renamed record filter module sources
[idzebra-moved-to-github.git] / index / rectext.c
diff --git a/index/rectext.c b/index/rectext.c
deleted file mode 100644 (file)
index cfa97c0..0000000
+++ /dev/null
@@ -1,264 +0,0 @@
-/* This file is part of the Zebra server.
-   Copyright (C) 1995-2008 Index Data
-
-Zebra is free software; you can redistribute it and/or modify it under
-the terms of the GNU General Public License as published by the Free
-Software Foundation; either version 2, or (at your option) any later
-version.
-
-Zebra is distributed in the hope that it will be useful, but WITHOUT ANY
-WARRANTY; without even the implied warranty of MERCHANTABILITY or
-FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
-for more details.
-
-You should have received a copy of the GNU General Public License
-along with this program; if not, write to the Free Software
-Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
-
-*/
-
-
-#include <stdio.h>
-#include <assert.h>
-#include <ctype.h>
-
-#include <idzebra/util.h>
-#include <idzebra/recctrl.h>
-#include <yaz/oid_db.h>
-
-struct filter_info {
-    char *sep;
-};
-
-static void *filter_init(Res res, RecType recType)
-{
-    struct filter_info *tinfo = (struct filter_info *) xmalloc(sizeof(*tinfo));
-    tinfo->sep = 0;
-    return tinfo;
-}
-
-static ZEBRA_RES filter_config(void *clientData, Res res, const char *args)
-{
-    struct filter_info *tinfo = (struct filter_info*) clientData;
-    xfree(tinfo->sep);
-    tinfo->sep = 0;
-    if (args && *args)
-       tinfo->sep = xstrdup(args);
-    return ZEBRA_OK;
-}
-
-static void filter_destroy(void *clientData)
-{
-    struct filter_info *tinfo = clientData;
-    xfree(tinfo->sep);
-    xfree(tinfo);
-}
-
-struct buf_info {
-    struct recExtractCtrl *p;
-    char *buf;
-    int offset;
-    int max;
-};
-
-static struct buf_info *buf_open(struct recExtractCtrl *p)
-{
-    struct buf_info *fi = (struct buf_info *) xmalloc(sizeof(*fi));
-
-    fi->p = p;
-    fi->buf = (char *) xmalloc(4096);
-    fi->offset = 1;
-    fi->max = 1;
-    return fi;
-}
-
-static int buf_getchar(struct filter_info *tinfo, struct buf_info *fi, char *dst)
-{
-    if (fi->offset >= fi->max)
-    {
-        if (fi->max <= 0)
-            return 0;
-        fi->max = fi->p->stream->readf(fi->p->stream, fi->buf, 4096);
-        fi->offset = 0;
-        if (fi->max <= 0)
-            return 0;
-    }
-    *dst = fi->buf[(fi->offset)++];
-    if (tinfo->sep && *dst == *tinfo->sep)
-    {
-       off_t off = fi->p->stream->tellf(fi->p->stream);
-        off_t end_offset = off - (fi->max - fi->offset);
-       fi->p->stream->endf(fi->p->stream, &end_offset);
-       return 0;
-    }
-    return 1;
-}
-
-static void buf_close(struct buf_info *fi)
-{
-    xfree(fi->buf);
-    xfree(fi);
-}
-
-static int filter_extract(void *clientData, struct recExtractCtrl *p)
-{
-    struct filter_info *tinfo = clientData;
-    char w[512];
-    RecWord recWord;
-    int r;
-    struct buf_info *fi = buf_open(p);
-    int no_read = 0;
-
-#if 0
-    yaz_log(YLOG_LOG, "filter_extract off=%ld",
-           (long) (*fi->p->tellf)(fi->p->fh));
-#endif
-    (*p->init)(p, &recWord);
-    do
-    {
-        int i = 0;
-            
-        r = buf_getchar(tinfo, fi, w);
-        while (r > 0 && i < 511 && w[i] != '\n' && w[i] != '\r')
-        {
-            i++;
-            r = buf_getchar(tinfo, fi, w + i); 
-       }
-        if (i)
-        {
-           no_read += i;
-            recWord.term_buf = w;
-           recWord.term_len = i;
-            (*p->tokenAdd)(&recWord);
-        }
-    } while (r > 0);
-    buf_close(fi);
-    if (no_read == 0)
-       return RECCTRL_EXTRACT_EOF;
-    return RECCTRL_EXTRACT_OK;
-}
-
-static int filter_retrieve(void *clientData, struct recRetrieveCtrl *p)
-{
-    int r, filter_ptr = 0;
-    static char *filter_buf = NULL;
-    static int filter_size = 0;
-    int make_header = 1;
-    int make_body = 1;
-    const char *elementSetName = NULL;
-    int no_lines = 0;
-
-    if (p->comp && p->comp->which == Z_RecordComp_simple &&
-        p->comp->u.simple->which == Z_ElementSetNames_generic)
-        elementSetName = p->comp->u.simple->u.generic;
-
-    if (elementSetName)
-    {
-       /* don't make header for the R(aw) element set name */
-       if (!strcmp(elementSetName, "R"))
-       {
-           make_header = 0;
-           make_body = 1;
-       }
-       /* only make header for the H(eader) element set name */
-       else if (!strcmp(elementSetName, "H"))
-       {
-           make_header = 1;
-           make_body = 0;
-       }
-    }
-    while (1)
-    {
-        if (filter_ptr + 4096 >= filter_size)
-        {
-            char *nb;
-
-            filter_size = 2*filter_size + 8192;
-            nb = (char *) xmalloc(filter_size);
-            if (filter_buf)
-            {
-                memcpy(nb, filter_buf, filter_ptr);
-                xfree(filter_buf);
-            }
-            filter_buf = nb;
-        }
-        if (make_header && filter_ptr == 0)
-        {
-            if (p->score >= 0)
-            {
-                sprintf(filter_buf, "Rank: %d\n", p->score);
-                filter_ptr = strlen(filter_buf);
-            }
-            sprintf(filter_buf + filter_ptr, "Local Number: " ZINT_FORMAT "\n",
-                    p->localno);
-            filter_ptr = strlen(filter_buf);
-           if (p->fname)
-           {
-               sprintf(filter_buf + filter_ptr, "Filename: %s\n", p->fname);
-               filter_ptr = strlen(filter_buf);
-           }
-           strcpy(filter_buf+filter_ptr++, "\n");
-        }
-       if (!make_body)
-           break;
-        r = p->stream->readf(p->stream, filter_buf + filter_ptr, 4096);
-        if (r <= 0)
-            break;
-        filter_ptr += r;
-    }
-    filter_buf[filter_ptr] = '\0';
-    if (elementSetName)
-    {
-        if (!strcmp(elementSetName, "B"))
-            no_lines = 4;
-        if (!strcmp(elementSetName, "M"))
-            no_lines = 20;
-    }
-    if (no_lines)
-    {
-        char *p = filter_buf;
-        int i = 0;
-
-        while (++i <= no_lines && (p = strchr(p, '\n')))
-            p++;
-        if (p)
-        {
-            p[1] = '\0';
-            filter_ptr = p-filter_buf;
-        }
-    }
-    p->output_format = yaz_oid_recsyn_sutrs;
-    p->rec_buf = filter_buf;
-    p->rec_len = filter_ptr; 
-    return 0;
-}
-
-static struct recType filter_type = {
-    0,
-    "text",
-    filter_init,
-    filter_config,
-    filter_destroy,
-    filter_extract,
-    filter_retrieve
-};
-
-RecType
-#ifdef IDZEBRA_STATIC_TEXT
-idzebra_filter_text
-#else
-idzebra_filter
-#endif
-
-[] = {
-    &filter_type,
-    0,
-};
-/*
- * Local variables:
- * c-basic-offset: 4
- * indent-tabs-mode: nil
- * End:
- * vim: shiftwidth=4 tabstop=8 expandtab
- */
-