Break long lines in debian/control
[idzebra-moved-to-github.git] / dict / scan.c
index 5eaa727..76032f3 100644 (file)
@@ -1,74 +1,55 @@
-/*
- * Copyright (C) 1994-1999, Index Data
- * All rights reserved.
- * Sebastian Hammer, Adam Dickmeiss
- *
- * $Log: scan.c,v $
- * Revision 1.12  1999-02-02 14:50:28  adam
- * Updated WIN32 code specific sections. Changed header.
- *
- * Revision 1.11  1998/06/22 11:34:45  adam
- * Changed scan callback function so it doesn't stop further scanning.
- *
- * Revision 1.10  1998/03/06 16:58:04  adam
- * Fixed bug which related to scanning of large indexes.
- *
- * Revision 1.9  1997/10/27 14:33:04  adam
- * Moved towards generic character mapping depending on "structure"
- * field in abstract syntax file. Fixed a few memory leaks. Fixed
- * bug with negative integers when doing searches with relational
- * operators.
- *
- * Revision 1.8  1996/02/02 13:43:52  adam
- * The public functions simply use char instead of Dict_char to represent
- * search strings. Dict_char is used internally only.
- *
- * Revision 1.7  1995/12/11  09:04:50  adam
- * Bug fix: the lookup/scan/lookgrep didn't handle empty dictionary.
- *
- * Revision 1.6  1995/11/20  11:58:04  adam
- * Support for YAZ in standard located directories, such as /usr/local/..
- *
- * Revision 1.5  1995/10/09  16:18:32  adam
- * Function dict_lookup_grep got extra client data parameter.
- *
- * Revision 1.4  1995/10/06  13:52:00  adam
- * Bug fixes. Handler may abort further scanning.
- *
- * Revision 1.3  1995/10/06  11:06:07  adam
- * Bug fixes.
- *
- * Revision 1.2  1995/10/06  10:43:16  adam
- * Minor changes.
- *
- * Revision 1.1  1995/10/06  09:04:18  adam
- * First version of scan.
- *
- */
+/* This file is part of the Zebra server.
+   Copyright (C) 1994-2011 Index Data
+
+   Zebra is free software; you can redistribute it and/or modify it under
+   the terms of the GNU General Public License as published by the Free
+   Software Foundation; either version 2, or (at your option) any later
+   version.
+
+   Zebra is distributed in the hope that it will be useful, but WITHOUT ANY
+   WARRANTY; without even the implied warranty of MERCHANTABILITY or
+   FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
+   for more details.
+
+   You should have received a copy of the GNU General Public License
+   along with this program; if not, write to the Free Software
+   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
+
+*/
+
+
+#if HAVE_CONFIG_H
+#include <config.h>
+#endif
 #include <stdlib.h>
 #include <string.h>
 #include <stdio.h>
 #include <assert.h>
 
-#include <dict.h>
+#include "dict-p.h"
 
-int dict_scan_trav (Dict dict, Dict_ptr ptr, int pos, Dict_char *str, 
-                   int start, int *count, void *client,
-                    int (*userfunc)(char *, const char *, int, void *),
-                   int dir)
+static void scan_direction(Dict dict, Dict_ptr ptr, int pos, Dict_char *str, 
+                           int start, int *count, void *client,
+                           int (*userfunc)(char *, const char *, int, void *),
+                           int dir)
 {
     int lo, hi, j;
     void *p;
     short *indxp;
     char *info;
 
-    dict_bf_readp (dict->dbf, ptr, &p);
+    dict_bf_readp(dict->dbf, ptr, &p);
     hi = DICT_nodir(p)-1;
-    if (start == 0 && dir == -1)
-        lo = hi;
-    else
+    if (start != -1)
         lo = start;
-    indxp = (short*) ((char*) p+DICT_pagesize(dict)-sizeof(short)); 
+    else
+    {
+        if (dir == -1)
+            lo = hi;
+        else
+            lo = 0;
+    }
+    indxp = (short*) ((char*) p+DICT_bsize(p)-sizeof(short)); 
 
     while (lo <= hi && lo >= 0 && *count > 0)
     {
@@ -82,9 +63,13 @@ int dict_scan_trav (Dict dict, Dict_ptr ptr, int pos, Dict_char *str,
             for (j = 0; info[j] != DICT_EOS; j++)
                str[pos+j] = info[j];
             str[pos+j] = DICT_EOS;
-            (*userfunc)((char*) str, info+(j+1)*sizeof(Dict_char),
-                            *count * dir, client);
-            --(*count);
+            if ((*userfunc)((char*) str, info+(j+1)*sizeof(Dict_char),
+                            *count * dir, client))
+            {
+                *count = 0;
+            }
+            else
+                --(*count);
         }
         else
         {
@@ -97,32 +82,46 @@ int dict_scan_trav (Dict dict, Dict_ptr ptr, int pos, Dict_char *str,
             /* char *               information */
 
             info = (char*)p - indxp[-lo];
-            memcpy (&dc, info+sizeof(Dict_ptr), sizeof(Dict_char));
+            memcpy(&dc, info+sizeof(Dict_ptr), sizeof(Dict_char));
             str[pos] = dc;
-           memcpy (&subptr, info, sizeof(Dict_ptr));
-           if (info[sizeof(Dict_ptr)+sizeof(Dict_char)])
+           memcpy(&subptr, info, sizeof(Dict_ptr));
+           if (dir>0 && info[sizeof(Dict_ptr)+sizeof(Dict_char)])
             {
-                 str[pos+1] = DICT_EOS;
-                 if ((*userfunc)((char*) str,
-                                 info+sizeof(Dict_ptr)+sizeof(Dict_char),
-                                 *count * dir, client))
-                     return 1;
-                 --(*count);
+                str[pos+1] = DICT_EOS;
+                if ((*userfunc)((char*) str,
+                                info+sizeof(Dict_ptr)+sizeof(Dict_char),
+                                *count * dir, client))
+                {
+                    *count = 0;
+                }
+                else
+                    --(*count);
             }
-            if (*count > 0 && subptr)
+            if (*count>0 && subptr)
             {
-               dict_scan_trav (dict, subptr, pos+1, str, 0, count, 
-                                client, userfunc, dir);
-                dict_bf_readp (dict->dbf, ptr, &p);
-                indxp = (short*) ((char*) p+DICT_pagesize(dict)-sizeof(short)); 
+               scan_direction(dict, subptr, pos+1, str, -1, count, 
+                               client, userfunc, dir);
+                dict_bf_readp(dict->dbf, ptr, &p);
+                indxp = (short*) ((char*) p+DICT_bsize(p)-sizeof(short)); 
            }
+           if (*count>0 && dir<0 && info[sizeof(Dict_ptr)+sizeof(Dict_char)])
+            {
+                str[pos+1] = DICT_EOS;
+                if ((*userfunc)((char*) str,
+                                info+sizeof(Dict_ptr)+sizeof(Dict_char),
+                                *count * dir, client))
+                {
+                    *count = 0;
+                }
+                else
+                    --(*count);
+            }
         }
         lo += dir;
     }
-    return 0;
 }
 
-int dict_scan_r (Dict dict, Dict_ptr ptr, int pos, Dict_char *str, 
+void dict_scan_r(Dict dict, Dict_ptr ptr, int pos, Dict_char *str, 
                 int *before, int *after, void *client,
                  int (*userfunc)(char *, const char *, int, void *))
 {
@@ -131,12 +130,12 @@ int dict_scan_r (Dict dict, Dict_ptr ptr, int pos, Dict_char *str,
     short *indxp;
     char *info;
 
-    dict_bf_readp (dict->dbf, ptr, &p);
+    dict_bf_readp(dict->dbf, ptr, &p);
     if (!p)
-        return 0;
+        return;
     mid = lo = 0;
     hi = DICT_nodir(p)-1;
-    indxp = (short*) ((char*) p+DICT_pagesize(dict)-sizeof(short));    
+    indxp = (short*) ((char*) p+DICT_bsize(p)-sizeof(short));
     while (lo <= hi)
     {
         mid = (lo+hi)/2;
@@ -146,16 +145,20 @@ int dict_scan_r (Dict dict, Dict_ptr ptr, int pos, Dict_char *str,
             /* unsigned char        length of information */
             /* char *               information */
            info = (char*)p + indxp[-mid];
-           cmp = dict_strcmp ((Dict_char*) info, str + pos);
+           cmp = dict_strcmp((Dict_char*) info, str + pos);
            if (!cmp)
             {
                 if (*after)
                 {
-                    (*userfunc)((char *) str, info+
-                                (dict_strlen((Dict_char*) info)+1)
-                                *sizeof(Dict_char), 
-                                *after, client);
-                    --(*after);
+                    if ((*userfunc)((char *) str, info+
+                                    (dict_strlen((Dict_char*) info)+1)
+                                    *sizeof(Dict_char), 
+                                    *after, client))
+                    {
+                        *after = 0;
+                    }
+                    else
+                        --(*after);
                 }
                 break;
             }
@@ -170,34 +173,53 @@ int dict_scan_r (Dict dict, Dict_ptr ptr, int pos, Dict_char *str,
             /* unsigned char        length of information */
             /* char *               information */
             info = (char*)p - indxp[-mid];
-            memcpy (&dc, info+sizeof(Dict_ptr), sizeof(Dict_char));
+            memcpy(&dc, info+sizeof(Dict_ptr), sizeof(Dict_char));
            cmp = dc - str[pos];
            if (!cmp)
             {
-               memcpy (&subptr, info, sizeof(Dict_ptr));
+               memcpy(&subptr, info, sizeof(Dict_ptr));
                 if (str[pos+1] == DICT_EOS)
                 {
                    if (info[sizeof(Dict_ptr)+sizeof(Dict_char)])
                     {
                         if (*after)
                         {
-                            (*userfunc)((char*) str,
-                                        info+sizeof(Dict_ptr)+
-                                        sizeof(Dict_char),
-                                        *after, client);
-                            --(*after);
+                            if ((*userfunc)((char*) str,
+                                            info+sizeof(Dict_ptr)+
+                                            sizeof(Dict_char),
+                                            *after, client))
+                            {
+                                *after = 0;
+                            }
+                            else
+                                --(*after);
                         }
                     }
                     if (*after && subptr)
-                       if (dict_scan_trav (dict, subptr, pos+1, str, 0, 
-                                            after, client, userfunc, 1))
-                            return 1;
+                       scan_direction(dict, subptr, pos+1, str, -1, 
+                                       after, client, userfunc, 1);
                 }
-               else if (subptr)
+               else
                 {
-                    if (dict_scan_r (dict, subptr, pos+1, str, before, after,
-                                     client, userfunc))
-                        return 1;
+                    if (subptr)
+                        dict_scan_r(dict, subptr, pos+1, str, before, after,
+                                    client, userfunc);
+                   if (info[sizeof(Dict_ptr)+sizeof(Dict_char)])
+                    {
+                        if (*before)
+                        {
+                            str[pos+1] = DICT_EOS;
+                            if ((*userfunc)((char*) str,
+                                            info+sizeof(Dict_ptr)+
+                                            sizeof(Dict_char),
+                                            - *before, client))
+                            {
+                                *before = 0;
+                            }
+                            else
+                                --(*before);
+                        }
+                    }
                 }
                 break;
             }
@@ -210,30 +232,36 @@ int dict_scan_r (Dict dict, Dict_ptr ptr, int pos, Dict_char *str,
     if (lo>hi && cmp < 0)
         ++mid;
     if (*after)
-        if (dict_scan_trav (dict, ptr, pos, str, cmp ? mid : mid+1, after,
-                            client, userfunc, 1))
-            return 1;
-    if (*before && mid > 1)
-        if (dict_scan_trav (dict, ptr, pos, str, mid-1, before, 
-                            client, userfunc, -1))
-            return 1;
-    return 0;
+        scan_direction(dict, ptr, pos, str, cmp ? mid : mid+1, after,
+                       client, userfunc, 1);
+    if (*before && mid > 0)
+        scan_direction(dict, ptr, pos, str, mid-1, before, 
+                       client, userfunc, -1);
 }
 
-int dict_scan (Dict dict, char *str, int *before, int *after, void *client,
-               int (*f)(char *name, const char *info, int pos, void *client))
+int dict_scan(Dict dict, char *str, int *before, int *after, void *client,
+              int (*f)(char *name, const char *info, int pos, void *client))
 {
     int i;
 
-    logf (LOG_DEBUG, "dict_scan");
+    yaz_log(YLOG_DEBUG, "dict_scan");
     for (i = 0; str[i]; i++)
     {
-       logf (LOG_DEBUG, " %3d  %c", str[i],
-             (str[i] > ' ' && str[i] < 127) ? str[i] : '?');
+       yaz_log(YLOG_DEBUG, "start_term pos %d %3d  %c", i, str[i],
+                (str[i] > ' ' && str[i] < 127) ? str[i] : '?');
     }
-    if (dict->head.last <= 1)
+    if (!dict->head.root)
         return 0;
-    return dict_scan_r (dict, 1, 0, (Dict_char *) str, before, after, client,
-                        f);
+    dict_scan_r(dict, dict->head.root, 0, (Dict_char *) str,
+                before, after, client, f);
+    return 0;
 }
+/*
+ * Local variables:
+ * c-basic-offset: 4
+ * c-file-style: "Stroustrup"
+ * indent-tabs-mode: nil
+ * End:
+ * vim: shiftwidth=4 tabstop=8 expandtab
+ */