X-Git-Url: http://git.indexdata.com/?a=blobdiff_plain;f=index%2Fkinput.c;h=9b7b8b2721c5f6fade873af65624a5907278eb6a;hb=b8e1425a7f78791afbf45dc11acd82808e455c65;hp=e8d154a8a712bb2c5b0dda2260db3782591154be;hpb=764b78fb481cf1084a5a583ffefbe8a0f32af28c;p=idzebra-moved-to-github.git diff --git a/index/kinput.c b/index/kinput.c index e8d154a..9b7b8b2 100644 --- a/index/kinput.c +++ b/index/kinput.c @@ -3,7 +3,7 @@ * All rights reserved. * Sebastian Hammer, Adam Dickmeiss, Heikki Levanto * - * $Id: kinput.c,v 1.49 2002-04-16 22:31:42 adam Exp $ + * $Id: kinput.c,v 1.51 2002-07-12 18:12:22 heikki Exp $ * * Bugs * - Allocates a lot of memory for the merge process, but never releases it. @@ -435,6 +435,27 @@ int heap_inpc (struct heap_info *hi) return 0; } +/* for debugging only */ +static void print_dict_item (ZebraMaps zm, const char *s) +{ + int reg_type = s[1]; + char keybuf[IT_MAX_WORD+1]; + char *to = keybuf; + const char *from = s + 2; + + while (*from) + { + const char *res = zebra_maps_output (zm, reg_type, &from); + if (!res) + *to++ = *from++; + else + while (*res) + *to++ = *res++; + } + *to = '\0'; + yaz_log (LOG_LOG, "%s", keybuf); +} + int heap_inpb (struct heap_info *hi) { struct heap_cread_info hci; @@ -457,6 +478,10 @@ int heap_inpb (struct heap_info *hi) strcpy (this_name, hci.cur_name); assert (hci.cur_name[1]); hi->no_diffs++; + +#if 0 + print_dict_item (hi->reg->zebra_maps, hci.cur_name); +#endif if ((dict_info = dict_lookup (hi->reg->dict, hci.cur_name))) { memcpy (&isamc_p, dict_info+1, sizeof(ISAMC_P)); @@ -503,35 +528,59 @@ int heap_inpd (struct heap_info *hi) while (hci.more) { char this_name[INP_NAME_MAX]; - ISAMD_P isamd_p, isamd_p2; char *dict_info; + char dictentry[ISAMD_MAX_DICT_LEN+1]; + char dictlen; strcpy (this_name, hci.cur_name); + + /* print_dict_item (hi->reg->zebra_maps, hci.cur_name); */ + /*!*/ /* FIXME: depend on isamd-debug */ + assert (hci.cur_name[1]); hi->no_diffs++; if ((dict_info = dict_lookup (hi->reg->dict, hci.cur_name))) { - memcpy (&isamd_p, dict_info+1, sizeof(ISAMD_P)); - isamd_p2 = isamd_append (hi->reg->isamd, isamd_p, isamd_i); - if (!isamd_p2) + dictlen=dict_info[0]; + memcpy (dictentry, dict_info+1, dictlen ); +#ifdef SKIPTHIS + logf(LOG_LOG,"dictentry before. len=%d: %d %d %d %d %d %d %d %d %d", + dictlen,dictentry[0], dictentry[1], dictentry[2], + dictentry[3], dictentry[4], dictentry[5], + dictentry[6], dictentry[7], dictentry[8]); /*!*/ +#endif + dictlen= isamd_append(hi->reg->isamd, dictentry, dictlen, isamd_i); + /* logf dictentry after */ + if (dictlen) { - hi->no_deletions++; - if (!dict_delete (hi->reg->dict, this_name)) - abort(); + hi->no_updates++; + if ( (dictlen!=dict_info[0]) || + (0!=memcmp(dictentry, dict_info+1, dictlen)) ) + { + dict_insert(hi->reg->dict, this_name, + dictlen,dictentry); + } } - else + else { - hi->no_updates++; - if (isamd_p2 != isamd_p) - dict_insert (hi->reg->dict, this_name, - sizeof(ISAMD_P), &isamd_p2); + hi->no_deletions++; + if (!dict_delete (hi->reg->dict, this_name)) + { + logf (LOG_FATAL, "dict_delete failed"); + abort(); + } } } else { - isamd_p = isamd_append (hi->reg->isamd, 0, isamd_i); + dictlen=0; + memset (dictentry, '\0', ISAMD_MAX_DICT_LEN); + dictlen= isamd_append(hi->reg->isamd, dictentry, dictlen, isamd_i); + /* logf dictentry first */ hi->no_insertions++; - dict_insert (hi->reg->dict, this_name, sizeof(ISAMD_P), &isamd_p); + if (dictlen) + dict_insert(hi->reg->dict, this_name, + dictlen,dictentry); } } xfree (isamd_i);