X-Git-Url: http://git.indexdata.com/?p=idzebra-moved-to-github.git;a=blobdiff_plain;f=index%2Fzinfo.c;h=cfede292629a8ebc0a625772f37ec71fc59e667c;hp=f2ae6c85564e9e9c5f9a8026730bba69fdac7a73;hb=96e4c5479e111511f5df3531b6648931251b9e5d;hpb=febdebf04b0c264efce4a58d602117f4a7f7fbdb diff --git a/index/zinfo.c b/index/zinfo.c index f2ae6c8..cfede29 100644 --- a/index/zinfo.c +++ b/index/zinfo.c @@ -1,29 +1,43 @@ -/* - * Copyright (C) 1994-1996, Index Data I/S - * All rights reserved. - * Sebastian Hammer, Adam Dickmeiss - * - * $Log: zinfo.c,v $ - * Revision 1.3 1996-05-22 08:21:59 adam - * Added public ZebDatabaseInfo structure. - * - * Revision 1.2 1996/05/14 06:16:41 adam - * Compact use/set bytes used in search service. - * - * Revision 1.1 1996/05/13 14:23:07 adam - * Work on compaction of set/use bytes in dictionary. - * - */ +/* This file is part of the Zebra server. + Copyright (C) 1994-2011 Index Data -#include +Zebra is free software; you can redistribute it and/or modify it under +the terms of the GNU General Public License as published by the Free +Software Foundation; either version 2, or (at your option) any later +version. + +Zebra is distributed in the hope that it will be useful, but WITHOUT ANY +WARRANTY; without even the implied warranty of MERCHANTABILITY or +FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License +for more details. + +You should have received a copy of the GNU General Public License +along with this program; if not, write to the Free Software +Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA + +*/ + +#if HAVE_CONFIG_H +#include +#endif +#include #include +#include +#include +#include +#include #include "zinfo.h" +#define ZINFO_DEBUG 0 + struct zebSUInfo { - int set; - int use; + char *index_type; + zinfo_index_category_t cat; + char *str; int ordinal; + zint doc_occurrences; + zint term_occurrences; }; struct zebSUInfoB { @@ -31,270 +45,1605 @@ struct zebSUInfoB { struct zebSUInfoB *next; }; -struct zebDatabaseInfoB { +typedef struct zebAccessObjectB *zebAccessObject; +struct zebAccessObjectB { + void *handle; + zint sysno; + Odr_oid *oid; + zebAccessObject next; +}; + +typedef struct zebAccessInfoB *zebAccessInfo; +struct zebAccessInfoB { + zebAccessObject attributeSetIds; + zebAccessObject schemas; +}; + +typedef struct { struct zebSUInfoB *SUInfo; - char *databaseName; - int sysno; - int readFlag; + zint sysno; int dirty; - struct zebDatabaseInfo info; + int readFlag; + data1_node *data1_tree; +} *zebAttributeDetails; + +struct zebDatabaseInfoB { + zebAttributeDetails attributeDetails; + int ordinalDatabase; + char *databaseName; + data1_node *data1_database; + zint recordCount; /* records in db */ + zint recordBytes; /* size of records */ + zint sysno; /* sysno of database info */ + int readFlag; /* 1: read is needed when referenced; 0 if not */ + int dirty; /* 1: database is dirty: write is needed */ struct zebDatabaseInfoB *next; + zebAccessInfo accessInfo; +}; + +struct zebraExplainAttset { + char *name; + int ordinal; + struct zebraExplainAttset *next; +}; + +struct zebraCategoryListInfo { + int dirty; + zint sysno; + data1_node *data1_categoryList; }; -struct zebTargetInfo { - int dictNum; - int dirty; +struct zebraExplainInfo { + int ordinalSU; + int ordinalDatabase; + zint runNumber; + int dirty; + int write_flag; Records records; + data1_handle dh; + Res res; + struct zebraExplainAttset *attsets; + NMEM nmem; + data1_node *data1_target; + struct zebraCategoryListInfo *categoryList; struct zebDatabaseInfoB *databaseInfo; struct zebDatabaseInfoB *curDatabaseInfo; + zebAccessInfo accessInfo; + char date[15]; /* YYYY MMDD HH MM SS */ + ZebraExplainUpdateFunc *updateFunc; + void *updateHandle; }; -void zebTargetInfo_close (ZebTargetInfo *zti, int writeFlag) +static void zebraExplain_initCommonInfo(ZebraExplainInfo zei, data1_node *n); +static void zebraExplain_initAccessInfo(ZebraExplainInfo zei, data1_node *n); + +static data1_node *read_sgml_rec(data1_handle dh, NMEM nmem, Record rec) +{ + return data1_read_sgml(dh, nmem, rec->info[recInfo_storeData]); +} + +static void zebraExplain_writeDatabase(ZebraExplainInfo zei, + struct zebDatabaseInfoB *zdi, + int key_flush); +static void zebraExplain_writeAttributeDetails(ZebraExplainInfo zei, + zebAttributeDetails zad, + const char *databaseName, + int key_flush); +static void zebraExplain_writeTarget(ZebraExplainInfo zei, int key_flush); +static void zebraExplain_writeAttributeSet(ZebraExplainInfo zei, + zebAccessObject o, + int key_flush); +static void zebraExplain_writeCategoryList(ZebraExplainInfo zei, + struct zebraCategoryListInfo *zcl, + int key_flush); + + +static Record createRecord(Records records, zint *sysno) +{ + Record rec; + if (*sysno) + { + rec = rec_get(records, *sysno); + if (!rec) + return 0; + xfree(rec->info[recInfo_storeData]); + } + else + { + rec = rec_new(records); + if (!rec) + return 0; + *sysno = rec->sysno; + + rec->info[recInfo_fileType] = + rec_strdup("grs.sgml", &rec->size[recInfo_fileType]); + rec->info[recInfo_databaseName] = + rec_strdup("IR-Explain-1", + &rec->size[recInfo_databaseName]); + } + return rec; +} + +void zebraExplain_flush(ZebraExplainInfo zei, void *handle) +{ + if (!zei) + return; + zei->updateHandle = handle; + if (zei->write_flag) + { + struct zebDatabaseInfoB *zdi; + zebAccessObject o; + + /* write each database info record */ + for (zdi = zei->databaseInfo; zdi; zdi = zdi->next) + { + zebraExplain_writeDatabase(zei, zdi, 1); + zebraExplain_writeAttributeDetails(zei, zdi->attributeDetails, + zdi->databaseName, 1); + } + zebraExplain_writeTarget(zei, 1); + zebraExplain_writeCategoryList(zei, + zei->categoryList, + 1); + assert(zei->accessInfo); + for (o = zei->accessInfo->attributeSetIds; o; o = o->next) + if (!o->sysno) + zebraExplain_writeAttributeSet(zei, o, 1); + for (o = zei->accessInfo->schemas; o; o = o->next) + if (!o->sysno) + { +/* zebraExplain_writeSchema(zei, o, 1); */ + } + + for (zdi = zei->databaseInfo; zdi; zdi = zdi->next) + { + zebraExplain_writeDatabase(zei, zdi, 0); + zebraExplain_writeAttributeDetails(zei, zdi->attributeDetails, + zdi->databaseName, 0); + } + zebraExplain_writeTarget(zei, 0); + } +} + +void zebraExplain_close(ZebraExplainInfo zei) +{ +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_close"); +#endif + if (!zei) + return; + zebraExplain_flush(zei, zei->updateHandle); + nmem_destroy(zei->nmem); +} + +void zebraExplain_mergeOids(ZebraExplainInfo zei, data1_node *n, + zebAccessObject *op) +{ + data1_node *np; + + for (np = n->child; np; np = np->next) + { + char str[64]; + int len; + Odr_oid *oid; + zebAccessObject ao; + + if (np->which != DATA1N_tag || strcmp(np->u.tag.tag, "oid")) + continue; + len = np->child->u.data.len; + if (len > 63) + len = 63; + memcpy(str, np->child->u.data.data, len); + str[len] = '\0'; + + oid = odr_getoidbystr_nmem(zei->nmem, str); + + for (ao = *op; ao; ao = ao->next) + if (!oid_oidcmp(oid, ao->oid)) + { + ao->sysno = 1; + break; + } + if (!ao) + { + ao = (zebAccessObject) nmem_malloc(zei->nmem, sizeof(*ao)); + ao->handle = 0; + ao->sysno = 1; + ao->oid = oid; + ao->next = *op; + *op = ao; + } + } +} + +void zebraExplain_mergeAccessInfo(ZebraExplainInfo zei, data1_node *n, + zebAccessInfo *accessInfo) +{ + data1_node *np; + + if (!n) + { + *accessInfo = (zebAccessInfo) + nmem_malloc(zei->nmem, sizeof(**accessInfo)); + (*accessInfo)->attributeSetIds = 0; + (*accessInfo)->schemas = 0; + } + else + { + if (!(n = data1_search_tag(zei->dh, n->child, "accessInfo"))) + return; + if ((np = data1_search_tag(zei->dh, n->child, "attributeSetIds"))) + zebraExplain_mergeOids(zei, np, + &(*accessInfo)->attributeSetIds); + if ((np = data1_search_tag(zei->dh, n->child, "schemas"))) + zebraExplain_mergeOids(zei, np, + &(*accessInfo)->schemas); + } +} + +/* Explain structure + root record + of type targetInfo + and has sysno = 1 + + databaseList (list of databases) +*/ +/* +Example root: +explain: + targetInfo: TargetInfo + name: Zebra + namedResultSets: 1 + multipleDbSearch: 1 + nicknames: + name: Zebra + commonInfo: + dateAdded: 20030630190601 + dateChanged: 20030630190601 + languageCode: EN + accessinfo: + unitSystems: + string: ISO + attributeSetIds: + oid: 1.2.840.10003.3.2 + oid: 1.2.840.10003.3.5 + oid: 1.2.840.10003.3.1 + schemas: + oid: 1.2.840.10003.13.1000.81.2 + oid: 1.2.840.10003.13.2 + zebraInfo: + version: 1.3.12 + databaseList: + database: + name: Default + id: 50 + attributeDetailsId: 51 + database: + name: IR-Explain-1 + id: 52 + attributeDetailsId: 53 + ordinalSU: 38 + runNumber: 1 +nextResultSetPosition = 2 +*/ + +ZebraExplainInfo zebraExplain_open( + Records records, data1_handle dh, + Res res, + int writeFlag, + void *updateHandle, + ZebraExplainUpdateFunc *updateFunc) { - struct zebDatabaseInfoB *zdi, *zdi1; + Record trec; + ZebraExplainInfo zei; + struct zebDatabaseInfoB **zdip; + time_t our_time; + struct tm *tm; + NMEM nmem = nmem_create(); + +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_open wr=%d", writeFlag); +#endif + zei = (ZebraExplainInfo) nmem_malloc(nmem, sizeof(*zei)); + zei->databaseInfo = 0; + zei->write_flag = writeFlag; + zei->updateHandle = updateHandle; + zei->updateFunc = updateFunc; + zei->dirty = 0; + zei->ordinalDatabase = 1; + zei->curDatabaseInfo = 0; + zei->records = records; + zei->nmem = nmem; + zei->dh = dh; - if (writeFlag) + data1_get_absyn(zei->dh, "explain", DATA1_XPATH_INDEXING_DISABLE); + + zei->attsets = 0; + zei->res = res; + zei->categoryList = (struct zebraCategoryListInfo *) + nmem_malloc(zei->nmem, sizeof(*zei->categoryList)); + zei->categoryList->sysno = 0; + zei->categoryList->dirty = 0; + zei->categoryList->data1_categoryList = 0; + + if ( atoi(res_get_def(res, "notimestamps", "0") )== 0) + { + time(&our_time); + tm = localtime(&our_time); + sprintf(zei->date, "%04d%02d%02d%02d%02d%02d", + tm->tm_year+1900, tm->tm_mon+1, tm->tm_mday, + tm->tm_hour, tm->tm_min, tm->tm_sec); + } else { + sprintf(zei->date, "%04d%02d%02d%02d%02d%02d", + 0, 0, 0, 0, 0, 0); + } + zdip = &zei->databaseInfo; + trec = rec_get_root(records); /* get "root" record */ + + zei->ordinalSU = 1; + zei->runNumber = 0; + + zebraExplain_mergeAccessInfo(zei, 0, &zei->accessInfo); + if (trec) /* targetInfo already exists ... */ { - char p0[4096], *p = p0; + data1_node *node_tgtinfo, *node_zebra, *node_list, *np; - memcpy (p, &zti->dictNum, sizeof(zti->dictNum)); - p += sizeof(zti->dictNum); - for (zdi = zti->databaseInfo; zdi; zdi=zdi->next) + zei->data1_target = read_sgml_rec(zei->dh, zei->nmem, trec); +#if 0 + if (!zei->data1_target || !zei->data1_target->u.root.absyn) +#else + if (!zei->data1_target) +#endif + { + yaz_log(YLOG_FATAL, "Explain schema missing. Check profilePath"); + nmem_destroy(zei->nmem); + return 0; + } +#if ZINFO_DEBUG + data1_pr_tree(zei->dh, zei->data1_target, stderr); +#endif + node_tgtinfo = data1_search_tag(zei->dh, zei->data1_target, + "/targetInfo"); + if (!node_tgtinfo) { - if (zdi->dirty) - { - char q0[4096], *q = q0; - struct zebSUInfoB *zsui; - Record drec; - int no = 0; - - if (zdi->sysno) - drec = rec_get (zti->records, zdi->sysno); - else - { - drec = rec_new (zti->records); - zdi->sysno = drec->sysno; - } - assert (drec); - for (zsui = zdi->SUInfo; zsui; zsui=zsui->next) - no++; - memcpy (q, &zdi->info, sizeof(zdi->info)); - q += sizeof(zdi->info); - memcpy (q, &no, sizeof(no)); - q += sizeof(no); - for (zsui = zdi->SUInfo; zsui; zsui=zsui->next) - { - memcpy (q, &zsui->info, sizeof(zsui->info)); - q += sizeof(zsui->info); - } - xfree (drec->info[0]); - drec->size[0] = q-q0; - drec->info[0] = xmalloc (drec->size[0]); - memcpy (drec->info[0], q0, drec->size[0]); - rec_put (zti->records, &drec); - } - strcpy (p, zdi->databaseName); - p += strlen(p)+1; - memcpy (p, &zdi->sysno, sizeof(zdi->sysno)); - p += sizeof(zdi->sysno); + yaz_log(YLOG_FATAL, "Node node_tgtinfo missing"); + nmem_destroy(zei->nmem); + return 0; } - *p++ = '\0'; - if (zti->dirty) + zebraExplain_mergeAccessInfo(zei, node_tgtinfo, + &zei->accessInfo); + + node_zebra = data1_search_tag(zei->dh, node_tgtinfo->child, + "zebraInfo"); + if (!node_zebra) { - Record grec = rec_get (zti->records, 1); - - assert (grec); - xfree (grec->info[0]); - grec->size[0] = p-p0; - grec->info[0] = xmalloc (grec->size[0]); - memcpy (grec->info[0], p0, grec->size[0]); - rec_put (zti->records, &grec); + yaz_log(YLOG_FATAL, "Node node_zebra missing"); + nmem_destroy(zei->nmem); + return 0; } + np = 0; + if (node_zebra) + { + node_list = data1_search_tag(zei->dh, node_zebra->child, + "databaseList"); + if (node_list) + np = node_list->child; + } + for(; np; np = np->next) + { + data1_node *node_name = 0; + data1_node *node_id = 0; + data1_node *node_aid = 0; + data1_node *np2; + if (np->which != DATA1N_tag || strcmp(np->u.tag.tag, "database")) + continue; + for(np2 = np->child; np2; np2 = np2->next) + { + if (np2->which != DATA1N_tag) + continue; + if (!strcmp(np2->u.tag.tag, "name")) + node_name = np2->child; + else if (!strcmp(np2->u.tag.tag, "id")) + node_id = np2->child; + else if (!strcmp(np2->u.tag.tag, "attributeDetailsId")) + node_aid = np2->child; + } + assert(node_id && node_name && node_aid); + + *zdip =(struct zebDatabaseInfoB *) + nmem_malloc(zei->nmem, sizeof(**zdip)); + (*zdip)->readFlag = 1; + (*zdip)->dirty = 0; + (*zdip)->data1_database = 0; + (*zdip)->recordCount = 0; + (*zdip)->recordBytes = 0; + zebraExplain_mergeAccessInfo(zei, 0, &(*zdip)->accessInfo); + + (*zdip)->databaseName = (char *) + nmem_malloc(zei->nmem, 1+node_name->u.data.len); + memcpy((*zdip)->databaseName, node_name->u.data.data, + node_name->u.data.len); + (*zdip)->databaseName[node_name->u.data.len] = '\0'; + (*zdip)->sysno = atoi_zn(node_id->u.data.data, + node_id->u.data.len); + (*zdip)->attributeDetails = (zebAttributeDetails) + nmem_malloc(zei->nmem, sizeof(*(*zdip)->attributeDetails)); + (*zdip)->attributeDetails->sysno = atoi_zn(node_aid->u.data.data, + node_aid->u.data.len); + (*zdip)->attributeDetails->readFlag = 1; + (*zdip)->attributeDetails->dirty = 0; + (*zdip)->attributeDetails->SUInfo = 0; + + zdip = &(*zdip)->next; + } + if (node_zebra) + { + np = data1_search_tag(zei->dh, node_zebra->child, + "ordinalSU"); + np = np->child; + assert(np && np->which == DATA1N_data); + zei->ordinalSU = atoi_n(np->u.data.data, np->u.data.len); + + np = data1_search_tag(zei->dh, node_zebra->child, + "ordinalDatabase"); + np = np->child; + assert(np && np->which == DATA1N_data); + zei->ordinalDatabase = atoi_n(np->u.data.data, np->u.data.len); + + np = data1_search_tag(zei->dh, node_zebra->child, + "runNumber"); + np = np->child; + assert(np && np->which == DATA1N_data); + zei->runNumber = atoi_zn(np->u.data.data, np->u.data.len); + yaz_log(YLOG_DEBUG, "read runnumber=" ZINT_FORMAT, zei->runNumber); + *zdip = 0; + } + rec_free(&trec); } - for (zdi = zti->databaseInfo; zdi; zdi = zdi1) + else /* create initial targetInfo */ { - struct zebSUInfoB *zsui, *zsui1; + data1_node *node_tgtinfo; - zdi1 = zdi->next; - for (zsui = zdi->SUInfo; zsui; zsui = zsui1) - { - zsui1 = zsui->next; - xfree (zsui); - } - xfree (zdi->databaseName); - xfree (zdi); + *zdip = 0; + if (writeFlag) + { + char *sgml_buf; + int sgml_len; + + zei->data1_target = + data1_read_sgml(zei->dh, zei->nmem, + "TargetInfo\n" + "Zebra\n" + "1\n" + "1\n" + "Zebra\n" + "\n" ); + if (!zei->data1_target) + { + yaz_log(YLOG_FATAL, "Explain schema missing. Check profilePath"); + nmem_destroy(zei->nmem); + return 0; + } + node_tgtinfo = data1_search_tag(zei->dh, zei->data1_target, + "/targetInfo"); + assert(node_tgtinfo); + + zebraExplain_initCommonInfo(zei, node_tgtinfo); + zebraExplain_initAccessInfo(zei, node_tgtinfo); + + /* write now because we want to be sure about the sysno */ + trec = rec_new(records); + if (!trec) + { + yaz_log(YLOG_FATAL, "Cannot create root Explain record"); + nmem_destroy(zei->nmem); + return 0; + } + trec->info[recInfo_fileType] = + rec_strdup("grs.sgml", &trec->size[recInfo_fileType]); + trec->info[recInfo_databaseName] = + rec_strdup("IR-Explain-1", &trec->size[recInfo_databaseName]); + + sgml_buf = data1_nodetoidsgml(dh, zei->data1_target, 0, &sgml_len); + trec->info[recInfo_storeData] = (char *) xmalloc(sgml_len); + memcpy(trec->info[recInfo_storeData], sgml_buf, sgml_len); + trec->size[recInfo_storeData] = sgml_len; + + rec_put(records, &trec); + rec_free(&trec); + } + + zebraExplain_newDatabase(zei, "IR-Explain-1", 0); + + if (!zei->categoryList->dirty) + { + struct zebraCategoryListInfo *zcl = zei->categoryList; + data1_node *node_cl; + + zcl->dirty = 1; + zcl->data1_categoryList = + data1_read_sgml(zei->dh, zei->nmem, + "CategoryList\n" + "\n"); + + if (zcl->data1_categoryList) + { + node_cl = data1_search_tag(zei->dh, zcl->data1_categoryList, + "/categoryList"); + assert(node_cl); + zebraExplain_initCommonInfo(zei, node_cl); + } + } } - xfree (zti); + return zei; } -ZebTargetInfo *zebTargetInfo_open (Records records, int writeFlag) +static void zebraExplain_readAttributeDetails(ZebraExplainInfo zei, + zebAttributeDetails zad) { Record rec; - ZebTargetInfo *zti; - struct zebDatabaseInfoB **zdi; + struct zebSUInfoB **zsuip = &zad->SUInfo; + data1_node *node_adinfo, *node_zebra, *node_list, *np; - zti = xmalloc (sizeof(*zti)); - zti->dirty = 0; - zti->curDatabaseInfo = NULL; - zti->records = records; + assert(zad->sysno); + rec = rec_get(zei->records, zad->sysno); - zdi = &zti->databaseInfo; - - rec = rec_get (records, 1); - if (rec) + zad->data1_tree = read_sgml_rec(zei->dh, zei->nmem, rec); + + node_adinfo = data1_search_tag(zei->dh, zad->data1_tree, + "/attributeDetails"); + node_zebra = data1_search_tag(zei->dh, node_adinfo->child, + "zebraInfo"); + node_list = data1_search_tag(zei->dh, node_zebra->child, + "attrlist"); + for (np = node_list->child; np; np = np->next) { - const char *p; + data1_node *node_str = 0; + data1_node *node_ordinal = 0; + data1_node *node_type = 0; + data1_node *node_cat = 0; + data1_node *node_doc_occurrences = 0; + data1_node *node_term_occurrences = 0; + data1_node *np2; + + if (np->which != DATA1N_tag || strcmp(np->u.tag.tag, "attr")) + continue; + for (np2 = np->child; np2; np2 = np2->next) + { + if (np2->which != DATA1N_tag || !np2->child || + np2->child->which != DATA1N_data) + continue; + if (!strcmp(np2->u.tag.tag, "str")) + node_str = np2->child; + else if (!strcmp(np2->u.tag.tag, "ordinal")) + node_ordinal = np2->child; + else if (!strcmp(np2->u.tag.tag, "type")) + node_type = np2->child; + else if (!strcmp(np2->u.tag.tag, "cat")) + node_cat = np2->child; + else if (!strcmp(np2->u.tag.tag, "dococcurrences")) + node_doc_occurrences = np2->child; + else if (!strcmp(np2->u.tag.tag, "termoccurrences")) + node_term_occurrences = np2->child; + else + { + yaz_log(YLOG_LOG, "Unknown tag '%s' in attributeDetails", + np2->u.tag.tag); + } + } + assert(node_ordinal); + + *zsuip = (struct zebSUInfoB *) + nmem_malloc(zei->nmem, sizeof(**zsuip)); + + if (node_type && node_type->u.data.len > 0) + (*zsuip)->info.index_type = + nmem_strdupn(zei->nmem, + node_type->u.data.data, + node_type->u.data.len); + else + { + yaz_log(YLOG_WARN, "Missing attribute 'type' in attribute info"); + (*zsuip)->info.index_type = "w"; + } + if (node_cat && node_cat->u.data.len > 0) + { + zinfo_index_category_t cat; - p = rec->info[0]; + data1_node *np = node_cat; + if (!strncmp(np->u.data.data, "index", np->u.data.len)) + cat = zinfo_index_category_index; + else if (!strncmp(np->u.data.data, "sort", np->u.data.len)) + cat = zinfo_index_category_sort; + else if (!strncmp(np->u.data.data, "alwaysmatches", + np->u.data.len)) + cat = zinfo_index_category_alwaysmatches; + else if (!strncmp(np->u.data.data, "anchor", + np->u.data.len)) + cat = zinfo_index_category_anchor; + else + { + yaz_log(YLOG_WARN, "Bad index cateogry '%.*s'", + np->u.data.len, np->u.data.data); + cat = zinfo_index_category_index; + } + (*zsuip)->info.cat = cat; + } + else + (*zsuip)->info.cat = zinfo_index_category_index; - memcpy (&zti->dictNum, p, sizeof(zti->dictNum)); - p += sizeof(zti->dictNum); - while (*p) + if (node_doc_occurrences) { - *zdi = xmalloc (sizeof(**zdi)); - (*zdi)->SUInfo = NULL; - (*zdi)->databaseName = xstrdup (p); - p += strlen(p)+1; - memcpy (&(*zdi)->sysno, p, sizeof((*zdi)->sysno)); - p += sizeof((*zdi)->sysno); - (*zdi)->readFlag = 1; - (*zdi)->dirty = 0; - zdi = &(*zdi)->next; + data1_node *np = node_doc_occurrences; + (*zsuip)->info.doc_occurrences = atoi_zn(np->u.data.data, + np->u.data.len); } - assert (p - rec->info[0] == rec->size[0]-1); - } - else - { - zti->dictNum = 1; - if (writeFlag) + if (node_term_occurrences) { - rec = rec_new (records); - rec->info[0] = xmalloc (1+sizeof(zti->dictNum)); - memcpy (rec->info[0], &zti->dictNum, sizeof(zti->dictNum)); - rec->info[0][sizeof(zti->dictNum)] = '\0'; - rec->size[0] = sizeof(zti->dictNum)+1; - rec_put (records, &rec); + data1_node *np = node_term_occurrences; + (*zsuip)->info.term_occurrences = atoi_zn(np->u.data.data, + np->u.data.len); } + if (node_str) + { + (*zsuip)->info.str = nmem_strdupn(zei->nmem, + node_str->u.data.data, + node_str->u.data.len); + } + else + { + yaz_log(YLOG_WARN, "Missing set/use/str in attribute info"); + continue; + } + (*zsuip)->info.ordinal = atoi_n(node_ordinal->u.data.data, + node_ordinal->u.data.len); + zsuip = &(*zsuip)->next; } - *zdi = NULL; - rec_rm (&rec); - return zti; + *zsuip = 0; + zad->readFlag = 0; + rec_free(&rec); } -static void zebTargetInfo_readDatabase (ZebTargetInfo *zti, - struct zebDatabaseInfoB *zdi) +static void zebraExplain_readDatabase(ZebraExplainInfo zei, + struct zebDatabaseInfoB *zdi) { - const char *p; - struct zebSUInfoB **zsuip = &zdi->SUInfo; - int i, no; Record rec; + data1_node *node_dbinfo, *node_zebra, *np; - rec = rec_get (zti->records, zdi->sysno); - assert (rec); - p = rec->info[0]; - memcpy (&zdi->info, p, sizeof(zdi->info)); - p += sizeof(zdi->info); - memcpy (&no, p, sizeof(no)); - p += sizeof(no); - for (i = 0; iinfo, p, sizeof((*zsuip)->info)); - p += sizeof((*zsuip)->info); - zsuip = &(*zsuip)->next; + assert(zdi->sysno); + rec = rec_get(zei->records, zdi->sysno); + + zdi->data1_database = read_sgml_rec(zei->dh, zei->nmem, rec); + + node_dbinfo = data1_search_tag(zei->dh, zdi->data1_database, + "/databaseInfo"); + assert(node_dbinfo); + zebraExplain_mergeAccessInfo(zei, node_dbinfo, &zdi->accessInfo); + + node_zebra = data1_search_tag(zei->dh, node_dbinfo->child, + "zebraInfo"); + if (node_zebra + && (np = data1_search_tag(zei->dh, node_zebra->child, + "recordBytes")) + && np->child && np->child->which == DATA1N_data) + zdi->recordBytes = atoi_zn(np->child->u.data.data, + np->child->u.data.len); + + if (node_zebra + && (np = data1_search_tag(zei->dh, node_zebra->child, + "ordinalDatabase")) + && np->child && np->child->which == DATA1N_data) + zdi->ordinalDatabase = atoi_n(np->child->u.data.data, + np->child->u.data.len); + + if ((np = data1_search_tag(zei->dh, node_dbinfo->child, + "recordCount")) && + (np = data1_search_tag(zei->dh, np->child, + "recordCountActual")) && + np->child->which == DATA1N_data) + { + zdi->recordCount = atoi_zn(np->child->u.data.data, + np->child->u.data.len); } - *zsuip = NULL; zdi->readFlag = 0; - rec_rm (&rec); + rec_free(&rec); +} + +int zebraExplain_removeDatabase(ZebraExplainInfo zei, void *update_handle) +{ + struct zebDatabaseInfoB **zdip = &zei->databaseInfo; + + while (*zdip) + { + if (*zdip == zei->curDatabaseInfo) + { + struct zebDatabaseInfoB *zdi = *zdip; + Record rec; + + zei->dirty = 1; + zei->updateHandle = update_handle; + + if (zdi->attributeDetails) + { + /* remove attribute details keys and delete it */ + zebAttributeDetails zad = zdi->attributeDetails; + + rec = rec_get(zei->records, zad->sysno); + (*zei->updateFunc)(zei->updateHandle, rec, 0); + rec_del(zei->records, &rec); + } + /* remove database record keys and delete it */ + rec = rec_get(zei->records, zdi->sysno); + (*zei->updateFunc)(zei->updateHandle, rec, 0); + rec_del(zei->records, &rec); + + /* remove from list */ + *zdip = zdi->next; + + /* current database is IR-Explain-1 */ + return 0; + } + zdip = &(*zdip)->next; + } + return -1; } -int zebTargetInfo_curDatabase (ZebTargetInfo *zti, const char *database) +int zebraExplain_curDatabase(ZebraExplainInfo zei, const char *database) { struct zebDatabaseInfoB *zdi; + const char *database_n = strrchr(database, '/'); + + if (database_n) + database_n++; + else + database_n = database; - assert (zti); - if (zti->curDatabaseInfo && - !strcmp (zti->curDatabaseInfo->databaseName, database)) + assert(zei); + if (zei->curDatabaseInfo && + !STRCASECMP(zei->curDatabaseInfo->databaseName, database)) return 0; - for (zdi = zti->databaseInfo; zdi; zdi=zdi->next) + for (zdi = zei->databaseInfo; zdi; zdi=zdi->next) { - if (!strcmp (zdi->databaseName, database)) + if (!STRCASECMP(zdi->databaseName, database_n)) break; } if (!zdi) return -1; +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_curDatabase: %s", database); +#endif if (zdi->readFlag) - zebTargetInfo_readDatabase (zti, zdi); - zti->curDatabaseInfo = zdi; + { +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_readDatabase: %s", database); +#endif + zebraExplain_readDatabase(zei, zdi); + } + if (zdi->attributeDetails->readFlag) + { +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_readAttributeDetails: %s", database); +#endif + zebraExplain_readAttributeDetails(zei, zdi->attributeDetails); + } + zei->curDatabaseInfo = zdi; return 0; } -int zebTargetInfo_newDatabase (ZebTargetInfo *zti, const char *database) +static void zebraExplain_initCommonInfo(ZebraExplainInfo zei, data1_node *n) +{ + data1_node *c = data1_mk_tag(zei->dh, zei->nmem, "commonInfo", 0, n); + data1_mk_tag_data_text(zei->dh, c, "dateAdded", zei->date, zei->nmem); + data1_mk_tag_data_text(zei->dh, c, "dateChanged", zei->date, zei->nmem); + data1_mk_tag_data_text(zei->dh, c, "languageCode", "EN", zei->nmem); +} + +static void zebraExplain_updateCommonInfo(ZebraExplainInfo zei, data1_node *n) +{ + data1_node *c = data1_search_tag(zei->dh, n->child, "commonInfo"); + assert(c); + data1_mk_tag_data_text_uni(zei->dh, c, "dateChanged", zei->date, + zei->nmem); +} + +static void zebraExplain_initAccessInfo(ZebraExplainInfo zei, data1_node *n) +{ + data1_node *c = data1_mk_tag(zei->dh, zei->nmem, "accessInfo", 0, n); + data1_node *d = data1_mk_tag(zei->dh, zei->nmem, "unitSystems", 0, c); + data1_mk_tag_data_text(zei->dh, d, "string", "ISO", zei->nmem); +} + +static void zebraExplain_updateAccessInfo(ZebraExplainInfo zei, data1_node *n, + zebAccessInfo accessInfo) +{ + data1_node *c = data1_search_tag(zei->dh, n->child, "accessInfo"); + data1_node *d; + zebAccessObject p; + + if (!c) + { + data1_pr_tree(zei->dh, n, stdout); + zebra_exit("zebraExplain_updateAccessInfo"); + } + + if ((p = accessInfo->attributeSetIds)) + { + d = data1_mk_tag_uni(zei->dh, zei->nmem, "attributeSetIds", c); + for (; p; p = p->next) + data1_mk_tag_data_oid(zei->dh, d, "oid", p->oid, zei->nmem); + } + if ((p = accessInfo->schemas)) + { + d = data1_mk_tag_uni(zei->dh, zei->nmem, "schemas", c); + for (; p; p = p->next) + data1_mk_tag_data_oid(zei->dh, d, "oid", p->oid, zei->nmem); + } +} + +int zebraExplain_newDatabase(ZebraExplainInfo zei, const char *database, + int explain_database) { struct zebDatabaseInfoB *zdi; + data1_node *node_dbinfo, *node_adinfo; + const char *database_n = strrchr(database, '/'); + + if (database_n) + database_n++; + else + database_n = database; - assert (zti); - for (zdi = zti->databaseInfo; zdi; zdi=zdi->next) +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_newDatabase: %s", database); +#endif + assert(zei); + for (zdi = zei->databaseInfo; zdi; zdi=zdi->next) { - if (!strcmp (zdi->databaseName, database)) + if (!STRCASECMP(zdi->databaseName, database_n)) break; } if (zdi) return -1; - zdi = xmalloc (sizeof(*zdi)); - zdi->next = zti->databaseInfo; - zti->databaseInfo = zdi; + /* it's new really. make it */ + zdi = (struct zebDatabaseInfoB *) nmem_malloc(zei->nmem, sizeof(*zdi)); + zdi->next = zei->databaseInfo; + zei->databaseInfo = zdi; zdi->sysno = 0; + zdi->recordCount = 0; + zdi->recordBytes = 0; zdi->readFlag = 0; - zdi->databaseName = xstrdup (database); - zdi->SUInfo = NULL; + zdi->databaseName = nmem_strdup(zei->nmem, database_n); + + zdi->ordinalDatabase = zei->ordinalDatabase++; + + zebraExplain_mergeAccessInfo(zei, 0, &zdi->accessInfo); + + assert(zei->dh); + assert(zei->nmem); + + zdi->data1_database = + data1_read_sgml(zei->dh, zei->nmem, + "DatabaseInfo\n" + "\n"); + if (!zdi->data1_database) + return -2; + + node_dbinfo = data1_search_tag(zei->dh, zdi->data1_database, + "/databaseInfo"); + assert(node_dbinfo); + + zebraExplain_initCommonInfo(zei, node_dbinfo); + zebraExplain_initAccessInfo(zei, node_dbinfo); + + data1_mk_tag_data_text(zei->dh, node_dbinfo, "name", + database, zei->nmem); + + if (explain_database) + data1_mk_tag_data_text(zei->dh, node_dbinfo, "explainDatabase", + "", zei->nmem); + + data1_mk_tag_data_text(zei->dh, node_dbinfo, "userFee", + "0", zei->nmem); + + data1_mk_tag_data_text(zei->dh, node_dbinfo, "available", + "1", zei->nmem); + +#if ZINFO_DEBUG + data1_pr_tree(zei->dh, zdi->data1_database, stderr); +#endif zdi->dirty = 1; - zti->dirty = 1; - zti->curDatabaseInfo = zdi; + zei->dirty = 1; + zei->curDatabaseInfo = zdi; + + zdi->attributeDetails = (zebAttributeDetails) + nmem_malloc(zei->nmem, sizeof(*zdi->attributeDetails)); + zdi->attributeDetails->readFlag = 0; + zdi->attributeDetails->sysno = 0; + zdi->attributeDetails->dirty = 1; + zdi->attributeDetails->SUInfo = 0; + zdi->attributeDetails->data1_tree = + data1_read_sgml(zei->dh, zei->nmem, + "AttributeDetails\n" + "\n"); + + node_adinfo = data1_search_tag(zei->dh, zdi->attributeDetails->data1_tree, + "/attributeDetails"); + assert(node_adinfo); + + zebraExplain_initCommonInfo(zei, node_adinfo); + + data1_mk_tag_data_text(zei->dh, node_adinfo, "name", database, zei->nmem); + + return 0; +} + + +static void zebraExplain_writeCategoryList(ZebraExplainInfo zei, + struct zebraCategoryListInfo *zcl, + int key_flush) +{ + char *sgml_buf; + int sgml_len; + int i; + Record drec; + data1_node *node_ci, *node_categoryList; + zint sysno = 0; + static char *category[] = { + "CategoryList", + "TargetInfo", + "DatabaseInfo", + "AttributeDetails", + 0 + }; + + assert(zcl); + if (!zcl->dirty) + return ; + zcl->dirty = 0; + node_categoryList = zcl->data1_categoryList; + +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_writeCategoryList"); +#endif + + drec = createRecord(zei->records, &sysno); + if (!drec) + return; + + node_ci = data1_search_tag(zei->dh, node_categoryList, + "/categoryList"); + assert (node_ci); + node_ci = data1_mk_tag(zei->dh, zei->nmem, "categories", 0 /* attr */, + node_ci); + assert (node_ci); + + for (i = 0; category[i]; i++) + { + data1_node *node_cat = data1_mk_tag(zei->dh, zei->nmem, "category", + 0 /* attr */, node_ci); + + data1_mk_tag_data_text(zei->dh, node_cat, "name", + category[i], zei->nmem); + } + /* extract *searchable* keys from it. We do this here, because + record count, etc. is affected */ + if (key_flush) + (*zei->updateFunc)(zei->updateHandle, drec, node_categoryList); + + /* convert to "SGML" and write it */ +#if ZINFO_DEBUG + data1_pr_tree(zei->dh, node_categoryList, stderr); +#endif + sgml_buf = data1_nodetoidsgml(zei->dh, node_categoryList, 0, &sgml_len); + drec->info[recInfo_storeData] = (char *) xmalloc(sgml_len); + memcpy(drec->info[recInfo_storeData], sgml_buf, sgml_len); + drec->size[recInfo_storeData] = sgml_len; + + rec_put(zei->records, &drec); +} + +static void zebraExplain_writeAttributeDetails(ZebraExplainInfo zei, + zebAttributeDetails zad, + const char *databaseName, + int key_flush) +{ + char *sgml_buf; + int sgml_len; + Record drec; + data1_node *node_adinfo, *node_list, *node_zebra; + struct zebSUInfoB *zsui; + + if (!zad->dirty) + return; + + zad->dirty = 0; +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_writeAttributeDetails"); + data1_pr_tree(zei->dh, zad->data1_tree, stderr); +#endif + + drec = createRecord(zei->records, &zad->sysno); + if (!drec) + return; + assert(zad->data1_tree); + + node_adinfo = data1_search_tag(zei->dh, zad->data1_tree, + "/attributeDetails"); + zebraExplain_updateCommonInfo(zei, node_adinfo); + + /* zebra info (private) .. no children yet.. so se don't index zebraInfo */ + node_zebra = data1_mk_tag_uni(zei->dh, zei->nmem, + "zebraInfo", node_adinfo); + + /* extract *searchable* keys from it. We do this here, because + record count, etc. is affected */ + if (key_flush) + (*zei->updateFunc)(zei->updateHandle, drec, zad->data1_tree); + node_list = data1_mk_tag_uni(zei->dh, zei->nmem, + "attrlist", node_zebra); + for (zsui = zad->SUInfo; zsui; zsui = zsui->next) + { + data1_node *node_attr; + node_attr = data1_mk_tag(zei->dh, zei->nmem, "attr", 0 /* attr */, + node_list); + + data1_mk_tag_data_text(zei->dh, node_attr, "type", + zsui->info.index_type, zei->nmem); + data1_mk_tag_data_text(zei->dh, node_attr, "str", + zsui->info.str, zei->nmem); + data1_mk_tag_data_int(zei->dh, node_attr, "ordinal", + zsui->info.ordinal, zei->nmem); + + data1_mk_tag_data_zint(zei->dh, node_attr, "dococcurrences", + zsui->info.doc_occurrences, zei->nmem); + data1_mk_tag_data_zint(zei->dh, node_attr, "termoccurrences", + zsui->info.term_occurrences, zei->nmem); + switch(zsui->info.cat) + { + case zinfo_index_category_index: + data1_mk_tag_data_text(zei->dh, node_attr, "cat", + "index", zei->nmem); break; + case zinfo_index_category_sort: + data1_mk_tag_data_text(zei->dh, node_attr, "cat", + "sort", zei->nmem); break; + case zinfo_index_category_alwaysmatches: + data1_mk_tag_data_text(zei->dh, node_attr, "cat", + "alwaysmatches", zei->nmem); break; + case zinfo_index_category_anchor: + data1_mk_tag_data_text(zei->dh, node_attr, "cat", + "anchor", zei->nmem); break; + } + } + /* convert to "SGML" and write it */ +#if ZINFO_DEBUG + data1_pr_tree(zei->dh, zad->data1_tree, stderr); +#endif + sgml_buf = data1_nodetoidsgml(zei->dh, zad->data1_tree, + 0, &sgml_len); + drec->info[recInfo_storeData] = (char *) xmalloc(sgml_len); + memcpy(drec->info[recInfo_storeData], sgml_buf, sgml_len); + drec->size[recInfo_storeData] = sgml_len; + + rec_put(zei->records, &drec); +} + +static void zebraExplain_writeDatabase(ZebraExplainInfo zei, + struct zebDatabaseInfoB *zdi, + int key_flush) +{ + char *sgml_buf; + int sgml_len; + Record drec; + data1_node *node_dbinfo, *node_count, *node_zebra; + + if (!zdi->dirty) + return; + + zdi->dirty = 0; +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_writeDatabase %s", zdi->databaseName); +#endif + drec = createRecord(zei->records, &zdi->sysno); + if (!drec) + return; + assert(zdi->data1_database); + + node_dbinfo = data1_search_tag(zei->dh, zdi->data1_database, + "/databaseInfo"); + + assert(node_dbinfo); + zebraExplain_updateCommonInfo(zei, node_dbinfo); + zebraExplain_updateAccessInfo(zei, node_dbinfo, zdi->accessInfo); + + /* record count */ + node_count = data1_mk_tag_uni(zei->dh, zei->nmem, + "recordCount", node_dbinfo); + data1_mk_tag_data_zint(zei->dh, node_count, "recordCountActual", + zdi->recordCount, zei->nmem); + + /* zebra info (private) */ + node_zebra = data1_mk_tag_uni(zei->dh, zei->nmem, + "zebraInfo", node_dbinfo); + + /* extract *searchable* keys from it. We do this here, because + record count, etc. is affected */ + if (key_flush) + (*zei->updateFunc)(zei->updateHandle, drec, zdi->data1_database); + data1_mk_tag_data_zint(zei->dh, node_zebra, + "recordBytes", zdi->recordBytes, zei->nmem); + + data1_mk_tag_data_zint(zei->dh, node_zebra, + "ordinalDatabase", zdi->ordinalDatabase, zei->nmem); + + /* convert to "SGML" and write it */ +#if ZINFO_DEBUG + data1_pr_tree(zei->dh, zdi->data1_database, stderr); +#endif + sgml_buf = data1_nodetoidsgml(zei->dh, zdi->data1_database, + 0, &sgml_len); + drec->info[recInfo_storeData] = (char *) xmalloc(sgml_len); + memcpy(drec->info[recInfo_storeData], sgml_buf, sgml_len); + drec->size[recInfo_storeData] = sgml_len; + + rec_put(zei->records, &drec); +} + +static void writeAttributeValues(ZebraExplainInfo zei, + data1_node *node_values, + data1_attset *attset) +{ + data1_att *atts; + data1_attset_child *c; + + if (!attset) + return; + + for (c = attset->children; c; c = c->next) + writeAttributeValues(zei, node_values, c->child); + for (atts = attset->atts; atts; atts = atts->next) + { + data1_node *node_value; + + node_value = data1_mk_tag(zei->dh, zei->nmem, "attributeValue", + 0 /* attr */, node_values); + data1_mk_tag_data_text(zei->dh, node_value, "name", + atts->name, zei->nmem); + node_value = data1_mk_tag(zei->dh, zei->nmem, "value", + 0 /* attr */, node_value); + data1_mk_tag_data_int(zei->dh, node_value, "numeric", + atts->value, zei->nmem); + } +} + + +static void zebraExplain_writeAttributeSet(ZebraExplainInfo zei, + zebAccessObject o, + int key_flush) +{ + char *sgml_buf; + int sgml_len; + Record drec; + data1_node *node_root, *node_attinfo, *node_attributes, *node_atttype; + data1_node *node_values; + struct data1_attset *attset = 0; + + if (o->oid) + attset = data1_attset_search_id(zei->dh, o->oid); + +#if ZINFO_DEBUG + yaz_log(YLOG_LOG, "zebraExplain_writeAttributeSet %s", + attset ? attset->name : ""); +#endif + + drec = createRecord(zei->records, &o->sysno); + if (!drec) + return; + node_root = + data1_read_sgml(zei->dh, zei->nmem, + "AttributeSetInfo\n" + "\n" ); + + node_attinfo = data1_search_tag(zei->dh, node_root, + "/attributeSetInfo"); + + assert(node_attinfo); + zebraExplain_initCommonInfo(zei, node_attinfo); + zebraExplain_updateCommonInfo(zei, node_attinfo); + + data1_mk_tag_data_oid(zei->dh, node_attinfo, + "oid", o->oid, zei->nmem); + if (attset && attset->name) + data1_mk_tag_data_text(zei->dh, node_attinfo, + "name", attset->name, zei->nmem); + + node_attributes = data1_mk_tag_uni(zei->dh, zei->nmem, + "attributes", node_attinfo); + node_atttype = data1_mk_tag_uni(zei->dh, zei->nmem, + "attributeType", node_attributes); + data1_mk_tag_data_text(zei->dh, node_atttype, + "name", "Use", zei->nmem); + data1_mk_tag_data_text(zei->dh, node_atttype, + "description", "Use Attribute", zei->nmem); + data1_mk_tag_data_int(zei->dh, node_atttype, + "type", 1, zei->nmem); + node_values = data1_mk_tag(zei->dh, zei->nmem, + "attributeValues", 0 /* attr */, node_atttype); + if (attset) + writeAttributeValues(zei, node_values, attset); + + /* extract *searchable* keys from it. We do this here, because + record count, etc. is affected */ + if (key_flush) + (*zei->updateFunc)(zei->updateHandle, drec, node_root); + /* convert to "SGML" and write it */ +#if ZINFO_DEBUG + data1_pr_tree(zei->dh, node_root, stderr); +#endif + sgml_buf = data1_nodetoidsgml(zei->dh, node_root, 0, &sgml_len); + drec->info[recInfo_storeData] = (char *) xmalloc(sgml_len); + memcpy(drec->info[recInfo_storeData], sgml_buf, sgml_len); + drec->size[recInfo_storeData] = sgml_len; + + rec_put(zei->records, &drec); +} + +static void zebraExplain_writeTarget(ZebraExplainInfo zei, int key_flush) +{ + struct zebDatabaseInfoB *zdi; + data1_node *node_tgtinfo, *node_list, *node_zebra; + Record trec; + int sgml_len; + char *sgml_buf; + + if (!zei->dirty) + return; + zei->dirty = 0; + + trec = rec_get_root(zei->records); + xfree(trec->info[recInfo_storeData]); + + node_tgtinfo = data1_search_tag(zei->dh, zei->data1_target, + "/targetInfo"); + assert(node_tgtinfo); + + zebraExplain_updateCommonInfo(zei, node_tgtinfo); + zebraExplain_updateAccessInfo(zei, node_tgtinfo, zei->accessInfo); + + node_zebra = data1_mk_tag_uni(zei->dh, zei->nmem, + "zebraInfo", node_tgtinfo); + /* convert to "SGML" and write it */ + if (key_flush) + (*zei->updateFunc)(zei->updateHandle, trec, zei->data1_target); + + data1_mk_tag_data_text(zei->dh, node_zebra, "version", + ZEBRAVER, zei->nmem); + node_list = data1_mk_tag(zei->dh, zei->nmem, + "databaseList", 0 /* attr */, node_zebra); + for (zdi = zei->databaseInfo; zdi; zdi = zdi->next) + { + data1_node *node_db; + node_db = data1_mk_tag(zei->dh, zei->nmem, + "database", 0 /* attr */, node_list); + data1_mk_tag_data_text(zei->dh, node_db, "name", + zdi->databaseName, zei->nmem); + data1_mk_tag_data_zint(zei->dh, node_db, "id", + zdi->sysno, zei->nmem); + data1_mk_tag_data_zint(zei->dh, node_db, "attributeDetailsId", + zdi->attributeDetails->sysno, zei->nmem); + } + data1_mk_tag_data_int(zei->dh, node_zebra, "ordinalSU", + zei->ordinalSU, zei->nmem); + + data1_mk_tag_data_int(zei->dh, node_zebra, "ordinalDatabase", + zei->ordinalDatabase, zei->nmem); + + data1_mk_tag_data_zint(zei->dh, node_zebra, "runNumber", + zei->runNumber, zei->nmem); + +#if ZINFO_DEBUG + data1_pr_tree(zei->dh, zei->data1_target, stderr); +#endif + sgml_buf = data1_nodetoidsgml(zei->dh, zei->data1_target, + 0, &sgml_len); + trec->info[recInfo_storeData] = (char *) xmalloc(sgml_len); + memcpy(trec->info[recInfo_storeData], sgml_buf, sgml_len); + trec->size[recInfo_storeData] = sgml_len; + + rec_put(zei->records, &trec); +} + +int zebraExplain_lookup_attr_str(ZebraExplainInfo zei, + zinfo_index_category_t cat, + const char *index_type, + const char *str) +{ + struct zebSUInfoB **zsui; + + assert(zei->curDatabaseInfo); + for (zsui = &zei->curDatabaseInfo->attributeDetails->SUInfo; + *zsui; zsui = &(*zsui)->next) + if ( (index_type == 0 + || !strcmp((*zsui)->info.index_type, index_type)) + && (*zsui)->info.cat == cat + && !yaz_matchstr((*zsui)->info.str, str)) + { + struct zebSUInfoB *zsui_this = *zsui; + + /* take it out of the list and move to front */ + *zsui = (*zsui)->next; + zsui_this->next = zei->curDatabaseInfo->attributeDetails->SUInfo; + zei->curDatabaseInfo->attributeDetails->SUInfo = zsui_this; + + return zsui_this->info.ordinal; + } + return -1; +} + +int zebraExplain_trav_ord(ZebraExplainInfo zei, void *handle, + int (*f)(void *handle, int ord, + const char *index_type, + const char *string_index, + zinfo_index_category_t cat)) +{ + struct zebDatabaseInfoB *zdb = zei->curDatabaseInfo; + if (zdb) + { + struct zebSUInfoB *zsui = zdb->attributeDetails->SUInfo; + for ( ;zsui; zsui = zsui->next) + (*f)(handle, zsui->info.ordinal, + zsui->info.index_type, zsui->info.str, + zsui->info.cat); + } return 0; } -int zebTargetInfo_lookupSU (ZebTargetInfo *zti, int set, int use) + +struct zebSUInfoB *zebraExplain_get_sui_info(ZebraExplainInfo zei, int ord, + int dirty_mark, + const char **db) +{ + struct zebDatabaseInfoB *zdb; + + for (zdb = zei->databaseInfo; zdb; zdb = zdb->next) + { + struct zebSUInfoB **zsui; + + if (zdb->attributeDetails->readFlag) + zebraExplain_readAttributeDetails(zei, zdb->attributeDetails); + + for (zsui = &zdb->attributeDetails->SUInfo; *zsui; + zsui = &(*zsui)->next) + if ((*zsui)->info.ordinal == ord) + { + struct zebSUInfoB *zsui_this = *zsui; + + /* take it out of the list and move to front */ + *zsui = (*zsui)->next; + zsui_this->next = zdb->attributeDetails->SUInfo; + zdb->attributeDetails->SUInfo = zsui_this; + + if (dirty_mark) + zdb->attributeDetails->dirty = 1; + if (db) + *db = zdb->databaseName; + return zsui_this; + } + } + return 0; +} + + + +int zebraExplain_ord_adjust_occurrences(ZebraExplainInfo zei, int ord, + int term_delta, int doc_delta) +{ + struct zebSUInfoB *zsui = zebraExplain_get_sui_info(zei, ord, 1, 0); + if (zsui) + { + zsui->info.term_occurrences += term_delta; + zsui->info.doc_occurrences += doc_delta; + return 0; + } + return -1; +} + +int zebraExplain_ord_get_occurrences(ZebraExplainInfo zei, int ord, + zint *term_occurrences, + zint *doc_occurrences) +{ + struct zebSUInfoB *zsui = zebraExplain_get_sui_info(zei, ord, 0, 0); + if (zsui) + { + *term_occurrences = zsui->info.term_occurrences; + *doc_occurrences = zsui->info.doc_occurrences; + return 0; + } + return -1; +} + +zint zebraExplain_ord_get_doc_occurrences(ZebraExplainInfo zei, int ord) +{ + struct zebSUInfoB *zsui = zebraExplain_get_sui_info(zei, ord, 0, 0); + if (zsui) + return zsui->info.doc_occurrences; + return 0; +} + +zint zebraExplain_ord_get_term_occurrences(ZebraExplainInfo zei, int ord) +{ + struct zebSUInfoB *zsui = zebraExplain_get_sui_info(zei, ord, 0, 0); + if (zsui) + return zsui->info.term_occurrences; + return 0; +} + +int zebraExplain_lookup_ord(ZebraExplainInfo zei, int ord, + const char **index_type, + const char **db, + const char **string_index) { struct zebSUInfoB *zsui; - assert (zti->curDatabaseInfo); - for (zsui = zti->curDatabaseInfo->SUInfo; zsui; zsui=zsui->next) - if (zsui->info.use == use && zsui->info.set == set) - return zsui->info.ordinal; + if (index_type) + *index_type = 0; + if (string_index) + *string_index = 0; + + zsui = zebraExplain_get_sui_info(zei, ord, 0, db); + if (zsui) + { + if (string_index) + *string_index = zsui->info.str; + if (index_type) + *index_type = zsui->info.index_type; + return 0; + } return -1; } -int zebTargetInfo_addSU (ZebTargetInfo *zti, int set, int use) + + +zebAccessObject zebraExplain_announceOid(ZebraExplainInfo zei, + zebAccessObject *op, + Odr_oid *oid) +{ + zebAccessObject ao; + + for (ao = *op; ao; ao = ao->next) + if (!oid_oidcmp(oid, ao->oid)) + break; + if (!ao) + { + ao = (zebAccessObject) nmem_malloc(zei->nmem, sizeof(*ao)); + ao->handle = 0; + ao->sysno = 0; + ao->oid = odr_oiddup_nmem(zei->nmem, oid); + ao->next = *op; + *op = ao; + } + return ao; +} + +struct zebSUInfoB *zebraExplain_add_sui_info(ZebraExplainInfo zei, + zinfo_index_category_t cat, + const char *index_type) { struct zebSUInfoB *zsui; - assert (zti->curDatabaseInfo); - for (zsui = zti->curDatabaseInfo->SUInfo; zsui; zsui=zsui->next) - if (zsui->info.use == use && zsui->info.set == set) - return -1; - zsui = xmalloc (sizeof(*zsui)); - zsui->next = zti->curDatabaseInfo->SUInfo; - zti->curDatabaseInfo->SUInfo = zsui; - zti->curDatabaseInfo->dirty = 1; - zti->dirty = 1; - zsui->info.set = set; - zsui->info.use = use; - zsui->info.ordinal = (zti->dictNum)++; + assert(zei->curDatabaseInfo); + zsui = (struct zebSUInfoB *) nmem_malloc(zei->nmem, sizeof(*zsui)); + zsui->next = zei->curDatabaseInfo->attributeDetails->SUInfo; + zei->curDatabaseInfo->attributeDetails->SUInfo = zsui; + zei->curDatabaseInfo->attributeDetails->dirty = 1; + zei->dirty = 1; + zsui->info.index_type = nmem_strdup(zei->nmem, index_type); + zsui->info.cat = cat; + zsui->info.doc_occurrences = 0; + zsui->info.term_occurrences = 0; + zsui->info.ordinal = (zei->ordinalSU)++; + return zsui; +} + +int zebraExplain_add_attr_str(ZebraExplainInfo zei, + zinfo_index_category_t cat, + const char *index_type, + const char *index_name) +{ + struct zebSUInfoB *zsui = zebraExplain_add_sui_info(zei, cat, index_type); + + zsui->info.str = nmem_strdup(zei->nmem, index_name); return zsui->info.ordinal; } -ZebDatabaseInfo *zebTargetInfo_getDB (ZebTargetInfo *zti) +void zebraExplain_addSchema(ZebraExplainInfo zei, Odr_oid *oid) +{ + zebraExplain_announceOid(zei, &zei->accessInfo->schemas, oid); + zebraExplain_announceOid(zei, &zei->curDatabaseInfo-> + accessInfo->schemas, oid); +} + +void zebraExplain_recordBytesIncrement(ZebraExplainInfo zei, int adjust_num) { - assert (zti->curDatabaseInfo); + assert(zei->curDatabaseInfo); - return &zti->curDatabaseInfo->info; + if (adjust_num) + { + zei->curDatabaseInfo->recordBytes += adjust_num; + zei->curDatabaseInfo->dirty = 1; + } } -void zebTargetInfo_setDB (ZebTargetInfo *zti, ZebDatabaseInfo *zdi) +void zebraExplain_recordCountIncrement(ZebraExplainInfo zei, int adjust_num) { - assert (zti->curDatabaseInfo); + assert(zei->curDatabaseInfo); - zti->curDatabaseInfo->dirty = 1; - memcpy (&zti->curDatabaseInfo->info, zdi, sizeof(*zdi)); + if (adjust_num) + { + zei->curDatabaseInfo->recordCount += adjust_num; + zei->curDatabaseInfo->dirty = 1; + } } + +zint zebraExplain_runNumberIncrement(ZebraExplainInfo zei, int adjust_num) +{ + if (adjust_num) + { + zei->dirty = 1; + } + return zei->runNumber += adjust_num; +} + +RecordAttr *rec_init_attr(ZebraExplainInfo zei, Record rec) +{ + RecordAttr *recordAttr; + + if (rec->info[recInfo_attr]) + return (RecordAttr *) rec->info[recInfo_attr]; + recordAttr = (RecordAttr *) xmalloc(sizeof(*recordAttr)); + + memset(recordAttr, '\0', sizeof(*recordAttr)); + rec->info[recInfo_attr] = (char *) recordAttr; + rec->size[recInfo_attr] = sizeof(*recordAttr); + + recordAttr->recordSize = 0; + recordAttr->recordOffset = 0; + recordAttr->runNumber = zei->runNumber; + recordAttr->staticrank = 0; + return recordAttr; +} + +static void att_loadset(void *p, const char *n, const char *name) +{ + data1_handle dh = (data1_handle) p; + if (!data1_get_attset(dh, name)) + yaz_log(YLOG_WARN, "Directive attset failed for %s", name); +} + +int zebraExplain_get_database_ord(ZebraExplainInfo zei) +{ + if (!zei->curDatabaseInfo) + return -1; + return zei->curDatabaseInfo->ordinalDatabase; +} + +void zebraExplain_loadAttsets(data1_handle dh, Res res) +{ + res_trav(res, "attset", dh, att_loadset); +} + +/* + zebraExplain_addSU adds to AttributeDetails for a database and + adds attributeSet (in AccessInfo area) to DatabaseInfo if it doesn't + exist for the database. + + If the database doesn't exist globally (in TargetInfo) an + AttributeSetInfo must be added (globally). + */ +/* + * Local variables: + * c-basic-offset: 4 + * c-file-style: "Stroustrup" + * indent-tabs-mode: nil + * End: + * vim: shiftwidth=4 tabstop=8 expandtab + */ +