X-Git-Url: http://git.indexdata.com/?p=idzebra-moved-to-github.git;a=blobdiff_plain;f=index%2Fmod_dom.c;h=de2a872ec4fd3a8c157069b4b064b8ac2bd36158;hp=95c8a06bad0b5f3c042197946e055f74d24d45d0;hb=a5c8c78e8671af863fc61b2ad8b24f92f827f7b2;hpb=26325895a68fa527a1cd26ea2ccbe80b51db44bd diff --git a/index/mod_dom.c b/index/mod_dom.c index 95c8a06..de2a872 100644 --- a/index/mod_dom.c +++ b/index/mod_dom.c @@ -1,5 +1,5 @@ /* This file is part of the Zebra server. - Copyright (C) 1995-2008 Index Data + Copyright (C) 1994-2011 Index Data Zebra is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free @@ -17,6 +17,9 @@ Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */ +#if HAVE_CONFIG_H +#include +#endif #include #include #include @@ -399,11 +402,11 @@ static int process_meta(struct filter_info *tinfo, xmlDocPtr doc, xmlNodePtr nod if (ret == 0) { xmlDocPtr sub_doc = - xmlParseMemory( wrbuf_buf(result), wrbuf_len(result)); + xmlParseMemory(wrbuf_buf(result), wrbuf_len(result)); if (sub_doc) { xmlNodePtr t = xmlDocGetRootElement(sub_doc); - xmlAddChild(node, xmlCopyNode(t, 1)); + xmlReplaceNode(node, xmlCopyNode(t, 1)); xmlFreeDoc(sub_doc); } } @@ -813,10 +816,18 @@ static void index_value_of(struct filter_info *tinfo, { xmlChar *text = xmlNodeGetContent(node); size_t text_len = strlen((const char *)text); - + /* if there is no text, we do not need to proceed */ if (text_len) { + /* keep seqno base so that all text will have + identical seqno's for multiple fields , e.g + .. */ + + zint seqno_base = recword->seqno; + zint seqno_max = recword->seqno; + + const char *look = index_p; const char *bval; const char *eval; @@ -864,6 +875,7 @@ static void index_value_of(struct filter_info *tinfo, /* actually indexing the text given */ + recword->seqno = seqno_base; recword->index_name = (const char *)index; if (*type) recword->index_type = (const char *) type; @@ -878,12 +890,16 @@ static void index_value_of(struct filter_info *tinfo, (extctr->tokenAdd)(recword); + if (seqno_max < recword->seqno) + seqno_max = recword->seqno; + /* eat whitespaces */ if (*look && ' ' == *look) { look++; } } + recword->seqno = seqno_max; } xmlFree(text); } @@ -908,7 +924,13 @@ static void set_record_info(struct filter_info *tinfo, if (id_p && *id_p) - sscanf((const char *)id_p, "%255s", extctr->match_criteria); + { + size_t l = strlen(id_p); + if (l >= sizeof(extctr->match_criteria)) + l = sizeof(extctr->match_criteria)-1; + memcpy(extctr->match_criteria, id_p, l); + extctr->match_criteria[l] = '\0'; + } if (rank_p && *rank_p) extctr->staticrank = atozint((const char *)rank_p); @@ -1008,9 +1030,6 @@ static int attr_content_pi(const char **c_ptr, const char *name, const char *look = *c_ptr; int ret = 0; - *value = '\0'; - while (*look && ' ' == *look) - look++; if (strlen(look) > name_len) { if (look[name_len] == '=' && !memcmp(look, name, name_len)) @@ -1027,8 +1046,6 @@ static int attr_content_pi(const char **c_ptr, const char *name, ret = 1; } } - while (*look && ' ' == *look) - look++; *c_ptr = look; return ret; } @@ -1056,18 +1073,27 @@ static void process_xml_pi_node(struct filter_info *tinfo, *rank = '\0'; *type = '\0'; look += 6; - while (*look) + for (;;) + { + /* eat whitespace */ + while (' ' == *look) + look++; + if (*look == '\0') + break; if (attr_content_pi(&look, "id", id, sizeof(id))) ; else if (attr_content_pi(&look, "rank", rank, sizeof(rank))) ; else if (attr_content_pi(&look, "type", type, sizeof(type))) + ; + else { dom_log(YLOG_WARN, tinfo, node, "content '%s', can not parse '%s'", pi_p, look); break; } + } set_record_info(tinfo, extctr, node, id, rank, type); } /* parsing index instruction */ @@ -1166,15 +1192,13 @@ static int convert_extract_doc(struct filter_info *tinfo, { xmlChar *buf_out; int len_out; + xmlDocDumpMemory(doc, &buf_out, &len_out); #if 0 FILE *outf = fopen("extract.xml", "w"); - xmlDocDumpMemory(doc, &buf_out, &len_out); fwrite(buf_out, 1, len_out, outf); -#endif - yaz_log(YLOG_LOG, "Extract Doc: %.*s", len_out, buf_out); -#if 0 fclose(outf); #endif + yaz_log(YLOG_LOG, "Extract Doc: %.*s", len_out, buf_out); } if (p->setStoreData) @@ -1407,7 +1431,8 @@ static int filter_extract(void *clientData, struct recExtractCtrl *p) static int ioread_ret(void *context, char *buffer, int len) { struct recRetrieveCtrl *p = context; - return p->stream->readf(p->stream, buffer, len); + int r = p->stream->readf(p->stream, buffer, len); + return r; } static int ioclose_ret(void *context) @@ -1445,7 +1470,7 @@ static int filter_retrieve(void *clientData, struct recRetrieveCtrl *p) { p->diagnostic = YAZ_BIB1_SPECIFIED_ELEMENT_SET_NAME_NOT_VALID_FOR_SPECIFIED_; - p->addinfo = odr_strdup(p->odr, esn); + p->addinfo = odr_strdup_null(p->odr, esn); return 0; } @@ -1539,7 +1564,7 @@ static struct recType filter_type = { }; RecType -#ifdef IDZEBRA_STATIC_DOM +#if IDZEBRA_STATIC_DOM idzebra_filter_dom #else idzebra_filter @@ -1552,6 +1577,7 @@ idzebra_filter /* * Local variables: * c-basic-offset: 4 + * c-file-style: "Stroustrup" * indent-tabs-mode: nil * End: * vim: shiftwidth=4 tabstop=8 expandtab