X-Git-Url: http://git.indexdata.com/?a=blobdiff_plain;f=recctrl%2Fxslt.c;h=5528c8893c5fe52fe2b7e171098a4c0d5ec8d0c0;hb=9b9f570a2960c2c8a7026b2faee943794b08ce49;hp=62c8dd04793e920a3e4dae1d0e20dea219fb8ded;hpb=0f3b8bcc6fe2e3beeec7c834d9a64dca48a4f1b7;p=idzebra-moved-to-github.git diff --git a/recctrl/xslt.c b/recctrl/xslt.c index 62c8dd0..5528c88 100644 --- a/recctrl/xslt.c +++ b/recctrl/xslt.c @@ -1,4 +1,4 @@ -/* $Id: xslt.c,v 1.1 2005-04-28 08:20:40 adam Exp $ +/* $Id: xslt.c,v 1.5 2005-05-01 07:38:51 adam Exp $ Copyright (C) 1995-2005 Index Data ApS @@ -25,7 +25,12 @@ Free Software Foundation, 59 Temple Place - Suite 330, Boston, MA #include #include +#include +#include +#include +#ifdef LIBXML_READER_ENABLED #include +#endif #include #include @@ -33,19 +38,60 @@ Free Software Foundation, 59 Temple Place - Suite 330, Boston, MA struct filter_info { xsltStylesheetPtr stylesheet_xsp; +#ifdef LIBXML_READER_ENABLED xmlTextReaderPtr reader; +#endif char *fname; int split_depth; + ODR odr; }; -static const char *zebra_index_ns = "http://indexdata.dk/zebra/indexing/1"; +#define ZEBRA_INDEX_NS "http://indexdata.dk/zebra/indexing/1" +#define ZEBRA_SCHEMA_IDENTITY_NS "http://indexdata.dk/zebra/identity/1" +static const char *zebra_index_ns = ZEBRA_INDEX_NS; + +static void set_param_str(const char **params, const char *name, + const char *value, ODR odr) +{ + char *quoted = odr_malloc(odr, 3 + strlen(value)); + sprintf(quoted, "'%s'", value); + while (*params) + params++; + params[0] = name; + params[1] = quoted; + params[2] = 0; +} + +static void set_param_int(const char **params, const char *name, + zint value, ODR odr) +{ + char *quoted = odr_malloc(odr, 30); /* 25 digits enough for 2^64 */ + while (*params) + params++; + sprintf(quoted, "'" ZINT_FORMAT "'", value); + params[0] = name; + params[1] = quoted; + params[2] = 0; +} -static void *filter_init (Res res, RecType recType) + +static void *filter_init_xslt(Res res, RecType recType) { struct filter_info *tinfo = (struct filter_info *) xmalloc(sizeof(*tinfo)); tinfo->stylesheet_xsp = 0; +#ifdef LIBXML_READER_ENABLED tinfo->reader = 0; +#endif tinfo->fname = 0; + tinfo->split_depth = 0; + tinfo->odr = odr_createmem(ODR_ENCODE); + return tinfo; +} + +static void *filter_init_xslt1(Res res, RecType recType) +{ + struct filter_info *tinfo = (struct filter_info *) + filter_init_xslt(res, recType); tinfo->split_depth = 1; return tinfo; } @@ -72,7 +118,12 @@ static void filter_destroy(void *clientData) struct filter_info *tinfo = clientData; if (tinfo->stylesheet_xsp) xsltFreeStylesheet(tinfo->stylesheet_xsp); +#ifdef LIBXML_READER_ENABLED + if (tinfo->reader) + xmlFreeTextReader(tinfo->reader); +#endif xfree(tinfo->fname); + odr_destroy(tinfo->odr); xfree(tinfo); } @@ -133,16 +184,48 @@ static void index_node(struct filter_info *tinfo, struct recExtractCtrl *ctrl, } } -static int filter_extract(void *clientData, struct recExtractCtrl *p) +static int extract_doc(struct filter_info *tinfo, struct recExtractCtrl *p, + xmlDocPtr doc) { - static const char *params[] = { - "schema", "'http://indexdata.dk/zebra/indexing/1'", - 0 - }; - struct filter_info *tinfo = clientData; RecWord recWord; - int ret; + const char *params[10]; + xmlChar *buf_out; + int len_out; + + params[0] = 0; + set_param_str(params, "schema", ZEBRA_INDEX_NS, tinfo->odr); + (*p->init)(p, &recWord); + recWord.reg_type = 'w'; + + if (tinfo->stylesheet_xsp) + { + xmlDocPtr resDoc = + xsltApplyStylesheet(tinfo->stylesheet_xsp, + doc, params); + if (p->flagShowRecords) + { + xmlDocDumpMemory(resDoc, &buf_out, &len_out); + fwrite(buf_out, len_out, 1, stdout); + xmlFree(buf_out); + } + index_node(tinfo, p, xmlDocGetRootElement(resDoc), &recWord); + xmlFreeDoc(resDoc); + } + xmlDocDumpMemory(doc, &buf_out, &len_out); + if (p->flagShowRecords) + fwrite(buf_out, len_out, 1, stdout); + (*p->setStoreData)(p, buf_out, len_out); + xmlFree(buf_out); + + xmlFreeDoc(doc); + return RECCTRL_EXTRACT_OK; +} + +#ifdef LIBXML_READER_ENABLED +static int extract_split(struct filter_info *tinfo, struct recExtractCtrl *p) +{ + int ret; if (p->first_record) { if (tinfo->reader) @@ -159,9 +242,6 @@ static int filter_extract(void *clientData, struct recExtractCtrl *p) if (!tinfo->stylesheet_xsp) return RECCTRL_EXTRACT_ERROR_GENERIC; - (*p->init)(p, &recWord); - recWord.reg_type = 'w'; - ret = xmlTextReaderRead(tinfo->reader); while (ret == 1) { int type = xmlTextReaderNodeType(tinfo->reader); @@ -169,37 +249,13 @@ static int filter_extract(void *clientData, struct recExtractCtrl *p) if (tinfo->split_depth == 0 || (type == XML_READER_TYPE_ELEMENT && tinfo->split_depth == depth)) { - xmlChar *buf_out; - int len_out; - xmlNodePtr ptr = xmlTextReaderExpand(tinfo->reader); xmlNodePtr ptr2 = xmlCopyNode(ptr, 1); xmlDocPtr doc = xmlNewDoc("1.0"); xmlDocSetRootElement(doc, ptr2); - - if (tinfo->stylesheet_xsp) - { - xmlDocPtr resDoc = - xsltApplyStylesheet(tinfo->stylesheet_xsp, - doc, params); - if (p->flagShowRecords) - { - xmlDocDumpMemory(resDoc, &buf_out, &len_out); - fwrite(buf_out, len_out, 1, stdout); - xmlFree(buf_out); - } - index_node(tinfo, p, xmlDocGetRootElement(resDoc), &recWord); - xmlFreeDoc(resDoc); - } - xmlDocDumpMemory(doc, &buf_out, &len_out); - if (p->flagShowRecords) - fwrite(buf_out, len_out, 1, stdout); - (*p->setStoreData)(p, buf_out, len_out); - xmlFree(buf_out); - xmlFreeDoc(doc); - return RECCTRL_EXTRACT_OK; + return extract_doc(tinfo, p, doc); } ret = xmlTextReaderRead(tinfo->reader); } @@ -207,6 +263,44 @@ static int filter_extract(void *clientData, struct recExtractCtrl *p) tinfo->reader = 0; return RECCTRL_EXTRACT_EOF; } +#endif + +static int extract_full(struct filter_info *tinfo, struct recExtractCtrl *p) +{ + if (p->first_record) /* only one record per stream */ + { + xmlDocPtr doc = xmlReadIO(ioread_ex, ioclose_ex, p /* I/O handler */, + 0 /* URL */, + 0 /* encoding */, + XML_PARSE_XINCLUDE); + if (!doc) + { + return RECCTRL_EXTRACT_ERROR_GENERIC; + } + return extract_doc(tinfo, p, doc); + } + else + return RECCTRL_EXTRACT_EOF; +} + +static int filter_extract(void *clientData, struct recExtractCtrl *p) +{ + struct filter_info *tinfo = clientData; + + odr_reset(tinfo->odr); + + if (tinfo->split_depth == 0) + return extract_full(tinfo, p); + else + { +#ifdef LIBXML_READER_ENABLED + return extract_split(tinfo, p); +#else + /* no xmlreader so we can't split it */ + return RECCTRL_EXTRACT_ERROR_GENERIC; +#endif + } +} static int ioread_ret(void *context, char *buffer, int len) { @@ -221,18 +315,14 @@ static int ioclose_ret(void *context) static int filter_retrieve (void *clientData, struct recRetrieveCtrl *p) { - static const char *params[] = { - "schema", "'F'", - 0 - }; + const char *esn = ZEBRA_SCHEMA_IDENTITY_NS; + const char *params[10]; struct filter_info *tinfo = clientData; xmlDocPtr resDoc; xmlDocPtr doc; if (p->comp) { - const char *esn; - char *esn_quoted; if (p->comp->which != Z_RecordComp_simple || p->comp->u.simple->which != Z_ElementSetNames_generic) { @@ -240,10 +330,16 @@ static int filter_retrieve (void *clientData, struct recRetrieveCtrl *p) return 0; } esn = p->comp->u.simple->u.generic; - esn_quoted = odr_malloc(p->odr, 3 + strlen(esn)); - sprintf(esn_quoted, "'%s'", esn); - params[1] = esn_quoted; } + + params[0] = 0; + set_param_str(params, "schema", esn, p->odr); + if (p->fname) + set_param_str(params, "filename", p->fname, p->odr); + if (p->score >= 0) + set_param_int(params, "score", p->score, p->odr); + set_param_int(params, "size", p->recordSize, p->odr); + if (!tinfo->stylesheet_xsp) { p->diagnostic = YAZ_BIB1_SYSTEM_ERROR_IN_PRESENTING_RECORDS; @@ -258,8 +354,15 @@ static int filter_retrieve (void *clientData, struct recRetrieveCtrl *p) p->diagnostic = YAZ_BIB1_SYSTEM_ERROR_IN_PRESENTING_RECORDS; return 0; } - resDoc = xsltApplyStylesheet(tinfo->stylesheet_xsp, - doc, params); + + if (!strcmp(esn, ZEBRA_SCHEMA_IDENTITY_NS)) + resDoc = doc; + else + { + resDoc = xsltApplyStylesheet(tinfo->stylesheet_xsp, + doc, params); + xmlFreeDoc(doc); + } if (!resDoc) { p->diagnostic = YAZ_BIB1_SYSTEM_ERROR_IN_PRESENTING_RECORDS; @@ -295,14 +398,23 @@ static int filter_retrieve (void *clientData, struct recRetrieveCtrl *p) p->diagnostic = YAZ_BIB1_RECORD_SYNTAX_UNSUPP; } xmlFreeDoc(resDoc); - xmlFreeDoc(doc); return 0; } -static struct recType filter_type = { +static struct recType filter_type_xslt = { 0, "xslt", - filter_init, + filter_init_xslt, + filter_config, + filter_destroy, + filter_extract, + filter_retrieve +}; + +static struct recType filter_type_xslt1 = { + 0, + "xslt1", + filter_init_xslt1, filter_config, filter_destroy, filter_extract, @@ -317,6 +429,9 @@ idzebra_filter #endif [] = { - &filter_type, + &filter_type_xslt, +#ifdef LIBXML_READER_ENABLED + &filter_type_xslt1, +#endif 0, };