X-Git-Url: http://git.indexdata.com/?a=blobdiff_plain;f=util%2Fmarcdump.c;h=3de8d7631375c77609e324f7a226e58932570a21;hb=4e82b831a8ac31e25b246a631acde354d8161688;hp=7cc154ec62ace766fcd34b9bed7b368ca634b151;hpb=aabf1ddf38ac10199480c78045c09456c86524a8;p=yaz-moved-to-github.git diff --git a/util/marcdump.c b/util/marcdump.c index 7cc154e..3de8d76 100644 --- a/util/marcdump.c +++ b/util/marcdump.c @@ -1,59 +1,36 @@ /* - * Copyright (c) 1995-2001, Index Data + * Copyright (C) 1995-2005, Index Data ApS * See the file LICENSE for details. - * Sebastian Hammer, Adam Dickmeiss - * - * $Log: marcdump.c,v $ - * Revision 1.13 2001-02-10 01:21:59 adam - * Dumper only keeps one record at a time in memory. - * - * Revision 1.12 2000/10/02 11:07:45 adam - * Added peer_name member for bend_init handler. Changed the YAZ - * client so that tcp: can be avoided in target spec. - * - * Revision 1.11 2000/07/04 08:53:22 adam - * Fixed bug. - * - * Revision 1.10 2000/02/29 13:44:55 adam - * Check for config.h (currently not generated). - * - * Revision 1.9 1999/11/30 13:47:12 adam - * Improved installation. Moved header files to include/yaz. - * - * Revision 1.8 1999/05/26 07:49:35 adam - * C++ compilation. - * - * Revision 1.7 1998/02/11 11:53:36 adam - * Changed code so that it compiles as C++. - * - * Revision 1.6 1997/12/12 06:32:33 adam - * Added include of string.h. - * - * Revision 1.5 1997/09/24 13:29:40 adam - * Added verbose option -v to marcdump utility. - * - * Revision 1.4 1995/11/01 13:55:05 quinn - * Minor adjustments - * - * Revision 1.3 1995/05/16 08:51:12 quinn - * License, documentation, and memory fixes - * - * Revision 1.2 1995/05/15 11:56:56 quinn - * Debuggng & adjustments. - * - * Revision 1.1 1995/04/10 10:28:47 quinn - * Added copy of CCL and MARC display * + * $Id: marcdump.c,v 1.26 2005-01-15 19:47:15 adam Exp $ */ #if HAVE_CONFIG_H #include #endif +#if HAVE_XML2 +#include +#include + +#include +#include + +#endif + #include #include #include #include +#include + +#if HAVE_LOCALE_H +#include +#endif +#if HAVE_LANGINFO_H +#include +#endif + #include #include #include @@ -65,86 +42,252 @@ #ifndef SEEK_END #define SEEK_END 2 #endif - + +static void usage(const char *prog) +{ + fprintf (stderr, "Usage: %s [-c cfile] [-f from] [-t to] [-x] [-O] [-X] [-I] [-v] file...\n", + prog); +} + +#if HAVE_XML2 +void print_xpath_nodes(xmlNodeSetPtr nodes, FILE* output) { + xmlNodePtr cur; + int size; + int i; + + assert(output); + size = (nodes) ? nodes->nodeNr : 0; + + fprintf(output, "Result (%d nodes):\n", size); + for(i = 0; i < size; ++i) { + assert(nodes->nodeTab[i]); + + if(nodes->nodeTab[i]->type == XML_NAMESPACE_DECL) + { + xmlNsPtr ns; + + ns = (xmlNsPtr)nodes->nodeTab[i]; + cur = (xmlNodePtr)ns->next; + if(cur->ns) { + fprintf(output, "= namespace \"%s\"=\"%s\" for node %s:%s\n", + ns->prefix, ns->href, cur->ns->href, cur->name); + } else { + fprintf(output, "= namespace \"%s\"=\"%s\" for node %s\n", + ns->prefix, ns->href, cur->name); + } + } + else if(nodes->nodeTab[i]->type == XML_ELEMENT_NODE) + { + cur = nodes->nodeTab[i]; + if(cur->ns) { + fprintf(output, "= element node \"%s:%s\"\n", + cur->ns->href, cur->name); + } + else + { + fprintf(output, "= element node \"%s\"\n", + cur->name); + } + } + else + { + cur = nodes->nodeTab[i]; + fprintf(output, "= node \"%s\": type %d\n", cur->name, cur->type); + } + } +} +#endif + int main (int argc, char **argv) { int r; + int libxml_dom_test = 0; + int print_offset = 0; char *arg; int verbose = 0; FILE *inf; char buf[100001]; char *prog = *argv; int no = 0; + int xml = 0; FILE *cfile = 0; + char *from = 0, *to = 0; + int num = 1; + +#if HAVE_LOCALE_H + setlocale(LC_CTYPE, ""); +#endif +#if HAVE_LANGINFO_H +#ifdef CODESET + to = nl_langinfo(CODESET); +#endif +#endif - while ((r = options("vc:", argv, argc, &arg)) != -2) + while ((r = options("pvc:xOXIf:t:2", argv, argc, &arg)) != -2) { int count; no++; switch (r) { + case 'f': + from = arg; + break; + case 't': + to = arg; + break; case 'c': if (cfile) fclose (cfile); cfile = fopen (arg, "w"); break; + case 'x': + xml = YAZ_MARC_SIMPLEXML; + break; + case 'O': + xml = YAZ_MARC_OAIMARC; + break; + case 'X': + xml = YAZ_MARC_MARCXML; + break; + case 'I': + xml = YAZ_MARC_ISO2709; + break; + case 'p': + print_offset = 1; + break; + case '2': + libxml_dom_test = 1; + break; case 0: - inf = fopen (arg, "r"); + inf = fopen (arg, "rb"); count = 0; if (!inf) { fprintf (stderr, "%s: cannot open %s:%s\n", prog, arg, strerror (errno)); - exit (1); + exit(1); } if (cfile) fprintf (cfile, "char *marc_records[] = {\n"); - while (1) - { - int len; - - r = fread (buf, 1, 5, inf); - if (r < 5) - break; - len = atoi_n(buf, 5); - if (len < 25 || len > 100000) - break; - len = len - 5; - r = fread (buf + 5, 1, len, inf); - if (r < len) - break; - r = marc_display_ex (buf, stdout, verbose); - if (r <= 0) - break; - if (cfile) - { - char *p = buf; - int i; - if (count) - fprintf (cfile, ","); - fprintf (cfile, "{\n"); - for (i = 0; i < r; i++) + if (1) + { + yaz_marc_t mt = yaz_marc_create(); + yaz_iconv_t cd = 0; + + if (from && to) + { + cd = yaz_iconv_open(to, from); + if (!cd) + { + fprintf(stderr, "conversion from %s to %s " + "unsupported\n", from, to); + exit(2); + } + yaz_marc_iconv(mt, cd); + } + yaz_marc_xml(mt, xml); + yaz_marc_debug(mt, verbose); + while (1) + { + int len; + char *result; + int rlen; + + r = fread (buf, 1, 5, inf); + if (r < 5) + { + if (r && print_offset) + printf ("Extra %d bytes", r); + break; + } + if (print_offset) + { + long off = ftell(inf); + printf ("Record %d offset %ld\n", num, (long) off); + } + len = atoi_n(buf, 5); + if (len < 25 || len > 100000) + break; + len = len - 5; + r = fread (buf + 5, 1, len, inf); + if (r < len) + break; + r = yaz_marc_decode_buf (mt, buf, -1, &result, &rlen); + if (r <= 0) + break; + fwrite (result, rlen, 1, stdout); +#if HAVE_XML2 + if (libxml_dom_test) { - if ((i & 15) == 0) - fprintf (cfile, " \""); - fprintf (cfile, "\\x%02X", p[i] & 255); - - if (i < r - 1 && (i & 15) == 15) - fprintf (cfile, "\"\n"); - + xmlDocPtr doc = xmlParseMemory(result, rlen); + if (!doc) + fprintf(stderr, "xmLParseMemory failed\n"); + else + { + int i; + xmlXPathContextPtr xpathCtx; + xmlXPathObjectPtr xpathObj; + static const char *xpathExpr[] = { + "/record/datafield[@tag='245']/subfield[@code='a']", + "/record/datafield[@tag='100']/subfield", + "/record/datafield[@tag='245']/subfield[@code='a']", + "/record/datafield[@tag='650']/subfield", + "/record/datafield[@tag='650']", + 0}; + + xpathCtx = xmlXPathNewContext(doc); + + for (i = 0; xpathExpr[i]; i++) { + xpathObj = xmlXPathEvalExpression(xpathExpr[i], xpathCtx); + if(xpathObj == NULL) { + fprintf(stderr,"Error: unable to evaluate xpath expression \"%s\"\n", xpathExpr[i]); + } + else + { + print_xpath_nodes(xpathObj->nodesetval, stdout); + xmlXPathFreeObject(xpathObj); + } + } + xmlXPathFreeContext(xpathCtx); + xmlFreeDoc(doc); + } + } +#endif + if (cfile) + { + char *p = buf; + int i; + if (count) + fprintf (cfile, ","); + fprintf (cfile, "\n"); + for (i = 0; i < r; i++) + { + if ((i & 15) == 0) + fprintf (cfile, " \""); + fprintf (cfile, "\\x%02X", p[i] & 255); + + if (i < r - 1 && (i & 15) == 15) + fprintf (cfile, "\"\n"); + } - fprintf (cfile, "\"\n}"); - } - count++; + fprintf (cfile, "\"\n"); + } + num++; + } + count++; + if (cd) + yaz_iconv_close(cd); + yaz_marc_destroy(mt); } if (cfile) fprintf (cfile, "};\n"); + fclose(inf); break; case 'v': verbose++; break; default: - fprintf (stderr, "Usage: %s [-c cfile] [-v] file...\n", prog); + usage(prog); exit (1); } } @@ -152,7 +295,7 @@ int main (int argc, char **argv) fclose (cfile); if (!no) { - fprintf (stderr, "Usage: %s [-v] file...\n", prog); + usage(prog); exit (1); } exit (0);