/*
- * Copyright (c) 1995-2000, Index Data
+ * Copyright (c) 1995-2004, Index Data
* See the file LICENSE for details.
- * Sebastian Hammer, Adam Dickmeiss
- *
- * $Log: marcdump.c,v $
- * Revision 1.11 2000-07-04 08:53:22 adam
- * Fixed bug.
- *
- * Revision 1.10 2000/02/29 13:44:55 adam
- * Check for config.h (currently not generated).
- *
- * Revision 1.9 1999/11/30 13:47:12 adam
- * Improved installation. Moved header files to include/yaz.
- *
- * Revision 1.8 1999/05/26 07:49:35 adam
- * C++ compilation.
- *
- * Revision 1.7 1998/02/11 11:53:36 adam
- * Changed code so that it compiles as C++.
- *
- * Revision 1.6 1997/12/12 06:32:33 adam
- * Added include of string.h.
- *
- * Revision 1.5 1997/09/24 13:29:40 adam
- * Added verbose option -v to marcdump utility.
- *
- * Revision 1.4 1995/11/01 13:55:05 quinn
- * Minor adjustments
- *
- * Revision 1.3 1995/05/16 08:51:12 quinn
- * License, documentation, and memory fixes
- *
- * Revision 1.2 1995/05/15 11:56:56 quinn
- * Debuggng & adjustments.
- *
- * Revision 1.1 1995/04/10 10:28:47 quinn
- * Added copy of CCL and MARC display
*
+ * $Id: marcdump.c,v 1.25 2004-08-07 08:18:20 adam Exp $
*/
#if HAVE_CONFIG_H
#include <config.h>
#endif
+#if HAVE_XML2
+#include <libxml/parser.h>
+#include <libxml/tree.h>
+
+#include <libxml/xpath.h>
+#include <libxml/xpathInternals.h>
+
+#endif
+
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
+#include <assert.h>
+
+#if HAVE_LOCALE_H
+#include <locale.h>
+#endif
+#if HAVE_LANGINFO_H
+#include <langinfo.h>
+#endif
+
#include <yaz/marcdisp.h>
+#include <yaz/yaz-util.h>
#include <yaz/xmalloc.h>
#include <yaz/options.h>
#ifndef SEEK_END
#define SEEK_END 2
#endif
-
+
+static void usage(const char *prog)
+{
+ fprintf (stderr, "Usage: %s [-c cfile] [-f from] [-t to] [-x] [-O] [-X] [-I] [-v] file...\n",
+ prog);
+}
+
+#if HAVE_XML2
+void print_xpath_nodes(xmlNodeSetPtr nodes, FILE* output) {
+ xmlNodePtr cur;
+ int size;
+ int i;
+
+ assert(output);
+ size = (nodes) ? nodes->nodeNr : 0;
+
+ fprintf(output, "Result (%d nodes):\n", size);
+ for(i = 0; i < size; ++i) {
+ assert(nodes->nodeTab[i]);
+
+ if(nodes->nodeTab[i]->type == XML_NAMESPACE_DECL)
+ {
+ xmlNsPtr ns;
+
+ ns = (xmlNsPtr)nodes->nodeTab[i];
+ cur = (xmlNodePtr)ns->next;
+ if(cur->ns) {
+ fprintf(output, "= namespace \"%s\"=\"%s\" for node %s:%s\n",
+ ns->prefix, ns->href, cur->ns->href, cur->name);
+ } else {
+ fprintf(output, "= namespace \"%s\"=\"%s\" for node %s\n",
+ ns->prefix, ns->href, cur->name);
+ }
+ }
+ else if(nodes->nodeTab[i]->type == XML_ELEMENT_NODE)
+ {
+ cur = nodes->nodeTab[i];
+ if(cur->ns) {
+ fprintf(output, "= element node \"%s:%s\"\n",
+ cur->ns->href, cur->name);
+ }
+ else
+ {
+ fprintf(output, "= element node \"%s\"\n",
+ cur->name);
+ }
+ }
+ else
+ {
+ cur = nodes->nodeTab[i];
+ fprintf(output, "= node \"%s\": type %d\n", cur->name, cur->type);
+ }
+ }
+}
+#endif
+
int main (int argc, char **argv)
{
- int ret;
+ int r;
+ int libxml_dom_test = 0;
+ int print_offset = 0;
char *arg;
int verbose = 0;
FILE *inf;
- long file_size;
- char *buf, *p;
+ char buf[100001];
char *prog = *argv;
- int count = 0;
int no = 0;
+ int xml = 0;
+ FILE *cfile = 0;
+ char *from = 0, *to = 0;
+ int num = 1;
+
+#if HAVE_LOCALE_H
+ setlocale(LC_CTYPE, "");
+#endif
+#if HAVE_LANGINFO_H
+#ifdef CODESET
+ to = nl_langinfo(CODESET);
+#endif
+#endif
- while ((ret = options("v", argv, argc, &arg)) != -2)
+ while ((r = options("pvc:xOXIf:t:2", argv, argc, &arg)) != -2)
{
+ int count;
no++;
- switch (ret)
+ switch (r)
{
+ case 'f':
+ from = arg;
+ break;
+ case 't':
+ to = arg;
+ break;
+ case 'c':
+ if (cfile)
+ fclose (cfile);
+ cfile = fopen (arg, "w");
+ break;
+ case 'x':
+ xml = YAZ_MARC_SIMPLEXML;
+ break;
+ case 'O':
+ xml = YAZ_MARC_OAIMARC;
+ break;
+ case 'X':
+ xml = YAZ_MARC_MARCXML;
+ break;
+ case 'I':
+ xml = YAZ_MARC_ISO2709;
+ break;
+ case 'p':
+ print_offset = 1;
+ break;
+ case '2':
+ libxml_dom_test = 1;
+ break;
case 0:
- inf = fopen (arg, "r");
+ inf = fopen (arg, "rb");
+ count = 0;
if (!inf)
{
fprintf (stderr, "%s: cannot open %s:%s\n",
prog, arg, strerror (errno));
- exit (1);
- }
- if (fseek (inf, 0L, SEEK_END))
- {
- fprintf (stderr, "%s: cannot seek in %s:%s\n",
- prog, arg, strerror (errno));
- exit (1);
- }
- file_size = ftell (inf);
- if (fseek (inf, 0L, SEEK_SET))
- {
- fprintf (stderr, "%s: cannot seek in %s:%s\n",
- prog, arg, strerror (errno));
- exit (1);
+ exit(1);
}
- buf = (char *)xmalloc (file_size);
- if (!buf)
- {
- fprintf (stderr, "%s: cannot xmalloc: %s\n",
- prog, strerror (errno));
- exit (1);
- }
- if ((long) fread (buf, 1, file_size, inf) != file_size)
- {
- fprintf (stderr, "%s: cannot read %s: %s\n",
- prog, arg, strerror (errno));
- exit (1);
- }
- for (p = buf; (ret = marc_display_ex (p, stdout, verbose)) > 0;)
- {
- p += ret;
- count++;
+ if (cfile)
+ fprintf (cfile, "char *marc_records[] = {\n");
+ if (1)
+ {
+ yaz_marc_t mt = yaz_marc_create();
+ yaz_iconv_t cd = 0;
+
+ if (from && to)
+ {
+ cd = yaz_iconv_open(to, from);
+ if (!cd)
+ {
+ fprintf(stderr, "conversion from %s to %s "
+ "unsupported\n", from, to);
+ exit(2);
+ }
+ yaz_marc_iconv(mt, cd);
+ }
+ yaz_marc_xml(mt, xml);
+ yaz_marc_debug(mt, verbose);
+ while (1)
+ {
+ int len;
+ char *result;
+ int rlen;
+
+ r = fread (buf, 1, 5, inf);
+ if (r < 5)
+ {
+ if (r && print_offset)
+ printf ("Extra %d bytes", r);
+ break;
+ }
+ if (print_offset)
+ {
+ long off = ftell(inf);
+ printf ("Record %d offset %ld\n", num, (long) off);
+ }
+ len = atoi_n(buf, 5);
+ if (len < 25 || len > 100000)
+ break;
+ len = len - 5;
+ r = fread (buf + 5, 1, len, inf);
+ if (r < len)
+ break;
+ r = yaz_marc_decode_buf (mt, buf, -1, &result, &rlen);
+ if (r <= 0)
+ break;
+ fwrite (result, rlen, 1, stdout);
+#if HAVE_XML2
+ if (libxml_dom_test)
+ {
+ xmlDocPtr doc = xmlParseMemory(result, rlen);
+ if (!doc)
+ fprintf(stderr, "xmLParseMemory failed\n");
+ else
+ {
+ int i;
+ xmlXPathContextPtr xpathCtx;
+ xmlXPathObjectPtr xpathObj;
+ static const char *xpathExpr[] = {
+ "/record/datafield[@tag='245']/subfield[@code='a']",
+ "/record/datafield[@tag='100']/subfield",
+ "/record/datafield[@tag='245']/subfield[@code='a']",
+ "/record/datafield[@tag='650']/subfield",
+ "/record/datafield[@tag='650']",
+ 0};
+
+ xpathCtx = xmlXPathNewContext(doc);
+
+ for (i = 0; xpathExpr[i]; i++) {
+ xpathObj = xmlXPathEvalExpression(xpathExpr[i], xpathCtx);
+ if(xpathObj == NULL) {
+ fprintf(stderr,"Error: unable to evaluate xpath expression \"%s\"\n", xpathExpr[i]);
+ }
+ else
+ {
+ print_xpath_nodes(xpathObj->nodesetval, stdout);
+ xmlXPathFreeObject(xpathObj);
+ }
+ }
+ xmlXPathFreeContext(xpathCtx);
+ xmlFreeDoc(doc);
+ }
+ }
+#endif
+ if (cfile)
+ {
+ char *p = buf;
+ int i;
+ if (count)
+ fprintf (cfile, ",");
+ fprintf (cfile, "\n");
+ for (i = 0; i < r; i++)
+ {
+ if ((i & 15) == 0)
+ fprintf (cfile, " \"");
+ fprintf (cfile, "\\x%02X", p[i] & 255);
+
+ if (i < r - 1 && (i & 15) == 15)
+ fprintf (cfile, "\"\n");
+
+ }
+ fprintf (cfile, "\"\n");
+ }
+ num++;
+ }
+ count++;
+ if (cd)
+ yaz_iconv_close(cd);
+ yaz_marc_destroy(mt);
}
- fclose (inf);
- xfree (buf);
+ if (cfile)
+ fprintf (cfile, "};\n");
+ fclose(inf);
break;
case 'v':
verbose++;
break;
default:
- fprintf (stderr, "Usage: %s [-v] file...\n", prog);
+ usage(prog);
exit (1);
}
}
+ if (cfile)
+ fclose (cfile);
if (!no)
{
- fprintf (stderr, "Usage: %s [-v] file...\n", prog);
+ usage(prog);
exit (1);
}
exit (0);