Added SGML-output filter.
authorSebastian Hammer <quinn@indexdata.com>
Wed, 13 Dec 1995 15:38:43 +0000 (15:38 +0000)
committerSebastian Hammer <quinn@indexdata.com>
Wed, 13 Dec 1995 15:38:43 +0000 (15:38 +0000)
retrieval/d1_write.c [new file with mode: 0644]

diff --git a/retrieval/d1_write.c b/retrieval/d1_write.c
new file mode 100644 (file)
index 0000000..544fba3
--- /dev/null
@@ -0,0 +1,138 @@
+/*
+ * Copyright (c) 1995, Index Data.
+ * See the file LICENSE for details.
+ * Sebastian Hammer, Adam Dickmeiss
+ *
+ * $Log: d1_write.c,v $
+ * Revision 1.1  1995-12-13 15:38:43  quinn
+ * Added SGML-output filter.
+ *
+ *
+ */
+
+#include <string.h>
+#include <ctype.h>
+
+#include <data1.h>
+#include <wrbuf.h>
+
+#define IDSGML_MARGIN 75
+
+static int wordlen(char *b)
+{
+    int l = 0;
+
+    while (*b && !isspace(*b))
+       l++, b++;
+    return l;
+}
+
+static int nodetoidsgml(data1_node *n, int select, WRBUF b, int col)
+{
+    data1_node *c;
+    char line[1024];
+
+    for (c = n->child; c; c = c->next)
+    {
+       char *tag;
+
+       if (c->which == DATA1N_tag)
+       {
+           if (select && c->u.tag.node_selected)
+               continue;
+           if (c->u.tag.element && c->u.tag.element->tag)
+               tag = c->u.tag.element->tag->names->name; /* first name */
+           else
+               tag = c->u.tag.tag; /* local string tag */
+           if (data1_matchstr(tag, "wellknown")) /* skip wellknown */
+           {
+               sprintf(line, "<%s>\n", tag);
+               wrbuf_write(b, line, strlen(line));
+               col = 0;
+           }
+           if (nodetoidsgml(c, select, b, col) < 0)
+               return -1;
+           wrbuf_write(b, "</>\n", 5);
+           col = 0;
+       }
+       else if (c->which == DATA1N_data)
+       {
+           char *p = c->u.data.data;
+           int l = c->u.data.len;
+           int first = 1;
+
+           if (c->u.data.what == DATA1I_text)
+           {
+               while (l)
+               {
+                   int wlen;
+
+                   while (l && isspace(*p))
+                       p++, l--;
+                   if (!l)
+                       break;
+                   /* break if we'll cross margin and word is not too long */
+                   if (col + (wlen = wordlen(p)) > IDSGML_MARGIN && wlen <
+                       IDSGML_MARGIN)
+                   {
+                       sprintf(line, "\n");
+                       col = 0;
+                       wrbuf_write(b, line, strlen(line));
+                       first = 1;
+                   }
+                   if (!first)
+                   {
+                       wrbuf_putc(b, ' ');
+                       col++;
+                   }
+                   while (l && !isspace(*p))
+                   {
+#if 0
+                       if (col > NTOBUF_MARGIN)
+                       {
+                           wrbuf_putc(b, '=');
+                           wrbuf_putc(b, '\n');
+                           sprintf(line, "%*s", indent * NTOBUF_INDENT, "");
+                           wrbuf_write(b, line, strlen(line));
+                           col = indent * NTOBUF_INDENT;
+                       }
+#endif
+                       wrbuf_putc(b, *p);
+                       p++;
+                       l--;
+                       col++;
+                   }
+                   first = 0;
+               }
+               wrbuf_write(b, "\n", 1);
+               col = 0;
+           }
+           else if (c->u.data.what == DATA1I_num)
+           {
+               wrbuf_putc(b, ' ');
+               wrbuf_write(b, c->u.data.data, c->u.data.len);
+           }
+       }
+    }
+    return 0;
+}
+
+char *data1_nodetoidsgml(data1_node *n, int select, int *len)
+{
+    static WRBUF b = 0;
+    char line[1024];
+
+    if (!b)
+       b = wrbuf_alloc();
+    else
+       wrbuf_rewind(b);
+    
+    sprintf(line, "<%s>\n", n->u.root.type);
+    wrbuf_write(b, line, strlen(line));
+    if (nodetoidsgml(n, select, b, 0))
+       return 0;
+    sprintf(line, "</%s>\n", n->u.root.type);
+    wrbuf_write(b, line, strlen(line));
+    *len = wrbuf_len(b);
+    return wrbuf_buf(b);
+}