Directive s=pw sets structure to phrase if term includes blank(s).
[yaz-moved-to-github.git] / retrieval / d1_write.c
index b631903..eb64130 100644 (file)
@@ -1,10 +1,24 @@
 /*
- * Copyright (c) 1995-1998, Index Data.
+ * Copyright (c) 1995-1999, Index Data.
  * See the file LICENSE for details.
  * Sebastian Hammer, Adam Dickmeiss
  *
  * $Log: d1_write.c,v $
- * Revision 1.5  1998-06-05 08:57:43  adam
+ * Revision 1.9  2000-11-29 14:22:47  adam
+ * Implemented XML/SGML attributes for data1 so that d1_read reads them
+ * and d1_write generates proper attributes for XML/SGML records. Added
+ * register locking for threaded version.
+ *
+ * Revision 1.8  1999/11/30 13:47:12  adam
+ * Improved installation. Moved header files to include/yaz.
+ *
+ * Revision 1.7  1999/10/21 12:06:29  adam
+ * Retrieval module no longer uses ctype.h - functions.
+ *
+ * Revision 1.6  1999/07/06 12:16:00  adam
+ * Improved layout generated record in SGML/XML format.
+ *
+ * Revision 1.5  1998/06/05 08:57:43  adam
  * Fixed problem with function wordlen.
  *
  * Revision 1.4  1998/05/18 13:07:08  adam
  */
 
 #include <string.h>
-#include <ctype.h>
 
-#include <data1.h>
-#include <wrbuf.h>
+#include <yaz/data1.h>
+#include <yaz/wrbuf.h>
 
 #define IDSGML_MARGIN 75
 
@@ -36,7 +49,7 @@ static int wordlen(char *b, int max)
 {
     int l = 0;
 
-    while (l < max && !isspace(*b))
+    while (l < max && !d1_isspace(*b))
        l++, b++;
     return l;
 }
@@ -58,76 +71,86 @@ static int nodetoidsgml(data1_node *n, int select, WRBUF b, int col)
                tag = c->u.tag.element->tag->names->name; /* first name */
            else
                tag = c->u.tag.tag; /* local string tag */
-           if (data1_matchstr(tag, "wellknown")) /* skip wellknown */
+           if (!data1_matchstr(tag, "wellknown")) /* skip wellknown */
            {
-               sprintf(line, "<%s>\n", tag);
+               if (nodetoidsgml(c, select, b, col) < 0)
+                   return -1;
+           }
+           else
+           {
+#if DATA1_USING_XATTR
+               data1_xattr *p;
+#endif
+               sprintf (line, "%*s<", col, "");
+               wrbuf_puts (b, line);
+               wrbuf_puts (b, tag);
+#if DATA1_USING_XATTR
+               for (p = c->u.tag.attributes; p; p = p->next)
+               {
+                   wrbuf_putc (b, ' ');
+                   wrbuf_puts (b, p->name);
+                   wrbuf_putc (b, '=');
+                   wrbuf_putc (b, '"');
+                   wrbuf_puts (b, p->value);
+                   wrbuf_putc (b, '"');
+               }
+#endif
+               wrbuf_puts(b, ">\n");
+               if (nodetoidsgml(c, select, b, (col > 40) ? 40 : col+2) < 0)
+                   return -1;
+               sprintf (line, "%*s</%s>\n", col, "", tag);
                wrbuf_write(b, line, strlen(line));
-               col = 0;
            }
-           if (nodetoidsgml(c, select, b, col) < 0)
-               return -1;
-           wrbuf_write(b, "</>\n", 4);
-           col = 0;
        }
        else if (c->which == DATA1N_data)
        {
            char *p = c->u.data.data;
            int l = c->u.data.len;
            int first = 1;
+           int lcol = col;
 
+           sprintf(line, "%*s", col, "");
+           wrbuf_write(b, line, strlen(line));
            switch (c->u.data.what)
            {
            case DATA1I_text:
                while (l)
                {
                    int wlen;
-
-                   while (l && isspace(*p))
+                   
+                   while (l && d1_isspace(*p))
                        p++, l--;
                    if (!l)
                        break;
                    /* break if we'll cross margin and word is not too long */
-                   if (col + (wlen = wordlen(p, l)) > IDSGML_MARGIN && wlen <
+                   if (lcol + (wlen = wordlen(p, l)) > IDSGML_MARGIN && wlen <
                        IDSGML_MARGIN)
                    {
-                       sprintf(line, "\n");
-                       col = 0;
+                       sprintf(line, "\n%*s", col, "");
+                       lcol = col;
                        wrbuf_write(b, line, strlen(line));
                        first = 1;
                    }
                    if (!first)
                    {
                        wrbuf_putc(b, ' ');
-                       col++;
+                       lcol++;
                    }
-                   while (l && !isspace(*p))
+                   while (l && !d1_isspace(*p))
                    {
-#if 0
-                       if (col > NTOBUF_MARGIN)
-                       {
-                           wrbuf_putc(b, '=');
-                           wrbuf_putc(b, '\n');
-                           sprintf(line, "%*s", indent * NTOBUF_INDENT, "");
-                           wrbuf_write(b, line, strlen(line));
-                           col = indent * NTOBUF_INDENT;
-                       }
-#endif
                        wrbuf_putc(b, *p);
                        p++;
                        l--;
-                       col++;
+                       lcol++;
                    }
                    first = 0;
                }
                wrbuf_write(b, "\n", 1);
-               col = 0;
                break;
            case DATA1I_num:
-               wrbuf_putc(b, ' ');
                wrbuf_write(b, c->u.data.data, c->u.data.len);
                break;
            case DATA1I_oid:
-               wrbuf_putc(b, ' ');
                wrbuf_write(b, c->u.data.data, c->u.data.len);
            }
        }
@@ -139,7 +162,7 @@ char *data1_nodetoidsgml (data1_handle dh, data1_node *n, int select, int *len)
 {
     WRBUF b = data1_get_wrbuf (dh);
     char line[1024];
-
+    
     wrbuf_rewind(b);
     
     sprintf(line, "<%s>\n", n->u.root.type);