Added charmap facility to delete leading articles

[idzebra-moved-to-github.git] / doc / administration.xml
diff --git a/doc/administration.xml b/doc/administration.xml

index 2486f70..dca0506 100644 (file)
--- a/doc/administration.xml
+++ b/doc/administration.xml
@@ -1,7 +1,13 @@
  <chapter id="administration">
- <!-- $Id: administration.xml,v 1.4 2002-04-09 19:20:22 adam Exp $ -->
+ <!-- $Id: administration.xml,v 1.17 2004-01-22 16:23:23 heikki Exp $ -->
   <title>Administrating Zebra</title>
- 
+ <!-- ### It's a bit daft that this chapter (which describes half of
+          the configuration-file formats) is separated from
+          "recordmodel.xml" (which describes the other half) by the
+          instructions on running zebraidx and zebrasrv.  Some careful
+          re-ordering is required here.
+ -->
+
   <para>
    Unlike many simpler retrieval systems, Zebra supports safe, incremental
    updates to an existing index.
@@ -100,7 +106,7 @@
    <para>
     You can edit the configuration file with a normal text editor.
     parameter names and values are separated by colons in the file. Lines
-   starting with a hash sign (<literal>&num;</literal>) are
+   starting with a hash sign (<literal>#</literal>) are
     treated as comments.
    </para>
    
@@ -146,13 +152,17 @@
     explained further in the following sections.
    </para>
    
+  <!--
+   FIXME - Didn't Adam make something to have multiple databases in multiple dirs...
+  -->
+  
    <para>
     <variablelist>
      
      <varlistentry>
       <term>
        <emphasis>group</emphasis>
-      .recordType&lsqb;<emphasis>.name</emphasis>&rsqb;:
+      .recordType[<emphasis>.name</emphasis>]:
        <replaceable>type</replaceable>
       </term>
       <listitem>
@@ -186,6 +196,7 @@
       <listitem>
        <para>
         Specifies the Z39.50 database name.
+       <!-- FIXME - now we can have multiple databases in one server. -H -->
        </para>
       </listitem>
      </varlistentry>
@@ -198,6 +209,7 @@
         group of records. If you plan to update/delete this type of
         records later this should be specified as 1; otherwise it
         should be 0 (default), to save register space.
+       <!-- ### this is the first mention of "register" -->
         See <xref linkend="file-ids"/>.
        </para>
       </listitem>
@@ -217,6 +229,7 @@
       </listitem>
      </varlistentry>
      <varlistentry>
+     <!-- ### probably a better place to define "register" -->
       <term>register: <replaceable>register-location</replaceable></term>
       <listitem>
        <para>
@@ -248,7 +261,7 @@
       <term>keyTmpDir: <replaceable>directory</replaceable></term>
       <listitem>
        <para>
-       Directory in which temporary files used during zebraidx' update
+       Directory in which temporary files used during zebraidx's update
         phase are stored. 
        </para>
       </listitem>
@@ -263,7 +276,7 @@
       </listitem>
      </varlistentry>
      <varlistentry>
-     <term>profilePath: <literal>path</literal></term>
+     <term>profilePath: <replaceable>path</replaceable></term>
       <listitem>
        <para>
         Specifies a path of profile specification files. 
@@ -292,6 +305,19 @@
         Specifies <replaceable>size</replaceable> of internal memory
         to use for the zebraidx program.
         The amount is given in megabytes - default is 4 (4 MB).
+       The more memory, the faster large updates happen, up to about
+       half the free memory available on the computer.
+      </para>
+     </listitem>
+    </varlistentry>
+    <varlistentry>
+     <term>tempfiles: <replaceable>Yes/Auto/No</replaceable></term>
+     <listitem>
+      <para>
+       Tells zebra if it should use temporary files when indexing. The
+       default is Auto, in which case zebra uses temporary files only
+       if it would need more that <replaceable>memMax</replaceable> 
+       megabytes of memory. This should be good for most uses.
        </para>
       </listitem>
      </varlistentry>
@@ -302,13 +328,34 @@
        <para>
         Specifies a directory base for Zebra. All relative paths
         given (in profilePath, register, shadow) are based on this
-       directory. This setting is useful if if you Zebra server
+       directory. This setting is useful if your Zebra server
         is running in a different directory from where
         <literal>zebra.cfg</literal> is located.
        </para>
       </listitem>
      </varlistentry>
  
+     <!--
+     no longer supported.
+    <varlistentry>
+     <term>tagsysno: 0|1</term>
+     <listitem>
+      <para>
+       Species whether Zebra should include system-number data in XML
+       and GRS-1 records returned to clients, represented by the
+       <literal>&lt;localControlNumber&gt;</literal> element in XML
+       and the <literal>(1,14)</literal> tag in GRS-1.
+       The content of these elements is an internally-generated
+       integer uniquely identifying the record within its database.
+       It is included by default but may be turned off, with
+       <literal>tagsysno: 0</literal> for databases in which a local
+       control number is explicitly specified in the input records
+       themselves.
+      </para>
+     </listitem>
+    </varlistentry>
+     -->
+     
     </variablelist>
    </para>
    
@@ -324,8 +371,9 @@
     That is, when a client wishes to retrieve a record
     following a search operation, the files are accessed from the place
     where you originally put them - if you remove the files (without
-   running <literal>zebraidx</literal> again, the client
-   will receive a diagnostic message.
+   running <literal>zebraidx</literal> again, the server will return
+   diagnostic number 14 (``System error in presenting records'') to
+   the client.
    </para>
    
    <para>
@@ -370,7 +418,7 @@
    <para>
     
     <screen>
-    profilePath: /usr/local/yaz
+    profilePath: /usr/local/idzebra/tab
      attset: bib1.att
      simple.recordType: text
      simple.database: textbase
@@ -428,9 +476,13 @@
     in the configuration file. In addition, you should set
     <literal>storeKeys</literal> to <literal>1</literal>, since the Zebra
     indexer must save additional information about the contents of each record
-   in order to modify the indices correctly at a later time.
+   in order to modify the indexes correctly at a later time.
    </para>
    
+   <!--
+    FIXME - There must be a simpler way to do this with Adams string tags -H
+     -->
+
    <para>
     For example, to update records of group <literal>esdd</literal>
     located below
@@ -466,6 +518,7 @@
     and then run <literal>zebraidx</literal> with the
     <literal>update</literal> command.
    </para>
+  <!-- ### what happens if a file contains multiple records? -->
  </sect1>
   
   <sect1 id="generic-ids">
@@ -635,19 +688,22 @@
     each directory in the order specified and use the next specified
     directories as needed.
     The <emphasis>size</emphasis> is an integer followed by a qualifier
-   code, <literal>M</literal> for megabytes,
+   code, 
+   <literal>b</literal> for bytes,
     <literal>k</literal> for kilobytes.
+   <literal>M</literal> for megabytes,
+   <literal>G</literal> for gigabytes.
    </para>
    
    <para>
     For instance, if you have allocated two disks for your register, and
     the first disk is mounted
-   on <literal>/d1</literal> and has 200 MB of free space and the
-   second, mounted on <literal>/d2</literal> has 300 MB, you could
+   on <literal>/d1</literal> and has 2GB of free space and the
+   second, mounted on <literal>/d2</literal> has 3.6 GB, you could
     put this entry in your configuration file:
     
     <screen>
-    register: /d1:200M /d2:300M
+    register: /d1:2G /d2:3600M
     </screen>
     
    </para>
@@ -764,14 +820,13 @@
      In order to make changes to the system take effect for the
      users, you'll have to submit a "commit" command after a
      (sequence of) update operation(s).
-    You can ask the indexer to commit the changes immediately
-    after the update operation:
     </para>
     
     <para>
      
      <screen>
-     $ zebraidx update /d1/records update /d2/more-records commit
+     $ zebraidx update /d1/records 
+     $ zebraidx commit
      </screen>
      
     </para>
@@ -783,7 +838,7 @@
     <para>
      
      <screen>
-     $ zebraidx -g books update /d1/records update /d2/more-records
+     $ zebraidx -g books update /d1/records  /d2/more-records
       $ zebraidx -g fun update /d3/fun-records
       $ zebraidx commit
      </screen>