Update m4

[idzebra-moved-to-github.git] / doc / administration.xml
diff --git a/doc/administration.xml b/doc/administration.xml

index fbb02e2..762ba7d 100644 (file)
--- a/doc/administration.xml
+++ b/doc/administration.xml
@@ -1,5 +1,4 @@
  <chapter id="administration">
- <!-- $Id: administration.xml,v 1.54 2007-12-19 09:30:29 adam Exp $ -->
   <title>Administrating &zebra;</title>
   <!-- ### It's a bit daft that this chapter (which describes half of
            the configuration-file formats) is separated from
@@ -313,6 +312,19 @@
       </varlistentry>
  
       <varlistentry>
+      <term>sortmax: <replaceable>integer</replaceable></term>
+      <listitem>
+       <para>
+    Specifies the maximum number of records that will be sorted
+    in a result set.  If the result set contains more than 
+    <replaceable>integer</replaceable> records, records after the
+    limit will not be sorted.  If omitted, the default value is
+    1,000.
+       </para>
+      </listitem>
+     </varlistentry>
+
+     <varlistentry>
        <term>staticrank: <replaceable>integer</replaceable></term>
        <listitem>
         <para>
@@ -326,13 +338,13 @@
  
  
       <varlistentry>
-      <term>estimatehits:: <replaceable>integer</replaceable></term>
+      <term>estimatehits: <replaceable>integer</replaceable></term>
        <listitem>
         <para>
-       Controls whether &zebra; should calculate approximite hit counts and
+       Controls whether &zebra; should calculate approximate hit counts and
         at which hit count it is to be enabled.
-       A value of 0 disables approximiate hit counts.
-       For a positive value approximaite hit count is enabled
+       A value of 0 disables approximate hit counts.
+       For a positive value approximate hit count is enabled
         if it is known to be larger than <replaceable>integer</replaceable>.
         </para>
         <para>
@@ -426,7 +438,7 @@
       <replaceable>permstring</replaceable></term>
       <listitem>
        <para>
-       Specifies permissions (priviledge) for a user that are allowed
+       Specifies permissions (privilege) for a user that are allowed
         to access &zebra; via the passwd system. There are two kinds
         of permissions currently: read (r) and write(w). By default
         users not listed in a permission directive are given the read
@@ -441,13 +453,53 @@
      </varlistentry>
  
      <varlistentry>
-      <term>dbaccess <replaceable>accessfile</replaceable></term>
+      <term>dbaccess: <replaceable>accessfile</replaceable></term>
        <listitem>
          <para>
           Names a file which lists database subscriptions for individual users.
-         The access file should consists of lines of the form <literal>username:
-         dbnames</literal>, where dbnames is a list of database names, seprated by
-         '+'. No whitespace is allowed in the database list.
+         The access file should consists of lines of the form
+          <literal>username: dbnames</literal>, where dbnames is a list of
+          database names, separated by '+'. No whitespace is allowed in the
+          database list.
+       </para>
+      </listitem>
+    </varlistentry>
+
+    <varlistentry>
+      <term>encoding: <replaceable>charsetname</replaceable></term>
+      <listitem>
+        <para>
+         Tells &zebra; to interpret the terms in Z39.50 queries as
+         having been encoded using the specified character
+         encoding.  The default is <literal>ISO-8859-1</literal>; one
+         useful alternative is <literal>UTF-8</literal>.
+       </para>
+      </listitem>
+    </varlistentry>
+
+    <varlistentry>
+      <term>storeKeys: <replaceable>value</replaceable></term>
+      <listitem>
+        <para>
+          Specifies whether &zebra; keeps a copy of indexed keys.
+          Use a value of 1 to enable; 0 to disable. If storeKeys setting is
+          omitted, it is enabled. Enabled storeKeys
+          are required for updating and deleting records.  Disable only 
+          storeKeys to save space and only plan to index data once.
+       </para>
+      </listitem>
+    </varlistentry>
+
+    <varlistentry>
+      <term>storeData: <replaceable>value</replaceable></term>
+      <listitem>
+        <para>
+          Specifies whether &zebra; keeps a copy of indexed records.
+          Use a value of 1 to enable; 0 to disable. If storeData setting is
+          omitted, it is enabled. A storeData setting of 0 (disabled) makes
+          Zebra fetch records from the original locaction in the file 
+          system using filename, file offset and file length. For the
+          DOM and ALVIS filter, the storeData setting is ignored.
         </para>
        </listitem>
      </varlistentry>
@@ -774,9 +826,7 @@
     The value of the <literal>register</literal> setting is a sequence
     of tokens. Each token takes the form:
     
-   <screen>
-    <emphasis>dir</emphasis><literal>:</literal><emphasis>size</emphasis> 
-   </screen>
+   <emphasis>dir</emphasis><literal>:</literal><emphasis>size</emphasis> 
     
     The <emphasis>dir</emphasis> specifies a directory in which index files
     will be stored and the <emphasis>size</emphasis> specifies the maximum
@@ -1030,7 +1080,7 @@
    <title>Static Ranking</title>
    
     <para>
-    &zebra; uses internally inverted indexes to look up term occurencies
+    &zebra; uses internally inverted indexes to look up term frequencies
      in documents. Multiple queries from different indexes can be
      combined by the binary boolean operations <literal>AND</literal>, 
      <literal>OR</literal> and/or <literal>NOT</literal> (which
@@ -1121,7 +1171,7 @@
     <para>
       The default <literal>rank-1</literal> ranking module implements a 
       TF/IDF (Term Frequecy over Inverse Document Frequency) like
-     algorithm. In contrast to the usual defintion of TF/IDF
+     algorithm. In contrast to the usual definition of TF/IDF
       algorithms, which only considers searching in one full-text
       index, this one works on multiple indexes at the same time.
       More precisely, 
@@ -1834,7 +1884,7 @@ where g = rset_count(terms[i]->rset) is the count of all documents in this speci
     <sect2 id="administration-extended-services-debugging">
      <title>Extended services debugging guide</title>
      <para>
-     When debugging ES over PHP we recomment the following order of tests:
+     When debugging ES over PHP we recommend the following order of tests:
      </para>
  
      <itemizedlist>
@@ -1855,14 +1905,14 @@ where g = rset_count(terms[i]->rset) is the count of all documents in this speci
         <literal>yaz-client</literal> like described in
         <xref linkend="administration-extended-services-yaz-client"/>,
         and
-       remeber the <literal>-a</literal> option which tells you what
+       remember the <literal>-a</literal> option which tells you what
         goes over the wire! Notice also the section on permissions:
         try 
         <screen>
          perm.anonymous: rw
         </screen>
         in <literal>zebra.cfg</literal> to make sure you do not run into 
-       permission  problems (but never expose such an unsecure setup on the 
+       permission  problems (but never expose such an insecure setup on the 
         internet!!!). Then, make sure to set the general
         <literal>recordType</literal> instruction, pointing correctly
         to the GRS-1 filters,