X-Git-Url: http://git.indexdata.com/?p=idzebra-moved-to-github.git;a=blobdiff_plain;f=index%2Fmain.c;h=8cdc1061319f262ad3308feaf55d7a32bafbd8b3;hp=71e8325da7e7f73b6df52877b6479e4c2403478a;hb=519fefb91135ad52134b9fc4e82b3874f5525a2b;hpb=fb99bfcb44d29215f411d82646c59f2f74f5a25c diff --git a/index/main.c b/index/main.c index 71e8325..8cdc106 100644 --- a/index/main.c +++ b/index/main.c @@ -1,39 +1,42 @@ -/* - * Copyright (C) 1995, Index Data I/S - * All rights reserved. - * Sebastian Hammer, Adam Dickmeiss - * - * $Log: main.c,v $ - * Revision 1.7 1995-09-05 15:28:39 adam - * More work on search engine. - * - * Revision 1.6 1995/09/04 12:33:43 adam - * Various cleanup. YAZ util used instead. - * - * Revision 1.5 1995/09/04 09:10:39 adam - * More work on index add/del/update. - * Merge sort implemented. - * Initial work on z39 server. - * - * Revision 1.4 1995/09/01 14:06:36 adam - * Split of work into more files. - * - * Revision 1.3 1995/09/01 10:57:07 adam - * Minor changes. - * - * Revision 1.2 1995/09/01 10:30:24 adam - * More work on indexing. Not working yet. - * - * Revision 1.1 1995/08/31 14:50:24 adam - * New simple file index tool. - * - */ +/* $Id: main.c,v 1.100 2002-10-22 12:51:08 adam Exp $ + Copyright (C) 1995,1996,1997,1998,1999,2000,2001,2002 + Index Data Aps + +This file is part of the Zebra server. + +Zebra is free software; you can redistribute it and/or modify it under +the terms of the GNU General Public License as published by the Free +Software Foundation; either version 2, or (at your option) any later +version. + +Zebra is distributed in the hope that it will be useful, but WITHOUT ANY +WARRANTY; without even the implied warranty of MERCHANTABILITY or +FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License +for more details. + +You should have received a copy of the GNU General Public License +along with Zebra; see the file LICENSE.zebra. If not, write to the +Free Software Foundation, 59 Temple Place - Suite 330, Boston, MA +02111-1307, USA. +*/ + + #include +#include #include +#ifdef WIN32 +#include +#else #include +#include +#endif +#include +#if HAVE_SYS_TIMES_H +#include +#endif -#include -#include "index.h" +#include +#include "zebraapi.h" char *prog; @@ -42,77 +45,249 @@ int main (int argc, char **argv) int ret; int cmd = 0; char *arg; - char *base_name = NULL; - char *base_path = NULL; + char *configName = 0; + int nsections = 0; + int disableCommit = 0; + char *mem_max = 0; + + int trans_started=0; +#if HAVE_SYS_TIMES_H + struct tms tms1, tms2; + struct timeval start_time, end_time; + long usec; +#endif +#ifndef WIN32 + char nbuf[100]; +#endif + struct recordGroup rGroupDef; + ZebraService zs = 0; + ZebraHandle zh = 0; + + nmem_init (); + +#ifdef WIN32 +#else + sprintf(nbuf, "%.40s(%d)", *argv, getpid()); + yaz_log_init_prefix (nbuf); +#endif +#if HAVE_SYS_TIMES_H + times(&tms1); + gettimeofday(&start_time, 0); +#endif + + rGroupDef.groupName = NULL; + rGroupDef.databaseName = NULL; + rGroupDef.path = NULL; + rGroupDef.recordId = NULL; + rGroupDef.recordType = NULL; + rGroupDef.flagStoreData = -1; + rGroupDef.flagStoreKeys = -1; + rGroupDef.flagRw = 1; + rGroupDef.databaseNamePath = 0; + rGroupDef.explainDatabase = 0; + rGroupDef.fileVerboseLimit = 100000; + rGroupDef.followLinks = -1; prog = *argv; - while ((ret = options ("r:v:", argv, argc, &arg)) != -2) + if (argc < 2) + { + fprintf (stderr, "%s [options] command ...\n" + "Commands:\n" + " update Update index with files below .\n" + " If is empty filenames are read from stdin.\n" + " delete Delete index with files below .\n" + " commit Commit changes\n" + " clean Clean shadow files\n" + "Options:\n" + " -t Index files as (grs or text).\n" + " -c Read configuration file .\n" + " -g Index files according to group settings.\n" + " -d Records belong to Z39.50 database .\n" + " -m Use before flushing keys to disk.\n" + " -n Don't use shadow system.\n" + " -s Show analysis on stdout, but do no work.\n" + " -v Set logging to .\n" + " -l Write log to .\n" + " -L Don't follow symbolic links.\n" + " -f Display information for the first records.\n" + " -V Show version.\n", *argv + ); + exit (1); + } + while ((ret = options ("sVt:c:g:d:m:v:nf:l:L" + , argv, argc, &arg)) != -2) { if (ret == 0) { - if (!base_name) + if(cmd == 0) /* command */ { - base_name = arg; - - common_resource = res_open (base_name); - if (!common_resource) + if (!zs) { - logf (LOG_FATAL, "Cannot open resource `%s'", base_name); - exit (1); + const char *config = configName ? configName : "zebra.cfg"; + logf (LOG_LOG, "Zebra version %s %s", + ZEBRAVER, ZEBRADATE); + zs = zebra_start (config); + if (!zs) + { + yaz_log (LOG_FATAL, "Cannot read config %s", config); + exit (1); + } + zh = zebra_open (zs); + if (disableCommit) + zebra_shadow_enable (zh, 0); } - } - else if(cmd == 0) /* command */ - { - if (!strcmp (arg, "add")) + + if (rGroupDef.databaseName) { - cmd = 'a'; + if (zebra_select_database (zh, rGroupDef.databaseName)) + { + logf(LOG_FATAL, "Could not select database %s errCode=%d", + rGroupDef.databaseName, zebra_errCode(zh) ); + exit (1); + } } - else if (!strcmp (arg, "del")) + else { + if (zebra_select_database (zh, "Default")) + { + logf(LOG_FATAL, "Could not select database Default errCode=%d", + zebra_errCode(zh) ); + exit (1); + } + } + if (mem_max) + zebra_set_resource(zh, "memmax",mem_max); + + if (!strcmp (arg, "update")) + cmd = 'u'; + else if (!strcmp (arg, "update1")) + cmd = 'U'; + else if (!strcmp (arg, "update2")) + cmd = 'm'; + else if (!strcmp (arg, "dump")) + cmd = 's'; + else if (!strcmp (arg, "del") || !strcmp(arg, "delete")) cmd = 'd'; + else if (!strcmp (arg, "init")) + { + zebra_init (zh); + } + else if (!strcmp (arg, "commit")) + { + zebra_commit (zh); + } + else if (!strcmp (arg, "clean")) + { + assert (!"todo"); + } + else if (!strcmp (arg, "stat") || !strcmp (arg, "status")) + { + zebra_register_statistics (zh,0); + } + else if (!strcmp (arg, "dump") || !strcmp (arg, "dumpdict")) + { + zebra_register_statistics (zh,1); + } + else if (!strcmp (arg, "compact")) + { + zebra_compact (zh); } else { - logf (LOG_FATAL, "Unknown command: %s", arg); + logf (LOG_FATAL, "unknown command: %s", arg); exit (1); } } - else + else { - unlink ("keys.tmp"); - key_open ("keys.tmp"); - repository (cmd, arg, base_path); - cmd = 0; + rGroupDef.path = arg; + zebra_set_group (zh, &rGroupDef); + if (!trans_started) + { + trans_started=1; + zebra_begin_trans (zh); + } + + switch (cmd) + { + case 'u': + zebra_repository_update (zh); + break; + case 'd': + zebra_repository_delete (zh); + break; + case 's': + logf (LOG_LOG, "dumping %s", rGroupDef.path); + zebra_repository_show (zh); + nsections = 0; + break; + default: + nsections = 0; + } + log_event_end (NULL, NULL); } } - else if (ret == 'v') - { - log_init (log_mask_str(arg), prog, NULL); - } - else if (ret == 'r') + else if (ret == 'V') { - base_path = arg; + printf("Zebra %s %s\n", ZEBRAVER, ZEBRADATE); + printf(" (C) 1994-2002, Index Data ApS\n"); +#ifdef WIN32 +#ifdef _DEBUG + printf(" WIN32 Debug\n"); +#else + printf(" WIN32 Release\n"); +#endif +#endif +#if HAVE_BZLIB_H + printf("libbzip2\n" + " (C) 1996-1999 Julian R Seward. All rights reserved.\n"); +#endif } + else if (ret == 'v') + yaz_log_init_level (yaz_log_mask_str(arg)); + else if (ret == 'l') + yaz_log_init_file (arg); + else if (ret == 'm') + mem_max = arg; + else if (ret == 'd') + rGroupDef.databaseName = arg; + else if (ret == 's') + rGroupDef.flagRw = 0; + else if (ret == 'g') + rGroupDef.groupName = arg; + else if (ret == 'f') + rGroupDef.fileVerboseLimit = atoi(arg); + else if (ret == 'c') + configName = arg; + else if (ret == 't') + rGroupDef.recordType = arg; + else if (ret == 'n') + disableCommit = 1; + else if (ret == 'L') + rGroupDef.followLinks = 0; else - { - logf (LOG_FATAL, "Unknown option '-%s'", arg); - exit (1); - } - } - if (!base_name) + logf (LOG_WARN, "unknown option '-%s'", arg); + } /* while arg */ + + if (trans_started) + zebra_end_trans (zh); + + zebra_close (zh); + zebra_stop (zs); +#if HAVE_SYS_TIMES_H + if (trans_started) { - fprintf (stderr, "index [-v log] [-r repository] " - "base cmd1 dir1 cmd2 dir2 ...\n"); - exit (1); + gettimeofday(&end_time, 0); + usec = (end_time.tv_sec - start_time.tv_sec) * 1000000L + + end_time.tv_usec - start_time.tv_usec; + times(&tms2); + yaz_log (LOG_LOG, "zebraidx times: %5.2f %5.2f %5.2f", + (double) usec / 1000000.0, + (double) (tms2.tms_utime - tms1.tms_utime)/100, + (double) (tms2.tms_stime - tms1.tms_stime)/100); } - key_flush (); - if (!key_close ()) - exit (0); - logf (LOG_DEBUG, "Sorting"); - if (!key_sort ("keys.tmp", 1000000)) - exit (0); - logf (LOG_DEBUG, "Input"); - key_input (FNAME_WORD_DICT, FNAME_WORD_ISAM, "keys.tmp", 50); +#endif exit (0); + return 0; }