X-Git-Url: http://git.indexdata.com/?p=yaz-moved-to-github.git;a=blobdiff_plain;f=util%2Fyaz-icu.c;h=10fa2f599ffa53da33e09ada8850af81893c0f07;hp=4f0368e3d579e401447a14a984a53e9d46ac5bf3;hb=36f0d152f5f2b4d6ef4bcb01a041f4c16c1deaf8;hpb=e310bbc88afee1090799a0183d75c35d5eb060d9 diff --git a/util/yaz-icu.c b/util/yaz-icu.c index 4f0368e..10fa2f5 100644 --- a/util/yaz-icu.c +++ b/util/yaz-icu.c @@ -1,8 +1,6 @@ -/* - * Copyright (C) 1995-2007, Index Data ApS +/* This file is part of the YAZ toolkit. + * Copyright (C) 1995-2009 Index Data * See the file LICENSE for details. - * - * $Id: yaz-icu.c,v 1.16 2008-01-14 22:58:06 adam Exp $ */ #if HAVE_CONFIG_H @@ -32,6 +30,7 @@ static struct config_t { char conffile[1024]; char print[1024]; int xmloutput; + int sortoutput; yaz_icu_chain_t chain; FILE * infile; FILE * outfile; @@ -45,6 +44,7 @@ void print_option_error(const struct config_t *p_config) fprintf(stderr, "yaz-icu\n" " [-c (path/to/config/file.xml)]\n" " [-p (a|c|l|t)] print ICU info \n" + " [-s] Show sort normalization key\n" " [-x] XML output\n" "\n" "Examples:\n" @@ -73,13 +73,14 @@ void read_params(int argc, char **argv, struct config_t *p_config) p_config->conffile[0] = 0; p_config->print[0] = 0; p_config->xmloutput = 0; + p_config->sortoutput = 0; p_config->chain = 0; p_config->infile = stdin; p_config->outfile = stdout; /* set up command line parameters */ - while ((ret = options("c:p:x", argv, argc, &arg)) != -2) + while ((ret = options("c:p:xs", argv, argc, &arg)) != -2) { switch (ret) { @@ -89,10 +90,14 @@ void read_params(int argc, char **argv, struct config_t *p_config) case 'p': strcpy(p_config->print, arg); break; + case 's': + p_config->sortoutput = 1; + break; case 'x': p_config->xmloutput = 1; break; default: + printf("Got %d\n", ret); print_option_error(p_config); } } @@ -395,7 +400,7 @@ static void print_icu_xml_locales(const struct config_t *p_config) if(U_FAILURE(status)) { fprintf(stderr, "ICU Error: %d %s\n", status, u_errorName(status)); - exit(status); + exit(2); } } @@ -438,23 +443,23 @@ static void process_text_file(const struct config_t *p_config) long unsigned int line_count = 0; UErrorCode status = U_ZERO_ERROR; - int success = 0; - if (! xml_node) + if (!xml_node) { printf("Could not parse XML config file '%s' \n", config.conffile); - exit (1); + exit(1); } config.chain = icu_chain_xml_config(xml_node, 1, &status); - if (config.chain && U_SUCCESS(status)) - success = 1; - else { + if (!config.chain || !U_SUCCESS(status)) + { printf("Could not set up ICU chain from config file '%s' \n", config.conffile); - exit (1); + if (!U_SUCCESS(status)) + printf("ICU Error: %d %s\n", status, u_errorName(status)); + exit(1); } if (p_config->xmloutput) @@ -466,49 +471,70 @@ static void process_text_file(const struct config_t *p_config) /* read input lines for processing */ while ((line=fgets(linebuf, sizeof(linebuf)-1, config.infile))) { - success = icu_chain_assign_cstr(config.chain, line, &status); + WRBUF sw = wrbuf_alloc(); + WRBUF cdata = wrbuf_alloc(); + int success = icu_chain_assign_cstr(config.chain, line, &status); line_count++; while (success && icu_chain_next_token(config.chain, &status)) { - WRBUF sw = wrbuf_alloc(); if (U_FAILURE(status)) success = 0; - else { + else + { const char *sortkey = icu_chain_token_sortkey(config.chain); wrbuf_rewind(sw); wrbuf_puts_escaped(sw, sortkey); token_count++; if (p_config->xmloutput) { - /* should XML encode this. Bug #1902 */ fprintf(config.outfile, - "\n", - token_count, - line_count, - icu_chain_token_norm(config.chain), - icu_chain_token_display(config.chain), - wrbuf_cstr(sw)); + "sortoutput) + { + wrbuf_rewind(cdata); + wrbuf_xmlputs(cdata, wrbuf_cstr(sw)); + fprintf(config.outfile, " sortkey=\"%s\"", + wrbuf_cstr(cdata)); + } + fprintf(config.outfile, "/>\n"); } else - fprintf(config.outfile, "%lu %lu '%s' '%s' '%s'\n", + { + fprintf(config.outfile, "%lu %lu '%s' '%s'", token_count, line_count, icu_chain_token_norm(config.chain), - icu_chain_token_display(config.chain), - wrbuf_cstr(sw)); + icu_chain_token_display(config.chain)); + if (p_config->sortoutput) + { + fprintf(config.outfile, " '%s'", wrbuf_cstr(sw)); + } + fprintf(config.outfile, "\n"); + } } - wrbuf_destroy(sw); } - + wrbuf_destroy(sw); + wrbuf_destroy(cdata); } if (p_config->xmloutput) - fprintf(config.outfile, + fprintf(config.outfile, "\n" "\n"); - + icu_chain_destroy(config.chain); xmlFreeDoc(doc); if (line) @@ -538,15 +564,17 @@ int main(int argc, char **argv) "re-configure and re-compile\n"); + exit(3); #endif /* YAZ_HAVE_ICU */ - return(0); + return 0; } /* * Local variables: * c-basic-offset: 4 + * c-file-style: "Stroustrup" * indent-tabs-mode: nil * End: * vim: shiftwidth=4 tabstop=8 expandtab