zoom: authenticationMode YAZ-686
[yaz-moved-to-github.git] / src / zoom-sru.c
1 /* This file is part of the YAZ toolkit.
2  * Copyright (C) 1995-2013 Index Data
3  * See the file LICENSE for details.
4  */
5 /**
6  * \file zoom-sru.c
7  * \brief Implements ZOOM SRU
8  */
9 #if HAVE_CONFIG_H
10 #include <config.h>
11 #endif
12
13 #include <assert.h>
14 #include <string.h>
15 #include <errno.h>
16 #include "zoom-p.h"
17
18 #include <yaz/log.h>
19 #include <yaz/pquery.h>
20
21 #if YAZ_HAVE_XML2
22 static void set_SRU_error(ZOOM_connection c, Z_SRW_diagnostic *d)
23 {
24     const char *uri = d->uri;
25     if (uri)
26         ZOOM_set_dset_error(c, ZOOM_uri_to_code(uri), uri, d->details, 0);
27 }
28 #endif
29
30
31 #if YAZ_HAVE_XML2
32 static zoom_ret send_srw(ZOOM_connection c, Z_SRW_PDU *sr)
33 {
34     Z_GDU *gdu;
35     const char *database =  ZOOM_options_get(c->options, "databaseName");
36
37     gdu = z_get_HTTP_Request_uri(c->odr_out, c->host_port,
38                                  database,
39                                  c->proxy ? 1 : 0);
40
41     if (c->sru_mode == zoom_sru_get)
42     {
43         yaz_sru_get_encode(gdu->u.HTTP_Request, sr, c->odr_out, c->charset);
44     }
45     else if (c->sru_mode == zoom_sru_post)
46     {
47         yaz_sru_post_encode(gdu->u.HTTP_Request, sr, c->odr_out, c->charset);
48     }
49     else if (c->sru_mode == zoom_sru_soap)
50     {
51         yaz_sru_soap_encode(gdu->u.HTTP_Request, sr, c->odr_out, c->charset);
52     }
53     else if (c->sru_mode == zoom_sru_solr)
54     {
55         yaz_solr_encode_request(gdu->u.HTTP_Request, sr, c->odr_out, c->charset);
56     }
57     return ZOOM_send_GDU(c, gdu);
58 }
59 #endif
60
61 #if YAZ_HAVE_XML2
62 static Z_SRW_PDU *ZOOM_srw_get_pdu(ZOOM_connection c, int type)
63 {
64     Z_SRW_PDU *sr = yaz_srw_get_pdu(c->odr_out, type, c->sru_version);
65     if (c->url_authentication && c->user)
66     {
67         Z_SRW_extra_arg **ea = &sr->extra_args;
68         while (*ea)
69             ea = &(*ea)->next;
70         *ea = (Z_SRW_extra_arg *) odr_malloc(c->odr_out, sizeof(**ea));
71         (*ea)->name = "x-username";
72         (*ea)->value = c->user;
73         ea = &(*ea)->next;
74         if (c->password)
75         {
76             *ea = (Z_SRW_extra_arg *) odr_malloc(c->odr_out, sizeof(**ea));
77             (*ea)->name = "x-password";
78             (*ea)->value = c->password;
79             ea = &(*ea)->next;
80         }
81         *ea = 0;
82     }
83     else
84     {
85         sr->username = c->user;
86         sr->password = c->password;
87     }
88     return sr;
89 }
90 #endif
91
92 #if YAZ_HAVE_XML2
93 zoom_ret ZOOM_connection_srw_send_scan(ZOOM_connection c)
94 {
95     ZOOM_scanset scan;
96     Z_SRW_PDU *sr = 0;
97     const char *option_val = 0;
98     Z_Query *z_query;
99
100     if (!c->tasks)
101         return zoom_complete;
102     assert (c->tasks->which == ZOOM_TASK_SCAN);
103     scan = c->tasks->u.scan.scan;
104
105     sr = ZOOM_srw_get_pdu(c, Z_SRW_scan_request);
106
107     z_query = ZOOM_query_get_Z_Query(scan->query);
108     /* SRU scan can only carry CQL and PQF */
109     if (z_query->which == Z_Query_type_104)
110     {
111         sr->u.scan_request->query_type = Z_SRW_query_type_cql;
112         sr->u.scan_request->scanClause.cql =
113             odr_strdup(c->odr_out, ZOOM_query_get_query_string(scan->query));
114     }
115     else if (z_query->which == Z_Query_type_1
116              || z_query->which == Z_Query_type_101)
117     {
118         sr->u.scan_request->query_type = Z_SRW_query_type_pqf;
119         sr->u.scan_request->scanClause.pqf =
120             odr_strdup(c->odr_out, ZOOM_query_get_query_string(scan->query));
121     }
122     else
123     {
124         ZOOM_set_error(c, ZOOM_ERROR_UNSUPPORTED_QUERY, 0);
125         return zoom_complete;
126     }
127
128     sr->u.scan_request->maximumTerms = odr_intdup(
129         c->odr_out, ZOOM_options_get_int(scan->options, "number", 10));
130
131     sr->u.scan_request->responsePosition = odr_intdup(
132         c->odr_out, ZOOM_options_get_int(scan->options, "position", 1));
133
134     option_val = ZOOM_options_get(scan->options, "extraArgs");
135     yaz_encode_sru_extra(sr, c->odr_out, option_val);
136     return send_srw(c, sr);
137 }
138 #else
139 zoom_ret ZOOM_connection_srw_send_scan(ZOOM_connection c)
140 {
141     return zoom_complete;
142 }
143 #endif
144
145 #if YAZ_HAVE_XML2
146 zoom_ret ZOOM_connection_srw_send_search(ZOOM_connection c)
147 {
148     const char *facets = 0;
149     int i;
150     int *start, *count;
151     ZOOM_resultset resultset = 0;
152     Z_SRW_PDU *sr = 0;
153     const char *option_val = 0;
154     const char *schema = 0;
155     Z_Query *z_query;
156     Z_FacetList *facet_list = 0;
157     if (c->error)                  /* don't continue on error */
158         return zoom_complete;
159     assert(c->tasks);
160     switch(c->tasks->which)
161     {
162     case ZOOM_TASK_SEARCH:
163         resultset = c->tasks->u.search.resultset;
164         if (!resultset->setname)
165             resultset->setname = xstrdup("default");
166         ZOOM_options_set(resultset->options, "setname", resultset->setname);
167         start = &c->tasks->u.search.start;
168         count = &c->tasks->u.search.count;
169         facets = ZOOM_options_get(resultset->options, "facets");
170         if (facets)
171             facet_list = yaz_pqf_parse_facet_list(c->odr_out, facets);
172         schema = c->tasks->u.search.schema;
173         break;
174     case ZOOM_TASK_RETRIEVE:
175         resultset = c->tasks->u.retrieve.resultset;
176         schema = c->tasks->u.retrieve.schema;
177
178         start = &c->tasks->u.retrieve.start;
179         count = &c->tasks->u.retrieve.count;
180
181         if (*start >= resultset->size)
182             return zoom_complete;
183         if (*start + *count > resultset->size)
184             *count = resultset->size - *start;
185
186         for (i = 0; i < *count; i++)
187         {
188             ZOOM_record rec =
189                 ZOOM_record_cache_lookup(resultset, i + *start,
190                                          c->tasks->u.retrieve.syntax,
191                                          c->tasks->u.retrieve.elementSetName,
192                                          schema);
193             if (!rec)
194                 break;
195             else
196             {
197                 ZOOM_Event event = ZOOM_Event_create(ZOOM_EVENT_RECV_RECORD);
198                 ZOOM_connection_put_event(c, event);
199             }
200         }
201         *start += i;
202         *count -= i;
203
204         if (*count == 0)
205             return zoom_complete;
206         break;
207     default:
208         return zoom_complete;
209     }
210     assert(resultset->query);
211
212     sr = ZOOM_srw_get_pdu(c, Z_SRW_searchRetrieve_request);
213     z_query = ZOOM_query_get_Z_Query(resultset->query);
214
215     if (z_query->which == Z_Query_type_104
216         && z_query->u.type_104->which == Z_External_CQL)
217     {
218         sr->u.request->query_type = Z_SRW_query_type_cql;
219         sr->u.request->query.cql = z_query->u.type_104->u.cql;
220     }
221     else if (z_query->which == Z_Query_type_1 && z_query->u.type_1)
222     {
223         sr->u.request->query_type = Z_SRW_query_type_pqf;
224         sr->u.request->query.pqf =
225             odr_strdup(c->odr_out,
226                        ZOOM_query_get_query_string(resultset->query));
227     }
228     else
229     {
230         ZOOM_set_error(c, ZOOM_ERROR_UNSUPPORTED_QUERY, 0);
231         return zoom_complete;
232     }
233
234     option_val = ZOOM_query_get_sru11(resultset->query);
235     if (option_val)
236     {
237         sr->u.request->sort_type = Z_SRW_sort_type_sort;
238         sr->u.request->sort.sortKeys = odr_strdup(c->odr_out, option_val);
239     }
240     sr->u.request->startRecord = odr_intdup(c->odr_out, *start + 1);
241     sr->u.request->maximumRecords = odr_intdup(
242         c->odr_out, (resultset->step > 0 && resultset->step < *count) ?
243         resultset->step : *count);
244     sr->u.request->recordSchema = odr_strdup_null(c->odr_out, schema);
245     sr->u.request->facetList = facet_list;
246
247     option_val = ZOOM_resultset_option_get(resultset, "recordPacking");
248     if (option_val)
249         sr->u.request->recordPacking = odr_strdup(c->odr_out, option_val);
250
251     option_val = ZOOM_resultset_option_get(resultset, "extraArgs");
252     yaz_encode_sru_extra(sr, c->odr_out, option_val);
253     return send_srw(c, sr);
254 }
255 #else
256 zoom_ret ZOOM_connection_srw_send_search(ZOOM_connection c)
257 {
258     return zoom_complete;
259 }
260 #endif
261
262 #if YAZ_HAVE_XML2
263 static zoom_ret handle_srw_response(ZOOM_connection c,
264                                     Z_SRW_searchRetrieveResponse *res)
265 {
266     ZOOM_resultset resultset = 0;
267     int i;
268     NMEM nmem;
269     ZOOM_Event event;
270     int *start, *count;
271     const char *syntax, *elementSetName, *schema;
272
273     if (!c->tasks)
274         return zoom_complete;
275
276     switch(c->tasks->which)
277     {
278     case ZOOM_TASK_SEARCH:
279         resultset = c->tasks->u.search.resultset;
280         start = &c->tasks->u.search.start;
281         count = &c->tasks->u.search.count;
282         syntax = c->tasks->u.search.syntax;
283         elementSetName = c->tasks->u.search.elementSetName;
284         schema = c->tasks->u.search.schema;
285         /* Required not for reporting client hit count multiple times into session */
286         if (!c->tasks->u.search.recv_search_fired) {
287             yaz_log(YLOG_DEBUG, "posting ZOOM_EVENT_RECV_SEARCH");
288             event = ZOOM_Event_create(ZOOM_EVENT_RECV_SEARCH);
289             ZOOM_connection_put_event(c, event);
290             c->tasks->u.search.recv_search_fired = 1;
291         }
292         if (res->facetList)
293             ZOOM_handle_facet_list(resultset, res->facetList);
294         break;
295     case ZOOM_TASK_RETRIEVE:
296         resultset = c->tasks->u.retrieve.resultset;
297         start = &c->tasks->u.retrieve.start;
298         count = &c->tasks->u.retrieve.count;
299         syntax = c->tasks->u.retrieve.syntax;
300         elementSetName = c->tasks->u.retrieve.elementSetName;
301         schema = c->tasks->u.retrieve.schema;
302         break;
303     default:
304         return zoom_complete;
305     }
306
307     resultset->size = 0;
308
309     if (res->resultSetId)
310         ZOOM_resultset_option_set(resultset, "resultSetId", res->resultSetId);
311
312     yaz_log(c->log_details, "%p handle_srw_response got SRW response OK", c);
313
314     if (res->num_diagnostics > 0)
315     {
316         set_SRU_error(c, &res->diagnostics[0]);
317     }
318     else
319     {
320         if (res->numberOfRecords) {
321             resultset->size = *res->numberOfRecords;
322         }
323         if (res->suggestions) {
324             ZOOM_resultset_option_set(resultset, "suggestions", res->suggestions);
325         }
326         for (i = 0; i<res->num_records; i++)
327         {
328             int pos = *start + i;
329             Z_SRW_record *sru_rec;
330             Z_SRW_diagnostic *diag = 0;
331             int num_diag;
332
333             Z_NamePlusRecord *npr = (Z_NamePlusRecord *)
334                 odr_malloc(c->odr_in, sizeof(Z_NamePlusRecord));
335
336             /* only trust recordPosition if >= calculated position */
337             if (res->records[i].recordPosition &&
338                 *res->records[i].recordPosition >= pos + 1)
339                 pos = *res->records[i].recordPosition - 1;
340
341             sru_rec = &res->records[i];
342
343             npr->databaseName = 0;
344             npr->which = Z_NamePlusRecord_databaseRecord;
345             npr->u.databaseRecord = (Z_External *)
346                 odr_malloc(c->odr_in, sizeof(Z_External));
347             npr->u.databaseRecord->descriptor = 0;
348             npr->u.databaseRecord->direct_reference =
349                 odr_oiddup(c->odr_in, yaz_oid_recsyn_xml);
350             npr->u.databaseRecord->indirect_reference = 0;
351             npr->u.databaseRecord->which = Z_External_octet;
352
353             npr->u.databaseRecord->u.octet_aligned = (Odr_oct *)
354                 odr_malloc(c->odr_in, sizeof(Odr_oct));
355             npr->u.databaseRecord->u.octet_aligned->buf = (unsigned char*)
356                 sru_rec->recordData_buf;
357             npr->u.databaseRecord->u.octet_aligned->len =
358                 npr->u.databaseRecord->u.octet_aligned->size =
359                 sru_rec->recordData_len;
360
361             if (sru_rec->recordSchema
362                 && !strcmp(sru_rec->recordSchema,
363                            "info:srw/schema/1/diagnostics-v1.1"))
364             {
365                 sru_decode_surrogate_diagnostics(sru_rec->recordData_buf,
366                                                  sru_rec->recordData_len,
367                                                  &diag, &num_diag,
368                                                  resultset->odr);
369             }
370             ZOOM_record_cache_add(resultset, npr, pos, syntax, elementSetName,
371                                   schema, diag);
372         }
373         *count -= i;
374         *start += i;
375         if (*count + *start > resultset->size)
376             *count = resultset->size - *start;
377         yaz_log(YLOG_DEBUG, "SRU result set size " ODR_INT_PRINTF " start %d count %d", resultset->size, *start, *count);
378         if (*count < 0)
379             *count = 0;
380         nmem = odr_extract_mem(c->odr_in);
381         nmem_transfer(odr_getmem(resultset->odr), nmem);
382         nmem_destroy(nmem);
383
384         if (*count > 0)
385             return ZOOM_connection_srw_send_search(c);
386     }
387     return zoom_complete;
388 }
389 #endif
390
391 #if YAZ_HAVE_XML2
392 static void handle_srw_scan_response(ZOOM_connection c,
393                                      Z_SRW_scanResponse *res)
394 {
395     NMEM nmem = odr_extract_mem(c->odr_in);
396     ZOOM_scanset scan;
397
398     if (!c->tasks || c->tasks->which != ZOOM_TASK_SCAN)
399         return;
400     scan = c->tasks->u.scan.scan;
401
402     if (res->num_diagnostics > 0)
403         set_SRU_error(c, &res->diagnostics[0]);
404
405     scan->scan_response = 0;
406     scan->srw_scan_response = res;
407     nmem_transfer(odr_getmem(scan->odr), nmem);
408
409     ZOOM_options_set_int(scan->options, "number", res->num_terms);
410     nmem_destroy(nmem);
411 }
412 #endif
413
414 int ZOOM_handle_sru(ZOOM_connection c, Z_HTTP_Response *hres,
415                     zoom_ret *cret, char **addinfo)
416 {
417 #if YAZ_HAVE_XML2
418     int ret = 0;
419
420     /* not redirect (normal response) */
421     if (!yaz_srw_check_content_type(hres))
422     {
423         *addinfo = "content-type";
424         ret = -1;
425     }
426     else if (c->sru_mode == zoom_sru_solr)
427     {
428         Z_SRW_PDU *sr;
429         ret = yaz_solr_decode_response(c->odr_in, hres, &sr);
430         if (ret == 0)
431         {
432             if (sr->which == Z_SRW_searchRetrieve_response)
433                 *cret = handle_srw_response(c, sr->u.response);
434             else if (sr->which == Z_SRW_scan_response)
435                 handle_srw_scan_response(c, sr->u.scan_response);
436         }
437     }
438     else
439     {
440         Z_SOAP *soap_package = 0;
441         ODR o = c->odr_in;
442         Z_SOAP_Handler soap_handlers[3] = {
443             {YAZ_XMLNS_SRU_v1_response, 0, (Z_SOAP_fun) yaz_srw_codec},
444             {YAZ_XMLNS_SRU_v2_response, 0, (Z_SOAP_fun) yaz_srw_codec},
445             {0, 0, 0}
446         };
447         ret = z_soap_codec(o, &soap_package,
448                            &hres->content_buf, &hres->content_len,
449                            soap_handlers);
450         if (!ret && soap_package->which == Z_SOAP_generic)
451         {
452             Z_SRW_PDU *sr = (Z_SRW_PDU*) soap_package->u.generic->p;
453
454             ZOOM_options_set(c->options, "sru_version", sr->srw_version);
455             ZOOM_options_setl(c->options, "sru_extra_response_data",
456                               sr->extraResponseData_buf, sr->extraResponseData_len);
457             if (sr->which == Z_SRW_searchRetrieve_response)
458                 *cret = handle_srw_response(c, sr->u.response);
459             else if (sr->which == Z_SRW_scan_response)
460                 handle_srw_scan_response(c, sr->u.scan_response);
461             else
462                 ret = -1;
463         }
464         else if (!ret && (soap_package->which == Z_SOAP_fault
465                           || soap_package->which == Z_SOAP_error))
466         {
467             ZOOM_set_HTTP_error(c, hres->code,
468                                 soap_package->u.fault->fault_code,
469                                 soap_package->u.fault->fault_string);
470         }
471         else
472         {
473             size_t max_chars = 1000;
474             size_t sz = hres->content_len;
475             if (sz > max_chars - 1)
476                 sz = max_chars;
477             *addinfo = odr_malloc(c->odr_in, sz + 4);
478             memcpy(*addinfo, hres->content_buf, sz);
479             if (sz == max_chars)
480                 strcpy(*addinfo + sz, "...");
481             else
482                 strcpy(*addinfo + sz, "");
483             ret = -1;
484         }
485     }
486     return ret;
487 #else
488     return -1;
489 #endif
490 }
491
492 /*
493  * Local variables:
494  * c-basic-offset: 4
495  * c-file-style: "Stroustrup"
496  * indent-tabs-mode: nil
497  * End:
498  * vim: shiftwidth=4 tabstop=8 expandtab
499  */
500