More self-contained test
[metaproxy-moved-to-github.git] / src / test_filter_rewrite.cpp
1 /* This file is part of Metaproxy.
2    Copyright (C) 2005-2013 Index Data
3
4 Metaproxy is free software; you can redistribute it and/or modify it under
5 the terms of the GNU General Public License as published by the Free
6 Software Foundation; either version 2, or (at your option) any later
7 version.
8
9 Metaproxy is distributed in the hope that it will be useful, but WITHOUT ANY
10 WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12 for more details.
13
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
17 */
18
19 #include "config.hpp"
20 #include <iostream>
21 #include <stdexcept>
22
23 #include "filter_http_client.hpp"
24 #include "filter_http_rewrite.hpp"
25 #include <metaproxy/util.hpp>
26 #include "router_chain.hpp"
27 #include <metaproxy/package.hpp>
28
29 #include <boost/regex.hpp>
30 #include <boost/lexical_cast.hpp>
31
32 #include <yaz/log.h>
33
34 #define BOOST_AUTO_TEST_MAIN
35 #define BOOST_TEST_DYN_LINK
36
37 #include <boost/test/auto_unit_test.hpp>
38
39 using namespace boost::unit_test;
40 namespace mp = metaproxy_1;
41
42 struct TestConfig {
43     TestConfig()   
44     {
45         std::cout << "global setup\n"; 
46         yaz_log_init_level(YLOG_ALL);
47     }
48     ~TestConfig() 
49     { 
50         std::cout << "global teardown\n"; 
51     }
52 };
53
54 BOOST_GLOBAL_FIXTURE( TestConfig );
55
56 BOOST_AUTO_TEST_CASE( test_filter_rewrite_1 )
57 {
58     try
59     {
60         std::cout << "Running non-xml config test case" << std::endl;
61         mp::RouterChain router;
62         mp::filter::HttpRewrite fhr;
63         
64         //configure the filter
65         mp::filter::HttpRewrite::spair_vec vec_req;
66         vec_req.push_back(std::make_pair(
67         "(?<proto>http\\:\\/\\/s?)(?<pxhost>[^\\/?#]+)\\/(?<pxpath>[^\\/]+)"
68         "\\/(?<host>[^\\/]+)(?<path>.*)",
69         "${proto}${host}${path}"
70         ));
71         vec_req.push_back(std::make_pair(
72         "(?:Host\\: )(.*)",
73         "Host: ${host}"
74         ));
75
76         mp::filter::HttpRewrite::spair_vec vec_res;
77         vec_res.push_back(std::make_pair(
78         "(?<proto>http\\:\\/\\/s?)(?<host>[^\\/?# \"'>]+)\\/(?<path>[^ \"'>]+)",
79         "${proto}${pxhost}/${pxpath}/${host}/${path}"
80         ));
81         
82         fhr.configure(vec_req, vec_res);
83         
84         router.append(fhr);
85
86         // create an http request
87         mp::Package pack;
88
89         mp::odr odr;
90         Z_GDU *gdu_req = z_get_HTTP_Request_uri(odr, 
91         "http://proxyhost/proxypath/targetsite/page1.html", 0, 1);
92
93         pack.request() = gdu_req;
94
95         //create the http response
96
97         /* response, content  */
98         const char *resp_buf =
99             /*123456789012345678 */
100             "HTTP/1.1 200 OK\r\n"
101             "Content-Length: 3000\r\n"
102             "Content-Type: text/html\r\n"
103             "Link: <http://targetsite/file.xml>; rel=absolute\r\r"
104             "Link: </dir/file.xml>; rel=relative\r\r"
105             "\r\n"
106             "<html><head><title>Hello proxy!</title>"
107             "<style>"
108             "body {"
109             "  background-image:url('http://targetsite/images/bg.png');"
110             "}"
111             "</style>"
112             "</head>"
113             "<script>var jslink=\"http://targetsite/webservice.xml\";</script>"
114             "<body>"
115             "<p>Welcome to our website. It doesn't make it easy to get pro"
116             "xified"
117             "<a href=\"http://targetsite/page2.html\">"
118             "  An absolute link</a>"
119             "<a target=_blank href='http://targetsite/page3.html\">"
120             "  Another abs link</a>"
121             "<a href=\"/docs/page4.html\" />"
122             "</body></html>";
123
124         /* response, content  */
125         const char *resp_buf_rew =
126             /*123456789012345678 */
127             "HTTP/1.1 200 OK\r\n"
128             "Content-Length: 3000\r\n"
129             "Content-Type: text/html\r\n"
130             "Link: <http://proxyhost/proxypath/targetsite/file.xml>; rel=absolute\r\r"
131             "Link: </dir/file.xml>; rel=relative\r\r"
132             "\r\n"
133             "<html><head><title>Hello proxy!</title>"
134             "<style>"
135             "body {"
136             "  background-image:url('http://proxyhost/proxypath/targetsite/images/bg.png');"
137             "}"
138             "</style>"
139             "</head>"
140             "<script>var jslink=\"http://proxyhost/proxypath/targetsite/webservice.xml\";</script>"
141             "<body>"
142             "<p>Welcome to our website. It doesn't make it easy to get pro"
143             "xified"
144             "<a href=\"http://proxyhost/proxypath/targetsite/page.html\">"
145             "  An absolute link</a>"
146             "<a target=_blank href='http://proxyhost/proxypath/targetsite/anotherpage.html\">"
147             "  Another abs link</a>"
148             "<a href=\"/docs/page2.html\" />"
149             "</body></html>";
150
151         int r;
152         Z_GDU *gdu_res;
153         ODR odr2 = odr_createmem(ODR_DECODE);
154         odr_setbuf(odr2, (char *) resp_buf, strlen(resp_buf), 0);
155         r = z_GDU(odr2, &gdu_res, 0, 0);
156
157         BOOST_CHECK(r == 0);
158         if (r)
159         {
160             BOOST_CHECK_EQUAL(gdu_res->which, Z_GDU_HTTP_Response);
161         }
162
163         pack.response() = gdu_res;
164
165         //feed to the router
166         pack.router(router).move();
167
168         //analyze the response
169         Z_GDU *gdu_res_rew = pack.response().get();
170         BOOST_CHECK(gdu_res_rew);
171         BOOST_CHECK_EQUAL(gdu_res_rew->which, Z_GDU_HTTP_Response);
172         
173         Z_HTTP_Response *hres = gdu_res_rew->u.HTTP_Response;
174         BOOST_CHECK(hres);
175
176         //how to compare the buffers:
177
178         odr_destroy(odr2);
179     }
180     catch (std::exception & e) {
181         std::cout << e.what();
182         std::cout << std::endl;
183         BOOST_CHECK (false);
184     }
185 }
186
187 BOOST_AUTO_TEST_CASE( test_filter_rewrite_2 )
188 {
189     try
190     {
191         std::cout << "Running xml config test case" << std::endl;
192         mp::RouterChain router;
193         mp::filter::HttpRewrite fhr;
194
195         std::string xmlconf =
196             "<?xml version='1.0'?>\n"
197             "<filter xmlns='http://indexdata.com/metaproxy'\n"
198             "        id='rewrite1' type='http_rewrite'>\n"
199             " <request>\n"
200             "   <rewrite from='"
201     "(?&lt;proto>https?://)(?&lt;pxhost>[^ /?#]+)/(?&lt;pxpath>[^ /]+)"
202     "/(?&lt;host>[^ /]+)(?&lt;path>[^ ]*)'\n"
203             "            to='${proto}${host}${path}' />\n"
204             "   <rewrite from='(?:Host: )(.*)'\n"
205             "            to='Host: ${host}' />\n" 
206             " </request>\n"
207             " <response>\n"
208             "   <rewrite from='"
209     "(?&lt;proto>https?://)(?&lt;host>[^/?# &quot;&apos;>]+)/(?&lt;path>[^  &quot;&apos;>]+)'\n"
210             "            to='${proto}${pxhost}/${pxpath}/${host}/${path}' />\n" 
211             " </response>\n"
212             "</filter>\n"
213         ;
214
215         std::cout << xmlconf;
216
217         // reading and parsing XML conf
218         xmlDocPtr doc = xmlParseMemory(xmlconf.c_str(), xmlconf.size());
219         BOOST_CHECK(doc);
220         xmlNode *root_element = xmlDocGetRootElement(doc);
221         fhr.configure(root_element, true, "");
222         xmlFreeDoc(doc);
223         
224         router.append(fhr);
225
226         // create an http request
227         mp::Package pack;
228
229         mp::odr odr;
230         Z_GDU *gdu_req = z_get_HTTP_Request_uri(odr, 
231         "http://proxyhost/proxypath/targetsite/page1.html", 0, 1);
232
233         pack.request() = gdu_req;
234
235         //create the http response
236
237         /* response, content  */
238         const char *resp_buf =
239             /*123456789012345678 */
240             "HTTP/1.1 200 OK\r\n"
241             "Content-Length: 3000\r\n"
242             "Content-Type: text/html\r\n"
243             "Link: <http://targetsite/file.xml>; rel=absolute\r\r"
244             "Link: </dir/file.xml>; rel=relative\r\r"
245             "\r\n"
246             "<html><head><title>Hello proxy!</title>"
247             "<style>"
248             "body {"
249             "  background-image:url('http://targetsite/images/bg.png');"
250             "}"
251             "</style>"
252             "</head>"
253             "<script>var jslink=\"http://targetsite/webservice.xml\";</script>"
254             "<body>"
255             "<p>Welcome to our website. It doesn't make it easy to get pro"
256             "xified"
257             "<a href=\"http://targetsite/page2.html\">"
258             "  An absolute link</a>"
259             "<a target=_blank href='http://targetsite/page3.html\">"
260             "  Another abs link</a>"
261             "<a href=\"/docs/page4.html\" />"
262             "</body></html>";
263
264         /* response, content  */
265         const char *resp_buf_rew =
266             /*123456789012345678 */
267             "HTTP/1.1 200 OK\r\n"
268             "Content-Length: 3000\r\n"
269             "Content-Type: text/html\r\n"
270             "Link: <http://proxyhost/proxypath/targetsite/file.xml>; rel=absolute\r\r"
271             "Link: </dir/file.xml>; rel=relative\r\r"
272             "\r\n"
273             "<html><head><title>Hello proxy!</title>"
274             "<style>"
275             "body {"
276             "  background-image:url('http://proxyhost/proxypath/targetsite/images/bg.png');"
277             "}"
278             "</style>"
279             "</head>"
280             "<script>var jslink=\"http://proxyhost/proxypath/targetsite/webservice.xml\";</script>"
281             "<body>"
282             "<p>Welcome to our website. It doesn't make it easy to get pro"
283             "xified"
284             "<a href=\"http://proxyhost/proxypath/targetsite/page.html\">"
285             "  An absolute link</a>"
286             "<a target=_blank href='http://proxyhost/proxypath/targetsite/anotherpage.html\">"
287             "  Another abs link</a>"
288             "<a href=\"/docs/page2.html\" />"
289             "</body></html>";
290
291         int r;
292         Z_GDU *gdu_res;
293         ODR odr2 = odr_createmem(ODR_DECODE);
294         odr_setbuf(odr2, (char *) resp_buf, strlen(resp_buf), 0);
295         r = z_GDU(odr2, &gdu_res, 0, 0);
296
297         BOOST_CHECK(r == 0);
298         if (r)
299         {
300             BOOST_CHECK_EQUAL(gdu_res->which, Z_GDU_HTTP_Response);
301         }
302
303         pack.response() = gdu_res;
304
305         //feed to the router
306         pack.router(router).move();
307
308         //analyze the response
309         Z_GDU *gdu_res_rew = pack.response().get();
310         BOOST_CHECK(gdu_res_rew);
311         BOOST_CHECK_EQUAL(gdu_res_rew->which, Z_GDU_HTTP_Response);
312         
313         Z_HTTP_Response *hres = gdu_res_rew->u.HTTP_Response;
314         BOOST_CHECK(hres);
315
316         //how to compare the buffers:
317
318         odr_destroy(odr2);
319     }
320     catch (std::exception & e) {
321         std::cout << e.what();
322         std::cout << std::endl;
323         BOOST_CHECK (false);
324     }
325 }
326
327
328 /*
329  * Local variables:
330  * c-basic-offset: 4
331  * c-file-style: "Stroustrup"
332  * indent-tabs-mode: nil
333  * End:
334  * vim: shiftwidth=4 tabstop=8 expandtab
335  */
336