X-Git-Url: http://jsfdemo.indexdata.com/?a=blobdiff_plain;f=src%2Ftest_filter_rewrite.cpp;h=430e7846dfd2911fdfc3c952923675737579702c;hb=0ce322844494022dc85a9c776d9ff041aad17520;hp=67755ddc89f70bb95b5153c5612c9303848ec8f4;hpb=6ca510d9c7b0c706fc86caebb728028404b09fb2;p=metaproxy-moved-to-github.git diff --git a/src/test_filter_rewrite.cpp b/src/test_filter_rewrite.cpp index 67755dd..430e784 100644 --- a/src/test_filter_rewrite.cpp +++ b/src/test_filter_rewrite.cpp @@ -21,6 +21,7 @@ Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA #include #include "filter_http_client.hpp" +#include "filter_http_rewrite.hpp" #include #include "router_chain.hpp" #include @@ -28,6 +29,8 @@ Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA #include #include +#include + #define BOOST_AUTO_TEST_MAIN #define BOOST_TEST_DYN_LINK @@ -36,352 +39,301 @@ Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA using namespace boost::unit_test; namespace mp = metaproxy_1; -typedef std::pair string_pair; -typedef std::vector spair_vec; -typedef spair_vec::iterator spv_iter; - -class FilterHeaderRewrite: public mp::filter::Base { -public: - void process(mp::Package & package) const { - Z_GDU *gdu = package.request().get(); - //map of request/response vars - std::map vars; - //we have an http req - if (gdu && gdu->which == Z_GDU_HTTP_Request) - { - Z_HTTP_Request *hreq = gdu->u.HTTP_Request; - mp::odr o; - //rewrite the request line - std::string path; - if (strstr(hreq->path, "http://") == hreq->path) - { - std::cout << "Path in the method line is absolute, " - "possibly a proxy request\n"; - path += hreq->path; - } - else - { - //TODO what about proto - path += z_HTTP_header_lookup(hreq->headers, "Host"); - path += hreq->path; - } - std::cout << "Proxy request URL is " << path << std::endl; - std::string npath = - test_patterns(vars, path, req_uri_pats, req_groups_bynum); - std::cout << "Resp request URL is " << npath << std::endl; - if (!npath.empty()) - hreq->path = odr_strdup(o, npath.c_str()); - std::cout << ">> Request headers" << std::endl; - //iterate headers - for (Z_HTTP_Header *header = hreq->headers; - header != 0; - header = header->next) - { - std::cout << header->name << ": " << header->value << std::endl; - std::string out = test_patterns(vars, - std::string(header->value), - req_uri_pats, req_groups_bynum); - if (!out.empty()) - header->value = odr_strdup(o, out.c_str()); - } - package.request() = gdu; - } - package.move(); - gdu = package.response().get(); - if (gdu && gdu->which == Z_GDU_HTTP_Response) - { - Z_HTTP_Response *hr = gdu->u.HTTP_Response; - std::cout << "Response " << hr->code; - std::cout << "<< Respose headers" << std::endl; - mp::odr o; - //iterate headers - for (Z_HTTP_Header *header = hr->headers; - header != 0; - header = header->next) - { - std::cout << header->name << ": " << header->value << std::endl; - std::string out = test_patterns(vars, - std::string(header->value), - res_uri_pats, res_groups_bynum); - if (!out.empty()) - header->value = odr_strdup(o, out.c_str()); - } - package.response() = gdu; - } - }; - - void configure(const xmlNode* ptr, bool test_only, const char *path) {}; - - /** - * Tests pattern from the vector in order and executes recipe on - the first match. - */ - const std::string test_patterns( - std::map & vars, - const std::string & txt, - const spair_vec & uri_pats, - const std::vector > & groups_bynum_vec) - const - { - for (int i = 0; i < uri_pats.size(); i++) - { - std::string out = search_replace(vars, txt, - uri_pats[i].first, uri_pats[i].second, - groups_bynum_vec[i]); - if (!out.empty()) return out; - } - return ""; - } - - - const std::string search_replace( - std::map & vars, - const std::string & txt, - const std::string & uri_re, - const std::string & uri_pat, - const std::map & groups_bynum) const - { - //exec regex against value - boost::regex re(uri_re); - boost::smatch what; - std::string::const_iterator start, end; - start = txt.begin(); - end = txt.end(); - std::string out; - while (regex_search(start, end, what, re)) //find next full match - { - unsigned i; - for (i = 1; i < what.size(); ++i) - { - //check if the group is named - std::map::const_iterator it - = groups_bynum.find(i); - if (it != groups_bynum.end()) - { //it is - std::string name = it->second; - if (!what[i].str().empty()) - vars[name] = what[i]; - } - - } - //prepare replacement string - std::string rvalue = sub_vars(uri_pat, vars); - //rewrite value - std::string rhvalue = what.prefix().str() - + rvalue + what.suffix().str(); - std::cout << "! Rewritten '"+what.str(0)+"' to '"+rvalue+"'\n"; - out += rhvalue; - start = what[0].second; //move search forward - } - return out; - } - - static void parse_groups( - const spair_vec & uri_pats, - std::vector > & groups_bynum_vec) +struct TestConfig { + TestConfig() { - for (int h = 0; h < uri_pats.size(); h++) - { - int gnum = 0; - bool esc = false; - //regex is first, subpat is second - std::string str = uri_pats[h].first; - //for each pair we have an indexing map - std::map groups_bynum; - for (int i = 0; i < str.size(); ++i) - { - if (!esc && str[i] == '\\') - { - esc = true; - continue; - } - if (!esc && str[i] == '(') //group starts - { - gnum++; - if (i+1 < str.size() && str[i+1] == '?') //group with attrs - { - i++; - if (i+1 < str.size() && str[i+1] == ':') //non-capturing - { - if (gnum > 0) gnum--; - i++; - continue; - } - if (i+1 < str.size() && str[i+1] == 'P') //optional, python - i++; - if (i+1 < str.size() && str[i+1] == '<') //named - { - i++; - std::string gname; - bool term = false; - while (++i < str.size()) - { - if (str[i] == '>') { term = true; break; } - if (!isalnum(str[i])) - throw mp::filter::FilterException - ("Only alphanumeric chars allowed, found " - " in '" - + str - + "' at " - + boost::lexical_cast(i)); - gname += str[i]; - } - if (!term) - throw mp::filter::FilterException - ("Unterminated group name '" + gname - + " in '" + str +"'"); - groups_bynum[gnum] = gname; - std::cout << "Found named group '" << gname - << "' at $" << gnum << std::endl; - } - } - } - esc = false; - } - groups_bynum_vec.push_back(groups_bynum); - } + std::cout << "global setup\n"; + yaz_log_init_level(YLOG_ALL); } - - static std::string sub_vars (const std::string & in, - const std::map & vars) - { - std::string out; - bool esc = false; - for (int i = 0; i < in.size(); ++i) - { - if (!esc && in[i] == '\\') - { - esc = true; - continue; - } - if (!esc && in[i] == '$') //var - { - if (i+1 < in.size() && in[i+1] == '{') //ref prefix - { - ++i; - std::string name; - bool term = false; - while (++i < in.size()) - { - if (in[i] == '}') { term = true; break; } - name += in[i]; - } - if (!term) throw mp::filter::FilterException - ("Unterminated var ref in '"+in+"' at " - + boost::lexical_cast(i)); - std::map::const_iterator it - = vars.find(name); - if (it != vars.end()) - { - out += it->second; - } - } - else - { - throw mp::filter::FilterException - ("Malformed or trimmed var ref in '" - +in+"' at "+boost::lexical_cast(i)); - } - continue; - } - //passthru - out += in[i]; - esc = false; - } - return out; + ~TestConfig() + { + std::cout << "global teardown\n"; } - - void configure( - const spair_vec req_uri_pats, - const spair_vec res_uri_pats) - { - //TODO should we really copy them out? - this->req_uri_pats = req_uri_pats; - this->res_uri_pats = res_uri_pats; - //pick up names - parse_groups(req_uri_pats, req_groups_bynum); - parse_groups(res_uri_pats, res_groups_bynum); - }; - -private: - std::map vars; - spair_vec req_uri_pats; - spair_vec res_uri_pats; - std::vector > req_groups_bynum; - std::vector > res_groups_bynum; - }; +BOOST_GLOBAL_FIXTURE( TestConfig ); BOOST_AUTO_TEST_CASE( test_filter_rewrite_1 ) { try { - FilterHeaderRewrite fhr; - } - catch ( ... ) { - BOOST_CHECK (false); - } -} - -BOOST_AUTO_TEST_CASE( test_filter_rewrite_2 ) -{ - try - { + std::cout << "Running non-xml config test case" << std::endl; mp::RouterChain router; - - FilterHeaderRewrite fhr; + mp::filter::HttpRewrite fhr; - spair_vec vec_req; + //configure the filter + mp::filter::HttpRewrite::spair_vec vec_req; vec_req.push_back(std::make_pair( "(?http\\:\\/\\/s?)(?[^\\/?#]+)\\/(?[^\\/]+)" - "\\/(?.+)", - "${proto}${target}" + "\\/(?[^\\/]+)(?.*)", + "${proto}${host}${path}" )); vec_req.push_back(std::make_pair( - "proxyhost", - "localhost" + "(?:Host\\: )(.*)", + "Host: ${host}" )); - spair_vec vec_res; + mp::filter::HttpRewrite::spair_vec vec_res; vec_res.push_back(std::make_pair( - "(?http\\:\\/\\/s?)(?[^\\/?#]+)\\/(?[^ >]+)", - "http://${pxhost}/${pxpath}/${host}/${path}" + "(?http\\:\\/\\/s?)(?[^\\/?# \"'>]+)\\/(?[^ \"'>]+)", + "${proto}${pxhost}/${pxpath}/${host}/${path}" )); fhr.configure(vec_req, vec_res); + + router.append(fhr); - mp::filter::HTTPClient hc; + // create an http request + mp::Package pack; + + mp::odr odr; + Z_GDU *gdu_req = z_get_HTTP_Request_uri(odr, + "http://proxyhost/proxypath/targetsite/page1.html", 0, 1); + + pack.request() = gdu_req; + + //create the http response + + const char *resp_buf = + "HTTP/1.1 200 OK\r\n" + "Content-Length: 441\r\n" + "Content-Type: text/html\r\n" + "Link: ; rel=absolute\r\n" + "Link: ; rel=relative\r\n" + "\r\n" + "Hello proxy!" + "" + "" + "" + "" + "

Welcome to our website. It doesn't make it easy to get pro" + "xified" + "" + " An absolute link" + "" + "" + "" + "" + "

Welcome to our website. It doesn't make it easy to get pro" + "xified" + "" + " An absolute link" + "\n" + "\n" + " \n" + " \n" + " \n" + " \n" + " \n" + " \n" + " \n" + "\n" + ; + + std::cout << xmlconf; + + // reading and parsing XML conf + xmlDocPtr doc = xmlParseMemory(xmlconf.c_str(), xmlconf.size()); + BOOST_CHECK(doc); + xmlNode *root_element = xmlDocGetRootElement(doc); + fhr.configure(root_element, true, ""); + xmlFreeDoc(doc); router.append(fhr); - router.append(hc); // create an http request mp::Package pack; mp::odr odr; Z_GDU *gdu_req = z_get_HTTP_Request_uri(odr, - "http://proxyhost/proxypath/localhost:80/~jakub/targetsite.php", 0, 1); + "http://proxyhost/proxypath/targetsite/page1.html", 0, 1); pack.request() = gdu_req; + //create the http response + + const char *resp_buf = + "HTTP/1.1 200 OK\r\n" + "Content-Length: 50\r\n" + "Content-Type: text/html\r\n" + "Link: ; rel=absolute\r\n" + "Link: ; rel=relative\r\n" + "\r\n" + "Hello proxy!" + "" + "" + "" + "" + "

Welcome to our website. It doesn't make it easy to get pro" + "xified" + "" + " An absolute link" + "" + "" + "" + "" + "

Welcome to our website. It doesn't make it easy to get pro" + "xified" + "" + " An absolute link" + "