-rw-r--r-- | lib/consumer.cc | 105 |
1 files changed, 44 insertions, 61 deletions
diff --git a/lib/consumer.cc b/lib/consumer.cc index 20f4174..c155157 100644 --- a/lib/consumer.cc +++ b/lib/consumer.cc | |||
@@ -1,152 +1,135 @@ | |||
1 | #include <algorithm> | 1 | #include <algorithm> |
2 | #include <cassert> | 2 | #include <cassert> |
3 | #include <cstring> | 3 | #include <cstring> |
4 | #include <opkele/util.h> | 4 | #include <opkele/util.h> |
5 | #include <opkele/curl.h> | 5 | #include <opkele/curl.h> |
6 | #include <opkele/exception.h> | 6 | #include <opkele/exception.h> |
7 | #include <opkele/data.h> | 7 | #include <opkele/data.h> |
8 | #include <opkele/consumer.h> | 8 | #include <opkele/consumer.h> |
9 | #include <openssl/sha.h> | 9 | #include <openssl/sha.h> |
10 | #include <openssl/hmac.h> | 10 | #include <openssl/hmac.h> |
11 | #include <iostream> | 11 | #include <iostream> |
12 | 12 | ||
13 | #include "config.h" | 13 | #include "config.h" |
14 | 14 | ||
15 | #include <pcre.h> | 15 | #include <pcre.h> |
16 | 16 | ||
17 | namespace opkele { | 17 | namespace opkele { |
18 | using namespace std; | 18 | using namespace std; |
19 | using util::curl_t; | ||
19 | 20 | ||
20 | class pcre_matches_t { | 21 | class pcre_matches_t { |
21 | public: | 22 | public: |
22 | int *_ov; | 23 | int *_ov; |
23 | int _s; | 24 | int _s; |
24 | 25 | ||
25 | pcre_matches_t() : _ov(0), _s(0) { } | 26 | pcre_matches_t() : _ov(0), _s(0) { } |
26 | pcre_matches_t(int s) : _ov(0), _s(s) { | 27 | pcre_matches_t(int s) : _ov(0), _s(s) { |
27 | if(_s&1) ++_s; | 28 | if(_s&1) ++_s; |
28 | _s += _s>>1; | 29 | _s += _s>>1; |
29 | _ov = new int[_s]; | 30 | _ov = new int[_s]; |
30 | } | 31 | } |
31 | ~pcre_matches_t() throw() { if(_ov) delete[] _ov; } | 32 | ~pcre_matches_t() throw() { if(_ov) delete[] _ov; } |
32 | 33 | ||
33 | int begin(int i) const { return _ov[i<<1]; } | 34 | int begin(int i) const { return _ov[i<<1]; } |
34 | int end(int i) const { return _ov[(i<<1)+1]; } | 35 | int end(int i) const { return _ov[(i<<1)+1]; } |
35 | int length(int i) const { int t=i<<1; return _ov[t+1]-_ov[t]; } | 36 | int length(int i) const { int t=i<<1; return _ov[t+1]-_ov[t]; } |
36 | }; | 37 | }; |
37 | 38 | ||
38 | class pcre_t { | 39 | class pcre_t { |
39 | public: | 40 | public: |
40 | pcre *_p; | 41 | pcre *_p; |
41 | 42 | ||
42 | pcre_t() : _p(0) { } | 43 | pcre_t() : _p(0) { } |
43 | pcre_t(pcre *p) : _p(p) { } | 44 | pcre_t(pcre *p) : _p(p) { } |
44 | pcre_t(const char *re,int opts) : _p(0) { | 45 | pcre_t(const char *re,int opts) : _p(0) { |
45 | static const char *errptr; static int erroffset; | 46 | static const char *errptr; static int erroffset; |
46 | _p = pcre_compile(re,opts,&errptr,&erroffset,NULL); | 47 | _p = pcre_compile(re,opts,&errptr,&erroffset,NULL); |
47 | if(!_p) | 48 | if(!_p) |
48 | throw internal_error(OPKELE_CP_ string("Failed to compile regexp: ")+errptr); | 49 | throw internal_error(OPKELE_CP_ string("Failed to compile regexp: ")+errptr); |
49 | } | 50 | } |
50 | ~pcre_t() throw() { if(_p) (*pcre_free)(_p); } | 51 | ~pcre_t() throw() { if(_p) (*pcre_free)(_p); } |
51 | 52 | ||
52 | pcre_t& operator=(pcre *p) { if(_p) (*pcre_free)(_p); _p=p; return *this; } | 53 | pcre_t& operator=(pcre *p) { if(_p) (*pcre_free)(_p); _p=p; return *this; } |
53 | 54 | ||
54 | operator const pcre*(void) const { return _p; } | 55 | operator const pcre*(void) const { return _p; } |
55 | operator pcre*(void) { return _p; } | 56 | operator pcre*(void) { return _p; } |
56 | 57 | ||
57 | int exec(const string& s,pcre_matches_t& m) { | 58 | int exec(const string& s,pcre_matches_t& m) { |
58 | if(!_p) | 59 | if(!_p) |
59 | throw internal_error(OPKELE_CP_ "Trying to execute absent regexp"); | 60 | throw internal_error(OPKELE_CP_ "Trying to execute absent regexp"); |
60 | return pcre_exec(_p,NULL,s.c_str(),s.length(),0,0,m._ov,m._s); | 61 | return pcre_exec(_p,NULL,s.c_str(),s.length(),0,0,m._ov,m._s); |
61 | } | 62 | } |
62 | }; | 63 | }; |
63 | 64 | ||
64 | static CURLcode curl_misc_sets(CURL* c) { | ||
65 | CURLcode r; | ||
66 | (r=curl_easy_setopt(c,CURLOPT_FOLLOWLOCATION,1)) | ||
67 | || (r=curl_easy_setopt(c,CURLOPT_MAXREDIRS,5)) | ||
68 | || (r=curl_easy_setopt(c,CURLOPT_DNS_CACHE_TIMEOUT,120)) | ||
69 | || (r=curl_easy_setopt(c,CURLOPT_DNS_USE_GLOBAL_CACHE,1)) | ||
70 | || (r=curl_easy_setopt(c,CURLOPT_USERAGENT,PACKAGE_NAME"/"PACKAGE_SRC_VERSION)) | ||
71 | || (r=curl_easy_setopt(c,CURLOPT_TIMEOUT,20)) | ||
72 | #ifdefDISABLE_CURL_SSL_VERIFYHOST | ||
73 | || (r=curl_easy_setopt(c,CURLOPT_SSL_VERIFYHOST,0)) | ||
74 | #endif | ||
75 | #ifdefDISABLE_CURL_SSL_VERIFYPEER | ||
76 | || (r=curl_easy_setopt(c,CURLOPT_SSL_VERIFYPEER,0)) | ||
77 | #endif | ||
78 | ; | ||
79 | return r; | ||
80 | } | ||
81 | |||
82 | static size_t _curl_tostring(void *ptr,size_t size,size_t nmemb,void *stream) { | 65 | static size_t _curl_tostring(void *ptr,size_t size,size_t nmemb,void *stream) { |
83 | string *str = (string*)stream; | 66 | string *str = (string*)stream; |
84 | size_t bytes = size*nmemb; | 67 | size_t bytes = size*nmemb; |
85 | size_t get = min(16384-str->length(),bytes); | 68 | size_t get = min(16384-str->length(),bytes); |
86 | str->append((const char*)ptr,get); | 69 | str->append((const char*)ptr,get); |
87 | return get; | 70 | return get; |
88 | } | 71 | } |
89 | 72 | ||
90 | assoc_t consumer_t::associate(const string& server) { | 73 | assoc_t consumer_t::associate(const string& server) { |
91 | util::dh_t dh = DH_new(); | 74 | util::dh_t dh = DH_new(); |
92 | if(!dh) | 75 | if(!dh) |
93 | throw exception_openssl(OPKELE_CP_ "failed to DH_new()"); | 76 | throw exception_openssl(OPKELE_CP_ "failed to DH_new()"); |
94 | dh->p = util::dec_to_bignum(data::_default_p); | 77 | dh->p = util::dec_to_bignum(data::_default_p); |
95 | dh->g = util::dec_to_bignum(data::_default_g); | 78 | dh->g = util::dec_to_bignum(data::_default_g); |
96 | if(!DH_generate_key(dh)) | 79 | if(!DH_generate_key(dh)) |
97 | throw exception_openssl(OPKELE_CP_ "failed to DH_generate_key()"); | 80 | throw exception_openssl(OPKELE_CP_ "failed to DH_generate_key()"); |
98 | string request = | 81 | string request = |
99 | "openid.mode=associate" | 82 | "openid.mode=associate" |
100 | "&openid.assoc_type=HMAC-SHA1" | 83 | "&openid.assoc_type=HMAC-SHA1" |
101 | "&openid.session_type=DH-SHA1" | 84 | "&openid.session_type=DH-SHA1" |
102 | "&openid.dh_consumer_public="; | 85 | "&openid.dh_consumer_public="; |
103 | request += util::url_encode(util::bignum_to_base64(dh->pub_key)); | 86 | request += util::url_encode(util::bignum_to_base64(dh->pub_key)); |
104 | util::curl_t curl = curl_easy_init(); | 87 | curl_t curl = curl_t::easy_init(); |
105 | if(!curl) | 88 | if(!curl) |
106 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_init()"); | 89 | throw exception_curl(OPKELE_CP_ "failed to initialize curl"); |
107 | string response; | 90 | string response; |
108 | CURLcode r; | 91 | CURLcode r; |
109 | (r=curl_misc_sets(curl)) | 92 | (r=curl.misc_sets()) |
110 | || (r=curl_easy_setopt(curl,CURLOPT_URL,server.c_str())) | 93 | || (r=curl.easy_setopt(CURLOPT_URL,server.c_str())) |
111 | || (r=curl_easy_setopt(curl,CURLOPT_POST,1)) | 94 | || (r=curl.easy_setopt(CURLOPT_POST,1)) |
112 | || (r=curl_easy_setopt(curl,CURLOPT_POSTFIELDS,request.data())) | 95 | || (r=curl.easy_setopt(CURLOPT_POSTFIELDS,request.data())) |
113 | || (r=curl_easy_setopt(curl,CURLOPT_POSTFIELDSIZE,request.length())) | 96 | || (r=curl.easy_setopt(CURLOPT_POSTFIELDSIZE,request.length())) |
114 | || (r=curl_easy_setopt(curl,CURLOPT_WRITEFUNCTION,_curl_tostring)) | 97 | || (r=curl.easy_setopt(CURLOPT_WRITEFUNCTION,_curl_tostring)) |
115 | || (r=curl_easy_setopt(curl,CURLOPT_WRITEDATA,&response)) | 98 | || (r=curl.easy_setopt(CURLOPT_WRITEDATA,&response)) |
116 | ; | 99 | ; |
117 | if(r) | 100 | if(r) |
118 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_setopt()",r); | 101 | throw exception_curl(OPKELE_CP_ "failed to set curly options",r); |
119 | if( (r=curl_easy_perform(curl)) ) | 102 | if( (r=curl.easy_perform()) ) |
120 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_perform()",r); | 103 | throw exception_curl(OPKELE_CP_ "failed to perform curly request",r); |
121 | params_t p; p.parse_keyvalues(response); | 104 | params_t p; p.parse_keyvalues(response); |
122 | if(p.has_param("assoc_type") && p.get_param("assoc_type")!="HMAC-SHA1") | 105 | if(p.has_param("assoc_type") && p.get_param("assoc_type")!="HMAC-SHA1") |
123 | throw bad_input(OPKELE_CP_ "unsupported assoc_type"); | 106 | throw bad_input(OPKELE_CP_ "unsupported assoc_type"); |
124 | string st; | 107 | string st; |
125 | if(p.has_param("session_type")) st = p.get_param("session_type"); | 108 | if(p.has_param("session_type")) st = p.get_param("session_type"); |
126 | if((!st.empty()) && st!="DH-SHA1") | 109 | if((!st.empty()) && st!="DH-SHA1") |
127 | throw bad_input(OPKELE_CP_ "unsupported session_type"); | 110 | throw bad_input(OPKELE_CP_ "unsupported session_type"); |
128 | secret_t secret; | 111 | secret_t secret; |
129 | if(st.empty()) { | 112 | if(st.empty()) { |
130 | secret.from_base64(p.get_param("mac_key")); | 113 | secret.from_base64(p.get_param("mac_key")); |
131 | }else{ | 114 | }else{ |
132 | util::bignum_t s_pub = util::base64_to_bignum(p.get_param("dh_server_public")); | 115 | util::bignum_t s_pub = util::base64_to_bignum(p.get_param("dh_server_public")); |
133 | vector<unsigned char> ck(DH_size(dh)+1); | 116 | vector<unsigned char> ck(DH_size(dh)+1); |
134 | unsigned char *ckptr = &(ck.front())+1; | 117 | unsigned char *ckptr = &(ck.front())+1; |
135 | int cklen = DH_compute_key(ckptr,s_pub,dh); | 118 | int cklen = DH_compute_key(ckptr,s_pub,dh); |
136 | if(cklen<0) | 119 | if(cklen<0) |
137 | throw exception_openssl(OPKELE_CP_ "failed to DH_compute_key()"); | 120 | throw exception_openssl(OPKELE_CP_ "failed to DH_compute_key()"); |
138 | if(cklen && (*ckptr)&0x80) { | 121 | if(cklen && (*ckptr)&0x80) { |
139 | (*(--ckptr)) = 0; ++cklen; | 122 | (*(--ckptr)) = 0; ++cklen; |
140 | } | 123 | } |
141 | unsigned char key_sha1[SHA_DIGEST_LENGTH]; | 124 | unsigned char key_sha1[SHA_DIGEST_LENGTH]; |
142 | SHA1(ckptr,cklen,key_sha1); | 125 | SHA1(ckptr,cklen,key_sha1); |
143 | secret.enxor_from_base64(key_sha1,p.get_param("enc_mac_key")); | 126 | secret.enxor_from_base64(key_sha1,p.get_param("enc_mac_key")); |
144 | } | 127 | } |
145 | int expires_in = 0; | 128 | int expires_in = 0; |
146 | if(p.has_param("expires_in")) { | 129 | if(p.has_param("expires_in")) { |
147 | expires_in = util::string_to_long(p.get_param("expires_in")); | 130 | expires_in = util::string_to_long(p.get_param("expires_in")); |
148 | }else if(p.has_param("issued") && p.has_param("expiry")) { | 131 | }else if(p.has_param("issued") && p.has_param("expiry")) { |
149 | expires_in = util::w3c_to_time(p.get_param("expiry"))-util::w3c_to_time(p.get_param("issued")); | 132 | expires_in = util::w3c_to_time(p.get_param("expiry"))-util::w3c_to_time(p.get_param("issued")); |
150 | }else | 133 | }else |
151 | throw bad_input(OPKELE_CP_ "no expiration information"); | 134 | throw bad_input(OPKELE_CP_ "no expiration information"); |
152 | return store_assoc(server,p.get_param("assoc_handle"),secret,expires_in); | 135 | return store_assoc(server,p.get_param("assoc_handle"),secret,expires_in); |
@@ -232,112 +215,112 @@ namespace opkele { | |||
232 | f += (co==string::npos)?slist.substr(pp):slist.substr(pp,co-pp); | 215 | f += (co==string::npos)?slist.substr(pp):slist.substr(pp,co-pp); |
233 | p[f] = pin.get_param(f); | 216 | p[f] = pin.get_param(f); |
234 | if(co==string::npos) | 217 | if(co==string::npos) |
235 | break; | 218 | break; |
236 | pp = co+1; | 219 | pp = co+1; |
237 | } | 220 | } |
238 | p["openid.assoc_handle"] = pin.get_param("openid.assoc_handle"); | 221 | p["openid.assoc_handle"] = pin.get_param("openid.assoc_handle"); |
239 | p["openid.sig"] = pin.get_param("openid.sig"); | 222 | p["openid.sig"] = pin.get_param("openid.sig"); |
240 | p["openid.signed"] = pin.get_param("openid.signed"); | 223 | p["openid.signed"] = pin.get_param("openid.signed"); |
241 | try { | 224 | try { |
242 | string ih = pin.get_param("openid.invalidate_handle"); | 225 | string ih = pin.get_param("openid.invalidate_handle"); |
243 | p["openid.invalidate_handle"] = ih; | 226 | p["openid.invalidate_handle"] = ih; |
244 | }catch(failed_lookup& fl) { } | 227 | }catch(failed_lookup& fl) { } |
245 | try { | 228 | try { |
246 | check_authentication(server,p); | 229 | check_authentication(server,p); |
247 | }catch(failed_check_authentication& fca) { | 230 | }catch(failed_check_authentication& fca) { |
248 | throw id_res_failed(OPKELE_CP_ "failed to check_authentication()"); | 231 | throw id_res_failed(OPKELE_CP_ "failed to check_authentication()"); |
249 | } | 232 | } |
250 | } | 233 | } |
251 | if(ext) ext->id_res_hook(pin,ps,identity); | 234 | if(ext) ext->id_res_hook(pin,ps,identity); |
252 | } | 235 | } |
253 | 236 | ||
254 | void consumer_t::check_authentication(const string& server,const params_t& p) { | 237 | void consumer_t::check_authentication(const string& server,const params_t& p) { |
255 | string request = "openid.mode=check_authentication"; | 238 | string request = "openid.mode=check_authentication"; |
256 | for(params_t::const_iterator i=p.begin();i!=p.end();++i) { | 239 | for(params_t::const_iterator i=p.begin();i!=p.end();++i) { |
257 | if(i->first!="openid.mode") { | 240 | if(i->first!="openid.mode") { |
258 | request += '&'; | 241 | request += '&'; |
259 | request += i->first; | 242 | request += i->first; |
260 | request += '='; | 243 | request += '='; |
261 | request += util::url_encode(i->second); | 244 | request += util::url_encode(i->second); |
262 | } | 245 | } |
263 | } | 246 | } |
264 | util::curl_t curl = curl_easy_init(); | 247 | curl_t curl = curl_t::easy_init(); |
265 | if(!curl) | 248 | if(!curl) |
266 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_init()"); | 249 | throw exception_curl(OPKELE_CP_ "failed to initialize curl"); |
267 | string response; | 250 | string response; |
268 | CURLcode r; | 251 | CURLcode r; |
269 | (r=curl_misc_sets(curl)) | 252 | (r=curl.misc_sets()) |
270 | || (r=curl_easy_setopt(curl,CURLOPT_URL,server.c_str())) | 253 | || (r=curl.easy_setopt(CURLOPT_URL,server.c_str())) |
271 | || (r=curl_easy_setopt(curl,CURLOPT_POST,1)) | 254 | || (r=curl.easy_setopt(CURLOPT_POST,1)) |
272 | || (r=curl_easy_setopt(curl,CURLOPT_POSTFIELDS,request.data())) | 255 | || (r=curl.easy_setopt(CURLOPT_POSTFIELDS,request.data())) |
273 | || (r=curl_easy_setopt(curl,CURLOPT_POSTFIELDSIZE,request.length())) | 256 | || (r=curl.easy_setopt(CURLOPT_POSTFIELDSIZE,request.length())) |
274 | || (r=curl_easy_setopt(curl,CURLOPT_WRITEFUNCTION,_curl_tostring)) | 257 | || (r=curl.easy_setopt(CURLOPT_WRITEFUNCTION,_curl_tostring)) |
275 | || (r=curl_easy_setopt(curl,CURLOPT_WRITEDATA,&response)) | 258 | || (r=curl.easy_setopt(CURLOPT_WRITEDATA,&response)) |
276 | ; | 259 | ; |
277 | if(r) | 260 | if(r) |
278 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_setopt()",r); | 261 | throw exception_curl(OPKELE_CP_ "failed to set curly options",r); |
279 | if( (r=curl_easy_perform(curl)) ) | 262 | if( (r=curl.easy_perform()) ) |
280 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_perform()",r); | 263 | throw exception_curl(OPKELE_CP_ "failed to perform curly request",r); |
281 | params_t pp; pp.parse_keyvalues(response); | 264 | params_t pp; pp.parse_keyvalues(response); |
282 | if(pp.has_param("invalidate_handle")) | 265 | if(pp.has_param("invalidate_handle")) |
283 | invalidate_assoc(server,pp.get_param("invalidate_handle")); | 266 | invalidate_assoc(server,pp.get_param("invalidate_handle")); |
284 | if(pp.has_param("is_valid")) { | 267 | if(pp.has_param("is_valid")) { |
285 | if(pp.get_param("is_valid")=="true") | 268 | if(pp.get_param("is_valid")=="true") |
286 | return; | 269 | return; |
287 | }else if(pp.has_param("lifetime")) { | 270 | }else if(pp.has_param("lifetime")) { |
288 | if(util::string_to_long(pp.get_param("lifetime"))) | 271 | if(util::string_to_long(pp.get_param("lifetime"))) |
289 | return; | 272 | return; |
290 | } | 273 | } |
291 | throw failed_check_authentication(OPKELE_CP_ "failed to verify response"); | 274 | throw failed_check_authentication(OPKELE_CP_ "failed to verify response"); |
292 | } | 275 | } |
293 | 276 | ||
294 | void consumer_t::retrieve_links(const string& url,string& server,string& delegate) { | 277 | void consumer_t::retrieve_links(const string& url,string& server,string& delegate) { |
295 | server.erase(); | 278 | server.erase(); |
296 | delegate.erase(); | 279 | delegate.erase(); |
297 | util::curl_t curl = curl_easy_init(); | 280 | curl_t curl = curl_t::easy_init(); |
298 | if(!curl) | 281 | if(!curl) |
299 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_init()"); | 282 | throw exception_curl(OPKELE_CP_ "failed to initialize curl"); |
300 | string html; | 283 | string html; |
301 | CURLcode r; | 284 | CURLcode r; |
302 | (r=curl_misc_sets(curl)) | 285 | (r=curl.misc_sets()) |
303 | || (r=curl_easy_setopt(curl,CURLOPT_URL,url.c_str())) | 286 | || (r=curl.easy_setopt(CURLOPT_URL,url.c_str())) |
304 | || (r=curl_easy_setopt(curl,CURLOPT_WRITEFUNCTION,_curl_tostring)) | 287 | || (r=curl.easy_setopt(CURLOPT_WRITEFUNCTION,_curl_tostring)) |
305 | || (r=curl_easy_setopt(curl,CURLOPT_WRITEDATA,&html)) | 288 | || (r=curl.easy_setopt(CURLOPT_WRITEDATA,&html)) |
306 | ; | 289 | ; |
307 | if(r) | 290 | if(r) |
308 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_setopt()",r); | 291 | throw exception_curl(OPKELE_CP_ "failed to set curly options",r); |
309 | r = curl_easy_perform(curl); | 292 | r = curl.easy_perform(); |
310 | if(r && r!=CURLE_WRITE_ERROR) | 293 | if(r && r!=CURLE_WRITE_ERROR) |
311 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_perform()",r); | 294 | throw exception_curl(OPKELE_CP_ "failed to perform curly request",r); |
312 | static const char *re_bre = "<\\s*body\\b", *re_hdre = "<\\s*head[^>]*>", | 295 | static const char *re_bre = "<\\s*body\\b", *re_hdre = "<\\s*head[^>]*>", |
313 | *re_lre = "<\\s*link\\b([^>]+)>", | 296 | *re_lre = "<\\s*link\\b([^>]+)>", |
314 | *re_rre = "\\brel\\s*=\\s*['\"]([^'\"]+)['\"]", | 297 | *re_rre = "\\brel\\s*=\\s*['\"]([^'\"]+)['\"]", |
315 | *re_hre = "\\bhref\\s*=\\s*['\"]\\s*([^'\"\\s]+)\\s*['\"]"; | 298 | *re_hre = "\\bhref\\s*=\\s*['\"]\\s*([^'\"\\s]+)\\s*['\"]"; |
316 | pcre_matches_t m1(3), m2(3); | 299 | pcre_matches_t m1(3), m2(3); |
317 | pcre_t bre(re_bre,PCRE_CASELESS); | 300 | pcre_t bre(re_bre,PCRE_CASELESS); |
318 | if(bre.exec(html,m1)>0) | 301 | if(bre.exec(html,m1)>0) |
319 | html.erase(m1.begin(0)); | 302 | html.erase(m1.begin(0)); |
320 | pcre_t hdre(re_hdre,PCRE_CASELESS); | 303 | pcre_t hdre(re_hdre,PCRE_CASELESS); |
321 | if(hdre.exec(html,m1)<=0) | 304 | if(hdre.exec(html,m1)<=0) |
322 | throw bad_input(OPKELE_CP_ "failed to find <head>"); | 305 | throw bad_input(OPKELE_CP_ "failed to find <head>"); |
323 | html.erase(0,m1.end(0)+1); | 306 | html.erase(0,m1.end(0)+1); |
324 | pcre_t lre(re_lre,PCRE_CASELESS), rre(re_rre,PCRE_CASELESS), hre(re_hre,PCRE_CASELESS); | 307 | pcre_t lre(re_lre,PCRE_CASELESS), rre(re_rre,PCRE_CASELESS), hre(re_hre,PCRE_CASELESS); |
325 | bool gotit = false; | 308 | bool gotit = false; |
326 | while( (!gotit) && lre.exec(html,m1)>=2 ) { | 309 | while( (!gotit) && lre.exec(html,m1)>=2 ) { |
327 | static const char *whitespace = " \t"; | 310 | static const char *whitespace = " \t"; |
328 | string attrs(html,m1.begin(1),m1.length(1)); | 311 | string attrs(html,m1.begin(1),m1.length(1)); |
329 | html.erase(0,m1.end(0)+1); | 312 | html.erase(0,m1.end(0)+1); |
330 | if(!( rre.exec(attrs,m1)>=2 && hre.exec(attrs,m2)>=2 )) | 313 | if(!( rre.exec(attrs,m1)>=2 && hre.exec(attrs,m2)>=2 )) |
331 | continue; | 314 | continue; |
332 | string rels(attrs,m1.begin(1),m1.length(1)); | 315 | string rels(attrs,m1.begin(1),m1.length(1)); |
333 | for(string::size_type ns = rels.find_first_not_of(whitespace); | 316 | for(string::size_type ns = rels.find_first_not_of(whitespace); |
334 | ns!=string::npos; | 317 | ns!=string::npos; |
335 | ns=rels.find_first_not_of(whitespace,ns)) { | 318 | ns=rels.find_first_not_of(whitespace,ns)) { |
336 | string::size_type s = rels.find_first_of(whitespace,ns); | 319 | string::size_type s = rels.find_first_of(whitespace,ns); |
337 | string rel; | 320 | string rel; |
338 | if(s==string::npos) { | 321 | if(s==string::npos) { |
339 | rel.assign(rels,ns,string::npos); | 322 | rel.assign(rels,ns,string::npos); |
340 | ns=string::npos; | 323 | ns=string::npos; |
341 | }else{ | 324 | }else{ |
342 | rel.assign(rels,ns,s-ns); | 325 | rel.assign(rels,ns,s-ns); |
343 | ns=s; | 326 | ns=s; |
@@ -371,55 +354,55 @@ namespace opkele { | |||
371 | // strip leading and trailing spaces | 354 | // strip leading and trailing spaces |
372 | string::size_type i = rv.find_first_not_of(" \t\r\n"); | 355 | string::size_type i = rv.find_first_not_of(" \t\r\n"); |
373 | if(i==string::npos) | 356 | if(i==string::npos) |
374 | throw bad_input(OPKELE_CP_ "empty URL"); | 357 | throw bad_input(OPKELE_CP_ "empty URL"); |
375 | if(i) | 358 | if(i) |
376 | rv.erase(0,i); | 359 | rv.erase(0,i); |
377 | i = rv.find_last_not_of(" \t\r\n"); | 360 | i = rv.find_last_not_of(" \t\r\n"); |
378 | assert(i!=string::npos); | 361 | assert(i!=string::npos); |
379 | if(i<(rv.length()-1)) | 362 | if(i<(rv.length()-1)) |
380 | rv.erase(i+1); | 363 | rv.erase(i+1); |
381 | // add missing http:// | 364 | // add missing http:// |
382 | i = rv.find("://"); | 365 | i = rv.find("://"); |
383 | if(i==string::npos) { // primitive. but do we need more? | 366 | if(i==string::npos) { // primitive. but do we need more? |
384 | rv.insert(0,"http://"); | 367 | rv.insert(0,"http://"); |
385 | i = sizeof("http://")-1; | 368 | i = sizeof("http://")-1; |
386 | }else{ | 369 | }else{ |
387 | i += sizeof("://")-1; | 370 | i += sizeof("://")-1; |
388 | } | 371 | } |
389 | string::size_type qm = rv.find('?',i); | 372 | string::size_type qm = rv.find('?',i); |
390 | string::size_type sl = rv.find('/',i); | 373 | string::size_type sl = rv.find('/',i); |
391 | if(qm!=string::npos) { | 374 | if(qm!=string::npos) { |
392 | if(sl==string::npos || sl>qm) | 375 | if(sl==string::npos || sl>qm) |
393 | rv.insert(qm,1,'/'); | 376 | rv.insert(qm,1,'/'); |
394 | }else{ | 377 | }else{ |
395 | if(sl==string::npos) | 378 | if(sl==string::npos) |
396 | rv += '/'; | 379 | rv += '/'; |
397 | } | 380 | } |
398 | return rv; | 381 | return rv; |
399 | } | 382 | } |
400 | 383 | ||
401 | string consumer_t::canonicalize(const string& url) { | 384 | string consumer_t::canonicalize(const string& url) { |
402 | string rv = normalize(url); | 385 | string rv = normalize(url); |
403 | util::curl_t curl = curl_easy_init(); | 386 | curl_t curl = curl_t::easy_init(); |
404 | if(!curl) | 387 | if(!curl) |
405 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_init()"); | 388 | throw exception_curl(OPKELE_CP_ "failed to initialize curl()"); |
406 | string html; | 389 | string html; |
407 | CURLcode r; | 390 | CURLcode r; |
408 | (r=curl_misc_sets(curl)) | 391 | (r=curl.misc_sets()) |
409 | || (r=curl_easy_setopt(curl,CURLOPT_URL,rv.c_str())) | 392 | || (r=curl.easy_setopt(CURLOPT_URL,rv.c_str())) |
410 | || (r=curl_easy_setopt(curl,CURLOPT_NOBODY,1)) | 393 | || (r=curl.easy_setopt(CURLOPT_NOBODY,1)) |
411 | ; | 394 | ; |
412 | if(r) | 395 | if(r) |
413 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_setopt()",r); | 396 | throw exception_curl(OPKELE_CP_ "failed to set curly options",r); |
414 | r = curl_easy_perform(curl); | 397 | r = curl.easy_perform(); |
415 | if(r) | 398 | if(r) |
416 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_perform()",r); | 399 | throw exception_curl(OPKELE_CP_ "failed to perform curly request",r); |
417 | const char *eu = 0; | 400 | const char *eu = 0; |
418 | r = curl_easy_getinfo(curl,CURLINFO_EFFECTIVE_URL,&eu); | 401 | r = curl.easy_getinfo(CURLINFO_EFFECTIVE_URL,&eu); |
419 | if(r) | 402 | if(r) |
420 | throw exception_curl(OPKELE_CP_ "failed to curl_easy_getinfo(..CURLINFO_EFFECTIVE_URL..)",r); | 403 | throw exception_curl(OPKELE_CP_ "failed to get CURLINFO_EFFECTIVE_URL",r); |
421 | rv = eu; | 404 | rv = eu; |
422 | return normalize(rv); | 405 | return normalize(rv); |
423 | } | 406 | } |
424 | 407 | ||
425 | } | 408 | } |