summaryrefslogtreecommitdiffabout
path: root/lib
authorMichael Krelin <hacker@klever.net>2008-12-02 21:36:54 (UTC)
committer Michael Krelin <hacker@klever.net>2008-12-02 21:36:54 (UTC)
commita2a524f744849e81ec91a7afbaf641d1b57e14b1 (patch) (unidiff)
treed023154d9485179fdd3001d5816a0ebec05e5d5c /lib
parent47bf5ab634dc5cc3bd5d71894b2d6681f7a83024 (diff)
downloadlibopkele-a2a524f744849e81ec91a7afbaf641d1b57e14b1.zip
libopkele-a2a524f744849e81ec91a7afbaf641d1b57e14b1.tar.gz
libopkele-a2a524f744849e81ec91a7afbaf641d1b57e14b1.tar.bz2
added passthrough unknown encoding handler to discovery parser
Diffstat (limited to 'lib') (more/less context) (ignore whitespace changes)
-rw-r--r--lib/discovery.cc8
1 files changed, 8 insertions, 0 deletions
diff --git a/lib/discovery.cc b/lib/discovery.cc
index bd1f917..cbdceb3 100644
--- a/lib/discovery.cc
+++ b/lib/discovery.cc
@@ -1,587 +1,595 @@
1#include <list> 1#include <list>
2#include <opkele/curl.h> 2#include <opkele/curl.h>
3#include <opkele/expat.h> 3#include <opkele/expat.h>
4#include <opkele/uris.h> 4#include <opkele/uris.h>
5#include <opkele/discovery.h> 5#include <opkele/discovery.h>
6#include <opkele/exception.h> 6#include <opkele/exception.h>
7#include <opkele/util.h> 7#include <opkele/util.h>
8#include <opkele/data.h> 8#include <opkele/data.h>
9#include <opkele/debug.h> 9#include <opkele/debug.h>
10 10
11#include "config.h" 11#include "config.h"
12 12
13#include <opkele/tidy.h> 13#include <opkele/tidy.h>
14 14
15#define XRDS_HEADER "X-XRDS-Location" 15#define XRDS_HEADER "X-XRDS-Location"
16#define CT_HEADER "Content-Type" 16#define CT_HEADER "Content-Type"
17 17
18namespace opkele { 18namespace opkele {
19 using std::list; 19 using std::list;
20 using xrd::XRD_t; 20 using xrd::XRD_t;
21 using xrd::service_t; 21 using xrd::service_t;
22 22
23 /* TODO: the whole discovery thing needs cleanup and optimization due to 23 /* TODO: the whole discovery thing needs cleanup and optimization due to
24 * many changes of concept. */ 24 * many changes of concept. */
25 25
26 static const size_t max_html = 16384; 26 static const size_t max_html = 16384;
27 27
28 static const struct service_type_t { 28 static const struct service_type_t {
29 const char *uri; 29 const char *uri;
30 const char *forceid; 30 const char *forceid;
31 } op_service_types[] = { 31 } op_service_types[] = {
32 { STURI_OPENID20_OP, IDURI_SELECT20 }, 32 { STURI_OPENID20_OP, IDURI_SELECT20 },
33 { STURI_OPENID20, 0 }, 33 { STURI_OPENID20, 0 },
34 { STURI_OPENID11, 0 }, 34 { STURI_OPENID11, 0 },
35 { STURI_OPENID10, 0 } 35 { STURI_OPENID10, 0 }
36 }; 36 };
37 enum { 37 enum {
38 st_index_1 = 2, st_index_2 = 1 38 st_index_1 = 2, st_index_2 = 1
39 }; 39 };
40 40
41 41
42 static inline bool is_qelement(const XML_Char *n,const char *qen) { 42 static inline bool is_qelement(const XML_Char *n,const char *qen) {
43 return !strcasecmp(n,qen); 43 return !strcasecmp(n,qen);
44 } 44 }
45 static inline bool is_element(const XML_Char *n,const char *en) { 45 static inline bool is_element(const XML_Char *n,const char *en) {
46 if(!strcasecmp(n,en)) return true; 46 if(!strcasecmp(n,en)) return true;
47 int nl = strlen(n), enl = strlen(en); 47 int nl = strlen(n), enl = strlen(en);
48 if( (nl>=(enl+1)) && n[nl-enl-1]=='\t' 48 if( (nl>=(enl+1)) && n[nl-enl-1]=='\t'
49 && !strcasecmp(&n[nl-enl],en) ) 49 && !strcasecmp(&n[nl-enl],en) )
50 return true; 50 return true;
51 return false; 51 return false;
52 } 52 }
53 53
54 static long element_priority(const XML_Char **a) { 54 static long element_priority(const XML_Char **a) {
55 for(;*a;++a) 55 for(;*a;++a)
56 if(!strcasecmp(*(a++),"priority")) { 56 if(!strcasecmp(*(a++),"priority")) {
57 long rv; 57 long rv;
58 return (sscanf(*a,"%ld",&rv)==1)?rv:-1; 58 return (sscanf(*a,"%ld",&rv)==1)?rv:-1;
59 } 59 }
60 return -1; 60 return -1;
61 } 61 }
62 /* TODO: ideally all attributes should be 62 /* TODO: ideally all attributes should be
63 * retrieved in one run */ 63 * retrieved in one run */
64 static const char *element_attr(const XML_Char **a, const char *at) { 64 static const char *element_attr(const XML_Char **a, const char *at) {
65 for(;*a;++a) 65 for(;*a;++a)
66 if(!strcasecmp(*(a++),at)) { 66 if(!strcasecmp(*(a++),at)) {
67 return *a; 67 return *a;
68 } 68 }
69 return 0; 69 return 0;
70 } 70 }
71 71
72 class idigger_t : public util::curl_t, public util::expat_t { 72 class idigger_t : public util::curl_t, public util::expat_t {
73 public: 73 public:
74 string xri_proxy; 74 string xri_proxy;
75 75
76 enum { 76 enum {
77 xmode_html = 1, xmode_xrd = 2, xmode_cid = 4, 77 xmode_html = 1, xmode_xrd = 2, xmode_cid = 4,
78 xmode_noredirs = 8 78 xmode_noredirs = 8
79 }; 79 };
80 int xmode; 80 int xmode;
81 81
82 string xrds_location; 82 string xrds_location;
83 string http_content_type; 83 string http_content_type;
84 service_t html_openid1; 84 service_t html_openid1;
85 service_t html_openid2; 85 service_t html_openid2;
86 string cdata_buf; 86 string cdata_buf;
87 long status_code; 87 long status_code;
88 string status_string; 88 string status_string;
89 89
90 typedef list<string> pt_stack_t; 90 typedef list<string> pt_stack_t;
91 pt_stack_t pt_stack; 91 pt_stack_t pt_stack;
92 int skipping; 92 int skipping;
93 bool parser_choked; 93 bool parser_choked;
94 string save_html; 94 string save_html;
95 95
96 XRD_t *xrd; 96 XRD_t *xrd;
97 service_t *xrd_service; 97 service_t *xrd_service;
98 string* cdata; 98 string* cdata;
99 99
100 idigger_t() 100 idigger_t()
101 : util::curl_t(easy_init()), 101 : util::curl_t(easy_init()),
102 util::expat_t(0), 102 util::expat_t(0),
103 xri_proxy(XRI_PROXY_URL) { 103 xri_proxy(XRI_PROXY_URL) {
104 CURLcode r; 104 CURLcode r;
105 (r=misc_sets()) 105 (r=misc_sets())
106 || (r=set_write()) 106 || (r=set_write())
107 || (r=set_header()) 107 || (r=set_header())
108 ; 108 ;
109 if(r) 109 if(r)
110 throw exception_curl(OPKELE_CP_ "failed to set curly options",r); 110 throw exception_curl(OPKELE_CP_ "failed to set curly options",r);
111 } 111 }
112 ~idigger_t() throw() { } 112 ~idigger_t() throw() { }
113 113
114 void yadiscover(endpoint_discovery_iterator oi,const string& yurl,const char **types,bool redirs) { 114 void yadiscover(endpoint_discovery_iterator oi,const string& yurl,const char **types,bool redirs) {
115 idiscovery_t idis; 115 idiscovery_t idis;
116 idis.xri_identity = false; 116 idis.xri_identity = false;
117 discover_at(idis,yurl,xmode_html|xmode_xrd|(redirs?0:xmode_noredirs)); 117 discover_at(idis,yurl,xmode_html|xmode_xrd|(redirs?0:xmode_noredirs));
118 if(!xrds_location.empty()) { 118 if(!xrds_location.empty()) {
119 idis.clear(); 119 idis.clear();
120 discover_at(idis,xrds_location,xmode_xrd); 120 discover_at(idis,xrds_location,xmode_xrd);
121 } 121 }
122 idis.normalized_id = idis.canonicalized_id = yurl; 122 idis.normalized_id = idis.canonicalized_id = yurl;
123 service_type_t st; 123 service_type_t st;
124 for(st.uri=*types;*types;st.uri=*(++types)) 124 for(st.uri=*types;*types;st.uri=*(++types))
125 queue_endpoints(oi,idis,&st); 125 queue_endpoints(oi,idis,&st);
126 } 126 }
127 127
128 string discover(endpoint_discovery_iterator& oi,const string& identity) { 128 string discover(endpoint_discovery_iterator& oi,const string& identity) {
129 string rv; 129 string rv;
130 idiscovery_t idis; 130 idiscovery_t idis;
131 string::size_type fsc = identity.find_first_not_of(data::_whitespace_chars); 131 string::size_type fsc = identity.find_first_not_of(data::_whitespace_chars);
132 if(fsc==string::npos) 132 if(fsc==string::npos)
133 throw bad_input(OPKELE_CP_ "whitespace-only identity"); 133 throw bad_input(OPKELE_CP_ "whitespace-only identity");
134 string::size_type lsc = identity.find_last_not_of(data::_whitespace_chars); 134 string::size_type lsc = identity.find_last_not_of(data::_whitespace_chars);
135 assert(lsc!=string::npos); 135 assert(lsc!=string::npos);
136 if(!strncasecmp(identity.c_str()+fsc,"xri://",sizeof("xri://")-1)) 136 if(!strncasecmp(identity.c_str()+fsc,"xri://",sizeof("xri://")-1))
137 fsc += sizeof("xri://")-1; 137 fsc += sizeof("xri://")-1;
138 if((fsc+1)>=lsc) 138 if((fsc+1)>=lsc)
139 throw bad_input(OPKELE_CP_ "not a character of importance in identity"); 139 throw bad_input(OPKELE_CP_ "not a character of importance in identity");
140 string id(identity,fsc,lsc-fsc+1); 140 string id(identity,fsc,lsc-fsc+1);
141 idis.clear(); 141 idis.clear();
142 if(strchr(data::_iname_leaders,id[0])) { 142 if(strchr(data::_iname_leaders,id[0])) {
143 /* TODO: further normalize xri identity? Like folding case 143 /* TODO: further normalize xri identity? Like folding case
144 * or whatever... */ 144 * or whatever... */
145 rv = id; 145 rv = id;
146 set<string> cids; 146 set<string> cids;
147 for(const struct service_type_t *st=op_service_types; 147 for(const struct service_type_t *st=op_service_types;
148 st<&op_service_types[sizeof(op_service_types)/sizeof(*op_service_types)];++st) { 148 st<&op_service_types[sizeof(op_service_types)/sizeof(*op_service_types)];++st) {
149 idis.clear(); 149 idis.clear();
150 discover_at( idis, 150 discover_at( idis,
151 xri_proxy + util::url_encode(id)+ 151 xri_proxy + util::url_encode(id)+
152 "?_xrd_t="+util::url_encode(st->uri)+ 152 "?_xrd_t="+util::url_encode(st->uri)+
153 "&_xrd_r=application/xrd%2Bxml" 153 "&_xrd_r=application/xrd%2Bxml"
154 ";sep=true;refs=true", 154 ";sep=true;refs=true",
155 xmode_xrd ); 155 xmode_xrd );
156 if(status_code==241) continue; 156 if(status_code==241) continue;
157 if(status_code!=100) 157 if(status_code!=100)
158 throw failed_xri_resolution(OPKELE_CP_ 158 throw failed_xri_resolution(OPKELE_CP_
159 "XRI resolution failed with '"+status_string+"' message" 159 "XRI resolution failed with '"+status_string+"' message"
160 ", while looking for SEP with type '"+st->uri+"'", status_code); 160 ", while looking for SEP with type '"+st->uri+"'", status_code);
161 if(idis.xrd.canonical_ids.empty()) 161 if(idis.xrd.canonical_ids.empty())
162 throw opkele::failed_discovery(OPKELE_CP_ "No CanonicalID for XRI identity found"); 162 throw opkele::failed_discovery(OPKELE_CP_ "No CanonicalID for XRI identity found");
163 string cid = idis.xrd.canonical_ids.begin()->second; 163 string cid = idis.xrd.canonical_ids.begin()->second;
164 if(cids.find(cid)==cids.end()) { 164 if(cids.find(cid)==cids.end()) {
165 cids.insert(cid); 165 cids.insert(cid);
166 idis.clear(); 166 idis.clear();
167 discover_at( idis, 167 discover_at( idis,
168 xri_proxy + util::url_encode(id)+ 168 xri_proxy + util::url_encode(id)+
169 "?_xrd_t="+util::url_encode(st->uri)+ 169 "?_xrd_t="+util::url_encode(st->uri)+
170 "&_xrd_r=application/xrd%2Bxml" 170 "&_xrd_r=application/xrd%2Bxml"
171 ";sep=true;refs=true", 171 ";sep=true;refs=true",
172 xmode_xrd ); 172 xmode_xrd );
173 if(status_code==241) continue; 173 if(status_code==241) continue;
174 if(status_code!=100) 174 if(status_code!=100)
175 throw failed_xri_resolution(OPKELE_CP_ 175 throw failed_xri_resolution(OPKELE_CP_
176 "XRI resolution failed with '"+status_string+"' message" 176 "XRI resolution failed with '"+status_string+"' message"
177 ", while looking for SEP with type '"+st->uri+"'" 177 ", while looking for SEP with type '"+st->uri+"'"
178 " on canonical id", status_code); 178 " on canonical id", status_code);
179 } 179 }
180 idis.canonicalized_id = cid; 180 idis.canonicalized_id = cid;
181 idis.normalized_id = rv; idis.xri_identity = true; 181 idis.normalized_id = rv; idis.xri_identity = true;
182 queue_endpoints(oi,idis,st); 182 queue_endpoints(oi,idis,st);
183 } 183 }
184 }else{ 184 }else{
185 idis.xri_identity = false; 185 idis.xri_identity = false;
186 if(id.find("://")==string::npos) 186 if(id.find("://")==string::npos)
187 id.insert(0,"http://"); 187 id.insert(0,"http://");
188 string::size_type fp = id.find('#'); 188 string::size_type fp = id.find('#');
189 if(fp!=string::npos) { 189 if(fp!=string::npos) {
190 string::size_type qp = id.find('?'); 190 string::size_type qp = id.find('?');
191 if(qp==string::npos || qp<fp) 191 if(qp==string::npos || qp<fp)
192 id.erase(fp); 192 id.erase(fp);
193 else if(qp>fp) 193 else if(qp>fp)
194 id.erase(fp,qp-fp); 194 id.erase(fp,qp-fp);
195 } 195 }
196 rv = idis.normalized_id = util::rfc_3986_normalize_uri(id); 196 rv = idis.normalized_id = util::rfc_3986_normalize_uri(id);
197 discover_at(idis,id,xmode_html|xmode_xrd); 197 discover_at(idis,id,xmode_html|xmode_xrd);
198 const char * eu = 0; 198 const char * eu = 0;
199 CURLcode r = easy_getinfo(CURLINFO_EFFECTIVE_URL,&eu); 199 CURLcode r = easy_getinfo(CURLINFO_EFFECTIVE_URL,&eu);
200 if(r) 200 if(r)
201 throw exception_curl(OPKELE_CP_ "failed to get CURLINFO_EFFECTIVE_URL",r); 201 throw exception_curl(OPKELE_CP_ "failed to get CURLINFO_EFFECTIVE_URL",r);
202 string cid = util::strip_uri_fragment_part( idis.canonicalized_id = util::rfc_3986_normalize_uri(eu) ); 202 string cid = util::strip_uri_fragment_part( idis.canonicalized_id = util::rfc_3986_normalize_uri(eu) );
203 if(xrds_location.empty()) { 203 if(xrds_location.empty()) {
204 if(idis.xrd.empty()) 204 if(idis.xrd.empty())
205 html2xrd(oi,idis); 205 html2xrd(oi,idis);
206 else{ 206 else{
207 for(const service_type_t *st=op_service_types; 207 for(const service_type_t *st=op_service_types;
208 st<&op_service_types[sizeof(op_service_types)/sizeof(*op_service_types)];++st) 208 st<&op_service_types[sizeof(op_service_types)/sizeof(*op_service_types)];++st)
209 queue_endpoints(oi,idis,st); 209 queue_endpoints(oi,idis,st);
210 } 210 }
211 }else{ 211 }else{
212 idis.clear(); 212 idis.clear();
213 idis.canonicalized_id = cid; 213 idis.canonicalized_id = cid;
214 discover_at(idis,xrds_location,xmode_xrd); 214 discover_at(idis,xrds_location,xmode_xrd);
215 if(idis.xrd.empty()) 215 if(idis.xrd.empty())
216 html2xrd(oi,idis); 216 html2xrd(oi,idis);
217 else{ 217 else{
218 for(const service_type_t *st=op_service_types; 218 for(const service_type_t *st=op_service_types;
219 st<&op_service_types[sizeof(op_service_types)/sizeof(*op_service_types)];++st) 219 st<&op_service_types[sizeof(op_service_types)/sizeof(*op_service_types)];++st)
220 queue_endpoints(oi,idis,st); 220 queue_endpoints(oi,idis,st);
221 } 221 }
222 } 222 }
223 } 223 }
224 return rv; 224 return rv;
225 } 225 }
226 226
227 void discover_at(idiscovery_t& idis,const string& url,int xm) { 227 void discover_at(idiscovery_t& idis,const string& url,int xm) {
228 CURLcode r = easy_setopt(CURLOPT_MAXREDIRS, (xm&xmode_noredirs)?0:5); 228 CURLcode r = easy_setopt(CURLOPT_MAXREDIRS, (xm&xmode_noredirs)?0:5);
229 if(r) 229 if(r)
230 throw exception_curl(OPKELE_CP_ "failed to set curly maxredirs option"); 230 throw exception_curl(OPKELE_CP_ "failed to set curly maxredirs option");
231 if( (r=easy_setopt(CURLOPT_URL,url.c_str())) ) 231 if( (r=easy_setopt(CURLOPT_URL,url.c_str())) )
232 throw exception_curl(OPKELE_CP_ "failed to set curly urlie",r); 232 throw exception_curl(OPKELE_CP_ "failed to set curly urlie",r);
233 233
234 http_content_type.clear(); 234 http_content_type.clear();
235 xmode = xm; 235 xmode = xm;
236 prepare_to_parse(); 236 prepare_to_parse();
237 if(xmode&xmode_html) { 237 if(xmode&xmode_html) {
238 xrds_location.clear(); 238 xrds_location.clear();
239 save_html.clear(); 239 save_html.clear();
240 save_html.reserve(max_html); 240 save_html.reserve(max_html);
241 } 241 }
242 xrd = &idis.xrd; 242 xrd = &idis.xrd;
243 243
244 r = easy_perform(); 244 r = easy_perform();
245 if(r && r!=CURLE_WRITE_ERROR) 245 if(r && r!=CURLE_WRITE_ERROR)
246 throw exception_curl(OPKELE_CP_ "failed to perform curly request",r); 246 throw exception_curl(OPKELE_CP_ "failed to perform curly request",r);
247 247
248 if(!parser_choked) { 248 if(!parser_choked) {
249 parse(0,0,true); 249 parse(0,0,true);
250 }else if(xmode&xmode_html){ 250 }else if(xmode&xmode_html){
251 /* TODO: do not bother if we've seen xml */ 251 /* TODO: do not bother if we've seen xml */
252 try { 252 try {
253 util::tidy_doc_t td = util::tidy_doc_t::create(); 253 util::tidy_doc_t td = util::tidy_doc_t::create();
254 if(!td) 254 if(!td)
255 throw exception_tidy(OPKELE_CP_ "failed to create htmltidy document"); 255 throw exception_tidy(OPKELE_CP_ "failed to create htmltidy document");
256#ifdef NDEBUG 256#ifdef NDEBUG
257 td.opt_set(TidyQuiet,true); 257 td.opt_set(TidyQuiet,true);
258 td.opt_set(TidyShowWarnings,false); 258 td.opt_set(TidyShowWarnings,false);
259#else /* NDEBUG */ 259#else /* NDEBUG */
260 td.opt_set(TidyQuiet,false); 260 td.opt_set(TidyQuiet,false);
261 td.opt_set(TidyShowWarnings,true); 261 td.opt_set(TidyShowWarnings,true);
262#endif /* NDEBUG */ 262#endif /* NDEBUG */
263 td.opt_set(TidyForceOutput,true); 263 td.opt_set(TidyForceOutput,true);
264 td.opt_set(TidyXhtmlOut,true); 264 td.opt_set(TidyXhtmlOut,true);
265 td.opt_set(TidyDoctypeMode,TidyDoctypeOmit); 265 td.opt_set(TidyDoctypeMode,TidyDoctypeOmit);
266 td.opt_set(TidyMark,false); 266 td.opt_set(TidyMark,false);
267 td.opt_set(TidyNumEntities,true); 267 td.opt_set(TidyNumEntities,true);
268 if(td.parse_string(save_html)<=0) 268 if(td.parse_string(save_html)<=0)
269 throw exception_tidy(OPKELE_CP_ "tidy failed to parse document"); 269 throw exception_tidy(OPKELE_CP_ "tidy failed to parse document");
270 if(td.clean_and_repair()<=0) 270 if(td.clean_and_repair()<=0)
271 throw exception_tidy(OPKELE_CP_ "tidy failed to clean and repair"); 271 throw exception_tidy(OPKELE_CP_ "tidy failed to clean and repair");
272 util::tidy_buf_t tide; 272 util::tidy_buf_t tide;
273 if(td.save_buffer(tide)<=0) 273 if(td.save_buffer(tide)<=0)
274 throw exception_tidy(OPKELE_CP_ "tidy failed to save buffer"); 274 throw exception_tidy(OPKELE_CP_ "tidy failed to save buffer");
275 prepare_to_parse(); 275 prepare_to_parse();
276 parse(tide.c_str(),tide.size(),true); 276 parse(tide.c_str(),tide.size(),true);
277 }catch(exception_tidy& et) { } 277 }catch(exception_tidy& et) { }
278 } 278 }
279 save_html.clear(); 279 save_html.clear();
280 } 280 }
281 281
282 void prepare_to_parse() { 282 void prepare_to_parse() {
283 (*(expat_t*)this) = parser_create_ns(); 283 (*(expat_t*)this) = parser_create_ns();
284 set_user_data(); set_element_handler(); 284 set_user_data(); set_element_handler();
285 set_character_data_handler(); 285 set_character_data_handler();
286 set_unknown_encoding_handler();
286 287
287 if(xmode&xmode_html) { 288 if(xmode&xmode_html) {
288 html_openid1.clear(); html_openid2.clear(); 289 html_openid1.clear(); html_openid2.clear();
289 parser_choked = false; 290 parser_choked = false;
290 } 291 }
291 292
292 cdata = 0; xrd_service = 0; skipping = 0; 293 cdata = 0; xrd_service = 0; skipping = 0;
293 pt_stack.clear(); 294 pt_stack.clear();
294 status_code = 100; status_string.clear(); 295 status_code = 100; status_string.clear();
295 } 296 }
296 297
297 void html2xrd(endpoint_discovery_iterator& oi,idiscovery_t& id) { 298 void html2xrd(endpoint_discovery_iterator& oi,idiscovery_t& id) {
298 XRD_t& x = id.xrd; 299 XRD_t& x = id.xrd;
299 if(!html_openid2.uris.empty()) { 300 if(!html_openid2.uris.empty()) {
300 html_openid2.types.insert(STURI_OPENID20); 301 html_openid2.types.insert(STURI_OPENID20);
301 x.services.add(-1,html_openid2); 302 x.services.add(-1,html_openid2);
302 queue_endpoints(oi,id,&op_service_types[st_index_2]); 303 queue_endpoints(oi,id,&op_service_types[st_index_2]);
303 } 304 }
304 if(!html_openid1.uris.empty()) { 305 if(!html_openid1.uris.empty()) {
305 html_openid1.types.insert(STURI_OPENID11); 306 html_openid1.types.insert(STURI_OPENID11);
306 x.services.add(-1,html_openid1); 307 x.services.add(-1,html_openid1);
307 queue_endpoints(oi,id,&op_service_types[st_index_1]); 308 queue_endpoints(oi,id,&op_service_types[st_index_1]);
308 } 309 }
309 } 310 }
310 311
311 size_t write(void *p,size_t s,size_t nm) { 312 size_t write(void *p,size_t s,size_t nm) {
312 /* TODO: limit total size */ 313 /* TODO: limit total size */
313 size_t bytes = s*nm; 314 size_t bytes = s*nm;
314 const char *inbuf = (const char*)p; 315 const char *inbuf = (const char*)p;
315 if(xmode&xmode_html) { 316 if(xmode&xmode_html) {
316 size_t mbts = save_html.capacity()-save_html.size(); 317 size_t mbts = save_html.capacity()-save_html.size();
317 size_t bts = 0; 318 size_t bts = 0;
318 if(mbts>0) { 319 if(mbts>0) {
319 bts = (bytes>mbts)?mbts:bytes; 320 bts = (bytes>mbts)?mbts:bytes;
320 save_html.append(inbuf,bts); 321 save_html.append(inbuf,bts);
321 } 322 }
322 if(skipping<0) return bts; 323 if(skipping<0) return bts;
323 } 324 }
324 if(skipping<0) return 0; 325 if(skipping<0) return 0;
325 bool rp = parse(inbuf,bytes,false); 326 bool rp = parse(inbuf,bytes,false);
326 if(!rp) { 327 if(!rp) {
327 parser_choked = true; 328 parser_choked = true;
328 skipping = -1; 329 skipping = -1;
329 if(!(xmode&xmode_html)) 330 if(!(xmode&xmode_html))
330 bytes = 0; 331 bytes = 0;
331 } 332 }
332 return bytes; 333 return bytes;
333 } 334 }
334 size_t header(void *p,size_t s,size_t nm) { 335 size_t header(void *p,size_t s,size_t nm) {
335 size_t bytes = s*nm; 336 size_t bytes = s*nm;
336 const char *h = (const char*)p; 337 const char *h = (const char*)p;
337 const char *colon = (const char*)memchr(p,':',bytes); 338 const char *colon = (const char*)memchr(p,':',bytes);
338 const char *space = (const char*)memchr(p,' ',bytes); 339 const char *space = (const char*)memchr(p,' ',bytes);
339 if(space && ( (!colon) || space<colon ) ) { 340 if(space && ( (!colon) || space<colon ) ) {
340 xrds_location.clear(); http_content_type.clear(); 341 xrds_location.clear(); http_content_type.clear();
341 }else if(colon) { 342 }else if(colon) {
342 const char *hv = ++colon; 343 const char *hv = ++colon;
343 size_t hnl = colon-h; 344 size_t hnl = colon-h;
344 int rb; 345 int rb;
345 for(rb = bytes-hnl-1;rb>0 && isspace(*hv);++hv,--rb) ; 346 for(rb = bytes-hnl-1;rb>0 && isspace(*hv);++hv,--rb) ;
346 while(rb>0 && isspace(hv[rb-1])) --rb; 347 while(rb>0 && isspace(hv[rb-1])) --rb;
347 if(rb) { 348 if(rb) {
348 if( (hnl>=sizeof(XRDS_HEADER)) 349 if( (hnl>=sizeof(XRDS_HEADER))
349 && !strncasecmp(h,XRDS_HEADER":", 350 && !strncasecmp(h,XRDS_HEADER":",
350 sizeof(XRDS_HEADER)) ) { 351 sizeof(XRDS_HEADER)) ) {
351 xrds_location.assign(hv,rb); 352 xrds_location.assign(hv,rb);
352 }else if( (hnl>=sizeof(CT_HEADER)) 353 }else if( (hnl>=sizeof(CT_HEADER))
353 && !strncasecmp(h,CT_HEADER":", 354 && !strncasecmp(h,CT_HEADER":",
354 sizeof(CT_HEADER)) ) { 355 sizeof(CT_HEADER)) ) {
355 const char *sc = (const char*)memchr( 356 const char *sc = (const char*)memchr(
356 hv,';',rb); 357 hv,';',rb);
357 http_content_type.assign(hv,sc?(sc-hv):rb); 358 http_content_type.assign(hv,sc?(sc-hv):rb);
358 } 359 }
359 } 360 }
360 } 361 }
361 return curl_t::header(p,s,nm); 362 return curl_t::header(p,s,nm);
362 } 363 }
363 364
364 void start_element(const XML_Char *n,const XML_Char **a) { 365 void start_element(const XML_Char *n,const XML_Char **a) {
365 if(skipping<0) return; 366 if(skipping<0) return;
366 if(skipping) { 367 if(skipping) {
367 if(xmode&xmode_html) 368 if(xmode&xmode_html)
368 html_start_element(n,a); 369 html_start_element(n,a);
369 ++skipping; return; 370 ++skipping; return;
370 } 371 }
371 if(pt_stack.empty()) { 372 if(pt_stack.empty()) {
372 if(is_qelement(n,NSURI_XRDS "\tXRDS")) 373 if(is_qelement(n,NSURI_XRDS "\tXRDS"))
373 return; 374 return;
374 if(is_qelement(n,NSURI_XRD "\tXRD")) { 375 if(is_qelement(n,NSURI_XRD "\tXRD")) {
375 assert(xrd); 376 assert(xrd);
376 xrd->clear(); 377 xrd->clear();
377 pt_stack.push_back(n); 378 pt_stack.push_back(n);
378 }else if(xmode&xmode_html) { 379 }else if(xmode&xmode_html) {
379 html_start_element(n,a); 380 html_start_element(n,a);
380 }else{ 381 }else{
381 skipping = -1; 382 skipping = -1;
382 } 383 }
383 }else{ 384 }else{
384 int pt_s = pt_stack.size(); 385 int pt_s = pt_stack.size();
385 if(pt_s==1) { 386 if(pt_s==1) {
386 if(is_qelement(n,NSURI_XRD "\tCanonicalID")) { 387 if(is_qelement(n,NSURI_XRD "\tCanonicalID")) {
387 assert(xrd); 388 assert(xrd);
388 cdata = &(xrd->canonical_ids.add(element_priority(a),string())); 389 cdata = &(xrd->canonical_ids.add(element_priority(a),string()));
389 }else if(is_qelement(n,NSURI_XRD "\tLocalID")) { 390 }else if(is_qelement(n,NSURI_XRD "\tLocalID")) {
390 assert(xrd); 391 assert(xrd);
391 cdata = &(xrd->local_ids.add(element_priority(a),string())); 392 cdata = &(xrd->local_ids.add(element_priority(a),string()));
392 }else if(is_qelement(n,NSURI_XRD "\tProviderID")) { 393 }else if(is_qelement(n,NSURI_XRD "\tProviderID")) {
393 assert(xrd); 394 assert(xrd);
394 cdata = &(xrd->provider_id); 395 cdata = &(xrd->provider_id);
395 }else if(is_qelement(n,NSURI_XRD "\tService")) { 396 }else if(is_qelement(n,NSURI_XRD "\tService")) {
396 assert(xrd); 397 assert(xrd);
397 xrd_service = &(xrd->services.add(element_priority(a), 398 xrd_service = &(xrd->services.add(element_priority(a),
398 service_t())); 399 service_t()));
399 pt_stack.push_back(n); 400 pt_stack.push_back(n);
400 }else if(is_qelement(n,NSURI_XRD "\tStatus")) { 401 }else if(is_qelement(n,NSURI_XRD "\tStatus")) {
401 for(;*a;) { 402 for(;*a;) {
402 if(!strcasecmp(*(a++),"code")) { 403 if(!strcasecmp(*(a++),"code")) {
403 if(sscanf(*(a++),"%ld",&status_code)==1 && status_code!=100) { 404 if(sscanf(*(a++),"%ld",&status_code)==1 && status_code!=100) {
404 cdata = &status_string; 405 cdata = &status_string;
405 pt_stack.push_back(n); 406 pt_stack.push_back(n);
406 break; 407 break;
407 } 408 }
408 }else 409 }else
409 ++a; 410 ++a;
410 } 411 }
411 }else if(is_qelement(n,NSURI_XRD "\tExpires")) { 412 }else if(is_qelement(n,NSURI_XRD "\tExpires")) {
412 assert(xrd); 413 assert(xrd);
413 cdata_buf.clear(); 414 cdata_buf.clear();
414 cdata = &cdata_buf; 415 cdata = &cdata_buf;
415 }else if(xmode&xmode_html) { 416 }else if(xmode&xmode_html) {
416 html_start_element(n,a); 417 html_start_element(n,a);
417 }else{ 418 }else{
418 skipping = 1; 419 skipping = 1;
419 } 420 }
420 }else if(pt_s==2) { 421 }else if(pt_s==2) {
421 if(is_qelement(pt_stack.back().c_str(), NSURI_XRD "\tService")) { 422 if(is_qelement(pt_stack.back().c_str(), NSURI_XRD "\tService")) {
422 if(is_qelement(n,NSURI_XRD "\tType")) { 423 if(is_qelement(n,NSURI_XRD "\tType")) {
423 assert(xrd); assert(xrd_service); 424 assert(xrd); assert(xrd_service);
424 cdata_buf.clear(); 425 cdata_buf.clear();
425 cdata = &cdata_buf; 426 cdata = &cdata_buf;
426 }else if(is_qelement(n,NSURI_XRD "\tURI")) { 427 }else if(is_qelement(n,NSURI_XRD "\tURI")) {
427 assert(xrd); assert(xrd_service); 428 assert(xrd); assert(xrd_service);
428 const char *append = element_attr(a,"append"); 429 const char *append = element_attr(a,"append");
429 xrd::uri_t& uri = xrd_service->uris.add(element_priority(a),xrd::uri_t("",append?append:"")); 430 xrd::uri_t& uri = xrd_service->uris.add(element_priority(a),xrd::uri_t("",append?append:""));
430 cdata = &uri.uri; 431 cdata = &uri.uri;
431 }else if(is_qelement(n,NSURI_XRD "\tLocalID") 432 }else if(is_qelement(n,NSURI_XRD "\tLocalID")
432 || is_qelement(n,NSURI_OPENID10 "\tDelegate") ) { 433 || is_qelement(n,NSURI_OPENID10 "\tDelegate") ) {
433 assert(xrd); assert(xrd_service); 434 assert(xrd); assert(xrd_service);
434 cdata = &(xrd_service->local_ids.add(element_priority(a),string())); 435 cdata = &(xrd_service->local_ids.add(element_priority(a),string()));
435 }else if(is_qelement(n,NSURI_XRD "\tProviderID")) { 436 }else if(is_qelement(n,NSURI_XRD "\tProviderID")) {
436 assert(xrd); assert(xrd_service); 437 assert(xrd); assert(xrd_service);
437 cdata = &(xrd_service->provider_id); 438 cdata = &(xrd_service->provider_id);
438 }else{ 439 }else{
439 skipping = 1; 440 skipping = 1;
440 } 441 }
441 }else 442 }else
442 skipping = 1; 443 skipping = 1;
443 }else if(xmode&xmode_html) { 444 }else if(xmode&xmode_html) {
444 html_start_element(n,a); 445 html_start_element(n,a);
445 }else{ 446 }else{
446 skipping = 1; 447 skipping = 1;
447 } 448 }
448 } 449 }
449 } 450 }
450 void end_element(const XML_Char *n) { 451 void end_element(const XML_Char *n) {
451 if(skipping<0) return; 452 if(skipping<0) return;
452 if(skipping) { 453 if(skipping) {
453 --skipping; return; 454 --skipping; return;
454 } 455 }
455 if(is_qelement(n,NSURI_XRD "\tType")) { 456 if(is_qelement(n,NSURI_XRD "\tType")) {
456 assert(xrd); assert(xrd_service); assert(cdata==&cdata_buf); 457 assert(xrd); assert(xrd_service); assert(cdata==&cdata_buf);
457 xrd_service->types.insert(cdata_buf); 458 xrd_service->types.insert(cdata_buf);
458 }else if(is_qelement(n,NSURI_XRD "\tService")) { 459 }else if(is_qelement(n,NSURI_XRD "\tService")) {
459 assert(xrd); assert(xrd_service); 460 assert(xrd); assert(xrd_service);
460 assert(!pt_stack.empty()); 461 assert(!pt_stack.empty());
461 assert(pt_stack.back()==(NSURI_XRD "\tService")); 462 assert(pt_stack.back()==(NSURI_XRD "\tService"));
462 pt_stack.pop_back(); 463 pt_stack.pop_back();
463 xrd_service = 0; 464 xrd_service = 0;
464 }else if(is_qelement(n,NSURI_XRD "\tStatus")) { 465 }else if(is_qelement(n,NSURI_XRD "\tStatus")) {
465 assert(xrd); 466 assert(xrd);
466 if(is_qelement(pt_stack.back().c_str(),n)) { 467 if(is_qelement(pt_stack.back().c_str(),n)) {
467 assert(cdata==&status_string); 468 assert(cdata==&status_string);
468 pt_stack.pop_back(); 469 pt_stack.pop_back();
469 if(status_code!=100) 470 if(status_code!=100)
470 skipping = -1; 471 skipping = -1;
471 } 472 }
472 }else if(is_qelement(n,NSURI_XRD "\tExpires")) { 473 }else if(is_qelement(n,NSURI_XRD "\tExpires")) {
473 assert(xrd); 474 assert(xrd);
474 xrd->expires = util::w3c_to_time(cdata_buf); 475 xrd->expires = util::w3c_to_time(cdata_buf);
475 }else if((xmode&xmode_html) && is_element(n,"head")) { 476 }else if((xmode&xmode_html) && is_element(n,"head")) {
476 skipping = -1; 477 skipping = -1;
477 } 478 }
478 cdata = 0; 479 cdata = 0;
479 } 480 }
480 void character_data(const XML_Char *s,int l) { 481 void character_data(const XML_Char *s,int l) {
481 if(skipping) return; 482 if(skipping) return;
482 if(cdata) cdata->append(s,l); 483 if(cdata) cdata->append(s,l);
483 } 484 }
484 485
485 void html_start_element(const XML_Char *n,const XML_Char **a) { 486 void html_start_element(const XML_Char *n,const XML_Char **a) {
486 if(is_element(n,"meta")) { 487 if(is_element(n,"meta")) {
487 bool heq = false; 488 bool heq = false;
488 string l; 489 string l;
489 for(;*a;a+=2) { 490 for(;*a;a+=2) {
490 if(!( strcasecmp(a[0],"http-equiv") 491 if(!( strcasecmp(a[0],"http-equiv")
491 || strcasecmp(a[1],XRDS_HEADER) )) 492 || strcasecmp(a[1],XRDS_HEADER) ))
492 heq = true; 493 heq = true;
493 else if(!strcasecmp(a[0],"content")) 494 else if(!strcasecmp(a[0],"content"))
494 l.assign(a[1]); 495 l.assign(a[1]);
495 } 496 }
496 if(heq) 497 if(heq)
497 xrds_location = l; 498 xrds_location = l;
498 }else if(is_element(n,"link")) { 499 }else if(is_element(n,"link")) {
499 string rels; 500 string rels;
500 string href; 501 string href;
501 for(;*a;a+=2) { 502 for(;*a;a+=2) {
502 if( !strcasecmp(a[0],"rel") ) { 503 if( !strcasecmp(a[0],"rel") ) {
503 rels.assign(a[1]); 504 rels.assign(a[1]);
504 }else if( !strcasecmp(a[0],"href") ) { 505 }else if( !strcasecmp(a[0],"href") ) {
505 const char *ns = a[1]; 506 const char *ns = a[1];
506 for(;*ns && isspace(*ns);++ns) ; 507 for(;*ns && isspace(*ns);++ns) ;
507 href.assign(ns); 508 href.assign(ns);
508 string::size_type lns=href.find_last_not_of(data::_whitespace_chars); 509 string::size_type lns=href.find_last_not_of(data::_whitespace_chars);
509 href.erase(lns+1); 510 href.erase(lns+1);
510 } 511 }
511 } 512 }
512 for(string::size_type ns=rels.find_first_not_of(data::_whitespace_chars); 513 for(string::size_type ns=rels.find_first_not_of(data::_whitespace_chars);
513 ns!=string::npos; ns=rels.find_first_not_of(data::_whitespace_chars,ns)) { 514 ns!=string::npos; ns=rels.find_first_not_of(data::_whitespace_chars,ns)) {
514 string::size_type s = rels.find_first_of(data::_whitespace_chars,ns); 515 string::size_type s = rels.find_first_of(data::_whitespace_chars,ns);
515 string rel; 516 string rel;
516 if(s==string::npos) { 517 if(s==string::npos) {
517 rel.assign(rels,ns,string::npos); 518 rel.assign(rels,ns,string::npos);
518 ns = string::npos; 519 ns = string::npos;
519 }else{ 520 }else{
520 rel.assign(rels,ns,s-ns); 521 rel.assign(rels,ns,s-ns);
521 ns = s; 522 ns = s;
522 } 523 }
523 if(rel=="openid.server") 524 if(rel=="openid.server")
524 html_openid1.uris.add(-1,xrd::uri_t(href)); 525 html_openid1.uris.add(-1,xrd::uri_t(href));
525 else if(rel=="openid.delegate") 526 else if(rel=="openid.delegate")
526 html_openid1.local_ids.add(-1,href); 527 html_openid1.local_ids.add(-1,href);
527 else if(rel=="openid2.provider") 528 else if(rel=="openid2.provider")
528 html_openid2.uris.add(-1,xrd::uri_t(href)); 529 html_openid2.uris.add(-1,xrd::uri_t(href));
529 else if(rel=="openid2.local_id") 530 else if(rel=="openid2.local_id")
530 html_openid2.local_ids.add(-1,href); 531 html_openid2.local_ids.add(-1,href);
531 } 532 }
532 }else if(is_element(n,"body")) { 533 }else if(is_element(n,"body")) {
533 skipping = -1; 534 skipping = -1;
534 } 535 }
535 } 536 }
536 537
537 void queue_endpoints(endpoint_discovery_iterator& oi, 538 void queue_endpoints(endpoint_discovery_iterator& oi,
538 const idiscovery_t &id, 539 const idiscovery_t &id,
539 const service_type_t *st) { 540 const service_type_t *st) {
540 openid_endpoint_t ep; 541 openid_endpoint_t ep;
541 ep.claimed_id = id.canonicalized_id; 542 ep.claimed_id = id.canonicalized_id;
542 for(xrd::services_t::const_iterator isvc=id.xrd.services.begin(); 543 for(xrd::services_t::const_iterator isvc=id.xrd.services.begin();
543 isvc!=id.xrd.services.end(); ++isvc) { 544 isvc!=id.xrd.services.end(); ++isvc) {
544 const xrd::service_t svc = isvc->second; 545 const xrd::service_t svc = isvc->second;
545 if(svc.types.find(st->uri)==svc.types.end()) continue; 546 if(svc.types.find(st->uri)==svc.types.end()) continue;
546 for(xrd::uris_t::const_iterator iu=svc.uris.begin();iu!=svc.uris.end();++iu) { 547 for(xrd::uris_t::const_iterator iu=svc.uris.begin();iu!=svc.uris.end();++iu) {
547 ep.uri = iu->second.uri; 548 ep.uri = iu->second.uri;
548 if(id.xri_identity) { 549 if(id.xri_identity) {
549 if(iu->second.append=="qxri") { 550 if(iu->second.append=="qxri") {
550 ep.uri += id.normalized_id; 551 ep.uri += id.normalized_id;
551 } /* TODO: else handle other append attribute values */ 552 } /* TODO: else handle other append attribute values */
552 } 553 }
553 if(st->forceid) { 554 if(st->forceid) {
554 ep.local_id = ep.claimed_id = st->forceid; 555 ep.local_id = ep.claimed_id = st->forceid;
555 *(oi++) = ep; 556 *(oi++) = ep;
556 }else{ 557 }else{
557 if(svc.local_ids.empty()) { 558 if(svc.local_ids.empty()) {
558 ep.local_id = ep.claimed_id; 559 ep.local_id = ep.claimed_id;
559 *(oi++) = ep; 560 *(oi++) = ep;
560 }else{ 561 }else{
561 for(xrd::local_ids_t::const_iterator ilid=svc.local_ids.begin(); 562 for(xrd::local_ids_t::const_iterator ilid=svc.local_ids.begin();
562 ilid!=svc.local_ids.end(); ++ilid) { 563 ilid!=svc.local_ids.end(); ++ilid) {
563 ep.local_id = ilid->second; 564 ep.local_id = ilid->second;
564 *(oi++) = ep; 565 *(oi++) = ep;
565 } 566 }
566 } 567 }
567 } 568 }
568 } 569 }
569 } 570 }
570 } 571 }
571 572
573 int unknown_encoding(const XML_Char *n,XML_Encoding *i) {
574 for(int ii=0;ii < sizeof(i->map)/sizeof(i->map[0]);++ii)
575 i->map[ii] = ii;
576 i->convert = 0; i->release = 0;
577 return XML_STATUS_OK;
578 }
579
572 }; 580 };
573 581
574 string idiscover(endpoint_discovery_iterator oi,const string& identity) { 582 string idiscover(endpoint_discovery_iterator oi,const string& identity) {
575 idigger_t idigger; 583 idigger_t idigger;
576 return idigger.discover(oi,identity); 584 return idigger.discover(oi,identity);
577 } 585 }
578 586
579 void yadiscover(endpoint_discovery_iterator oi,const string& yurl,const char **types,bool redirs) try { 587 void yadiscover(endpoint_discovery_iterator oi,const string& yurl,const char **types,bool redirs) try {
580 idigger_t idigger; 588 idigger_t idigger;
581 idigger.yadiscover(oi,yurl,types,redirs); 589 idigger.yadiscover(oi,yurl,types,redirs);
582 }catch(exception_curl& ec) { 590 }catch(exception_curl& ec) {
583 if(redirs || ec._error!=CURLE_TOO_MANY_REDIRECTS) 591 if(redirs || ec._error!=CURLE_TOO_MANY_REDIRECTS)
584 throw; 592 throw;
585 } 593 }
586 594
587} 595}