summaryrefslogtreecommitdiffabout
path: root/parsing.c
authorLars Hjemli <hjemli@gmail.com>2007-11-05 21:27:43 (UTC)
committer Jonathan Bastien-Filiatrault <joe@x2a.org>2007-11-05 23:13:31 (UTC)
commita2ebbd6948da96172108db5e9c02c141923ad05c (patch) (unidiff)
tree9c40233ffcd35f1b20bb07a04bdb8c23d649e1ee /parsing.c
parent7858a309d7671109950ec940f893c2d112d36b99 (diff)
downloadcgit-a2ebbd6948da96172108db5e9c02c141923ad05c.zip
cgit-a2ebbd6948da96172108db5e9c02c141923ad05c.tar.gz
cgit-a2ebbd6948da96172108db5e9c02c141923ad05c.tar.bz2
Use utf8::reencode_string from git
This replaces the iconv-support in cgit with similar functions already existing in git. Signed-off-by: Lars Hjemli <hjemli@gmai.com>
Diffstat (limited to 'parsing.c') (more/less context) (ignore whitespace changes)
-rw-r--r--parsing.c64
1 files changed, 4 insertions, 60 deletions
diff --git a/parsing.c b/parsing.c
index c731084..e8c7ab9 100644
--- a/parsing.c
+++ b/parsing.c
@@ -1,42 +1,40 @@
1/* config.c: parsing of config files 1/* config.c: parsing of config files
2 * 2 *
3 * Copyright (C) 2006 Lars Hjemli 3 * Copyright (C) 2006 Lars Hjemli
4 * 4 *
5 * Licensed under GNU General Public License v2 5 * Licensed under GNU General Public License v2
6 * (see COPYING for full license text) 6 * (see COPYING for full license text)
7 */ 7 */
8 8
9#include <iconv.h>
10
11#include "cgit.h" 9#include "cgit.h"
12 10
13int next_char(FILE *f) 11int next_char(FILE *f)
14{ 12{
15 int c = fgetc(f); 13 int c = fgetc(f);
16 if (c=='\r') { 14 if (c=='\r') {
17 c = fgetc(f); 15 c = fgetc(f);
18 if (c!='\n') { 16 if (c!='\n') {
19 ungetc(c, f); 17 ungetc(c, f);
20 c = '\r'; 18 c = '\r';
21 } 19 }
22 } 20 }
23 return c; 21 return c;
24} 22}
25 23
26void skip_line(FILE *f) 24void skip_line(FILE *f)
27{ 25{
28 int c; 26 int c;
29 27
30 while((c=next_char(f)) && c!='\n' && c!=EOF) 28 while((c=next_char(f)) && c!='\n' && c!=EOF)
31 ; 29 ;
32} 30}
33 31
34int read_config_line(FILE *f, char *line, const char **value, int bufsize) 32int read_config_line(FILE *f, char *line, const char **value, int bufsize)
35{ 33{
36 int i = 0, isname = 0; 34 int i = 0, isname = 0;
37 35
38 *value = NULL; 36 *value = NULL;
39 while(i<bufsize-1) { 37 while(i<bufsize-1) {
40 int c = next_char(f); 38 int c = next_char(f);
41 if (!isname && (c=='#' || c==';')) { 39 if (!isname && (c=='#' || c==';')) {
42 skip_line(f); 40 skip_line(f);
@@ -149,120 +147,64 @@ void cgit_parse_url(const char *url)
149 if (!url || url[0] == '\0') 147 if (!url || url[0] == '\0')
150 return; 148 return;
151 149
152 cgit_repo = cgit_get_repoinfo(url); 150 cgit_repo = cgit_get_repoinfo(url);
153 if (cgit_repo) { 151 if (cgit_repo) {
154 cgit_query_repo = cgit_repo->url; 152 cgit_query_repo = cgit_repo->url;
155 return; 153 return;
156 } 154 }
157 155
158 cmd = strchr(url, '/'); 156 cmd = strchr(url, '/');
159 while (!cgit_repo && cmd) { 157 while (!cgit_repo && cmd) {
160 cmd[0] = '\0'; 158 cmd[0] = '\0';
161 cgit_repo = cgit_get_repoinfo(url); 159 cgit_repo = cgit_get_repoinfo(url);
162 if (cgit_repo == NULL) { 160 if (cgit_repo == NULL) {
163 cmd[0] = '/'; 161 cmd[0] = '/';
164 cmd = strchr(cmd + 1, '/'); 162 cmd = strchr(cmd + 1, '/');
165 continue; 163 continue;
166 } 164 }
167 165
168 cgit_query_repo = cgit_repo->url; 166 cgit_query_repo = cgit_repo->url;
169 p = strchr(cmd + 1, '/'); 167 p = strchr(cmd + 1, '/');
170 if (p) { 168 if (p) {
171 p[0] = '\0'; 169 p[0] = '\0';
172 if (p[1]) 170 if (p[1])
173 cgit_query_path = trim_end(p + 1, '/'); 171 cgit_query_path = trim_end(p + 1, '/');
174 } 172 }
175 cgit_cmd = cgit_get_cmd_index(cmd + 1); 173 cgit_cmd = cgit_get_cmd_index(cmd + 1);
176 cgit_query_page = xstrdup(cmd + 1); 174 cgit_query_page = xstrdup(cmd + 1);
177 return; 175 return;
178 } 176 }
179} 177}
180 178
181static char *iconv_msg(char *msg, const char *encoding)
182{
183 iconv_t msg_conv = iconv_open(PAGE_ENCODING, encoding);
184 size_t inlen = strlen(msg);
185 char *in;
186 char *out;
187 size_t inleft;
188 size_t outleft;
189 char *buf;
190 char *ret;
191 size_t buf_sz;
192 int again, fail;
193
194 if(msg_conv == (iconv_t)-1)
195 return NULL;
196
197 buf_sz = inlen * 2;
198 buf = xmalloc(buf_sz+1);
199 do {
200 in = msg;
201 inleft = inlen;
202
203 out = buf;
204 outleft = buf_sz;
205 iconv(msg_conv, &in, &inleft, &out, &outleft);
206
207 if(inleft == 0) {
208 fail = 0;
209 again = 0;
210 } else if(inleft != 0 && errno == E2BIG) {
211 fail = 0;
212 again = 1;
213
214 buf_sz *= 2;
215 free(buf);
216 buf = xmalloc(buf_sz+1);
217 } else {
218 fail = 1;
219 again = 0;
220 }
221 } while(again && !fail);
222
223 if(fail) {
224 free(buf);
225 ret = NULL;
226 } else {
227 buf = xrealloc(buf, out - buf);
228 *out = 0;
229 ret = buf;
230 }
231
232 iconv_close(msg_conv);
233
234 return ret;
235}
236
237char *substr(const char *head, const char *tail) 179char *substr(const char *head, const char *tail)
238{ 180{
239 char *buf; 181 char *buf;
240 182
241 buf = xmalloc(tail - head + 1); 183 buf = xmalloc(tail - head + 1);
242 strncpy(buf, head, tail - head); 184 strncpy(buf, head, tail - head);
243 buf[tail - head] = '\0'; 185 buf[tail - head] = '\0';
244 return buf; 186 return buf;
245} 187}
246 188
247struct commitinfo *cgit_parse_commit(struct commit *commit) 189struct commitinfo *cgit_parse_commit(struct commit *commit)
248{ 190{
249 struct commitinfo *ret; 191 struct commitinfo *ret;
250 char *p = commit->buffer, *t = commit->buffer; 192 char *p = commit->buffer, *t = commit->buffer;
251 193
252 ret = xmalloc(sizeof(*ret)); 194 ret = xmalloc(sizeof(*ret));
253 ret->commit = commit; 195 ret->commit = commit;
254 ret->author = NULL; 196 ret->author = NULL;
255 ret->author_email = NULL; 197 ret->author_email = NULL;
256 ret->committer = NULL; 198 ret->committer = NULL;
257 ret->committer_email = NULL; 199 ret->committer_email = NULL;
258 ret->subject = NULL; 200 ret->subject = NULL;
259 ret->msg = NULL; 201 ret->msg = NULL;
260 ret->msg_encoding = NULL; 202 ret->msg_encoding = NULL;
261 203
262 if (p == NULL) 204 if (p == NULL)
263 return ret; 205 return ret;
264 206
265 if (strncmp(p, "tree ", 5)) 207 if (strncmp(p, "tree ", 5))
266 die("Bad commit: %s", sha1_to_hex(commit->object.sha1)); 208 die("Bad commit: %s", sha1_to_hex(commit->object.sha1));
267 else 209 else
268 p += 46; // "tree " + hex[40] + "\n" 210 p += 46; // "tree " + hex[40] + "\n"
@@ -292,71 +234,73 @@ struct commitinfo *cgit_parse_commit(struct commit *commit)
292 p = strchr(t, '\n') + 1; 234 p = strchr(t, '\n') + 1;
293 } 235 }
294 236
295 if (!strncmp(p, "encoding ", 9)) { 237 if (!strncmp(p, "encoding ", 9)) {
296 p += 9; 238 p += 9;
297 t = strchr(p, '\n') + 1; 239 t = strchr(p, '\n') + 1;
298 ret->msg_encoding = substr(p, t); 240 ret->msg_encoding = substr(p, t);
299 p = t; 241 p = t;
300 } else 242 } else
301 ret->msg_encoding = xstrdup(PAGE_ENCODING); 243 ret->msg_encoding = xstrdup(PAGE_ENCODING);
302 244
303 while (*p && (*p != '\n')) 245 while (*p && (*p != '\n'))
304 p = strchr(p, '\n') + 1; // skip unknown header fields 246 p = strchr(p, '\n') + 1; // skip unknown header fields
305 247
306 while (*p == '\n') 248 while (*p == '\n')
307 p = strchr(p, '\n') + 1; 249 p = strchr(p, '\n') + 1;
308 250
309 t = strchr(p, '\n'); 251 t = strchr(p, '\n');
310 if (t) { 252 if (t) {
311 if (*t == '\0') 253 if (*t == '\0')
312 ret->subject = "** empty **"; 254 ret->subject = "** empty **";
313 else 255 else
314 ret->subject = substr(p, t); 256 ret->subject = substr(p, t);
315 p = t + 1; 257 p = t + 1;
316 258
317 while (*p == '\n') 259 while (*p == '\n')
318 p = strchr(p, '\n') + 1; 260 p = strchr(p, '\n') + 1;
319 ret->msg = xstrdup(p); 261 ret->msg = xstrdup(p);
320 } else 262 } else
321 ret->subject = substr(p, p+strlen(p)); 263 ret->subject = substr(p, p+strlen(p));
322 264
323 if(strcmp(ret->msg_encoding, PAGE_ENCODING)) { 265 if(strcmp(ret->msg_encoding, PAGE_ENCODING)) {
324 t = iconv_msg(ret->subject, ret->msg_encoding); 266 t = reencode_string(ret->subject, PAGE_ENCODING,
267 ret->msg_encoding);
325 if(t) { 268 if(t) {
326 free(ret->subject); 269 free(ret->subject);
327 ret->subject = t; 270 ret->subject = t;
328 } 271 }
329 272
330 t = iconv_msg(ret->msg, ret->msg_encoding); 273 t = reencode_string(ret->msg, PAGE_ENCODING,
274 ret->msg_encoding);
331 if(t) { 275 if(t) {
332 free(ret->msg); 276 free(ret->msg);
333 ret->msg = t; 277 ret->msg = t;
334 } 278 }
335 } 279 }
336 280
337 return ret; 281 return ret;
338} 282}
339 283
340 284
341struct taginfo *cgit_parse_tag(struct tag *tag) 285struct taginfo *cgit_parse_tag(struct tag *tag)
342{ 286{
343 void *data; 287 void *data;
344 enum object_type type; 288 enum object_type type;
345 unsigned long size; 289 unsigned long size;
346 char *p, *t; 290 char *p, *t;
347 struct taginfo *ret; 291 struct taginfo *ret;
348 292
349 data = read_sha1_file(tag->object.sha1, &type, &size); 293 data = read_sha1_file(tag->object.sha1, &type, &size);
350 if (!data || type != OBJ_TAG) { 294 if (!data || type != OBJ_TAG) {
351 free(data); 295 free(data);
352 return 0; 296 return 0;
353 } 297 }
354 298
355 ret = xmalloc(sizeof(*ret)); 299 ret = xmalloc(sizeof(*ret));
356 ret->tagger = NULL; 300 ret->tagger = NULL;
357 ret->tagger_email = NULL; 301 ret->tagger_email = NULL;
358 ret->tagger_date = 0; 302 ret->tagger_date = 0;
359 ret->msg = NULL; 303 ret->msg = NULL;
360 304
361 p = data; 305 p = data;
362 306