Jason A. Donenfeld | d01a6ee | 2014-01-10 04:59:34 +0100 | [diff] [blame] | 1 | /* parsing.c: parsing of config files |
Lars Hjemli | 7640d90 | 2006-12-10 22:41:14 +0100 | [diff] [blame] | 2 | * |
Lukas Fleischer | f7f26f8 | 2014-01-08 15:10:49 +0100 | [diff] [blame] | 3 | * Copyright (C) 2006-2014 cgit Development Team <cgit@lists.zx2c4.com> |
Lars Hjemli | 7640d90 | 2006-12-10 22:41:14 +0100 | [diff] [blame] | 4 | * |
| 5 | * Licensed under GNU General Public License v2 |
| 6 | * (see COPYING for full license text) |
| 7 | */ |
| 8 | |
Lars Hjemli | 0d169ad | 2006-12-09 15:18:17 +0100 | [diff] [blame] | 9 | #include "cgit.h" |
| 10 | |
Lars Hjemli | 30ccdca | 2007-05-18 03:00:54 +0200 | [diff] [blame] | 11 | /* |
| 12 | * url syntax: [repo ['/' cmd [ '/' path]]] |
| 13 | * repo: any valid repo url, may contain '/' |
| 14 | * cmd: log | commit | diff | tree | view | blob | snapshot |
| 15 | * path: any valid path, may contain '/' |
| 16 | * |
| 17 | */ |
| 18 | void cgit_parse_url(const char *url) |
| 19 | { |
Julian Maurice | 1045179 | 2014-03-28 23:18:29 +0100 | [diff] [blame] | 20 | char *c, *cmd, *p; |
| 21 | struct cgit_repo *repo; |
Lars Hjemli | 30ccdca | 2007-05-18 03:00:54 +0200 | [diff] [blame] | 22 | |
Lars Hjemli | d1f3bbe | 2008-02-16 13:56:09 +0100 | [diff] [blame] | 23 | ctx.repo = NULL; |
Lars Hjemli | 30ccdca | 2007-05-18 03:00:54 +0200 | [diff] [blame] | 24 | if (!url || url[0] == '\0') |
| 25 | return; |
| 26 | |
Lars Hjemli | d1f3bbe | 2008-02-16 13:56:09 +0100 | [diff] [blame] | 27 | ctx.repo = cgit_get_repoinfo(url); |
| 28 | if (ctx.repo) { |
| 29 | ctx.qry.repo = ctx.repo->url; |
Lars Hjemli | 30ccdca | 2007-05-18 03:00:54 +0200 | [diff] [blame] | 30 | return; |
| 31 | } |
| 32 | |
Julian Maurice | 1045179 | 2014-03-28 23:18:29 +0100 | [diff] [blame] | 33 | cmd = NULL; |
| 34 | c = strchr(url, '/'); |
| 35 | while (c) { |
| 36 | c[0] = '\0'; |
| 37 | repo = cgit_get_repoinfo(url); |
| 38 | if (repo) { |
| 39 | ctx.repo = repo; |
| 40 | cmd = c; |
Lars Hjemli | 30ccdca | 2007-05-18 03:00:54 +0200 | [diff] [blame] | 41 | } |
Julian Maurice | 1045179 | 2014-03-28 23:18:29 +0100 | [diff] [blame] | 42 | c[0] = '/'; |
| 43 | c = strchr(c + 1, '/'); |
| 44 | } |
Lars Hjemli | 30ccdca | 2007-05-18 03:00:54 +0200 | [diff] [blame] | 45 | |
Julian Maurice | 1045179 | 2014-03-28 23:18:29 +0100 | [diff] [blame] | 46 | if (ctx.repo) { |
Lars Hjemli | d1f3bbe | 2008-02-16 13:56:09 +0100 | [diff] [blame] | 47 | ctx.qry.repo = ctx.repo->url; |
Lars Hjemli | 30ccdca | 2007-05-18 03:00:54 +0200 | [diff] [blame] | 48 | p = strchr(cmd + 1, '/'); |
| 49 | if (p) { |
| 50 | p[0] = '\0'; |
Lars Hjemli | 3de63b2 | 2007-05-18 13:06:45 +0200 | [diff] [blame] | 51 | if (p[1]) |
Lars Hjemli | d14d77f | 2008-02-16 11:53:40 +0100 | [diff] [blame] | 52 | ctx.qry.path = trim_end(p + 1, '/'); |
Lars Hjemli | 30ccdca | 2007-05-18 03:00:54 +0200 | [diff] [blame] | 53 | } |
Lars Hjemli | e0e4478 | 2008-03-24 01:09:39 +0100 | [diff] [blame] | 54 | if (cmd[1]) |
| 55 | ctx.qry.page = xstrdup(cmd + 1); |
Lars Hjemli | 30ccdca | 2007-05-18 03:00:54 +0200 | [diff] [blame] | 56 | return; |
| 57 | } |
| 58 | } |
| 59 | |
Lukas Fleischer | bafab42 | 2013-03-04 08:52:33 +0100 | [diff] [blame] | 60 | static char *substr(const char *head, const char *tail) |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 61 | { |
| 62 | char *buf; |
| 63 | |
Jim Meyering | 61d4147 | 2012-04-23 22:06:35 +0200 | [diff] [blame] | 64 | if (tail < head) |
| 65 | return xstrdup(""); |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 66 | buf = xmalloc(tail - head + 1); |
| 67 | strncpy(buf, head, tail - head); |
| 68 | buf[tail - head] = '\0'; |
| 69 | return buf; |
| 70 | } |
| 71 | |
John Keeping | 93d8ef8 | 2014-07-27 11:56:18 +0100 | [diff] [blame] | 72 | static const char *parse_user(const char *t, char **name, char **email, unsigned long *date) |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 73 | { |
John Keeping | 93d8ef8 | 2014-07-27 11:56:18 +0100 | [diff] [blame] | 74 | const char *p = t; |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 75 | int mode = 1; |
| 76 | |
| 77 | while (p && *p) { |
| 78 | if (mode == 1 && *p == '<') { |
| 79 | *name = substr(t, p - 1); |
| 80 | t = p; |
| 81 | mode++; |
| 82 | } else if (mode == 1 && *p == '\n') { |
| 83 | *name = substr(t, p); |
| 84 | p++; |
| 85 | break; |
| 86 | } else if (mode == 2 && *p == '>') { |
| 87 | *email = substr(t, p + 1); |
| 88 | t = p; |
| 89 | mode++; |
| 90 | } else if (mode == 2 && *p == '\n') { |
| 91 | *email = substr(t, p); |
| 92 | p++; |
| 93 | break; |
| 94 | } else if (mode == 3 && isdigit(*p)) { |
| 95 | *date = atol(p); |
| 96 | mode++; |
| 97 | } else if (*p == '\n') { |
| 98 | p++; |
| 99 | break; |
| 100 | } |
| 101 | p++; |
| 102 | } |
| 103 | return p; |
| 104 | } |
| 105 | |
Lars Hjemli | 14b4e10 | 2008-12-05 19:10:28 +0100 | [diff] [blame] | 106 | #ifdef NO_ICONV |
| 107 | #define reencode(a, b, c) |
| 108 | #else |
Lukas Fleischer | bafab42 | 2013-03-04 08:52:33 +0100 | [diff] [blame] | 109 | static const char *reencode(char **txt, const char *src_enc, const char *dst_enc) |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 110 | { |
| 111 | char *tmp; |
| 112 | |
Lukas Fleischer | a0bf375 | 2011-04-05 10:35:43 +0200 | [diff] [blame] | 113 | if (!txt) |
| 114 | return NULL; |
| 115 | |
| 116 | if (!*txt || !src_enc || !dst_enc) |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 117 | return *txt; |
| 118 | |
Julius Plenz | 0a79942 | 2011-03-10 17:03:23 +0100 | [diff] [blame] | 119 | /* no encoding needed if src_enc equals dst_enc */ |
Jason A. Donenfeld | bdae1d8 | 2013-03-03 23:21:33 -0500 | [diff] [blame] | 120 | if (!strcasecmp(src_enc, dst_enc)) |
Julius Plenz | 0a79942 | 2011-03-10 17:03:23 +0100 | [diff] [blame] | 121 | return *txt; |
| 122 | |
| 123 | tmp = reencode_string(*txt, dst_enc, src_enc); |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 124 | if (tmp) { |
| 125 | free(*txt); |
| 126 | *txt = tmp; |
| 127 | } |
| 128 | return *txt; |
| 129 | } |
Lars Hjemli | 14b4e10 | 2008-12-05 19:10:28 +0100 | [diff] [blame] | 130 | #endif |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 131 | |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 132 | struct commitinfo *cgit_parse_commit(struct commit *commit) |
| 133 | { |
| 134 | struct commitinfo *ret; |
John Keeping | 865afe0 | 2014-07-27 11:56:19 +0100 | [diff] [blame^] | 135 | const char *p = get_cached_commit_buffer(commit, NULL); |
| 136 | const char *t; |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 137 | |
| 138 | ret = xmalloc(sizeof(*ret)); |
| 139 | ret->commit = commit; |
Lars Hjemli | 66091f9 | 2007-01-16 18:41:01 +0100 | [diff] [blame] | 140 | ret->author = NULL; |
| 141 | ret->author_email = NULL; |
| 142 | ret->committer = NULL; |
| 143 | ret->committer_email = NULL; |
| 144 | ret->subject = NULL; |
| 145 | ret->msg = NULL; |
Jonathan Bastien-Filiatrault | 3845e17 | 2007-10-26 18:09:06 -0400 | [diff] [blame] | 146 | ret->msg_encoding = NULL; |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 147 | |
Ondrej Jirman | 6130231 | 2007-05-26 03:27:49 +0200 | [diff] [blame] | 148 | if (p == NULL) |
| 149 | return ret; |
| 150 | |
Christian Hesse | 79c985e | 2014-05-29 17:35:46 +0200 | [diff] [blame] | 151 | if (!starts_with(p, "tree ")) |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 152 | die("Bad commit: %s", sha1_to_hex(commit->object.sha1)); |
| 153 | else |
| 154 | p += 46; // "tree " + hex[40] + "\n" |
| 155 | |
Christian Hesse | 79c985e | 2014-05-29 17:35:46 +0200 | [diff] [blame] | 156 | while (starts_with(p, "parent ")) |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 157 | p += 48; // "parent " + hex[40] + "\n" |
| 158 | |
Christian Hesse | 79c985e | 2014-05-29 17:35:46 +0200 | [diff] [blame] | 159 | if (p && starts_with(p, "author ")) { |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 160 | p = parse_user(p + 7, &ret->author, &ret->author_email, |
| 161 | &ret->author_date); |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 162 | } |
| 163 | |
Christian Hesse | 79c985e | 2014-05-29 17:35:46 +0200 | [diff] [blame] | 164 | if (p && starts_with(p, "committer ")) { |
Lukas Fleischer | 2a7dd4b | 2014-01-15 23:09:08 +0100 | [diff] [blame] | 165 | p = parse_user(p + 10, &ret->committer, &ret->committer_email, |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 166 | &ret->committer_date); |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 167 | } |
| 168 | |
Christian Hesse | 79c985e | 2014-05-29 17:35:46 +0200 | [diff] [blame] | 169 | if (p && starts_with(p, "encoding ")) { |
Jonathan Bastien-Filiatrault | aa5cc32 | 2007-10-26 18:10:26 -0400 | [diff] [blame] | 170 | p += 9; |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 171 | t = strchr(p, '\n'); |
| 172 | if (t) { |
| 173 | ret->msg_encoding = substr(p, t + 1); |
| 174 | p = t + 1; |
| 175 | } |
| 176 | } |
Jonathan Bastien-Filiatrault | aa5cc32 | 2007-10-26 18:10:26 -0400 | [diff] [blame] | 177 | |
Julius Plenz | 0a79942 | 2011-03-10 17:03:23 +0100 | [diff] [blame] | 178 | /* if no special encoding is found, assume UTF-8 */ |
Jason A. Donenfeld | bdae1d8 | 2013-03-03 23:21:33 -0500 | [diff] [blame] | 179 | if (!ret->msg_encoding) |
Julius Plenz | 0a79942 | 2011-03-10 17:03:23 +0100 | [diff] [blame] | 180 | ret->msg_encoding = xstrdup("UTF-8"); |
| 181 | |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 182 | // skip unknown header fields |
| 183 | while (p && *p && (*p != '\n')) { |
| 184 | p = strchr(p, '\n'); |
| 185 | if (p) |
| 186 | p++; |
| 187 | } |
Lars Hjemli | 13d2b0b | 2007-10-24 21:14:44 +0200 | [diff] [blame] | 188 | |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 189 | // skip empty lines between headers and message |
| 190 | while (p && *p == '\n') |
| 191 | p++; |
| 192 | |
| 193 | if (!p) |
| 194 | return ret; |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 195 | |
| 196 | t = strchr(p, '\n'); |
Ondrej Jirman | 3ce6fc1 | 2007-05-26 02:19:38 +0200 | [diff] [blame] | 197 | if (t) { |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 198 | ret->subject = substr(p, t); |
Lars Hjemli | 66091f9 | 2007-01-16 18:41:01 +0100 | [diff] [blame] | 199 | p = t + 1; |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 200 | |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 201 | while (p && *p == '\n') { |
| 202 | p = strchr(p, '\n'); |
| 203 | if (p) |
| 204 | p++; |
| 205 | } |
| 206 | if (p) |
| 207 | ret->msg = xstrdup(p); |
Ondrej Jirman | 3ce6fc1 | 2007-05-26 02:19:38 +0200 | [diff] [blame] | 208 | } else |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 209 | ret->subject = xstrdup(p); |
Ondrej Jirman | 3ce6fc1 | 2007-05-26 02:19:38 +0200 | [diff] [blame] | 210 | |
Julius Plenz | 0a79942 | 2011-03-10 17:03:23 +0100 | [diff] [blame] | 211 | reencode(&ret->author, ret->msg_encoding, PAGE_ENCODING); |
| 212 | reencode(&ret->author_email, ret->msg_encoding, PAGE_ENCODING); |
| 213 | reencode(&ret->committer, ret->msg_encoding, PAGE_ENCODING); |
| 214 | reencode(&ret->committer_email, ret->msg_encoding, PAGE_ENCODING); |
| 215 | reencode(&ret->subject, ret->msg_encoding, PAGE_ENCODING); |
| 216 | reencode(&ret->msg, ret->msg_encoding, PAGE_ENCODING); |
Jonathan Bastien-Filiatrault | 7858a30 | 2007-10-26 18:13:41 -0400 | [diff] [blame] | 217 | |
Lars Hjemli | 2101e26 | 2006-12-15 18:17:36 +0100 | [diff] [blame] | 218 | return ret; |
| 219 | } |
Lars Hjemli | a69061f | 2007-01-17 01:09:51 +0100 | [diff] [blame] | 220 | |
| 221 | |
| 222 | struct taginfo *cgit_parse_tag(struct tag *tag) |
| 223 | { |
| 224 | void *data; |
Lars Hjemli | 61c3ca9 | 2007-05-08 22:40:59 +0200 | [diff] [blame] | 225 | enum object_type type; |
Lars Hjemli | a69061f | 2007-01-17 01:09:51 +0100 | [diff] [blame] | 226 | unsigned long size; |
John Keeping | 93d8ef8 | 2014-07-27 11:56:18 +0100 | [diff] [blame] | 227 | const char *p; |
Lars Hjemli | a69061f | 2007-01-17 01:09:51 +0100 | [diff] [blame] | 228 | struct taginfo *ret; |
| 229 | |
Lars Hjemli | 61c3ca9 | 2007-05-08 22:40:59 +0200 | [diff] [blame] | 230 | data = read_sha1_file(tag->object.sha1, &type, &size); |
| 231 | if (!data || type != OBJ_TAG) { |
Lars Hjemli | a69061f | 2007-01-17 01:09:51 +0100 | [diff] [blame] | 232 | free(data); |
| 233 | return 0; |
| 234 | } |
Lars Hjemli | 47a81c7 | 2007-05-15 23:28:40 +0200 | [diff] [blame] | 235 | |
Lars Hjemli | a69061f | 2007-01-17 01:09:51 +0100 | [diff] [blame] | 236 | ret = xmalloc(sizeof(*ret)); |
| 237 | ret->tagger = NULL; |
| 238 | ret->tagger_email = NULL; |
| 239 | ret->tagger_date = 0; |
| 240 | ret->msg = NULL; |
| 241 | |
| 242 | p = data; |
| 243 | |
Lars Hjemli | ebd7b0f | 2007-02-03 16:11:41 +0100 | [diff] [blame] | 244 | while (p && *p) { |
Lars Hjemli | a69061f | 2007-01-17 01:09:51 +0100 | [diff] [blame] | 245 | if (*p == '\n') |
| 246 | break; |
| 247 | |
Christian Hesse | 79c985e | 2014-05-29 17:35:46 +0200 | [diff] [blame] | 248 | if (starts_with(p, "tagger ")) { |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 249 | p = parse_user(p + 7, &ret->tagger, &ret->tagger_email, |
| 250 | &ret->tagger_date); |
| 251 | } else { |
| 252 | p = strchr(p, '\n'); |
| 253 | if (p) |
| 254 | p++; |
Lars Hjemli | a69061f | 2007-01-17 01:09:51 +0100 | [diff] [blame] | 255 | } |
Lars Hjemli | a69061f | 2007-01-17 01:09:51 +0100 | [diff] [blame] | 256 | } |
| 257 | |
Lars Hjemli | a8305a9 | 2008-09-14 09:45:37 +0200 | [diff] [blame] | 258 | // skip empty lines between headers and message |
| 259 | while (p && *p == '\n') |
| 260 | p++; |
Lars Hjemli | 13d2b0b | 2007-10-24 21:14:44 +0200 | [diff] [blame] | 261 | |
Lars Hjemli | ebd7b0f | 2007-02-03 16:11:41 +0100 | [diff] [blame] | 262 | if (p && *p) |
Lars Hjemli | a69061f | 2007-01-17 01:09:51 +0100 | [diff] [blame] | 263 | ret->msg = xstrdup(p); |
| 264 | free(data); |
| 265 | return ret; |
| 266 | } |