blob: 3dbd12293186baad1a5cb07c67890b8b033d4083 [file] [log] [blame]
Jason A. Donenfeldd01a6ee2014-01-10 04:59:34 +01001/* parsing.c: parsing of config files
Lars Hjemli7640d902006-12-10 22:41:14 +01002 *
Lukas Fleischerf7f26f82014-01-08 15:10:49 +01003 * Copyright (C) 2006-2014 cgit Development Team <cgit@lists.zx2c4.com>
Lars Hjemli7640d902006-12-10 22:41:14 +01004 *
5 * Licensed under GNU General Public License v2
6 * (see COPYING for full license text)
7 */
8
Lars Hjemli0d169ad2006-12-09 15:18:17 +01009#include "cgit.h"
10
Lars Hjemli30ccdca2007-05-18 03:00:54 +020011/*
12 * url syntax: [repo ['/' cmd [ '/' path]]]
13 * repo: any valid repo url, may contain '/'
14 * cmd: log | commit | diff | tree | view | blob | snapshot
15 * path: any valid path, may contain '/'
16 *
17 */
18void cgit_parse_url(const char *url)
19{
Julian Maurice10451792014-03-28 23:18:29 +010020 char *c, *cmd, *p;
21 struct cgit_repo *repo;
Lars Hjemli30ccdca2007-05-18 03:00:54 +020022
Lars Hjemlid1f3bbe2008-02-16 13:56:09 +010023 ctx.repo = NULL;
Lars Hjemli30ccdca2007-05-18 03:00:54 +020024 if (!url || url[0] == '\0')
25 return;
26
Lars Hjemlid1f3bbe2008-02-16 13:56:09 +010027 ctx.repo = cgit_get_repoinfo(url);
28 if (ctx.repo) {
29 ctx.qry.repo = ctx.repo->url;
Lars Hjemli30ccdca2007-05-18 03:00:54 +020030 return;
31 }
32
Julian Maurice10451792014-03-28 23:18:29 +010033 cmd = NULL;
34 c = strchr(url, '/');
35 while (c) {
36 c[0] = '\0';
37 repo = cgit_get_repoinfo(url);
38 if (repo) {
39 ctx.repo = repo;
40 cmd = c;
Lars Hjemli30ccdca2007-05-18 03:00:54 +020041 }
Julian Maurice10451792014-03-28 23:18:29 +010042 c[0] = '/';
43 c = strchr(c + 1, '/');
44 }
Lars Hjemli30ccdca2007-05-18 03:00:54 +020045
Julian Maurice10451792014-03-28 23:18:29 +010046 if (ctx.repo) {
Lars Hjemlid1f3bbe2008-02-16 13:56:09 +010047 ctx.qry.repo = ctx.repo->url;
Lars Hjemli30ccdca2007-05-18 03:00:54 +020048 p = strchr(cmd + 1, '/');
49 if (p) {
50 p[0] = '\0';
Lars Hjemli3de63b22007-05-18 13:06:45 +020051 if (p[1])
Lars Hjemlid14d77f2008-02-16 11:53:40 +010052 ctx.qry.path = trim_end(p + 1, '/');
Lars Hjemli30ccdca2007-05-18 03:00:54 +020053 }
Lars Hjemlie0e44782008-03-24 01:09:39 +010054 if (cmd[1])
55 ctx.qry.page = xstrdup(cmd + 1);
Lars Hjemli30ccdca2007-05-18 03:00:54 +020056 return;
57 }
58}
59
Lukas Fleischerbafab422013-03-04 08:52:33 +010060static char *substr(const char *head, const char *tail)
Lars Hjemli2101e262006-12-15 18:17:36 +010061{
62 char *buf;
63
Jim Meyering61d41472012-04-23 22:06:35 +020064 if (tail < head)
65 return xstrdup("");
Lars Hjemli2101e262006-12-15 18:17:36 +010066 buf = xmalloc(tail - head + 1);
67 strncpy(buf, head, tail - head);
68 buf[tail - head] = '\0';
69 return buf;
70}
71
John Keeping93d8ef82014-07-27 11:56:18 +010072static const char *parse_user(const char *t, char **name, char **email, unsigned long *date)
Lars Hjemlia8305a92008-09-14 09:45:37 +020073{
John Keeping93d8ef82014-07-27 11:56:18 +010074 const char *p = t;
Lars Hjemlia8305a92008-09-14 09:45:37 +020075 int mode = 1;
76
77 while (p && *p) {
78 if (mode == 1 && *p == '<') {
79 *name = substr(t, p - 1);
80 t = p;
81 mode++;
82 } else if (mode == 1 && *p == '\n') {
83 *name = substr(t, p);
84 p++;
85 break;
86 } else if (mode == 2 && *p == '>') {
87 *email = substr(t, p + 1);
88 t = p;
89 mode++;
90 } else if (mode == 2 && *p == '\n') {
91 *email = substr(t, p);
92 p++;
93 break;
94 } else if (mode == 3 && isdigit(*p)) {
95 *date = atol(p);
96 mode++;
97 } else if (*p == '\n') {
98 p++;
99 break;
100 }
101 p++;
102 }
103 return p;
104}
105
Lars Hjemli14b4e102008-12-05 19:10:28 +0100106#ifdef NO_ICONV
107#define reencode(a, b, c)
108#else
Lukas Fleischerbafab422013-03-04 08:52:33 +0100109static const char *reencode(char **txt, const char *src_enc, const char *dst_enc)
Lars Hjemlia8305a92008-09-14 09:45:37 +0200110{
111 char *tmp;
112
Lukas Fleischera0bf3752011-04-05 10:35:43 +0200113 if (!txt)
114 return NULL;
115
116 if (!*txt || !src_enc || !dst_enc)
Lars Hjemlia8305a92008-09-14 09:45:37 +0200117 return *txt;
118
Julius Plenz0a799422011-03-10 17:03:23 +0100119 /* no encoding needed if src_enc equals dst_enc */
Jason A. Donenfeldbdae1d82013-03-03 23:21:33 -0500120 if (!strcasecmp(src_enc, dst_enc))
Julius Plenz0a799422011-03-10 17:03:23 +0100121 return *txt;
122
123 tmp = reencode_string(*txt, dst_enc, src_enc);
Lars Hjemlia8305a92008-09-14 09:45:37 +0200124 if (tmp) {
125 free(*txt);
126 *txt = tmp;
127 }
128 return *txt;
129}
Lars Hjemli14b4e102008-12-05 19:10:28 +0100130#endif
Lars Hjemlia8305a92008-09-14 09:45:37 +0200131
Lars Hjemli2101e262006-12-15 18:17:36 +0100132struct commitinfo *cgit_parse_commit(struct commit *commit)
133{
134 struct commitinfo *ret;
John Keeping865afe02014-07-27 11:56:19 +0100135 const char *p = get_cached_commit_buffer(commit, NULL);
136 const char *t;
Lars Hjemli2101e262006-12-15 18:17:36 +0100137
138 ret = xmalloc(sizeof(*ret));
139 ret->commit = commit;
Lars Hjemli66091f92007-01-16 18:41:01 +0100140 ret->author = NULL;
141 ret->author_email = NULL;
142 ret->committer = NULL;
143 ret->committer_email = NULL;
144 ret->subject = NULL;
145 ret->msg = NULL;
Jonathan Bastien-Filiatrault3845e172007-10-26 18:09:06 -0400146 ret->msg_encoding = NULL;
Lars Hjemli2101e262006-12-15 18:17:36 +0100147
Ondrej Jirman61302312007-05-26 03:27:49 +0200148 if (p == NULL)
149 return ret;
150
Christian Hesse79c985e2014-05-29 17:35:46 +0200151 if (!starts_with(p, "tree "))
Lars Hjemli2101e262006-12-15 18:17:36 +0100152 die("Bad commit: %s", sha1_to_hex(commit->object.sha1));
153 else
154 p += 46; // "tree " + hex[40] + "\n"
155
Christian Hesse79c985e2014-05-29 17:35:46 +0200156 while (starts_with(p, "parent "))
Lars Hjemli2101e262006-12-15 18:17:36 +0100157 p += 48; // "parent " + hex[40] + "\n"
158
Christian Hesse79c985e2014-05-29 17:35:46 +0200159 if (p && starts_with(p, "author ")) {
Lars Hjemlia8305a92008-09-14 09:45:37 +0200160 p = parse_user(p + 7, &ret->author, &ret->author_email,
161 &ret->author_date);
Lars Hjemli2101e262006-12-15 18:17:36 +0100162 }
163
Christian Hesse79c985e2014-05-29 17:35:46 +0200164 if (p && starts_with(p, "committer ")) {
Lukas Fleischer2a7dd4b2014-01-15 23:09:08 +0100165 p = parse_user(p + 10, &ret->committer, &ret->committer_email,
Lars Hjemlia8305a92008-09-14 09:45:37 +0200166 &ret->committer_date);
Lars Hjemli2101e262006-12-15 18:17:36 +0100167 }
168
Christian Hesse79c985e2014-05-29 17:35:46 +0200169 if (p && starts_with(p, "encoding ")) {
Jonathan Bastien-Filiatraultaa5cc322007-10-26 18:10:26 -0400170 p += 9;
Lars Hjemlia8305a92008-09-14 09:45:37 +0200171 t = strchr(p, '\n');
172 if (t) {
173 ret->msg_encoding = substr(p, t + 1);
174 p = t + 1;
175 }
176 }
Jonathan Bastien-Filiatraultaa5cc322007-10-26 18:10:26 -0400177
Julius Plenz0a799422011-03-10 17:03:23 +0100178 /* if no special encoding is found, assume UTF-8 */
Jason A. Donenfeldbdae1d82013-03-03 23:21:33 -0500179 if (!ret->msg_encoding)
Julius Plenz0a799422011-03-10 17:03:23 +0100180 ret->msg_encoding = xstrdup("UTF-8");
181
Lars Hjemlia8305a92008-09-14 09:45:37 +0200182 // skip unknown header fields
183 while (p && *p && (*p != '\n')) {
184 p = strchr(p, '\n');
185 if (p)
186 p++;
187 }
Lars Hjemli13d2b0b2007-10-24 21:14:44 +0200188
Lars Hjemlia8305a92008-09-14 09:45:37 +0200189 // skip empty lines between headers and message
190 while (p && *p == '\n')
191 p++;
192
193 if (!p)
194 return ret;
Lars Hjemli2101e262006-12-15 18:17:36 +0100195
196 t = strchr(p, '\n');
Ondrej Jirman3ce6fc12007-05-26 02:19:38 +0200197 if (t) {
Lars Hjemlia8305a92008-09-14 09:45:37 +0200198 ret->subject = substr(p, t);
Lars Hjemli66091f92007-01-16 18:41:01 +0100199 p = t + 1;
Lars Hjemli2101e262006-12-15 18:17:36 +0100200
Lars Hjemlia8305a92008-09-14 09:45:37 +0200201 while (p && *p == '\n') {
202 p = strchr(p, '\n');
203 if (p)
204 p++;
205 }
206 if (p)
207 ret->msg = xstrdup(p);
Ondrej Jirman3ce6fc12007-05-26 02:19:38 +0200208 } else
Lars Hjemlia8305a92008-09-14 09:45:37 +0200209 ret->subject = xstrdup(p);
Ondrej Jirman3ce6fc12007-05-26 02:19:38 +0200210
Julius Plenz0a799422011-03-10 17:03:23 +0100211 reencode(&ret->author, ret->msg_encoding, PAGE_ENCODING);
212 reencode(&ret->author_email, ret->msg_encoding, PAGE_ENCODING);
213 reencode(&ret->committer, ret->msg_encoding, PAGE_ENCODING);
214 reencode(&ret->committer_email, ret->msg_encoding, PAGE_ENCODING);
215 reencode(&ret->subject, ret->msg_encoding, PAGE_ENCODING);
216 reencode(&ret->msg, ret->msg_encoding, PAGE_ENCODING);
Jonathan Bastien-Filiatrault7858a302007-10-26 18:13:41 -0400217
Lars Hjemli2101e262006-12-15 18:17:36 +0100218 return ret;
219}
Lars Hjemlia69061f2007-01-17 01:09:51 +0100220
221
222struct taginfo *cgit_parse_tag(struct tag *tag)
223{
224 void *data;
Lars Hjemli61c3ca92007-05-08 22:40:59 +0200225 enum object_type type;
Lars Hjemlia69061f2007-01-17 01:09:51 +0100226 unsigned long size;
John Keeping93d8ef82014-07-27 11:56:18 +0100227 const char *p;
Lars Hjemlia69061f2007-01-17 01:09:51 +0100228 struct taginfo *ret;
229
Lars Hjemli61c3ca92007-05-08 22:40:59 +0200230 data = read_sha1_file(tag->object.sha1, &type, &size);
231 if (!data || type != OBJ_TAG) {
Lars Hjemlia69061f2007-01-17 01:09:51 +0100232 free(data);
233 return 0;
234 }
Lars Hjemli47a81c72007-05-15 23:28:40 +0200235
Lars Hjemlia69061f2007-01-17 01:09:51 +0100236 ret = xmalloc(sizeof(*ret));
237 ret->tagger = NULL;
238 ret->tagger_email = NULL;
239 ret->tagger_date = 0;
240 ret->msg = NULL;
241
242 p = data;
243
Lars Hjemliebd7b0f2007-02-03 16:11:41 +0100244 while (p && *p) {
Lars Hjemlia69061f2007-01-17 01:09:51 +0100245 if (*p == '\n')
246 break;
247
Christian Hesse79c985e2014-05-29 17:35:46 +0200248 if (starts_with(p, "tagger ")) {
Lars Hjemlia8305a92008-09-14 09:45:37 +0200249 p = parse_user(p + 7, &ret->tagger, &ret->tagger_email,
250 &ret->tagger_date);
251 } else {
252 p = strchr(p, '\n');
253 if (p)
254 p++;
Lars Hjemlia69061f2007-01-17 01:09:51 +0100255 }
Lars Hjemlia69061f2007-01-17 01:09:51 +0100256 }
257
Lars Hjemlia8305a92008-09-14 09:45:37 +0200258 // skip empty lines between headers and message
259 while (p && *p == '\n')
260 p++;
Lars Hjemli13d2b0b2007-10-24 21:14:44 +0200261
Lars Hjemliebd7b0f2007-02-03 16:11:41 +0100262 if (p && *p)
Lars Hjemlia69061f2007-01-17 01:09:51 +0100263 ret->msg = xstrdup(p);
264 free(data);
265 return ret;
266}