all repos — cgit @ b431282c91deea24916578395d88084261410968

a hyperfast web frontend for git written in c

parsing.c (view raw)

  1/* parsing.c: parsing of config files
  2 *
  3 * Copyright (C) 2006-2014 cgit Development Team <cgit@lists.zx2c4.com>
  4 *
  5 * Licensed under GNU General Public License v2
  6 *   (see COPYING for full license text)
  7 */
  8
  9#include "cgit.h"
 10
 11/*
 12 * url syntax: [repo ['/' cmd [ '/' path]]]
 13 *   repo: any valid repo url, may contain '/'
 14 *   cmd:  log | commit | diff | tree | view | blob | snapshot
 15 *   path: any valid path, may contain '/'
 16 *
 17 */
 18void cgit_parse_url(const char *url)
 19{
 20	char *c, *cmd, *p;
 21	struct cgit_repo *repo;
 22
 23	ctx.repo = NULL;
 24	if (!url || url[0] == '\0')
 25		return;
 26
 27	ctx.repo = cgit_get_repoinfo(url);
 28	if (ctx.repo) {
 29		ctx.qry.repo = ctx.repo->url;
 30		return;
 31	}
 32
 33	cmd = NULL;
 34	c = strchr(url, '/');
 35	while (c) {
 36		c[0] = '\0';
 37		repo = cgit_get_repoinfo(url);
 38		if (repo) {
 39			ctx.repo = repo;
 40			cmd = c;
 41		}
 42		c[0] = '/';
 43		c = strchr(c + 1, '/');
 44	}
 45
 46	if (ctx.repo) {
 47		ctx.qry.repo = ctx.repo->url;
 48		p = strchr(cmd + 1, '/');
 49		if (p) {
 50			p[0] = '\0';
 51			if (p[1])
 52				ctx.qry.path = trim_end(p + 1, '/');
 53		}
 54		if (cmd[1])
 55			ctx.qry.page = xstrdup(cmd + 1);
 56		return;
 57	}
 58}
 59
 60static char *substr(const char *head, const char *tail)
 61{
 62	char *buf;
 63
 64	if (tail < head)
 65		return xstrdup("");
 66	buf = xmalloc(tail - head + 1);
 67	strncpy(buf, head, tail - head);
 68	buf[tail - head] = '\0';
 69	return buf;
 70}
 71
 72static char *parse_user(char *t, char **name, char **email, unsigned long *date)
 73{
 74	char *p = t;
 75	int mode = 1;
 76
 77	while (p && *p) {
 78		if (mode == 1 && *p == '<') {
 79			*name = substr(t, p - 1);
 80			t = p;
 81			mode++;
 82		} else if (mode == 1 && *p == '\n') {
 83			*name = substr(t, p);
 84			p++;
 85			break;
 86		} else if (mode == 2 && *p == '>') {
 87			*email = substr(t, p + 1);
 88			t = p;
 89			mode++;
 90		} else if (mode == 2 && *p == '\n') {
 91			*email = substr(t, p);
 92			p++;
 93			break;
 94		} else if (mode == 3 && isdigit(*p)) {
 95			*date = atol(p);
 96			mode++;
 97		} else if (*p == '\n') {
 98			p++;
 99			break;
100		}
101		p++;
102	}
103	return p;
104}
105
106#ifdef NO_ICONV
107#define reencode(a, b, c)
108#else
109static const char *reencode(char **txt, const char *src_enc, const char *dst_enc)
110{
111	char *tmp;
112
113	if (!txt)
114		return NULL;
115
116	if (!*txt || !src_enc || !dst_enc)
117		return *txt;
118
119	/* no encoding needed if src_enc equals dst_enc */
120	if (!strcasecmp(src_enc, dst_enc))
121		return *txt;
122
123	tmp = reencode_string(*txt, dst_enc, src_enc);
124	if (tmp) {
125		free(*txt);
126		*txt = tmp;
127	}
128	return *txt;
129}
130#endif
131
132struct commitinfo *cgit_parse_commit(struct commit *commit)
133{
134	struct commitinfo *ret;
135	char *p = commit->buffer, *t;
136
137	ret = xmalloc(sizeof(*ret));
138	ret->commit = commit;
139	ret->author = NULL;
140	ret->author_email = NULL;
141	ret->committer = NULL;
142	ret->committer_email = NULL;
143	ret->subject = NULL;
144	ret->msg = NULL;
145	ret->msg_encoding = NULL;
146
147	if (p == NULL)
148		return ret;
149
150	if (prefixcmp(p, "tree "))
151		die("Bad commit: %s", sha1_to_hex(commit->object.sha1));
152	else
153		p += 46; // "tree " + hex[40] + "\n"
154
155	while (!prefixcmp(p, "parent "))
156		p += 48; // "parent " + hex[40] + "\n"
157
158	if (p && !prefixcmp(p, "author ")) {
159		p = parse_user(p + 7, &ret->author, &ret->author_email,
160			&ret->author_date);
161	}
162
163	if (p && !prefixcmp(p, "committer ")) {
164		p = parse_user(p + 10, &ret->committer, &ret->committer_email,
165			&ret->committer_date);
166	}
167
168	if (p && !prefixcmp(p, "encoding ")) {
169		p += 9;
170		t = strchr(p, '\n');
171		if (t) {
172			ret->msg_encoding = substr(p, t + 1);
173			p = t + 1;
174		}
175	}
176
177	/* if no special encoding is found, assume UTF-8 */
178	if (!ret->msg_encoding)
179		ret->msg_encoding = xstrdup("UTF-8");
180
181	// skip unknown header fields
182	while (p && *p && (*p != '\n')) {
183		p = strchr(p, '\n');
184		if (p)
185			p++;
186	}
187
188	// skip empty lines between headers and message
189	while (p && *p == '\n')
190		p++;
191
192	if (!p)
193		return ret;
194
195	t = strchr(p, '\n');
196	if (t) {
197		ret->subject = substr(p, t);
198		p = t + 1;
199
200		while (p && *p == '\n') {
201			p = strchr(p, '\n');
202			if (p)
203				p++;
204		}
205		if (p)
206			ret->msg = xstrdup(p);
207	} else
208		ret->subject = xstrdup(p);
209
210	reencode(&ret->author, ret->msg_encoding, PAGE_ENCODING);
211	reencode(&ret->author_email, ret->msg_encoding, PAGE_ENCODING);
212	reencode(&ret->committer, ret->msg_encoding, PAGE_ENCODING);
213	reencode(&ret->committer_email, ret->msg_encoding, PAGE_ENCODING);
214	reencode(&ret->subject, ret->msg_encoding, PAGE_ENCODING);
215	reencode(&ret->msg, ret->msg_encoding, PAGE_ENCODING);
216
217	return ret;
218}
219
220
221struct taginfo *cgit_parse_tag(struct tag *tag)
222{
223	void *data;
224	enum object_type type;
225	unsigned long size;
226	char *p;
227	struct taginfo *ret;
228
229	data = read_sha1_file(tag->object.sha1, &type, &size);
230	if (!data || type != OBJ_TAG) {
231		free(data);
232		return 0;
233	}
234
235	ret = xmalloc(sizeof(*ret));
236	ret->tagger = NULL;
237	ret->tagger_email = NULL;
238	ret->tagger_date = 0;
239	ret->msg = NULL;
240
241	p = data;
242
243	while (p && *p) {
244		if (*p == '\n')
245			break;
246
247		if (!prefixcmp(p, "tagger ")) {
248			p = parse_user(p + 7, &ret->tagger, &ret->tagger_email,
249				&ret->tagger_date);
250		} else {
251			p = strchr(p, '\n');
252			if (p)
253				p++;
254		}
255	}
256
257	// skip empty lines between headers and message
258	while (p && *p == '\n')
259		p++;
260
261	if (p && *p)
262		ret->msg = xstrdup(p);
263	free(data);
264	return ret;
265}