]> gitweb.ps.run Git - ps-cgit/blob - parsing.c
Use split_ident_line() in parse_user()
[ps-cgit] / parsing.c
1 /* parsing.c: parsing of config files
2  *
3  * Copyright (C) 2006-2014 cgit Development Team <cgit@lists.zx2c4.com>
4  *
5  * Licensed under GNU General Public License v2
6  *   (see COPYING for full license text)
7  */
8
9 #include "cgit.h"
10
11 /*
12  * url syntax: [repo ['/' cmd [ '/' path]]]
13  *   repo: any valid repo url, may contain '/'
14  *   cmd:  log | commit | diff | tree | view | blob | snapshot
15  *   path: any valid path, may contain '/'
16  *
17  */
18 void cgit_parse_url(const char *url)
19 {
20         char *c, *cmd, *p;
21         struct cgit_repo *repo;
22
23         ctx.repo = NULL;
24         if (!url || url[0] == '\0')
25                 return;
26
27         ctx.repo = cgit_get_repoinfo(url);
28         if (ctx.repo) {
29                 ctx.qry.repo = ctx.repo->url;
30                 return;
31         }
32
33         cmd = NULL;
34         c = strchr(url, '/');
35         while (c) {
36                 c[0] = '\0';
37                 repo = cgit_get_repoinfo(url);
38                 if (repo) {
39                         ctx.repo = repo;
40                         cmd = c;
41                 }
42                 c[0] = '/';
43                 c = strchr(c + 1, '/');
44         }
45
46         if (ctx.repo) {
47                 ctx.qry.repo = ctx.repo->url;
48                 p = strchr(cmd + 1, '/');
49                 if (p) {
50                         p[0] = '\0';
51                         if (p[1])
52                                 ctx.qry.path = trim_end(p + 1, '/');
53                 }
54                 if (cmd[1])
55                         ctx.qry.page = xstrdup(cmd + 1);
56                 return;
57         }
58 }
59
60 static char *substr(const char *head, const char *tail)
61 {
62         char *buf;
63
64         if (tail < head)
65                 return xstrdup("");
66         buf = xmalloc(tail - head + 1);
67         strncpy(buf, head, tail - head);
68         buf[tail - head] = '\0';
69         return buf;
70 }
71
72 static const char *parse_user(const char *t, char **name, char **email, unsigned long *date)
73 {
74         const char *line_end = strchrnul(t, '\n');
75         struct ident_split ident;
76         unsigned email_len;
77
78         if (!split_ident_line(&ident, t, line_end - t)) {
79                 *name = substr(ident.name_begin, ident.name_end);
80
81                 email_len = ident.mail_end - ident.mail_begin;
82                 *email = xmalloc(strlen("<") + email_len + strlen(">") + 1);
83                 sprintf(*email, "<%.*s>", email_len, ident.mail_begin);
84
85                 if (ident.date_begin)
86                         *date = strtoul(ident.date_begin, NULL, 10);
87         }
88
89         if (*line_end)
90                 return line_end + 1;
91         else
92                 return line_end;
93 }
94
95 #ifdef NO_ICONV
96 #define reencode(a, b, c)
97 #else
98 static const char *reencode(char **txt, const char *src_enc, const char *dst_enc)
99 {
100         char *tmp;
101
102         if (!txt)
103                 return NULL;
104
105         if (!*txt || !src_enc || !dst_enc)
106                 return *txt;
107
108         /* no encoding needed if src_enc equals dst_enc */
109         if (!strcasecmp(src_enc, dst_enc))
110                 return *txt;
111
112         tmp = reencode_string(*txt, dst_enc, src_enc);
113         if (tmp) {
114                 free(*txt);
115                 *txt = tmp;
116         }
117         return *txt;
118 }
119 #endif
120
121 struct commitinfo *cgit_parse_commit(struct commit *commit)
122 {
123         struct commitinfo *ret;
124         const char *p = get_cached_commit_buffer(commit, NULL);
125         const char *t;
126
127         ret = xmalloc(sizeof(*ret));
128         ret->commit = commit;
129         ret->author = NULL;
130         ret->author_email = NULL;
131         ret->committer = NULL;
132         ret->committer_email = NULL;
133         ret->subject = NULL;
134         ret->msg = NULL;
135         ret->msg_encoding = NULL;
136
137         if (p == NULL)
138                 return ret;
139
140         if (!starts_with(p, "tree "))
141                 die("Bad commit: %s", sha1_to_hex(commit->object.sha1));
142         else
143                 p += 46; // "tree " + hex[40] + "\n"
144
145         while (starts_with(p, "parent "))
146                 p += 48; // "parent " + hex[40] + "\n"
147
148         if (p && starts_with(p, "author ")) {
149                 p = parse_user(p + 7, &ret->author, &ret->author_email,
150                         &ret->author_date);
151         }
152
153         if (p && starts_with(p, "committer ")) {
154                 p = parse_user(p + 10, &ret->committer, &ret->committer_email,
155                         &ret->committer_date);
156         }
157
158         if (p && starts_with(p, "encoding ")) {
159                 p += 9;
160                 t = strchr(p, '\n');
161                 if (t) {
162                         ret->msg_encoding = substr(p, t + 1);
163                         p = t + 1;
164                 }
165         }
166
167         /* if no special encoding is found, assume UTF-8 */
168         if (!ret->msg_encoding)
169                 ret->msg_encoding = xstrdup("UTF-8");
170
171         // skip unknown header fields
172         while (p && *p && (*p != '\n')) {
173                 p = strchr(p, '\n');
174                 if (p)
175                         p++;
176         }
177
178         // skip empty lines between headers and message
179         while (p && *p == '\n')
180                 p++;
181
182         if (!p)
183                 return ret;
184
185         t = strchr(p, '\n');
186         if (t) {
187                 ret->subject = substr(p, t);
188                 p = t + 1;
189
190                 while (p && *p == '\n') {
191                         p = strchr(p, '\n');
192                         if (p)
193                                 p++;
194                 }
195                 if (p)
196                         ret->msg = xstrdup(p);
197         } else
198                 ret->subject = xstrdup(p);
199
200         reencode(&ret->author, ret->msg_encoding, PAGE_ENCODING);
201         reencode(&ret->author_email, ret->msg_encoding, PAGE_ENCODING);
202         reencode(&ret->committer, ret->msg_encoding, PAGE_ENCODING);
203         reencode(&ret->committer_email, ret->msg_encoding, PAGE_ENCODING);
204         reencode(&ret->subject, ret->msg_encoding, PAGE_ENCODING);
205         reencode(&ret->msg, ret->msg_encoding, PAGE_ENCODING);
206
207         return ret;
208 }
209
210
211 struct taginfo *cgit_parse_tag(struct tag *tag)
212 {
213         void *data;
214         enum object_type type;
215         unsigned long size;
216         const char *p;
217         struct taginfo *ret;
218
219         data = read_sha1_file(tag->object.sha1, &type, &size);
220         if (!data || type != OBJ_TAG) {
221                 free(data);
222                 return 0;
223         }
224
225         ret = xmalloc(sizeof(*ret));
226         ret->tagger = NULL;
227         ret->tagger_email = NULL;
228         ret->tagger_date = 0;
229         ret->msg = NULL;
230
231         p = data;
232
233         while (p && *p) {
234                 if (*p == '\n')
235                         break;
236
237                 if (starts_with(p, "tagger ")) {
238                         p = parse_user(p + 7, &ret->tagger, &ret->tagger_email,
239                                 &ret->tagger_date);
240                 } else {
241                         p = strchr(p, '\n');
242                         if (p)
243                                 p++;
244                 }
245         }
246
247         // skip empty lines between headers and message
248         while (p && *p == '\n')
249                 p++;
250
251         if (p && *p)
252                 ret->msg = xstrdup(p);
253         free(data);
254         return ret;
255 }