chiark / gitweb /
Source code reorganization:
[disorder] / lib / cgi.c
CommitLineData
5b708e0c
RK
1/*
2 * This file is part of DisOrder.
3 * Copyright (C) 2004, 2005, 2007, 2008 Richard Kettlewell
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
18 * USA
19 */
20/** @file lib/cgi.c
21 * @brief CGI tools
22 */
23
05b75f8d 24#include "common.h"
5b708e0c 25
5b708e0c
RK
26#include <unistd.h>
27#include <errno.h>
5b708e0c
RK
28
29#include "cgi.h"
30#include "mem.h"
31#include "log.h"
32#include "vector.h"
33#include "hash.h"
34#include "kvp.h"
35#include "mime.h"
36#include "unicode.h"
37#include "sink.h"
38
39/** @brief Hash of arguments */
40static hash *cgi_args;
41
42/** @brief Get CGI arguments from a GET request's query string */
43static struct kvp *cgi__init_get(void) {
44 const char *q;
45
46 if((q = getenv("QUERY_STRING")))
47 return kvp_urldecode(q, strlen(q));
48 error(0, "QUERY_STRING not set, assuming empty");
49 return NULL;
50}
51
52/** @brief Read the HTTP request body */
53static void cgi__input(char **ptrp, size_t *np) {
54 const char *cl;
55 char *q;
56 size_t n, m = 0;
57 int r;
58
59 if(!(cl = getenv("CONTENT_LENGTH")))
60 fatal(0, "CONTENT_LENGTH not set");
61 n = atol(cl);
62 /* We check for overflow and also limit the input to 16MB. Lower
63 * would probably do. */
64 if(!(n+1) || n > 16 * 1024 * 1024)
65 fatal(0, "input is much too large");
66 q = xmalloc_noptr(n + 1);
67 while(m < n) {
68 r = read(0, q + m, n - m);
69 if(r > 0)
70 m += r;
71 else if(r == 0)
72 fatal(0, "unexpected end of file reading request body");
73 else switch(errno) {
74 case EINTR: break;
75 default: fatal(errno, "error reading request body");
76 }
77 }
78 if(memchr(q, 0, n))
79 fatal(0, "null character in request body");
80 q[n + 1] = 0;
81 *ptrp = q;
82 if(np)
83 *np = n;
84}
85
86/** @brief Called for each part header field (see cgi__part_callback()) */
87static int cgi__field_callback(const char *name, const char *value,
88 void *u) {
89 char *disposition, *pname, *pvalue;
90 char **namep = u;
91
92 if(!strcmp(name, "content-disposition")) {
93 if(mime_rfc2388_content_disposition(value,
94 &disposition,
95 &pname,
96 &pvalue))
97 fatal(0, "error parsing Content-Disposition field");
98 if(!strcmp(disposition, "form-data")
99 && pname
100 && !strcmp(pname, "name")) {
101 if(*namep)
102 fatal(0, "duplicate Content-Disposition field");
103 *namep = pvalue;
104 }
105 }
106 return 0;
107}
108
109/** @brief Called for each part (see cgi__init_multipart()) */
110static int cgi__part_callback(const char *s,
111 void *u) {
112 char *name = 0;
113 struct kvp *k, **head = u;
114
115 if(!(s = mime_parse(s, cgi__field_callback, &name)))
116 fatal(0, "error parsing part header");
117 if(!name)
118 fatal(0, "no name found");
119 k = xmalloc(sizeof *k);
120 k->next = *head;
121 k->name = name;
122 k->value = s;
123 *head = k;
124 return 0;
125}
126
127/** @brief Initialize CGI arguments from a multipart/form-data request body */
128static struct kvp *cgi__init_multipart(const char *boundary) {
129 char *q;
130 struct kvp *head = 0;
131
132 cgi__input(&q, 0);
133 if(mime_multipart(q, cgi__part_callback, boundary, &head))
134 fatal(0, "invalid multipart object");
135 return head;
136}
137
138/** @brief Initialize CGI arguments from a POST request */
139static struct kvp *cgi__init_post(void) {
140 const char *ct, *boundary;
141 char *q, *type;
142 size_t n;
143 struct kvp *k;
144
145 if(!(ct = getenv("CONTENT_TYPE")))
146 ct = "application/x-www-form-urlencoded";
147 if(mime_content_type(ct, &type, &k))
148 fatal(0, "invalid content type '%s'", ct);
149 if(!strcmp(type, "application/x-www-form-urlencoded")) {
150 cgi__input(&q, &n);
151 return kvp_urldecode(q, n);
152 }
153 if(!strcmp(type, "multipart/form-data")) {
154 if(!(boundary = kvp_get(k, "boundary")))
155 fatal(0, "no boundary parameter found");
156 return cgi__init_multipart(boundary);
157 }
158 fatal(0, "unrecognized content type '%s'", type);
159}
160
161/** @brief Initialize CGI arguments
162 *
163 * Must be called before other cgi_ functions are used.
164 *
165 * This function can be called more than once, in which case it
166 * revisits the environment and (perhaps) standard input. This is
167 * only intended to be used for testing, actual CGI applications
168 * should call it exactly once.
169 */
170void cgi_init(void) {
171 const char *p;
172 struct kvp *k;
173
174 cgi_args = hash_new(sizeof (char *));
175 if(!(p = getenv("REQUEST_METHOD")))
176 error(0, "REQUEST_METHOD not set, assuming GET");
177 if(!p || !strcmp(p, "GET"))
178 k = cgi__init_get();
179 else if(!strcmp(p, "POST"))
180 k = cgi__init_post();
181 else
182 fatal(0, "unknown request method %s", p);
183 /* Validate the arguments and put them in a hash */
184 for(; k; k = k->next) {
185 if(!utf8_valid(k->name, strlen(k->name))
186 || !utf8_valid(k->value, strlen(k->value)))
187 error(0, "invalid UTF-8 sequence in cgi argument %s", k->name);
188 else
189 hash_add(cgi_args, k->name, &k->value, HASH_INSERT_OR_REPLACE);
190 /* We just drop bogus arguments. */
191 }
192}
193
194/** @brief Get a CGI argument by name
195 *
196 * cgi_init() must be called first. Names and values are all valid
197 * UTF-8 strings (and this is enforced at initialization time).
198 */
199const char *cgi_get(const char *name) {
200 const char **v = hash_find(cgi_args, name);
201
202 return v ? *v : NULL;
203}
204
5a7df048
RK
205/** @brief Set a CGI argument */
206void cgi_set(const char *name, const char *value) {
207 value = xstrdup(value);
208 hash_add(cgi_args, name, &value, HASH_INSERT_OR_REPLACE);
209}
210
2cc4c0ef
RK
211/** @brief Clear CGI arguments */
212void cgi_clear(void) {
213 cgi_args = hash_new(sizeof (char *));
214}
215
5b708e0c
RK
216/** @brief Add SGML-style quoting
217 * @param src String to quote (UTF-8)
218 * @return Quoted string
219 *
220 * Quotes characters for insertion into HTML output. Anything that is
221 * not a printable ASCII character will be converted to a numeric
222 * character references, as will '"', '&', '<' and '>' (since those
223 * have special meanings).
224 *
225 * Quoting everything down to ASCII means we don't care what the
226 * content encoding really is (as long as it's not anything insane
227 * like EBCDIC).
228 */
229char *cgi_sgmlquote(const char *src) {
230 uint32_t *ucs, c;
231 int n;
232 struct dynstr d[1];
233 struct sink *s;
234
235 if(!(ucs = utf8_to_utf32(src, strlen(src), 0)))
236 exit(1);
237 dynstr_init(d);
238 s = sink_dynstr(d);
239 n = 1;
240 /* format the string */
241 while((c = *ucs++)) {
242 switch(c) {
243 default:
244 if(c > 126 || c < 32) {
245 case '"':
246 case '&':
247 case '<':
248 case '>':
249 /* For simplicity we always use numeric character references
250 * even if a named reference is available. */
251 sink_printf(s, "&#%"PRIu32";", c);
252 break;
253 } else
254 sink_writec(s, (char)c);
255 }
256 }
257 dynstr_terminate(d);
258 return d->vec;
259}
260
261/** @brief Write a CGI attribute
262 * @param output Where to send output
263 * @param name Attribute name
264 * @param value Attribute value
265 */
266void cgi_attr(struct sink *output, const char *name, const char *value) {
267 /* Try to avoid needless quoting */
268 if(!value[strspn(value, "abcdefghijklmnopqrstuvwxyz"
269 "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
270 "0123456789")])
271 sink_printf(output, "%s=%s", name, value);
272 else
273 sink_printf(output, "%s=\"%s\"", name, cgi_sgmlquote(value));
274}
275
276/** @brief Write an open tag
277 * @param output Where to send output
278 * @param name Element name
279 * @param ... Attribute name/value pairs
280 *
281 * The name/value pair list is terminated by a single (char *)0.
282 */
283void cgi_opentag(struct sink *output, const char *name, ...) {
284 va_list ap;
285 const char *n, *v;
286
287 sink_printf(output, "<%s", name);
288 va_start(ap, name);
289 while((n = va_arg(ap, const char *))) {
290 sink_printf(output, " ");
291 v = va_arg(ap, const char *);
292 if(v)
293 cgi_attr(output, n, v);
294 else
295 sink_printf(output, n);
296 }
297 va_end(ap);
298 sink_printf(output, ">");
299}
300
301/** @brief Write a close tag
302 * @param output Where to send output
303 * @param name Element name
304 */
305void cgi_closetag(struct sink *output, const char *name) {
306 sink_printf(output, "</%s>", name);
307}
308
309/** @brief Construct a URL
310 * @param url Base URL
311 * @param ... Name/value pairs for constructed query string
312 * @return Constructed URL
313 *
314 * The name/value pair list is terminated by a single (char *)0.
315 */
316char *cgi_makeurl(const char *url, ...) {
317 va_list ap;
318 struct kvp *kvp, *k, **kk = &kvp;
319 struct dynstr d;
320 const char *n, *v;
321
322 dynstr_init(&d);
323 dynstr_append_string(&d, url);
324 va_start(ap, url);
325 while((n = va_arg(ap, const char *))) {
326 v = va_arg(ap, const char *);
327 *kk = k = xmalloc(sizeof *k);
328 kk = &k->next;
329 k->name = n;
330 k->value = v;
331 }
332 va_end(ap);
333 *kk = 0;
334 if(kvp) {
335 dynstr_append(&d, '?');
336 dynstr_append_string(&d, kvp_urlencode(kvp, 0));
337 }
338 dynstr_terminate(&d);
339 return d.vec;
340}
341
9faa7a88
RK
342/** @brief Construct a URL from current parameters
343 * @param url Base URL
344 * @return Constructed URL
345 */
346char *cgi_thisurl(const char *url) {
347 struct dynstr d[1];
348 char **keys = hash_keys(cgi_args);
349 int n;
350
351 dynstr_init(d);
352 dynstr_append_string(d, url);
e7ce7665
RK
353 for(n = 0; keys[n]; ++n) {
354 dynstr_append(d, n ? '&' : '?');
355 dynstr_append_string(d, urlencodestring(keys[n]));
356 dynstr_append(d, '=');
2cc4c0ef 357 dynstr_append_string(d, urlencodestring(cgi_get(keys[n])));
9faa7a88
RK
358 }
359 dynstr_terminate(d);
360 return d->vec;
361}
362
5b708e0c
RK
363/*
364Local Variables:
365c-basic-offset:2
366comment-column:40
367fill-column:79
368indent-tabs-mode:nil
369End:
370*/