/*
* This file is part of DisOrder
- * Copyright (C) 2005, 2007 Richard Kettlewell
+ * Copyright (C) 2005, 2007, 2008 Richard Kettlewell
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* @brief Support for MIME and allied protocols
*/
-#include <config.h>
-#include "types.h"
+#include "common.h"
-#include <string.h>
#include <ctype.h>
-#include <stdio.h>
-
#include "mem.h"
#include "mime.h"
#include "vector.h"
}
/** @brief Match RFC2045 tspecial characters */
-static int tspecial(int c) {
+int mime_tspecial(int c) {
switch(c) {
case '(':
case ')':
}
/** @brief Match RFC2616 separator characters */
-static int http_separator(int c) {
+int mime_http_separator(int c) {
switch(c) {
case '(':
case ')':
/** @brief Test for a word character
* @param c Character to test
- * @param special tspecial() (MIME/RFC2405) or http_separator() (HTTP/RFC2616)
+ * @param special mime_tspecial() (MIME/RFC2405) or mime_http_separator() (HTTP/RFC2616)
* @return 1 if @p c is a word character, else 0
*/
static int iswordchar(int c, int (*special)(int)) {
/** @brief Parse an RFC1521/RFC2616 word
* @param s Pointer to start of word
* @param valuep Where to store value
- * @param special tspecial() (MIME/RFC2405) or http_separator() (HTTP/RFC2616)
+ * @param special mime_tspecial() (MIME/RFC2405) or mime_http_separator() (HTTP/RFC2616)
* @return Pointer just after end of word or NULL if there's no word
*
* A word is a token or a quoted-string.
*/
-static const char *parseword(const char *s, char **valuep,
- int (*special)(int)) {
+const char *mime_parse_word(const char *s, char **valuep,
+ int (*special)(int)) {
struct dynstr value[1];
int c;
/** @brief Parse an RFC1521/RFC2616 token
* @param s Pointer to start of token
* @param valuep Where to store value
- * @param special tspecial() (MIME/RFC2405) or http_separator() (HTTP/RFC2616)
+ * @param special mime_tspecial() (MIME/RFC2405) or mime_http_separator() (HTTP/RFC2616)
* @return Pointer just after end of token or NULL if there's no token
*/
static const char *parsetoken(const char *s, char **valuep,
int (*special)(int)) {
if(*s == '"')
return 0;
- return parseword(s, valuep, special);
+ return mime_parse_word(s, valuep, special);
}
/** @brief Parse a MIME content-type field
return -1;
if(!*s)
return -1;
- while(*s && !tspecial(*s) && !whitespace(*s))
+ while(*s && !mime_tspecial(*s) && !whitespace(*s))
dynstr_append(&type, tolower((unsigned char)*s++));
if(!(s = skipwhite(s, 1)))
return -1;
dynstr_append(&type, '/');
if(!(s = skipwhite(s, 1)))
return -1;
- while(*s && !tspecial(*s) && !whitespace(*s))
+ while(*s && !mime_tspecial(*s) && !whitespace(*s))
dynstr_append(&type, tolower((unsigned char)*s++));
if(!(s = skipwhite(s, 1)))
return -1;
return -1;
if(!*s)
return -1;
- while(*s && !tspecial(*s) && !whitespace(*s))
+ while(*s && !mime_tspecial(*s) && !whitespace(*s))
dynstr_append(¶metername, tolower((unsigned char)*s++));
if(!(s = skipwhite(s, 1)))
return -1;
return -1;
if(!(s = skipwhite(s, 1)))
return -1;
- if(!(s = parseword(s, ¶metervalue, tspecial)))
+ if(!(s = mime_parse_word(s, ¶metervalue, mime_tspecial)))
return -1;
if(!(s = skipwhite(s, 1)))
return -1;
while(*s && !iscrlf(s)) {
dynstr_init(&name);
dynstr_init(&value);
- while(*s && !tspecial(*s) && !whitespace(*s))
+ while(*s && !mime_tspecial(*s) && !whitespace(*s))
dynstr_append(&name, tolower((unsigned char)*s++));
if(!(s = skipwhite(s, 1)))
return 0;
int ret;
/* We must start with a boundary string */
- if(!isboundary(s, boundary, bl))
+ if(!isboundary(s, boundary, bl)) {
+ error(0, "mime_multipart: first line is not the boundary string");
return -1;
+ }
/* Keep going until we hit a final boundary */
while(!isfinal(s, boundary, bl)) {
s = strstr(s, "\r\n") + 2;
start = s;
while(!isboundary(s, boundary, bl)) {
- if(!(e = strstr(s, "\r\n")))
+ if(!(e = strstr(s, "\r\n"))) {
+ error(0, "mime_multipart: line does not end CRLF");
return -1;
+ }
s = e + 2;
}
if((ret = callback(xstrndup(start,
return -1;
if(!*s)
return -1;
- while(*s && !tspecial(*s) && !whitespace(*s))
+ while(*s && !mime_tspecial(*s) && !whitespace(*s))
dynstr_append(&disposition, tolower((unsigned char)*s++));
if(!(s = skipwhite(s, 1)))
return -1;
return -1;
if(!*s)
return -1;
- while(*s && !tspecial(*s) && !whitespace(*s))
+ while(*s && !mime_tspecial(*s) && !whitespace(*s))
dynstr_append(¶metername, tolower((unsigned char)*s++));
if(!(s = skipwhite(s, 1)))
return -1;
return -1;
if(!(s = skipwhite(s, 1)))
return -1;
- if(!(s = parseword(s, parametervaluep, tspecial)))
+ if(!(s = mime_parse_word(s, parametervaluep, mime_tspecial)))
return -1;
if(!(s = skipwhite(s, 1)))
return -1;
return d.vec;
}
+/** @brief Match cookie separator characters
+ *
+ * This is a subset of the RFC2616 specials, and technically is in breach of
+ * the specification. However rejecting (in particular) slashes is
+ * unreasonably strict and has broken at least one (admittedly somewhat
+ * obscure) browser, so we're more forgiving.
+ */
+static int cookie_separator(int c) {
+ switch(c) {
+ case '(':
+ case ')':
+ case ',':
+ case ';':
+ case '=':
+ case ' ':
+ case '"':
+ case '\t':
+ return 1;
+
+ default:
+ return 0;
+ }
+}
+
+/** @brief Match cookie value separator characters
+ *
+ * Same as cookie_separator() but allows for @c = in cookie values.
+ */
+static int cookie_value_separator(int c) {
+ switch(c) {
+ case '(':
+ case ')':
+ case ',':
+ case ';':
+ case ' ':
+ case '"':
+ case '\t':
+ return 1;
+
+ default:
+ return 0;
+ }
+}
+
/** @brief Parse a RFC2109 Cookie: header
* @param s Header field value
* @param cd Where to store result
s = skipwhite(s, 0);
continue;
}
- if(!(s = parsetoken(s, &n, http_separator)))
+ if(!(s = parsetoken(s, &n, cookie_separator))) {
+ error(0, "parse_cookie: cannot parse attribute name");
return -1;
+ }
s = skipwhite(s, 0);
- if(*s++ != '=')
+ if(*s++ != '=') {
+ error(0, "parse_cookie: did not find expected '='");
return -1;
+ }
s = skipwhite(s, 0);
- if(!(s = parseword(s, &v, http_separator)))
+ if(!(s = mime_parse_word(s, &v, cookie_value_separator))) {
+ error(0, "parse_cookie: cannot parse value for '%s'", n);
return -1;
+ }
if(n[0] == '$') {
/* Some bit of meta-information */
if(!strcmp(n, "$Version"))
if(!force) {
/* See if we need to quote */
for(t = s; (c = (unsigned char)*t); ++t) {
- if(tspecial(c) || http_separator(c) || whitespace(c))
+ if(mime_tspecial(c) || mime_http_separator(c) || whitespace(c))
break;
}
if(*t)
* @param text Underlying UTF-8 text
* @param charsetp Where to store charset string
* @param encodingp Where to store encoding string
- * @return Encoded text (might be @ref text)
+ * @return Encoded text (might be @p text)
*/
const char *mime_encode_text(const char *text,
const char **charsetp,