X-Git-Url: http://www.chiark.greenend.org.uk/ucgi/~mdw/git/disorder/blobdiff_plain/121f51ac44276ce2744e91bc589e9dc78d3ffd3b..6ebc4527c6a103d0532c08744fb916f951018413:/lib/mime.c diff --git a/lib/mime.c b/lib/mime.c index 0e7d097..9cc54d6 100644 --- a/lib/mime.c +++ b/lib/mime.c @@ -1,34 +1,28 @@ /* * This file is part of DisOrder - * Copyright (C) 2005, 2007 Richard Kettlewell + * Copyright (C) 2005, 2007, 2008 Richard Kettlewell * - * This program is free software; you can redistribute it and/or modify + * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by - * the Free Software Foundation; either version 2 of the License, or + * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. - * - * This program is distributed in the hope that it will be useful, but - * WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU - * General Public License for more details. - * + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * * You should have received a copy of the GNU General Public License - * along with this program; if not, write to the Free Software - * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 - * USA + * along with this program. If not, see . */ /** @file lib/mime.c * @brief Support for MIME and allied protocols */ -#include -#include "types.h" +#include "common.h" -#include #include -#include - #include "mem.h" #include "mime.h" #include "vector.h" @@ -51,7 +45,7 @@ static int whitespace(int c) { } /** @brief Match RFC2045 tspecial characters */ -static int tspecial(int c) { +int mime_tspecial(int c) { switch(c) { case '(': case ')': @@ -75,7 +69,7 @@ static int tspecial(int c) { } /** @brief Match RFC2616 separator characters */ -static int http_separator(int c) { +int mime_http_separator(int c) { switch(c) { case '(': case ')': @@ -151,7 +145,7 @@ static const char *skipwhite(const char *s, int rfc822_comments) { /** @brief Test for a word character * @param c Character to test - * @param special tspecial() (MIME/RFC2405) or http_separator() (HTTP/RFC2616) + * @param special mime_tspecial() (MIME/RFC2405) or mime_http_separator() (HTTP/RFC2616) * @return 1 if @p c is a word character, else 0 */ static int iswordchar(int c, int (*special)(int)) { @@ -161,13 +155,13 @@ static int iswordchar(int c, int (*special)(int)) { /** @brief Parse an RFC1521/RFC2616 word * @param s Pointer to start of word * @param valuep Where to store value - * @param special tspecial() (MIME/RFC2405) or http_separator() (HTTP/RFC2616) + * @param special mime_tspecial() (MIME/RFC2405) or mime_http_separator() (HTTP/RFC2616) * @return Pointer just after end of word or NULL if there's no word * * A word is a token or a quoted-string. */ -static const char *parseword(const char *s, char **valuep, - int (*special)(int)) { +const char *mime_parse_word(const char *s, char **valuep, + int (*special)(int)) { struct dynstr value[1]; int c; @@ -201,14 +195,14 @@ static const char *parseword(const char *s, char **valuep, /** @brief Parse an RFC1521/RFC2616 token * @param s Pointer to start of token * @param valuep Where to store value - * @param special tspecial() (MIME/RFC2405) or http_separator() (HTTP/RFC2616) + * @param special mime_tspecial() (MIME/RFC2405) or mime_http_separator() (HTTP/RFC2616) * @return Pointer just after end of token or NULL if there's no token */ static const char *parsetoken(const char *s, char **valuep, int (*special)(int)) { if(*s == '"') return 0; - return parseword(s, valuep, special); + return mime_parse_word(s, valuep, special); } /** @brief Parse a MIME content-type field @@ -231,7 +225,7 @@ int mime_content_type(const char *s, return -1; if(!*s) return -1; - while(*s && !tspecial(*s) && !whitespace(*s)) + while(*s && !mime_tspecial(*s) && !whitespace(*s)) dynstr_append(&type, tolower((unsigned char)*s++)); if(!(s = skipwhite(s, 1))) return -1; @@ -240,7 +234,7 @@ int mime_content_type(const char *s, dynstr_append(&type, '/'); if(!(s = skipwhite(s, 1))) return -1; - while(*s && !tspecial(*s) && !whitespace(*s)) + while(*s && !mime_tspecial(*s) && !whitespace(*s)) dynstr_append(&type, tolower((unsigned char)*s++)); if(!(s = skipwhite(s, 1))) return -1; @@ -252,7 +246,7 @@ int mime_content_type(const char *s, return -1; if(!*s) return -1; - while(*s && !tspecial(*s) && !whitespace(*s)) + while(*s && !mime_tspecial(*s) && !whitespace(*s)) dynstr_append(¶metername, tolower((unsigned char)*s++)); if(!(s = skipwhite(s, 1))) return -1; @@ -260,7 +254,7 @@ int mime_content_type(const char *s, return -1; if(!(s = skipwhite(s, 1))) return -1; - if(!(s = parseword(s, ¶metervalue, tspecial))) + if(!(s = mime_parse_word(s, ¶metervalue, mime_tspecial))) return -1; if(!(s = skipwhite(s, 1))) return -1; @@ -294,7 +288,7 @@ const char *mime_parse(const char *s, while(*s && !iscrlf(s)) { dynstr_init(&name); dynstr_init(&value); - while(*s && !tspecial(*s) && !whitespace(*s)) + while(*s && !mime_tspecial(*s) && !whitespace(*s)) dynstr_append(&name, tolower((unsigned char)*s++)); if(!(s = skipwhite(s, 1))) return 0; @@ -334,7 +328,7 @@ const char *mime_parse(const char *s, return mime_qp(s); if(!strcmp(cte, "7bit") || !strcmp(cte, "8bit")) return s; - error(0, "unknown content-transfer-encoding '%s'", cte); + disorder_error(0, "unknown content-transfer-encoding '%s'", cte); return 0; } return s; @@ -381,15 +375,19 @@ int mime_multipart(const char *s, int ret; /* We must start with a boundary string */ - if(!isboundary(s, boundary, bl)) + if(!isboundary(s, boundary, bl)) { + disorder_error(0, "mime_multipart: first line is not the boundary string"); return -1; + } /* Keep going until we hit a final boundary */ while(!isfinal(s, boundary, bl)) { s = strstr(s, "\r\n") + 2; start = s; while(!isboundary(s, boundary, bl)) { - if(!(e = strstr(s, "\r\n"))) + if(!(e = strstr(s, "\r\n"))) { + disorder_error(0, "mime_multipart: line does not end CRLF"); return -1; + } s = e + 2; } if((ret = callback(xstrndup(start, @@ -421,7 +419,7 @@ int mime_rfc2388_content_disposition(const char *s, return -1; if(!*s) return -1; - while(*s && !tspecial(*s) && !whitespace(*s)) + while(*s && !mime_tspecial(*s) && !whitespace(*s)) dynstr_append(&disposition, tolower((unsigned char)*s++)); if(!(s = skipwhite(s, 1))) return -1; @@ -433,7 +431,7 @@ int mime_rfc2388_content_disposition(const char *s, return -1; if(!*s) return -1; - while(*s && !tspecial(*s) && !whitespace(*s)) + while(*s && !mime_tspecial(*s) && !whitespace(*s)) dynstr_append(¶metername, tolower((unsigned char)*s++)); if(!(s = skipwhite(s, 1))) return -1; @@ -441,7 +439,7 @@ int mime_rfc2388_content_disposition(const char *s, return -1; if(!(s = skipwhite(s, 1))) return -1; - if(!(s = parseword(s, parametervaluep, tspecial))) + if(!(s = mime_parse_word(s, parametervaluep, mime_tspecial))) return -1; if(!(s = skipwhite(s, 1))) return -1; @@ -503,6 +501,50 @@ char *mime_qp(const char *s) { return d.vec; } +/** @brief Match cookie separator characters + * + * This is a subset of the RFC2616 specials, and technically is in breach of + * the specification. However rejecting (in particular) slashes is + * unreasonably strict and has broken at least one (admittedly somewhat + * obscure) browser, so we're more forgiving. + */ +static int cookie_separator(int c) { + switch(c) { + case '(': + case ')': + case ',': + case ';': + case '=': + case ' ': + case '"': + case '\t': + return 1; + + default: + return 0; + } +} + +/** @brief Match cookie value separator characters + * + * Same as cookie_separator() but allows for @c = in cookie values. + */ +static int cookie_value_separator(int c) { + switch(c) { + case '(': + case ')': + case ',': + case ';': + case ' ': + case '"': + case '\t': + return 1; + + default: + return 0; + } +} + /** @brief Parse a RFC2109 Cookie: header * @param s Header field value * @param cd Where to store result @@ -523,14 +565,20 @@ int parse_cookie(const char *s, s = skipwhite(s, 0); continue; } - if(!(s = parsetoken(s, &n, http_separator))) + if(!(s = parsetoken(s, &n, cookie_separator))) { + disorder_error(0, "parse_cookie: cannot parse attribute name"); return -1; + } s = skipwhite(s, 0); - if(*s++ != '=') + if(*s++ != '=') { + disorder_error(0, "parse_cookie: did not find expected '='"); return -1; + } s = skipwhite(s, 0); - if(!(s = parseword(s, &v, http_separator))) + if(!(s = mime_parse_word(s, &v, cookie_value_separator))) { + disorder_error(0, "parse_cookie: cannot parse value for '%s'", n); return -1; + } if(n[0] == '$') { /* Some bit of meta-information */ if(!strcmp(n, "$Version")) @@ -539,14 +587,14 @@ int parse_cookie(const char *s, if(cd->ncookies > 0 && cd->cookies[cd->ncookies-1].path == 0) cd->cookies[cd->ncookies-1].path = v; else { - error(0, "redundant $Path in Cookie: header"); + disorder_error(0, "redundant $Path in Cookie: header"); return -1; } } else if(!strcmp(n, "$Domain")) { if(cd->ncookies > 0 && cd->cookies[cd->ncookies-1].domain == 0) cd->cookies[cd->ncookies-1].domain = v; else { - error(0, "redundant $Domain in Cookie: header"); + disorder_error(0, "redundant $Domain in Cookie: header"); return -1; } } @@ -562,7 +610,7 @@ int parse_cookie(const char *s, } s = skipwhite(s, 0); if(*s && (*s != ',' && *s != ';')) { - error(0, "missing separator in Cookie: header"); + disorder_error(0, "missing separator in Cookie: header"); return -1; } } @@ -597,7 +645,7 @@ char *quote822(const char *s, int force) { if(!force) { /* See if we need to quote */ for(t = s; (c = (unsigned char)*t); ++t) { - if(tspecial(c) || http_separator(c) || whitespace(c)) + if(mime_tspecial(c) || mime_http_separator(c) || whitespace(c)) break; } if(*t) @@ -688,7 +736,7 @@ char *mime_to_qp(const char *text) { * @param text Underlying UTF-8 text * @param charsetp Where to store charset string * @param encodingp Where to store encoding string - * @return Encoded text (might be @ref text) + * @return Encoded text (might be @p text) */ const char *mime_encode_text(const char *text, const char **charsetp,