X-Git-Url: http://git.madism.org/?p=apps%2Fmadmutt.git;a=blobdiff_plain;f=lib-mime%2Frfc2231.c;fp=lib-mime%2Frfc2231.c;h=b21c4254c479a1938654a17d73cf0f275f675f66;hp=0000000000000000000000000000000000000000;hb=2a06362a155582cd59ae2ef6f0df71694a7eede3;hpb=53186676acf2c3b5509a614433eb00a2087cd4ec diff --git a/lib-mime/rfc2231.c b/lib-mime/rfc2231.c new file mode 100644 index 0000000..b21c425 --- /dev/null +++ b/lib-mime/rfc2231.c @@ -0,0 +1,379 @@ +/* + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or (at + * your option) any later version. + * + * This program is distributed in the hope that it will be useful, but + * WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, + * MA 02110-1301, USA. + * + * Copyright © 2006 Pierre Habouzit + */ + +/* + * Copyright notice from original mutt: + * Copyright (C) 1999-2000 Thomas Roessler + * + * This file is part of mutt-ng, see http://www.muttng.org/. + * It's licensed under the GNU General Public License, + * please see the file GPL in the top level source directory. + */ + +/* + * Yet another MIME encoding for header data. This time, it's + * parameters, specified in RFC 2231, and modeled after the + * encoding used in URLs. + * + * Additionally, continuations and encoding are mixed in an, errrm, + * interesting manner. + * + */ + +#if HAVE_CONFIG_H +# include "config.h" +#endif + +#include +#include +#include + +#include + +#include "mutt.h" +#include "charset.h" +#include "rfc2047.h" + +#include +#include +#include + +struct rfc2231_parameter { + char *attribute; + char *value; + int index; + int encoded; + struct rfc2231_parameter + *next; +}; + +static char *rfc2231_get_charset (char *, char *, size_t); +static struct rfc2231_parameter *rfc2231_new_parameter (void); +static void rfc2231_decode_one (char *, char *); +static void rfc2231_free_parameter (struct rfc2231_parameter **); +static void rfc2231_join_continuations (PARAMETER **, + struct rfc2231_parameter *); +static void rfc2231_list_insert (struct rfc2231_parameter **, + struct rfc2231_parameter *); + +static void purge_empty_parameters (PARAMETER ** headp) +{ + PARAMETER *p, *q, **last; + + for (last = headp, p = *headp; p; p = q) { + q = p->next; + if (!p->attribute || !p->value) { + *last = q; + p->next = NULL; + mutt_free_parameter (&p); + } + else + last = &p->next; + } +} + + +void rfc2231_decode_parameters (PARAMETER ** headp) +{ + PARAMETER *head = NULL; + PARAMETER **last; + PARAMETER *p, *q; + + struct rfc2231_parameter *conthead = NULL; + struct rfc2231_parameter *conttmp; + + char *s, *t; + char charset[STRING]; + + int encoded; + int index; + short dirty = 0; /* set to 1 when we may have created + * empty parameters. + */ + + if (!headp) + return; + + purge_empty_parameters (headp); + + for (last = &head, p = *headp; p; p = q) { + q = p->next; + + if (!(s = strchr (p->attribute, '*'))) { + + /* + * Using RFC 2047 encoding in MIME parameters is explicitly + * forbidden by that document. Nevertheless, it's being + * generated by some software, including certain Lotus Notes to + * Internet Gateways. So we actually decode it. + */ + + if (option (OPTRFC2047PARAMS) && p->value && strstr (p->value, "=?")) + rfc2047_decode (&p->value); + else if (!option (OPTSTRICTMIME)) { + if (ascii_strcasecmp (AssumedCharset, "us-ascii")) + mutt_convert_nonmime_string (&p->value); + } + + *last = p; + last = &p->next; + p->next = NULL; + } + else if (*(s + 1) == '\0') { + *s = '\0'; + + s = rfc2231_get_charset (p->value, charset, sizeof (charset)); + rfc2231_decode_one (p->value, s); + mutt_convert_string (&p->value, charset, Charset, M_ICONV_HOOK_FROM); + + *last = p; + last = &p->next; + p->next = NULL; + + dirty = 1; + } + else { + *s = '\0'; + s++; /* let s point to the first character of index. */ + for (t = s; *t && isdigit ((unsigned char) *t); t++); + encoded = (*t == '*'); + *t = '\0'; + + index = atoi (s); + + conttmp = rfc2231_new_parameter (); + conttmp->attribute = p->attribute; + conttmp->value = p->value; + conttmp->encoded = encoded; + conttmp->index = index; + + p->attribute = NULL; + p->value = NULL; + p_delete(&p); + + rfc2231_list_insert (&conthead, conttmp); + } + } + + if (conthead) { + rfc2231_join_continuations (last, conthead); + dirty = 1; + } + + *headp = head; + + if (dirty) + purge_empty_parameters (headp); +} + +static struct rfc2231_parameter *rfc2231_new_parameter (void) +{ + return p_new(struct rfc2231_parameter, 1); +} + +static void rfc2231_free_parameter (struct rfc2231_parameter **p) +{ + if (*p) { + p_delete(&(*p)->attribute); + p_delete(&(*p)->value); + p_delete(p); + } +} + +static char *rfc2231_get_charset (char *value, char *charset, size_t chslen) +{ + char *t, *u; + + if (!(t = strchr (value, '\''))) { + charset[0] = '\0'; + return value; + } + + *t = '\0'; + m_strcpy(charset, chslen, value); + + if ((u = strchr (t + 1, '\''))) + return u + 1; + else + return t + 1; +} + +static void rfc2231_decode_one (char *dest, char *src) +{ + char *d; + + for (d = dest; *src; src++) { + if (*src == '%' && + isxdigit ((unsigned char) *(src + 1)) && + isxdigit ((unsigned char) *(src + 2))) { + *d++ = (hexval (*(src + 1)) << 4) | (hexval (*(src + 2))); + src += 2; + } + else + *d++ = *src; + } + + *d = '\0'; +} + +/* insert parameter into an ordered list. + * + * Primary sorting key: attribute + * Secondary sorting key: index + */ + +static void rfc2231_list_insert (struct rfc2231_parameter **list, + struct rfc2231_parameter *par) +{ + struct rfc2231_parameter **last = list; + struct rfc2231_parameter *p = *list, *q; + int c; + + while (p) { + last = &p->next; + q = p; + p = p->next; + + c = m_strcmp(par->value, q->value); + if ((c > 0) || (c == 0 && par->index >= q->index)) + break; + } + + par->next = p; + *last = par; +} + +/* process continuation parameters */ + +static void rfc2231_join_continuations (PARAMETER ** head, + struct rfc2231_parameter *par) +{ + struct rfc2231_parameter *q; + + char attribute[STRING]; + char charset[STRING]; + char *value = NULL; + char *valp; + int encoded; + + size_t l, vl; + + while (par) { + value = NULL; + l = 0; + + m_strcpy(attribute, sizeof(attribute), par->attribute); + + if ((encoded = par->encoded)) + valp = rfc2231_get_charset (par->value, charset, sizeof (charset)); + else + valp = par->value; + + do { + if (encoded && par->encoded) + rfc2231_decode_one (par->value, valp); + + vl = m_strlen(par->value); + + p_realloc(&value, l + vl + 1); + strcpy (value + l, par->value); /* __STRCPY_CHECKED__ */ + l += vl; + + q = par->next; + rfc2231_free_parameter (&par); + if ((par = q)) + valp = par->value; + } while (par && !m_strcmp(par->attribute, attribute)); + + if (value) { + if (encoded) + mutt_convert_string (&value, charset, Charset, M_ICONV_HOOK_FROM); + *head = mutt_new_parameter (); + (*head)->attribute = m_strdup(attribute); + (*head)->value = value; + head = &(*head)->next; + } + } +} + +int rfc2231_encode_string (char **pd) +{ + int ext = 0, encode = 0; + char *charset, *s, *t, *e, *d = 0; + size_t slen, dlen = 0; + + /* + * A shortcut to detect pure 7bit data. + * + * This should prevent the worst when character set handling + * is flawed. + */ + + for (s = *pd; *s; s++) + if (*s & 0x80) + break; + + if (!*s) + return 0; + + if (!Charset || !SendCharset || + !(charset = mutt_choose_charset (Charset, SendCharset, + *pd, m_strlen(*pd), &d, &dlen))) { + charset = m_strdup(Charset ? Charset : "unknown-8bit"); + d = *pd; + dlen = m_strlen(d); + } + + if (!mutt_is_us_ascii (charset)) + encode = 1; + + for (s = d, slen = dlen; slen; s++, slen--) + if (*s < 0x20 || *s >= 0x7f) + encode = 1, ++ext; + else if (strchr (MimeSpecials, *s) || strchr ("*'%", *s)) + ++ext; + + if (encode) { + e = p_new(char, dlen + 2 * ext + m_strlen(charset) + 3); + sprintf (e, "%s''", charset); /* __SPRINTF_CHECKED__ */ + t = e + m_strlen(e); + for (s = d, slen = dlen; slen; s++, slen--) + if (*s < 0x20 || *s >= 0x7f || + strchr (MimeSpecials, *s) || strchr ("*'%", *s)) { + sprintf (t, "%%%02X", (unsigned char) *s); + t += 3; + } + else + *t++ = *s; + *t = '\0'; + + if (d != *pd) + p_delete(&d); + p_delete(pd); + *pd = e; + } + else if (d != *pd) { + p_delete(pd); + *pd = d; + } + + p_delete(&charset); + + return encode; +}