claws-mail/src/procmime.c
2001-04-19 12:21:46 +00:00

857 lines
19 KiB
C

/*
* Sylpheed -- a GTK+ based, lightweight, and fast e-mail client
* Copyright (C) 1999,2000 Hiroyuki Yamamoto
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
*/
#ifdef HAVE_CONFIG_H
# include "config.h"
#endif
#include "defs.h"
#include <glib.h>
#include <stdio.h>
#include <string.h>
#include <locale.h>
#include <ctype.h>
#include "intl.h"
#include "procmime.h"
#include "procheader.h"
#include "base64.h"
#include "uuencode.h"
#include "unmime.h"
#include "codeconv.h"
#include "utils.h"
#include "prefs_common.h"
#if USE_GPGME
# include "rfc2015.h"
#endif
static GHashTable *procmime_get_mime_type_table (void);
static GList *procmime_get_mime_type_list (void);
MimeInfo *procmime_mimeinfo_new(void)
{
MimeInfo *mimeinfo;
mimeinfo = g_new0(MimeInfo, 1);
mimeinfo->mime_type = MIME_UNKNOWN;
mimeinfo->encoding_type = ENC_UNKNOWN;
return mimeinfo;
}
void procmime_mimeinfo_free(MimeInfo *mimeinfo)
{
if (!mimeinfo) return;
g_free(mimeinfo->encoding);
g_free(mimeinfo->content_type);
g_free(mimeinfo->charset);
g_free(mimeinfo->name);
g_free(mimeinfo->boundary);
g_free(mimeinfo->content_disposition);
g_free(mimeinfo->filename);
#if USE_GPGME
g_free(mimeinfo->plaintextfile);
g_free(mimeinfo->sigstatus);
g_free(mimeinfo->sigstatus_full);
#endif
procmime_mimeinfo_free(mimeinfo->sub);
g_free(mimeinfo);
}
void procmime_mimeinfo_free_all(MimeInfo *mimeinfo)
{
while (mimeinfo != NULL) {
MimeInfo *next;
g_free(mimeinfo->encoding);
g_free(mimeinfo->content_type);
g_free(mimeinfo->charset);
g_free(mimeinfo->name);
g_free(mimeinfo->boundary);
g_free(mimeinfo->content_disposition);
g_free(mimeinfo->filename);
#if USE_GPGME
g_free(mimeinfo->plaintextfile);
g_free(mimeinfo->sigstatus);
g_free(mimeinfo->sigstatus_full);
#endif
procmime_mimeinfo_free_all(mimeinfo->sub);
procmime_mimeinfo_free_all(mimeinfo->children);
#if USE_GPGME
procmime_mimeinfo_free_all(mimeinfo->plaintext);
#endif
next = mimeinfo->next;
g_free(mimeinfo);
mimeinfo = next;
}
}
MimeInfo *procmime_mimeinfo_insert(MimeInfo *parent, MimeInfo *mimeinfo)
{
MimeInfo *child = parent->children;
if (!child)
parent->children = mimeinfo;
else {
while (child->next != NULL)
child = child->next;
child->next = mimeinfo;
}
mimeinfo->parent = parent;
mimeinfo->level = parent->level + 1;
return mimeinfo;
}
void procmime_mimeinfo_replace(MimeInfo *old, MimeInfo *new)
{
MimeInfo *parent = old->parent;
MimeInfo *child;
if (!parent) {
g_warning("oops: Not top message");
return;
}
if (new->next) {
g_message("oops: new child should not have a sibling");
return;
}
for (child = parent->children; child && child != old;
child = child->next)
;
if (!child) {
g_warning("oops: parent can't find it's own child");
return;
}
procmime_mimeinfo_free_all(old);
if (child == parent->children) {
new->next = parent->children->next;
parent->children = new;
} else {
new->next = child->next;
child = new;
}
}
MimeInfo *procmime_scan_message(MsgInfo *msginfo)
{
FILE *fp;
MimeInfo *mimeinfo;
g_return_val_if_fail(msginfo != NULL, NULL);
if ((fp = procmsg_open_message(msginfo)) == NULL) return NULL;
mimeinfo = procmime_scan_mime_header(fp);
if (mimeinfo) {
if (mimeinfo->mime_type != MIME_MULTIPART) {
if (fseek(fp, mimeinfo->fpos, SEEK_SET) < 0)
perror("fseek");
}
if (mimeinfo->mime_type != MIME_TEXT)
procmime_scan_multipart_message(mimeinfo, fp);
}
#if USE_GPGME
if (prefs_common.auto_check_signatures)
rfc2015_check_signature(mimeinfo, fp);
#endif
fclose(fp);
return mimeinfo;
}
void procmime_scan_multipart_message(MimeInfo *mimeinfo, FILE *fp)
{
gchar *p;
gchar *boundary;
gint boundary_len = 0;
gchar buf[BUFFSIZE];
glong fpos, prev_fpos;
gint npart;
g_return_if_fail(mimeinfo != NULL);
g_return_if_fail(mimeinfo->mime_type != MIME_TEXT);
if (mimeinfo->mime_type == MIME_MULTIPART) {
g_return_if_fail(mimeinfo->boundary != NULL);
g_return_if_fail(mimeinfo->sub == NULL);
}
g_return_if_fail(fp != NULL);
boundary = mimeinfo->boundary;
if (boundary) {
boundary_len = strlen(boundary);
/* look for first boundary */
while ((p = fgets(buf, sizeof(buf), fp)) != NULL)
if (IS_BOUNDARY(buf, boundary, boundary_len)) break;
if (!p) return;
}
if ((fpos = ftell(fp)) < 0) {
perror("ftell");
return;
}
for (npart = 0;; npart++) {
MimeInfo *partinfo;
gboolean eom = FALSE;
prev_fpos = fpos;
partinfo = procmime_scan_mime_header(fp);
if (!partinfo) break;
procmime_mimeinfo_insert(mimeinfo, partinfo);
if (partinfo->mime_type == MIME_MULTIPART) {
if (partinfo->level < 8)
procmime_scan_multipart_message(partinfo, fp);
} else if (partinfo->mime_type == MIME_MESSAGE_RFC822) {
MimeInfo *sub;
partinfo->sub = sub = procmime_scan_mime_header(fp);
if (!sub) break;
sub->level = partinfo->level + 1;
sub->parent = partinfo->parent;
sub->main = partinfo;
if (sub->mime_type == MIME_MULTIPART) {
if (sub->level < 8)
procmime_scan_multipart_message
(sub, fp);
}
}
/* look for next boundary */
buf[0] = '\0';
while ((p = fgets(buf, sizeof(buf), fp)) != NULL) {
if (IS_BOUNDARY(buf, boundary, boundary_len)) {
if (buf[2 + boundary_len] == '-' &&
buf[2 + boundary_len + 1] == '-')
eom = TRUE;
break;
}
}
if (p == NULL)
eom = TRUE; /* broken MIME message */
fpos = ftell(fp);
partinfo->size = fpos - prev_fpos - strlen(buf);
if (eom) break;
}
//g_message ("** at " __PRETTY_FUNCTION__ ":%d:", __LINE__);
}
void procmime_scan_encoding(MimeInfo *mimeinfo, const gchar *encoding)
{
gchar *buf;
Xalloca(buf, strlen(encoding) + 1, return);
strcpy(buf, encoding);
g_free(mimeinfo->encoding);
mimeinfo->encoding = g_strdup(g_strstrip(buf));
if (!strcasecmp(buf, "7bit"))
mimeinfo->encoding_type = ENC_7BIT;
else if (!strcasecmp(buf, "8bit"))
mimeinfo->encoding_type = ENC_8BIT;
else if (!strcasecmp(buf, "quoted-printable"))
mimeinfo->encoding_type = ENC_QUOTED_PRINTABLE;
else if (!strcasecmp(buf, "base64"))
mimeinfo->encoding_type = ENC_BASE64;
else if (!strcasecmp(buf, "x-uuencode"))
mimeinfo->encoding_type = ENC_X_UUENCODE;
else
mimeinfo->encoding_type = ENC_UNKNOWN;
}
void procmime_scan_content_type(MimeInfo *mimeinfo, const gchar *content_type)
{
gchar *delim, *p, *cnttype;
gchar *buf;
Xalloca(buf, strlen(content_type) + 1, return);
strcpy(buf, content_type);
g_free(mimeinfo->content_type);
g_free(mimeinfo->charset);
g_free(mimeinfo->name);
mimeinfo->content_type = NULL;
mimeinfo->charset = NULL;
mimeinfo->name = NULL;
if ((delim = strchr(buf, ';'))) *delim = '\0';
mimeinfo->content_type = cnttype = g_strdup(g_strstrip(buf));
if (!strncasecmp(cnttype, "text/html", 9))
mimeinfo->mime_type = MIME_TEXT_HTML;
else if (!strncasecmp(cnttype, "text/", 5))
mimeinfo->mime_type = MIME_TEXT;
else if (!strncasecmp(cnttype, "message/rfc822", 14))
mimeinfo->mime_type = MIME_MESSAGE_RFC822;
else if (!strncasecmp(cnttype, "message/", 8))
mimeinfo->mime_type = MIME_TEXT;
else if (!strncasecmp(cnttype, "application/octet-stream", 24))
mimeinfo->mime_type = MIME_APPLICATION_OCTET_STREAM;
else if (!strncasecmp(cnttype, "application/", 12))
mimeinfo->mime_type = MIME_APPLICATION;
else if (!strncasecmp(cnttype, "multipart/", 10))
mimeinfo->mime_type = MIME_MULTIPART;
else if (!strncasecmp(cnttype, "image/", 6))
mimeinfo->mime_type = MIME_IMAGE;
else if (!strncasecmp(cnttype, "audio/", 6))
mimeinfo->mime_type = MIME_AUDIO;
else if (!strcasecmp(cnttype, "text"))
mimeinfo->mime_type = MIME_TEXT;
else
mimeinfo->mime_type = MIME_UNKNOWN;
if (!delim) return;
p = delim + 1;
for (;;) {
gchar *eq;
gchar *attr, *value;
if ((delim = strchr(p, ';'))) *delim = '\0';
if (!(eq = strchr(p, '='))) break;
*eq = '\0';
attr = p;
g_strstrip(attr);
value = eq + 1;
g_strstrip(value);
if (*value == '"')
extract_quote(value, '"');
else {
eliminate_parenthesis(value, '(', ')');
g_strstrip(value);
}
if (*value) {
if (!strcasecmp(attr, "charset"))
mimeinfo->charset = g_strdup(value);
else if (!strcasecmp(attr, "name")) {
gchar *tmp;
size_t len;
len = strlen(value) + 1;
Xalloca(tmp, len, return);
conv_unmime_header(tmp, len, value, NULL);
mimeinfo->name = g_strdup(tmp);
} else if (!strcasecmp(attr, "boundary"))
mimeinfo->boundary = g_strdup(value);
}
if (!delim) break;
p = delim + 1;
}
if (mimeinfo->mime_type == MIME_MULTIPART && !mimeinfo->boundary)
mimeinfo->mime_type = MIME_TEXT;
}
void procmime_scan_content_disposition(MimeInfo *mimeinfo,
const gchar *content_disposition)
{
gchar *delim, *p, *dispos;
gchar *buf;
Xalloca(buf, strlen(content_disposition) + 1, return);
strcpy(buf, content_disposition);
if ((delim = strchr(buf, ';'))) *delim = '\0';
mimeinfo->content_disposition = dispos = g_strdup(g_strstrip(buf));
if (!delim) return;
p = delim + 1;
for (;;) {
gchar *eq;
gchar *attr, *value;
if ((delim = strchr(p, ';'))) *delim = '\0';
if (!(eq = strchr(p, '='))) break;
*eq = '\0';
attr = p;
g_strstrip(attr);
value = eq + 1;
g_strstrip(value);
if (*value == '"')
extract_quote(value, '"');
else {
eliminate_parenthesis(value, '(', ')');
g_strstrip(value);
}
if (*value) {
if (!strcasecmp(attr, "filename")) {
gchar *tmp;
size_t len;
len = strlen(value) + 1;
Xalloca(tmp, len, return);
conv_unmime_header(tmp, len, value, NULL);
g_free(mimeinfo->filename);
mimeinfo->filename = g_strdup(tmp);
break;
}
}
if (!delim) break;
p = delim + 1;
}
}
enum
{
H_CONTENT_TRANSFER_ENCODING = 0,
H_CONTENT_TYPE = 1,
H_CONTENT_DISPOSITION = 2
};
MimeInfo *procmime_scan_mime_header(FILE *fp)
{
static HeaderEntry hentry[] = {{"Content-Transfer-Encoding:",
NULL, FALSE},
{"Content-Type:", NULL, TRUE},
{"Content-Disposition:",
NULL, TRUE},
{NULL, NULL, FALSE}};
gchar buf[BUFFSIZE];
gint hnum;
HeaderEntry *hp;
MimeInfo *mimeinfo;
g_return_val_if_fail(fp != NULL, NULL);
mimeinfo = procmime_mimeinfo_new();
mimeinfo->mime_type = MIME_TEXT;
mimeinfo->encoding_type = ENC_7BIT;
mimeinfo->fpos = ftell(fp);
while ((hnum = procheader_get_one_field(buf, sizeof(buf), fp, hentry))
!= -1) {
hp = hentry + hnum;
if (H_CONTENT_TRANSFER_ENCODING == hnum) {
procmime_scan_encoding
(mimeinfo, buf + strlen(hp->name));
} else if (H_CONTENT_TYPE == hnum) {
procmime_scan_content_type
(mimeinfo, buf + strlen(hp->name));
} else if (H_CONTENT_DISPOSITION == hnum) {
procmime_scan_content_disposition
(mimeinfo, buf + strlen(hp->name));
}
}
if (!mimeinfo->content_type)
mimeinfo->content_type = g_strdup("text/plain");
return mimeinfo;
}
FILE *procmime_decode_content(FILE *outfp, FILE *infp, MimeInfo *mimeinfo)
{
gchar buf[BUFFSIZE];
gchar *boundary = NULL;
gint boundary_len = 0;
gboolean tmp_file = FALSE;
g_return_val_if_fail(infp != NULL, NULL);
g_return_val_if_fail(mimeinfo != NULL, NULL);
if (!outfp) {
outfp = my_tmpfile();
if (!outfp) {
perror("tmpfile");
return NULL;
}
tmp_file = TRUE;
}
if (mimeinfo->parent && mimeinfo->parent->boundary) {
boundary = mimeinfo->parent->boundary;
boundary_len = strlen(boundary);
}
if (mimeinfo->encoding_type == ENC_QUOTED_PRINTABLE) {
gboolean softline = FALSE;
while (fgets(buf, sizeof(buf), infp) != NULL &&
(!boundary ||
!IS_BOUNDARY(buf, boundary, boundary_len))) {
guchar *p = buf;
softline = DoOneQPLine(&p, FALSE, softline);
fwrite(buf, p - (guchar *)buf, 1, outfp);
}
} else if (mimeinfo->encoding_type == ENC_BASE64) {
gchar outbuf[BUFFSIZE];
gint len;
while (fgets(buf, sizeof(buf), infp) != NULL &&
(!boundary ||
!IS_BOUNDARY(buf, boundary, boundary_len))) {
len = from64tobits(outbuf, buf);
if (len < 0) {
g_warning("Bad BASE64 content\n");
break;
}
fwrite(outbuf, sizeof(gchar), len, outfp);
}
} else if (mimeinfo->encoding_type == ENC_X_UUENCODE) {
gchar outbuf[BUFFSIZE];
gint len;
gboolean flag = FALSE;
while (fgets(buf, sizeof(buf), infp) != NULL &&
(!boundary ||
!IS_BOUNDARY(buf, boundary, boundary_len))) {
if(!flag && strncmp(buf,"begin ", 6)) continue;
if (flag) {
len = fromuutobits(outbuf, buf);
if (len <= 0) {
if (len < 0)
g_warning("Bad UUENCODE content(%d)\n", len);
break;
}
fwrite(outbuf, sizeof(gchar), len, outfp);
} else
flag = TRUE;
}
} else {
while (fgets(buf, sizeof(buf), infp) != NULL &&
(!boundary ||
!IS_BOUNDARY(buf, boundary, boundary_len))) {
fputs(buf, outfp);
}
}
if (tmp_file) rewind(outfp);
return outfp;
}
gint procmime_get_part(const gchar *outfile, const gchar *infile,
MimeInfo *mimeinfo)
{
FILE *infp, *outfp;
gchar buf[BUFFSIZE];
g_return_val_if_fail(outfile != NULL, -1);
g_return_val_if_fail(infile != NULL, -1);
g_return_val_if_fail(mimeinfo != NULL, -1);
if ((infp = fopen(infile, "r")) == NULL) {
FILE_OP_ERROR(infile, "fopen");
return -1;
}
if (fseek(infp, mimeinfo->fpos, SEEK_SET) < 0) {
FILE_OP_ERROR(infile, "fseek");
fclose(infp);
return -1;
}
if ((outfp = fopen(outfile, "w")) == NULL) {
FILE_OP_ERROR(outfile, "fopen");
fclose(infp);
return -1;
}
while (fgets(buf, sizeof(buf), infp) != NULL)
if (buf[0] == '\r' || buf[0] == '\n') break;
procmime_decode_content(outfp, infp, mimeinfo);
fclose(infp);
if (fclose(outfp) == EOF) {
FILE_OP_ERROR(outfile, "fclose");
unlink(outfile);
return -1;
}
return 0;
}
FILE *procmime_get_text_part(MsgInfo *msginfo)
{
FILE *infp, *tmpfp, *outfp;
MimeInfo *mimeinfo, *partinfo = NULL;
gchar *src_codeset;
gboolean conv_fail = FALSE;
gchar buf[BUFFSIZE];
g_return_val_if_fail(msginfo != NULL, NULL);
mimeinfo = procmime_scan_message(msginfo);
if (!mimeinfo) return NULL;
if ((infp = procmsg_open_message(msginfo)) == NULL) {
procmime_mimeinfo_free_all(mimeinfo);
return NULL;
}
if (mimeinfo->mime_type == MIME_MULTIPART) {
partinfo = mimeinfo->children;
if (partinfo && partinfo->mime_type == MIME_TEXT) {
if (fseek(infp, partinfo->fpos, SEEK_SET) < 0) {
perror("fseek");
partinfo = NULL;
}
} else
partinfo = NULL;
} else if (mimeinfo->mime_type == MIME_TEXT) {
partinfo = mimeinfo;
if (fseek(infp, partinfo->fpos, SEEK_SET) < 0) {
perror("fseek");
partinfo = NULL;
}
}
if (!partinfo) {
procmime_mimeinfo_free_all(mimeinfo);
return NULL;
}
while (fgets(buf, sizeof(buf), infp) != NULL)
if (buf[0] == '\r' || buf[0] == '\n') break;
tmpfp = procmime_decode_content(NULL, infp, partinfo);
if (!tmpfp) {
procmime_mimeinfo_free_all(mimeinfo);
return NULL;
}
if ((outfp = my_tmpfile()) == NULL) {
perror("tmpfile");
fclose(tmpfp);
procmime_mimeinfo_free_all(mimeinfo);
return NULL;
}
src_codeset = prefs_common.force_charset
? prefs_common.force_charset : partinfo->charset;
while (fgets(buf, sizeof(buf), tmpfp) != NULL) {
gchar *str;
str = conv_codeset_strdup(buf, src_codeset, NULL);
if (str) {
fputs(str, outfp);
g_free(str);
} else {
conv_fail = TRUE;
fputs(buf, outfp);
}
}
if (conv_fail) g_warning(_("Code conversion failed.\n"));
fclose(tmpfp);
procmime_mimeinfo_free_all(mimeinfo);
rewind(outfp);
return outfp;
}
gchar *procmime_get_tmp_file_name(MimeInfo *mimeinfo)
{
static guint32 id = 0;
gchar *base;
gchar *filename;
gchar f_prefix[10];
g_return_val_if_fail(mimeinfo != NULL, NULL);
g_snprintf(f_prefix, sizeof(f_prefix), "%08x.", id++);
if (MIME_TEXT_HTML == mimeinfo->mime_type)
base = "mimetmp.html";
else {
base = mimeinfo->filename ? mimeinfo->filename
: mimeinfo->name ? mimeinfo->name : "mimetmp";
base = g_basename(base);
if (*base == '\0') base = "mimetmp";
}
filename = g_strconcat(get_mime_tmp_dir(), G_DIR_SEPARATOR_S,
f_prefix, base, NULL);
return filename;
}
static GList *mime_type_list = NULL;
gchar *procmime_get_mime_type(const gchar *filename)
{
static GHashTable *mime_type_table = NULL;
MimeType *mime_type;
const gchar *ext, *p;
if (!mime_type_table) {
mime_type_table = procmime_get_mime_type_table();
if (!mime_type_table) return NULL;
}
filename = g_basename(filename);
p = strrchr(filename, '.');
if (p)
ext = p + 1;
else
return NULL;
mime_type = g_hash_table_lookup(mime_type_table, ext);
if (mime_type) {
gchar *str;
str = g_strconcat(mime_type->type, "/", mime_type->sub_type,
NULL);
return str;
}
return NULL;
}
static GHashTable *procmime_get_mime_type_table(void)
{
GHashTable *table = NULL;
GList *cur;
MimeType *mime_type;
gchar **exts;
if (!mime_type_list) {
mime_type_list = procmime_get_mime_type_list();
if (!mime_type_list) return NULL;
}
table = g_hash_table_new(g_str_hash, g_str_equal);
for (cur = mime_type_list; cur != NULL; cur = cur->next) {
gint i;
mime_type = (MimeType *)cur->data;
if (!mime_type->extension) continue;
exts = g_strsplit(mime_type->extension, " ", 16);
for (i = 0; exts[i] != NULL; i++)
g_hash_table_insert(table, g_strdup(exts[i]),
mime_type);
g_strfreev(exts);
}
return table;
}
static GList *procmime_get_mime_type_list(void)
{
GList *list = NULL;
FILE *fp;
gchar buf[BUFFSIZE];
gchar *p, *delim;
MimeType *mime_type;
if ((fp = fopen("/etc/mime.types", "r")) == NULL) {
FILE_OP_ERROR("/etc/mime.types", "fopen");
return NULL;
}
while (fgets(buf, sizeof(buf), fp) != NULL) {
p = strchr(buf, '#');
if (p) *p = '\0';
g_strstrip(buf);
p = buf;
while (*p && !isspace(*p)) p++;
if (*p) {
*p = '\0';
p++;
}
delim = strchr(buf, '/');
if (delim == NULL) continue;
*delim = '\0';
mime_type = g_new(MimeType, 1);
mime_type->type = g_strdup(buf);
mime_type->sub_type = g_strdup(delim + 1);
while (*p && isspace(*p)) p++;
if (*p)
mime_type->extension = g_strdup(p);
else
mime_type->extension = NULL;
list = g_list_append(list, mime_type);
}
fclose(fp);
if (!list)
g_warning("Can't read mime.types\n");
return list;
}
EncodingType procmime_get_encoding_for_charset(const gchar *charset)
{
if (!charset)
return ENC_8BIT;
else if (!strncasecmp(charset, "ISO-2022-", 9) ||
!strcasecmp(charset, "US-ASCII"))
return ENC_7BIT;
else
return ENC_8BIT;
/* return ENC_BASE64; */
/* return ENC_QUOTED_PRINTABLE; */
}
const gchar *procmime_get_encoding_str(EncodingType encoding)
{
static const gchar *encoding_str[] = {
"7bit", "8bit", "quoted-printable", "base64", "x-uuencode",
NULL
};
if (encoding >= ENC_7BIT && encoding <= ENC_UNKNOWN)
return encoding_str[encoding];
else
return NULL;
}