message-header-encode.c revision 5b6e0b6569d5e79ddb868525063cfd04009437b4
/* Copyright (c) 2009-2014 Dovecot authors, see the included COPYING file */
#include "lib.h"
#include "str.h"
#include "base64.h"
#include "message-header-encode.h"
#define MIME_WRAPPER_LEN (strlen("=?utf-8?q?""?="))
#define MIME_MAX_LINE_LEN 76
#define IS_LWSP(c) \
((c) == ' ' || (c) == '\t' || (c) == '\n')
static bool input_idx_need_encoding(const unsigned char *input,
unsigned int i, unsigned int len)
{
/* 8bit chars */
if ((input[i] & 0x80) != 0)
return TRUE;
/* control chars */
if (input[i] < 32)
return TRUE;
/* <LWSP>=? */
if (input[i] == '=' && i+1 < len && input[i+1] == '?' &&
(i == 0 || IS_LWSP(input[i-1])))
return TRUE;
return FALSE;
}
void message_header_encode_q(const unsigned char *input, unsigned int len,
string_t *output, unsigned int first_line_len)
{
unsigned int i, line_len_left;
line_len_left = MIME_MAX_LINE_LEN - MIME_WRAPPER_LEN;
if (first_line_len >= MIME_MAX_LINE_LEN - MIME_WRAPPER_LEN - 3) {
str_append(output, "\n\t");
line_len_left--;
} else {
line_len_left -= first_line_len;
}
str_append(output, "=?utf-8?q?");
for (i = 0; i < len; i++) {
if (line_len_left < 3) {
/* if we're not at the beginning of a character,
go backwards until we are */
while ((input[i] & 0xc0) == 0x80) {
str_truncate(output, str_len(output)-3);
i--;
}
str_append(output, "?=\n\t=?utf-8?q?");
line_len_left = MIME_MAX_LINE_LEN -
MIME_WRAPPER_LEN - 1;
}
switch (input[i]) {
case ' ':
str_append_c(output, '_');
break;
case '=':
case '?':
case '_':
line_len_left -= 2;
str_printfa(output, "=%02X", input[i]);
break;
default:
if (input[i] < 32 || (input[i] & 0x80) != 0) {
line_len_left -= 2;
str_printfa(output, "=%02X", input[i]);
} else {
str_append_c(output, input[i]);
}
break;
}
line_len_left--;
}
str_append(output, "?=");
}
void message_header_encode_b(const unsigned char *input, unsigned int len,
string_t *output, unsigned int first_line_len)
{
unsigned int line_len, line_len_left, max;
line_len = first_line_len;
if (line_len >= MIME_MAX_LINE_LEN - MIME_WRAPPER_LEN) {
str_append(output, "\n\t");
line_len = 1;
}
for (;;) {
line_len_left = MIME_MAX_LINE_LEN - MIME_WRAPPER_LEN - line_len;
max = MAX_BASE64_DECODED_SIZE(line_len_left);
do {
max--;
if (max > len)
max = len;
else {
/* all of it doesn't fit. find a character where we
can split it from. */
while (max > 0 && (input[max] & 0xc0) == 0x80)
max--;
}
} while (MAX_BASE64_ENCODED_SIZE(max) > line_len_left &&
max > 0);
if (max > 0) {
str_append(output, "=?utf-8?b?");
base64_encode(input, max, output);
str_append(output, "?=");
}
input += max;
len -= max;
if (len == 0)
break;
str_append(output, "\n\t");
line_len = 1;
}
}
void message_header_encode(const char *input, string_t *output)
{
message_header_encode_data((const void *)input, strlen(input), output);
}
void message_header_encode_data(const unsigned char *input, unsigned int len,
string_t *output)
{
unsigned int i, first_idx, last_idx;
unsigned int enc_chars, enc_len, base64_len, q_len;
bool use_q;
/* find the first word that needs encoding */
for (i = 0; i < len; i++) {
if (input_idx_need_encoding(input, i, len))
break;
}
if (i == len) {
/* no encoding necessary */
str_append_data(output, input, len);
return;
}
first_idx = i;
while (first_idx > 0 && !IS_LWSP(input[first_idx-1]))
first_idx--;
/* find the last word that needs encoding */
last_idx = ++i; enc_chars = 1;
for (; i < len; i++) {
if (input_idx_need_encoding(input, i, len)) {
last_idx = i + 1;
enc_chars++;
}
}
while (last_idx < len && !IS_LWSP(input[last_idx]))
last_idx++;
/* figure out if we should use Q or B encoding. Prefer Q if it's not
too much larger. */
enc_len = last_idx - first_idx;
base64_len = MAX_BASE64_ENCODED_SIZE(enc_len);
q_len = enc_len + enc_chars*3;
use_q = q_len*2/3 <= base64_len;
/* and do it */
str_append_data(output, input, first_idx);
if (use_q) {
message_header_encode_q(input + first_idx, enc_len,
output, first_idx);
} else {
message_header_encode_b(input + first_idx, enc_len,
output, first_idx);
}
str_append_data(output, input + last_idx, len - last_idx);
}