module arsd.email; import std.net.curl; pragma(lib, "curl"); import std.base64; import std.string; import arsd.characterencodings; // SEE ALSO: std.net.curl.SMTP struct RelayInfo { string server; string username; string password; } struct MimeAttachment { string type; string filename; const(void)[] content; string id; } class EmailMessage { void setHeader(string name, string value) { headers ~= name ~ ": " ~ value; } string[] to; string[] cc; string[] bcc; string from; string replyTo; string inReplyTo; string textBody; string htmlBody; string subject; string[] headers; private bool isMime = false; private bool isHtml = false; void setTextBody(string text) { textBody = text; } void setHtmlBody(string html) { isMime = true; isHtml = true; htmlBody = html; import arsd.htmltotext; if(textBody is null) textBody = htmlToText(html); } const(MimeAttachment)[] attachments; void addAttachment(string mimeType, string filename, in void[] content, string id = null) { isMime = true; attachments ~= MimeAttachment(mimeType, filename, content, id); } // in the html, use img src="cid:ID_GIVEN_HERE" void addInlineImage(string id, string mimeType, string filename, in void[] content) { assert(isHtml); isMime = true; inlineImages ~= MimeAttachment(mimeType, filename, content, id); } const(MimeAttachment)[] inlineImages; /* we should build out the mime thingy related mixed alternate */ override string toString() { assert(!isHtml || (isHtml && isMime)); auto headers = this.headers; if(to.length) headers ~= "To: " ~ join(to, ", "); if(cc.length) headers ~= "Cc: " ~ join(cc, ", "); if(from.length) headers ~= "From: " ~ from; if(subject !is null) headers ~= "Subject: " ~ subject; if(replyTo !is null) headers ~= "Reply-To: " ~ replyTo; if(inReplyTo !is null) headers ~= "In-Reply-To: " ~ inReplyTo; if(isMime) headers ~= "MIME-Version: 1.0"; /+ if(inlineImages.length) { headers ~= "Content-Type: multipart/related; boundary=" ~ boundary; // so we put the alternative inside asthe first attachment with as seconary boundary // then we do the images } else if(attachments.length) headers ~= "Content-Type: multipart/mixed; boundary=" ~ boundary; else if(isHtml) headers ~= "Content-Type: multipart/alternative; boundary=" ~ boundary; else headers ~= "Content-Type: text/plain; charset=UTF-8"; +/ string msgContent; if(isMime) { MimeContainer top; { MimeContainer mimeMessage; if(isHtml) { auto alternative = new MimeContainer("multipart/alternative"); alternative.stuff ~= new MimeContainer("text/plain; charset=UTF-8", textBody); alternative.stuff ~= new MimeContainer("text/html; charset=UTF-8", htmlBody); mimeMessage = alternative; } else { mimeMessage = new MimeContainer("text/plain; charset=UTF-8", textBody); } top = mimeMessage; } { MimeContainer mimeRelated; if(inlineImages.length) { mimeRelated = new MimeContainer("multipart/related"); mimeRelated.stuff ~= top; top = mimeRelated; foreach(attachment; inlineImages) { auto mimeAttachment = new MimeContainer(attachment.type ~ "; name=\""~attachment.filename~"\""); mimeAttachment.headers ~= "Content-Transfer-Encoding: base64"; mimeAttachment.headers ~= "Content-ID: <" ~ attachment.id ~ ">"; mimeAttachment.content = Base64.encode(cast(const(ubyte)[]) attachment.content); mimeRelated.stuff ~= mimeAttachment; } } } { MimeContainer mimeMixed; if(attachments.length) { mimeMixed = new MimeContainer("multipart/mixed"); mimeMixed.stuff ~= top; top = mimeMixed; foreach(attachment; attachments) { auto mimeAttachment = new MimeContainer(attachment.type); mimeAttachment.headers ~= "Content-Disposition: attachment; filename=\""~attachment.filename~"\""; mimeAttachment.headers ~= "Content-Transfer-Encoding: base64"; if(attachment.id.length) mimeAttachment.headers ~= "Content-ID: <" ~ attachment.id ~ ">"; mimeAttachment.content = Base64.encode(cast(const(ubyte)[]) attachment.content); mimeMixed.stuff ~= mimeAttachment; } } } headers ~= top.contentType; msgContent = top.toMimeString(true); } else { headers ~= "Content-Type: text/plain; charset=UTF-8"; msgContent = textBody; } string msg; msg.reserve(htmlBody.length + textBody.length + 1024); foreach(header; headers) msg ~= header ~ "\r\n"; if(msg.length) // has headers msg ~= "\r\n"; msg ~= msgContent; return msg; } void send(RelayInfo mailServer = RelayInfo("smtp://localhost")) { auto smtp = SMTP(mailServer.server); smtp.verifyHost = false; smtp.verifyPeer = false; // smtp.verbose = true; if(mailServer.username.length) smtp.setAuthentication(mailServer.username, mailServer.password); const(char)[][] allRecipients = cast(const(char)[][]) (to ~ cc ~ bcc); // WTF cast smtp.mailTo(allRecipients); auto mailFrom = from; auto idx = mailFrom.indexOf("<"); if(idx != -1) mailFrom = mailFrom[idx + 1 .. $]; idx = mailFrom.indexOf(">"); if(idx != -1) mailFrom = mailFrom[0 .. idx]; smtp.mailFrom = mailFrom; smtp.message = this.toString(); smtp.perform(); } } void email(string to, string subject, string message, string from, RelayInfo mailServer = RelayInfo("smtp://localhost")) { auto msg = new EmailMessage(); msg.from = from; msg.to = [to]; msg.subject = subject; msg.textBody = message; msg.send(mailServer); } // private: import std.conv; // for reading class MimePart { string[] headers; immutable(ubyte)[] content; string textContent; MimePart[] stuff; string name; string charset; string type; string transferEncoding; string disposition; string id; string filename; MimeAttachment toMimeAttachment() { MimeAttachment att; att.type = type; att.filename = filename; att.id = id; att.content = content; return att; } this(immutable(ubyte)[][] lines, string contentType = null) { string boundary; void parseContentType(string content) { foreach(k, v; breakUpHeaderParts(content)) { switch(k) { case "root": type = v; break; case "name": name = v; break; case "charset": charset = v; break; case "boundary": boundary = v; break; default: } } } if(contentType is null) { // read headers immediately... auto copyOfLines = lines; immutable(ubyte)[] currentHeader; void commitHeader() { if(currentHeader.length == 0) return; string h = decodeEncodedWord(cast(string) currentHeader); headers ~= h; currentHeader = null; auto idx = h.indexOf(":"); if(idx != -1) { auto name = h[0 .. idx].strip.toLower; auto content = h[idx + 1 .. $].strip; switch(name) { case "content-type": parseContentType(content); break; case "content-transfer-encoding": transferEncoding = content.toLower; break; case "content-disposition": foreach(k, v; breakUpHeaderParts(content)) { switch(k) { case "root": disposition = v; break; case "filename": filename = v; break; default: } } break; case "content-id": id = content; break; default: } } } foreach(line; copyOfLines) { lines = lines[1 .. $]; if(line.length == 0) break; if(line[0] == ' ' || line[0] == '\t') currentHeader ~= (cast(string) line).stripLeft(); else { if(currentHeader.length) { commitHeader(); } currentHeader = line; } } commitHeader(); } else { parseContentType(contentType); } // if it is multipart, find the start boundary. we'll break it up and fill in stuff // otherwise, all the data that follows is just content if(boundary.length) { immutable(ubyte)[][] partLines; bool inPart; foreach(line; lines) { if(line.startsWith("--" ~ boundary)) { if(inPart) stuff ~= new MimePart(partLines); inPart = true; partLines = null; if(line == "--" ~ boundary ~ "--") break; // all done } if(inPart) { partLines ~= line; } else { content ~= line ~ '\n'; } } } else { foreach(line; lines) { content ~= line; if(transferEncoding != "base64") content ~= '\n'; } } // decode the content.. switch(transferEncoding) { case "base64": content = Base64.decode(cast(string) content); break; case "quoted-printable": content = decodeQuotedPrintable(cast(string) content); break; default: // no change needed (I hope) } if(type.indexOf("text/") == 0) { if(charset.length == 0) charset = "latin1"; textContent = convertToUtf8Lossy(content, charset); } } } string[string] breakUpHeaderParts(string headerContent) { string[string] ret; string currentName = "root"; string currentContent; bool inQuote = false; bool gettingName = false; bool ignoringSpaces = false; foreach(char c; headerContent) { if(ignoringSpaces) { if(c == ' ') continue; else ignoringSpaces = false; } if(gettingName) { if(c == '=') { gettingName = false; continue; } currentName ~= c; } if(c == '"') { inQuote = !inQuote; continue; } if(!inQuote && c == ';') { ret[currentName] = currentContent; ignoringSpaces = true; currentName = null; currentContent = null; gettingName = true; continue; } if(!gettingName) currentContent ~= c; } if(currentName.length) ret[currentName] = currentContent; return ret; } // for writing class MimeContainer { private static int sequence; immutable string _contentType; immutable string boundary; string[] headers; // NOT including content-type string content; MimeContainer[] stuff; this(string contentType, string content = null) { this._contentType = contentType; this.content = content; sequence++; if(_contentType.indexOf("multipart/") == 0) boundary = "0016e64be86203dd36047610926a" ~ to!string(sequence); } @property string contentType() { string ct = "Content-Type: "~_contentType; if(boundary.length) ct ~= "; boundary=" ~ boundary; return ct; } string toMimeString(bool isRoot = false) { string ret; if(!isRoot) { ret ~= contentType; foreach(header; headers) { ret ~= "\r\n"; ret ~= header; } ret ~= "\r\n\r\n"; } ret ~= content; foreach(idx, thing; stuff) { assert(boundary.length); ret ~= "\r\n--" ~ boundary ~ "\r\n"; ret ~= thing.toMimeString(false); } if(boundary.length) ret ~= "\r\n--" ~ boundary ~ "--"; return ret; } } import std.algorithm : startsWith; class IncomingEmailMessage { this(ref immutable(ubyte)[][] mboxLines) { enum ParseState { lookingForFrom, readingHeaders, readingBody } auto state = ParseState.lookingForFrom; string contentType; bool isMultipart; bool isHtml; immutable(ubyte)[][] mimeLines; string charset = "latin-1"; string contentTransferEncoding; string headerName; string headerContent; void commitHeader() { if(headerName is null) return; headerName = headerName.toLower(); headerContent = headerContent.strip(); headerContent = decodeEncodedWord(headerContent); if(headerName == "content-type") { contentType = headerContent; if(contentType.indexOf("multipart/") != -1) isMultipart = true; else if(contentType.indexOf("text/html") != -1) isHtml = true; auto charsetIdx = contentType.indexOf("charset="); if(charsetIdx != -1) { string cs = contentType[charsetIdx + "charset=".length .. $]; if(cs.length && cs[0] == '\"') cs = cs[1 .. $]; auto quoteIdx = cs.indexOf("\""); if(quoteIdx != -1) cs = cs[0 .. quoteIdx]; auto semicolonIdx = cs.indexOf(";"); if(semicolonIdx != -1) cs = cs[0 .. semicolonIdx]; cs = cs.strip(); if(cs.length) charset = cs.toLower(); } } else if(headerName == "from") { this.from = headerContent; } else if(headerName == "to") { this.to = headerContent; } else if(headerName == "subject") { this.subject = headerContent; } else if(headerName == "content-transfer-encoding") { contentTransferEncoding = headerContent; } headers[headerName] = headerContent; headerName = null; headerContent = null; } lineLoop: while(mboxLines.length) { // this can needlessly convert headers too, but that won't harm anything since they are 7 bit anyway auto line = convertToUtf8Lossy(mboxLines[0], charset); line = line.stripRight; final switch(state) { case ParseState.lookingForFrom: if(line.startsWith("From ")) state = ParseState.readingHeaders; break; case ParseState.readingHeaders: if(line.length == 0) { commitHeader(); state = ParseState.readingBody; } else { if(line[0] == ' ' || line[0] == '\t') { headerContent ~= " " ~ line.stripLeft(); } else { commitHeader(); auto idx = line.indexOf(":"); if(idx == -1) headerName = line; else { headerName = line[0 .. idx]; headerContent = line[idx + 1 .. $].stripLeft(); } } } break; case ParseState.readingBody: if(line.startsWith("From ")) { break lineLoop; // we're at the beginning of the next messsage } if(line.startsWith(">>From") || line.startsWith(">From")) { line = line[1 .. $]; } if(isMultipart) { mimeLines ~= mboxLines[0]; } else if(isHtml) { // html with no alternative and no attachments htmlMessageBody ~= line ~ "\n"; } else { // plain text! textMessageBody ~= line ~ "\n"; } break; } mboxLines = mboxLines[1 .. $]; } if(mimeLines.length) { auto part = new MimePart(mimeLines, contentType); deeperInTheMimeTree: switch(part.type) { case "text/html": htmlMessageBody = part.textContent; break; case "text/plain": textMessageBody = part.textContent; break; case "multipart/alternative": foreach(p; part.stuff) { if(p.type == "text/html") htmlMessageBody = p.textContent; else if(p.type == "text/plain") textMessageBody = p.textContent; } break; case "multipart/related": // the first one is the message itself // after that comes attachments that can be rendered inline if(part.stuff.length) { auto msg = part.stuff[0]; foreach(thing; part.stuff[1 .. $]) { // FIXME: should this be special? attachments ~= thing.toMimeAttachment(); } part = msg; goto deeperInTheMimeTree; } break; case "multipart/mixed": if(part.stuff.length) { auto msg = part.stuff[0]; foreach(thing; part.stuff[1 .. $]) { attachments ~= thing.toMimeAttachment(); } part = msg; goto deeperInTheMimeTree; } // FIXME: the more proper way is: // check the disposition // if none, concat it to make a text message body // if inline it is prolly an image to be concated in the other body // if attachment, it is an attachment break; case "multipart/signed": // FIXME: it would be cool to actually check the signature default: // FIXME: correctly handle more if(part.stuff.length) { part = part.stuff[0]; goto deeperInTheMimeTree; } } } else { switch(contentTransferEncoding) { case "quoted-printable": if(textMessageBody.length) textMessageBody = convertToUtf8Lossy(decodeQuotedPrintable(textMessageBody), charset); if(htmlMessageBody.length) htmlMessageBody = convertToUtf8Lossy(decodeQuotedPrintable(htmlMessageBody), charset); break; default: // nothing needed } } if(htmlMessageBody.length > 0 && textMessageBody.length == 0) { import arsd.htmltotext; textMessageBody = htmlToText(htmlMessageBody); textAutoConverted = true; } } string[string] headers; string subject; string htmlMessageBody; string textMessageBody; string from; string to; bool textAutoConverted; MimeAttachment[] attachments; } struct MboxMessages { immutable(ubyte)[][] linesRemaining; this(immutable(ubyte)[] data) { linesRemaining = splitLinesWithoutDecoding(data); popFront(); } IncomingEmailMessage currentFront; IncomingEmailMessage front() { return currentFront; } bool empty() { return currentFront is null; } void popFront() { if(linesRemaining.length) currentFront = new IncomingEmailMessage(linesRemaining); else currentFront = null; } } MboxMessages processMboxData(immutable(ubyte)[] data) { return MboxMessages(data); } immutable(ubyte)[][] splitLinesWithoutDecoding(immutable(ubyte)[] data) { immutable(ubyte)[][] ret; size_t starting = 0; bool justSaw13 = false; foreach(idx, b; data) { if(b == 13) justSaw13 = true; if(b == 10) { auto use = idx; if(justSaw13) use--; ret ~= data[starting .. use]; starting = idx + 1; } if(b != 13) justSaw13 = false; } if(starting < data.length) ret ~= data[starting .. $]; return ret; } string decodeEncodedWord(string data) { string originalData = data; auto delimiter = data.indexOf("=?"); if(delimiter == -1) return data; string ret; while(delimiter != -1) { ret ~= data[0 .. delimiter]; data = data[delimiter + 2 .. $]; string charset; string encoding; string encodedText; // FIXME: the insane things should probably throw an // exception that keeps a copy of orignal data for use later auto questionMark = data.indexOf("?"); if(questionMark == -1) return originalData; // not sane charset = data[0 .. questionMark]; data = data[questionMark + 1 .. $]; questionMark = data.indexOf("?"); if(questionMark == -1) return originalData; // not sane encoding = data[0 .. questionMark]; data = data[questionMark + 1 .. $]; questionMark = data.indexOf("?="); if(questionMark == -1) return originalData; // not sane encodedText = data[0 .. questionMark]; data = data[questionMark + 2 .. $]; delimiter = data.indexOf("=?"); if (delimiter == 1 && data[0] == ' ') { // a single space between encoded words must be ignored because it is // used to separate multiple encoded words (RFC2047 says CRLF SPACE but a most clients // just use a space) data = data[1..$]; delimiter = 0; } immutable(ubyte)[] decodedText; if(encoding == "Q") decodedText = decodeQuotedPrintable(encodedText); else if(encoding == "B") decodedText = cast(typeof(decodedText)) Base64.decode(encodedText); else return originalData; // wtf ret ~= convertToUtf8Lossy(decodedText, charset); } ret ~= data; // keep the rest since there could be trailing stuff return ret; } immutable(ubyte)[] decodeQuotedPrintable(string text) { immutable(ubyte)[] ret; int state = 0; ubyte hexByte; foreach(b; cast(immutable(ubyte)[]) text) { switch(state) { case 0: if(b == '=') { state++; hexByte = 0; } else if (b == '_') { // RFC2047 4.2.2: a _ may be used to represent a space ret ~= ' '; } else ret ~= b; break; case 1: if(b == '\n') { state = 0; continue; } goto case; case 2: int value; if(b >= '0' && b <= '9') value = b - '0'; else if(b >= 'A' && b <= 'F') value = b - 'A' + 10; else if(b >= 'a' && b <= 'f') value = b - 'a' + 10; if(state == 1) { hexByte |= value << 4; state++; } else { hexByte |= value; ret ~= hexByte; state = 0; } break; default: assert(0); } } return ret; } /+ void main() { import std.file; import std.stdio; auto data = cast(immutable(ubyte)[]) std.file.read("/home/me/test_email_data"); foreach(message; processMboxData(data)) { writeln(message.subject); writeln(message.textMessageBody); writeln("**************** END MESSSAGE **************"); } } +/