// Copyright (c) 2020 Proton Technologies AG // // This file is part of ProtonMail Bridge. // // ProtonMail Bridge is free software: you can redistribute it and/or modify // it under the terms of the GNU General Public License as published by // the Free Software Foundation, either version 3 of the License, or // (at your option) any later version. // // ProtonMail Bridge is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU General Public License for more details. // // You should have received a copy of the GNU General Public License // along with ProtonMail Bridge. If not, see . package message import ( "bytes" "fmt" "io" "mime" "net/mail" "net/textproto" "strings" "github.com/ProtonMail/proton-bridge/pkg/message/parser" pmmime "github.com/ProtonMail/proton-bridge/pkg/mime" "github.com/ProtonMail/proton-bridge/pkg/pmapi" "github.com/emersion/go-message" "github.com/jaytaylor/html2text" "github.com/pkg/errors" "github.com/sirupsen/logrus" ) func Parse(r io.Reader, key, keyName string) (m *pmapi.Message, mimeBody, plainBody string, attReaders []io.Reader, err error) { logrus.Trace("Parsing message") p, err := parser.New(r) if err != nil { err = errors.Wrap(err, "failed to create new parser") return } if err = convertForeignEncodings(p); err != nil { err = errors.Wrap(err, "failed to convert foreign encodings") return } m = pmapi.NewMessage() if err = parseMessageHeader(m, p.Root().Header); err != nil { err = errors.Wrap(err, "failed to parse message header") return } if m.Attachments, attReaders, err = collectAttachments(p); err != nil { err = errors.Wrap(err, "failed to collect attachments") return } if m.Body, plainBody, err = buildBodies(p); err != nil { err = errors.Wrap(err, "failed to build bodies") return } if m.MIMEType, err = determineMIMEType(p); err != nil { err = errors.Wrap(err, "failed to determine mime type") return } // We only attach the public key manually to the MIME body for // signed/encrypted external recipients. It's not important for it to be // collected as an attachment; that's already done when we upload the draft. if key != "" { attachPublicKey(p.Root(), key, keyName) } mimeBodyBuffer := new(bytes.Buffer) if err = p.NewWriter().Write(mimeBodyBuffer); err != nil { err = errors.Wrap(err, "failed to write out mime message") return } return m, mimeBodyBuffer.String(), plainBody, attReaders, nil } func convertForeignEncodings(p *parser.Parser) error { logrus.Trace("Converting foreign encodings") return p.NewWalker(). RegisterContentTypeHandler("text/html", func(p *parser.Part) error { if err := p.ConvertToUTF8(); err != nil { return err } return p.ConvertMetaCharset() }). RegisterContentTypeHandler("text/.*", func(p *parser.Part) error { return p.ConvertToUTF8() }). RegisterDefaultHandler(func(p *parser.Part) error { t, params, _ := p.ContentType() // multipart/alternative, for example, can contain extra charset. if params != nil && params["charset"] != "" { return p.ConvertToUTF8() } logrus.WithField("type", t).Trace("Not converting part to utf-8") return nil }). Walk() } func collectAttachments(p *parser.Parser) ([]*pmapi.Attachment, []io.Reader, error) { var ( atts []*pmapi.Attachment data []io.Reader err error ) w := p.NewWalker(). RegisterContentDispositionHandler("attachment", func(p *parser.Part) error { att, err := parseAttachment(p.Header) if err != nil { return err } atts = append(atts, att) data = append(data, bytes.NewReader(p.Body)) return nil }). RegisterContentTypeHandler("text/calendar", func(p *parser.Part) error { att, err := parseAttachment(p.Header) if err != nil { return err } atts = append(atts, att) data = append(data, bytes.NewReader(p.Body)) return nil }). RegisterContentTypeHandler("text/.*", func(p *parser.Part) error { return nil }). RegisterDefaultHandler(func(p *parser.Part) error { if len(p.Children()) > 0 { return nil } att, err := parseAttachment(p.Header) if err != nil { return err } atts = append(atts, att) data = append(data, bytes.NewReader(p.Body)) return nil }) if err = w.Walk(); err != nil { return nil, nil, err } return atts, data, nil } // buildBodies collects all text/html and text/plain parts and returns two bodies, // - a rich text body (in which html is allowed), and // - a plaintext body (in which html is converted to plaintext). // // text/html parts are converted to plaintext in order to build the plaintext body, // unless there is already a plaintext part provided via multipart/alternative, // in which case the provided alternative is chosen. func buildBodies(p *parser.Parser) (richBody, plainBody string, err error) { richParts, err := collectBodyParts(p, "text/html") if err != nil { return } plainParts, err := collectBodyParts(p, "text/plain") if err != nil { return } richBuilder, plainBuilder := strings.Builder{}, strings.Builder{} for _, richPart := range richParts { _, _ = richBuilder.Write(richPart.Body) } for _, plainPart := range plainParts { _, _ = plainBuilder.Write(getPlainBody(plainPart)) } return richBuilder.String(), plainBuilder.String(), nil } // collectBodyParts collects all body parts in the parse tree, preferring // parts of the given content type if alternatives exist. func collectBodyParts(p *parser.Parser, preferredContentType string) (parser.Parts, error) { v := p. NewVisitor(func(p *parser.Part, visit parser.Visit) (interface{}, error) { childParts, err := collectChildParts(p, visit) if err != nil { return nil, err } return joinChildParts(childParts), nil }). RegisterRule("multipart/alternative", func(p *parser.Part, visit parser.Visit) (interface{}, error) { childParts, err := collectChildParts(p, visit) if err != nil { return nil, err } return bestChoice(childParts, preferredContentType), nil }). RegisterRule("text/plain", func(p *parser.Part, visit parser.Visit) (interface{}, error) { disp, _, err := p.Header.ContentDisposition() if err != nil { disp = "" } if disp == "attachment" { return parser.Parts{}, nil } return parser.Parts{p}, nil }). RegisterRule("text/html", func(p *parser.Part, visit parser.Visit) (interface{}, error) { disp, _, err := p.Header.ContentDisposition() if err != nil { disp = "" } if disp == "attachment" { return parser.Parts{}, nil } return parser.Parts{p}, nil }) res, err := v.Visit() if err != nil { return nil, err } return res.(parser.Parts), nil } func collectChildParts(p *parser.Part, visit parser.Visit) ([]parser.Parts, error) { childParts := []parser.Parts{} for _, child := range p.Children() { res, err := visit(child) if err != nil { return nil, err } childParts = append(childParts, res.(parser.Parts)) } return childParts, nil } func joinChildParts(childParts []parser.Parts) parser.Parts { res := parser.Parts{} for _, parts := range childParts { res = append(res, parts...) } return res } func bestChoice(childParts []parser.Parts, preferredContentType string) parser.Parts { // If one of the parts has preferred content type, use that. for i := len(childParts) - 1; i >= 0; i-- { if allPartsHaveContentType(childParts[i], preferredContentType) { return childParts[i] } } // Otherwise, choose the last one. return childParts[len(childParts)-1] } func allPartsHaveContentType(parts parser.Parts, contentType string) bool { if len(parts) == 0 { return false } for _, part := range parts { t, _, err := part.ContentType() if err != nil { return false } if t != contentType { return false } } return true } func determineMIMEType(p *parser.Parser) (string, error) { var isHTML bool w := p.NewWalker(). RegisterContentTypeHandler("text/html", func(p *parser.Part) (err error) { isHTML = true return }) if err := w.Walk(); err != nil { return "", err } if isHTML { return "text/html", nil } return "text/plain", nil } // getPlainBody returns the body of the given part, converting html to // plaintext where possible. func getPlainBody(part *parser.Part) []byte { contentType, _, err := part.ContentType() if err != nil { return part.Body } switch contentType { case "text/html": text, err := html2text.FromReader(bytes.NewReader(part.Body)) if err != nil { return part.Body } return []byte(text) default: return part.Body } } func attachPublicKey(p *parser.Part, key, keyName string) { h := message.Header{} h.Set("Content-Type", fmt.Sprintf(`application/pgp-keys; name="%v.asc"; filename="%v.asc"`, keyName, keyName)) h.Set("Content-Disposition", fmt.Sprintf(`attachment; name="%v.asc"; filename="%v.asc"`, keyName, keyName)) h.Set("Content-Transfer-Encoding", "base64") p.AddChild(&parser.Part{ Header: h, Body: []byte(key), }) } // NOTE: We should use our own ParseAddressList here. func parseMessageHeader(m *pmapi.Message, h message.Header) error { // nolint[funlen] mimeHeader, err := toMailHeader(h) if err != nil { return err } m.Header = mimeHeader if err := forEachDecodedHeaderField(h, func(key, val string) error { switch strings.ToLower(key) { case "subject": m.Subject = val case "from": sender, err := parseAddressList(val) if err != nil { return err } if len(sender) > 0 { m.Sender = sender[0] } case "to": toList, err := parseAddressList(val) if err != nil { return err } m.ToList = toList case "reply-to": replyTos, err := parseAddressList(val) if err != nil { return err } m.ReplyTos = replyTos case "cc": ccList, err := parseAddressList(val) if err != nil { return err } m.CCList = ccList case "bcc": bccList, err := parseAddressList(val) if err != nil { return err } m.BCCList = bccList case "date": date, err := mail.ParseDate(val) if err != nil { return err } m.Time = date.Unix() } return nil }); err != nil { return err } return nil } func parseAttachment(h message.Header) (*pmapi.Attachment, error) { att := &pmapi.Attachment{} mimeHeader, err := toMIMEHeader(h) if err != nil { return nil, err } att.Header = mimeHeader mimeType, _, err := h.ContentType() if err != nil { return nil, err } att.MIMEType = mimeType _, dispParams, dispErr := h.ContentDisposition() if dispErr != nil { ext, err := mime.ExtensionsByType(att.MIMEType) if err != nil { return nil, err } if len(ext) > 0 { att.Name = "attachment" + ext[0] } } else { att.Name = dispParams["filename"] if att.Name == "" { att.Name = "attachment.bin" } } att.ContentID = strings.Trim(h.Get("Content-Id"), " <>") return att, nil } func forEachDecodedHeaderField(h message.Header, fn func(string, string) error) error { fields := h.Fields() for fields.Next() { text, err := fields.Text() if err != nil { if !message.IsUnknownCharset(err) { return err } if text, err = pmmime.DecodeHeader(fields.Value()); err != nil { return err } } if err := fn(fields.Key(), text); err != nil { return err } } return nil } func toMailHeader(h message.Header) (mail.Header, error) { mimeHeader := make(mail.Header) if err := forEachDecodedHeaderField(h, func(key, val string) error { mimeHeader[key] = []string{val} return nil }); err != nil { return nil, err } return mimeHeader, nil } func toMIMEHeader(h message.Header) (textproto.MIMEHeader, error) { mimeHeader := make(textproto.MIMEHeader) if err := forEachDecodedHeaderField(h, func(key, val string) error { mimeHeader[key] = []string{val} return nil }); err != nil { return nil, err } return mimeHeader, nil }