// Copyright 2012 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. // Package quotedprintable implements quoted-printable encoding as specified by // RFC 2045. package quotedprintable import ( "bufio" "bytes" "fmt" "io" ) // Reader is a quoted-printable decoder. type Reader struct { br *bufio.Reader rerr error // last read error line []byte // to be consumed before more of br } // NewReader returns a quoted-printable reader, decoding from r. func NewReader(r io.Reader) *Reader { return &Reader{ br: bufio.NewReader(r), } } func fromHex(b byte) (byte, error) { switch { case b >= '0' && b <= '9': return b - '0', nil case b >= 'A' && b <= 'F': return b - 'A' + 10, nil // Accept badly encoded bytes. case b >= 'a' && b <= 'f': return b - 'a' + 10, nil } return 0, fmt.Errorf("quotedprintable: invalid hex byte 0x%02x", b) } func readHexByte(v []byte) (b byte, err error) { if len(v) < 2 { return 0, io.ErrUnexpectedEOF } var hb, lb byte if hb, err = fromHex(v[0]); err != nil { return 0, err } if lb, err = fromHex(v[1]); err != nil { return 0, err } return hb<<4 | lb, nil } func isQPDiscardWhitespace(r rune) bool { switch r { case '\n', '\r', ' ', '\t': return true } return false } var ( crlf = []byte("\r\n") lf = []byte("\n") softSuffix = []byte("=") ) // Read reads and decodes quoted-printable data from the underlying reader. func (r *Reader) Read(p []byte) (n int, err error) { // Deviations from RFC 2045: // 1. in addition to "=\r\n", "=\n" is also treated as soft line break. // 2. it will pass through a '\r' or '\n' not preceded by '=', consistent // with other broken QP encoders & decoders. // 3. it accepts soft line-break (=) at end of message (issue 15486); i.e. // the final byte read from the underlying reader is allowed to be '=', // and it will be silently ignored. // 4. it takes = as literal = if not followed by two hex digits // but not at end of line (issue 13219). for len(p) > 0 { if len(r.line) == 0 { if r.rerr != nil { return n, r.rerr } r.line, r.rerr = r.br.ReadSlice('\n') // Does the line end in CRLF instead of just LF? hasLF := bytes.HasSuffix(r.line, lf) hasCR := bytes.HasSuffix(r.line, crlf) wholeLine := r.line r.line = bytes.TrimRightFunc(wholeLine, isQPDiscardWhitespace) if bytes.HasSuffix(r.line, softSuffix) { rightStripped := wholeLine[len(r.line):] r.line = r.line[:len(r.line)-1] if !bytes.HasPrefix(rightStripped, lf) && !bytes.HasPrefix(rightStripped, crlf) && !(len(rightStripped) == 0 && len(r.line) > 0 && r.rerr == io.EOF) { r.rerr = fmt.Errorf("quotedprintable: invalid bytes after =: %q", rightStripped) } } else if hasLF { if hasCR { r.line = append(r.line, '\r', '\n') } else { r.line = append(r.line, '\n') } } continue } b := r.line[0] switch { case b == '=': b, err = readHexByte(r.line[1:]) if err != nil { if len(r.line) >= 2 && r.line[1] != '\r' && r.line[1] != '\n' { // Take the = as a literal =. b = '=' break } return n, err } r.line = r.line[2:] // 2 of the 3; other 1 is done below case b == '\t' || b == '\r' || b == '\n': break case b >= 0x80: // As an extension to RFC 2045, we accept // values >= 0x80 without complaint. Issue 22597. break case b < ' ' || b > '~': return n, fmt.Errorf("quotedprintable: invalid unescaped byte 0x%02x in body", b) } p[0] = b p = p[1:] r.line = r.line[1:] n++ } return n, nil }