Commit 27d0a731 authored by Brad Fitzpatrick's avatar Brad Fitzpatrick

mime/multipart: fix regression from previous ReadSlice change

The previous change to make multipart use ReadSlice out of
paranoia broke multipart to not deal with large lines in
the bodies.

We should only be paranoid about long lines in the header
sections.

Fixes http://code.google.com/p/camlistore/issues/detail?id=4

R=adg
CC=golang-dev
https://golang.org/cl/4432083
parent cb375ffb
...@@ -15,13 +15,13 @@ package multipart ...@@ -15,13 +15,13 @@ package multipart
import ( import (
"bufio" "bufio"
"bytes" "bytes"
"fmt"
"io" "io"
"io/ioutil" "io/ioutil"
"mime" "mime"
"net/textproto" "net/textproto"
"os" "os"
"regexp" "regexp"
"strings"
) )
var headerRegexp *regexp.Regexp = regexp.MustCompile("^([a-zA-Z0-9\\-]+): *([^\r\n]+)") var headerRegexp *regexp.Regexp = regexp.MustCompile("^([a-zA-Z0-9\\-]+): *([^\r\n]+)")
...@@ -79,25 +79,28 @@ func (p *Part) FormName() string { ...@@ -79,25 +79,28 @@ func (p *Part) FormName() string {
// NewReader creates a new multipart Reader reading from r using the // NewReader creates a new multipart Reader reading from r using the
// given MIME boundary. // given MIME boundary.
func NewReader(reader io.Reader, boundary string) Reader { func NewReader(reader io.Reader, boundary string) Reader {
b := []byte("\r\n--" + boundary + "--")
return &multiReader{ return &multiReader{
boundary: boundary, bufReader: bufio.NewReader(reader),
dashBoundary: "--" + boundary,
endLine: "--" + boundary + "--", nlDashBoundary: b[:len(b)-2],
bufReader: bufio.NewReader(reader), dashBoundaryDash: b[2:],
dashBoundary: b[2 : len(b)-2],
} }
} }
// Implementation .... // Implementation ....
func newPart(mr *multiReader) (bp *Part, err os.Error) { func newPart(mr *multiReader) (*Part, os.Error) {
bp = new(Part) bp := &Part{
bp.Header = make(map[string][]string) Header: make(map[string][]string),
bp.mr = mr mr: mr,
bp.buffer = new(bytes.Buffer) buffer: new(bytes.Buffer),
if err = bp.populateHeaders(); err != nil {
bp = nil
} }
return if err := bp.populateHeaders(); err != nil {
return nil, err
}
return bp, nil
} }
func (bp *Part) populateHeaders() os.Error { func (bp *Part) populateHeaders() os.Error {
...@@ -122,44 +125,49 @@ func (bp *Part) populateHeaders() os.Error { ...@@ -122,44 +125,49 @@ func (bp *Part) populateHeaders() os.Error {
// Read reads the body of a part, after its headers and before the // Read reads the body of a part, after its headers and before the
// next part (if any) begins. // next part (if any) begins.
func (bp *Part) Read(p []byte) (n int, err os.Error) { func (bp *Part) Read(p []byte) (n int, err os.Error) {
for { if bp.buffer.Len() >= len(p) {
if bp.buffer.Len() >= len(p) { // Internal buffer of unconsumed data is large enough for
// Internal buffer of unconsumed data is large enough for // the read request. No need to parse more at the moment.
// the read request. No need to parse more at the moment. return bp.buffer.Read(p)
break }
} peek, err := bp.mr.bufReader.Peek(4096) // TODO(bradfitz): add buffer size accessor
if !bp.mr.ensureBufferedLine() { unexpectedEof := err == os.EOF
return 0, io.ErrUnexpectedEOF if err != nil && !unexpectedEof {
} return 0, fmt.Errorf("multipart: Part Read: %v", err)
if bp.mr.bufferedLineIsBoundary() { }
// Don't consume this line if peek == nil {
break panic("nil peek buf")
} }
// Write all of this line, except the final CRLF // Search the peek buffer for "\r\n--boundary". If found,
s := *bp.mr.bufferedLine // consume everything up to the boundary. If not, consume only
if strings.HasSuffix(s, "\r\n") { // as much of the peek buffer as cannot hold the boundary
bp.mr.consumeLine() // string.
if !bp.mr.ensureBufferedLine() { nCopy := 0
return 0, io.ErrUnexpectedEOF foundBoundary := false
} if idx := bytes.Index(peek, bp.mr.nlDashBoundary); idx != -1 {
if bp.mr.bufferedLineIsBoundary() { nCopy = idx
// The final \r\n isn't ours. It logically belongs foundBoundary = true
// to the boundary line which follows. } else if safeCount := len(peek) - len(bp.mr.nlDashBoundary); safeCount > 0 {
bp.buffer.WriteString(s[0 : len(s)-2]) nCopy = safeCount
} else { } else if unexpectedEof {
bp.buffer.WriteString(s) // If we've run out of peek buffer and the boundary
} // wasn't found (and can't possibly fit), we must have
break // hit the end of the file unexpectedly.
} return 0, io.ErrUnexpectedEOF
if strings.HasSuffix(s, "\n") { }
bp.buffer.WriteString(s) if nCopy > 0 {
bp.mr.consumeLine() if _, err := io.Copyn(bp.buffer, bp.mr.bufReader, int64(nCopy)); err != nil {
continue return 0, err
} }
return 0, os.NewError("multipart parse error during Read; unexpected line: " + s)
} }
return bp.buffer.Read(p) n, err = bp.buffer.Read(p)
if err == os.EOF && !foundBoundary {
// If the boundary hasn't been reached there's more to
// read, so don't pass through an EOF from the buffer
err = nil
}
return
} }
func (bp *Part) Close() os.Error { func (bp *Part) Close() os.Error {
...@@ -168,46 +176,12 @@ func (bp *Part) Close() os.Error { ...@@ -168,46 +176,12 @@ func (bp *Part) Close() os.Error {
} }
type multiReader struct { type multiReader struct {
boundary string bufReader *bufio.Reader
dashBoundary string // --boundary
endLine string // --boundary--
bufferedLine *string
bufReader *bufio.Reader
currentPart *Part currentPart *Part
partsRead int partsRead int
}
func (mr *multiReader) eof() bool { nlDashBoundary, dashBoundaryDash, dashBoundary []byte
return mr.bufferedLine == nil &&
!mr.readLine()
}
func (mr *multiReader) readLine() bool {
lineBytes, err := mr.bufReader.ReadSlice('\n')
if err != nil {
// TODO: care about err being EOF or not?
return false
}
line := string(lineBytes)
mr.bufferedLine = &line
return true
}
func (mr *multiReader) bufferedLineIsBoundary() bool {
return strings.HasPrefix(*mr.bufferedLine, mr.dashBoundary)
}
func (mr *multiReader) ensureBufferedLine() bool {
if mr.bufferedLine == nil {
return mr.readLine()
}
return true
}
func (mr *multiReader) consumeLine() {
mr.bufferedLine = nil
} }
func (mr *multiReader) NextPart() (*Part, os.Error) { func (mr *multiReader) NextPart() (*Part, os.Error) {
...@@ -215,13 +189,14 @@ func (mr *multiReader) NextPart() (*Part, os.Error) { ...@@ -215,13 +189,14 @@ func (mr *multiReader) NextPart() (*Part, os.Error) {
mr.currentPart.Close() mr.currentPart.Close()
} }
expectNewPart := false
for { for {
if mr.eof() { line, err := mr.bufReader.ReadSlice('\n')
return nil, io.ErrUnexpectedEOF if err != nil {
return nil, fmt.Errorf("multipart: NextPart: %v", err)
} }
if isBoundaryDelimiterLine(*mr.bufferedLine, mr.dashBoundary) { if mr.isBoundaryDelimiterLine(line) {
mr.consumeLine()
mr.partsRead++ mr.partsRead++
bp, err := newPart(mr) bp, err := newPart(mr)
if err != nil { if err != nil {
...@@ -231,55 +206,67 @@ func (mr *multiReader) NextPart() (*Part, os.Error) { ...@@ -231,55 +206,67 @@ func (mr *multiReader) NextPart() (*Part, os.Error) {
return bp, nil return bp, nil
} }
if hasPrefixThenNewline(*mr.bufferedLine, mr.endLine) { if hasPrefixThenNewline(line, mr.dashBoundaryDash) {
mr.consumeLine()
// Expected EOF (no error) // Expected EOF (no error)
// TODO(bradfitz): should return an os.EOF error here, not using nil for errors
return nil, nil return nil, nil
} }
if expectNewPart {
return nil, fmt.Errorf("multipart: expecting a new Part; got line %q", string(line))
}
if mr.partsRead == 0 { if mr.partsRead == 0 {
// skip line // skip line
mr.consumeLine()
continue continue
} }
return nil, os.NewError("Unexpected line in Next().") if bytes.Equal(line, []byte("\r\n")) {
// Consume the "\r\n" separator between the
// body of the previous part and the boundary
// line we now expect will follow. (either a
// new part or the end boundary)
expectNewPart = true
continue
}
return nil, fmt.Errorf("multipart: unexpected line in Next(): %q", line)
} }
panic("unreachable") panic("unreachable")
} }
func isBoundaryDelimiterLine(line, dashPrefix string) bool { func (mr *multiReader) isBoundaryDelimiterLine(line []byte) bool {
// http://tools.ietf.org/html/rfc2046#section-5.1 // http://tools.ietf.org/html/rfc2046#section-5.1
// The boundary delimiter line is then defined as a line // The boundary delimiter line is then defined as a line
// consisting entirely of two hyphen characters ("-", // consisting entirely of two hyphen characters ("-",
// decimal value 45) followed by the boundary parameter // decimal value 45) followed by the boundary parameter
// value from the Content-Type header field, optional linear // value from the Content-Type header field, optional linear
// whitespace, and a terminating CRLF. // whitespace, and a terminating CRLF.
if !strings.HasPrefix(line, dashPrefix) { if !bytes.HasPrefix(line, mr.dashBoundary) {
return false return false
} }
if strings.HasSuffix(line, "\r\n") { if bytes.HasSuffix(line, []byte("\r\n")) {
return onlyHorizontalWhitespace(line[len(dashPrefix) : len(line)-2]) return onlyHorizontalWhitespace(line[len(mr.dashBoundary) : len(line)-2])
} }
// Violate the spec and also support newlines without the // Violate the spec and also support newlines without the
// carriage return... // carriage return...
if strings.HasSuffix(line, "\n") { if bytes.HasSuffix(line, []byte("\n")) {
return onlyHorizontalWhitespace(line[len(dashPrefix) : len(line)-1]) return onlyHorizontalWhitespace(line[len(mr.dashBoundary) : len(line)-1])
} }
return false return false
} }
func onlyHorizontalWhitespace(s string) bool { func onlyHorizontalWhitespace(s []byte) bool {
for i := 0; i < len(s); i++ { for _, b := range s {
if s[i] != ' ' && s[i] != '\t' { if b != ' ' && b != '\t' {
return false return false
} }
} }
return true return true
} }
func hasPrefixThenNewline(s, prefix string) bool { func hasPrefixThenNewline(s, prefix []byte) bool {
return strings.HasPrefix(s, prefix) && return bytes.HasPrefix(s, prefix) &&
(len(s) == len(prefix)+1 && strings.HasSuffix(s, "\n") || (len(s) == len(prefix)+1 && s[len(s)-1] == '\n' ||
len(s) == len(prefix)+2 && strings.HasSuffix(s, "\r\n")) len(s) == len(prefix)+2 && bytes.HasSuffix(s, []byte("\r\n")))
} }
...@@ -8,38 +8,37 @@ import ( ...@@ -8,38 +8,37 @@ import (
"bytes" "bytes"
"fmt" "fmt"
"io" "io"
"io/ioutil"
"json" "json"
"os" "os"
"regexp"
"strings" "strings"
"testing" "testing"
) )
func TestHorizontalWhitespace(t *testing.T) { func TestHorizontalWhitespace(t *testing.T) {
if !onlyHorizontalWhitespace(" \t") { if !onlyHorizontalWhitespace([]byte(" \t")) {
t.Error("expected pass") t.Error("expected pass")
} }
if onlyHorizontalWhitespace("foo bar") { if onlyHorizontalWhitespace([]byte("foo bar")) {
t.Error("expected failure") t.Error("expected failure")
} }
} }
func TestBoundaryLine(t *testing.T) { func TestBoundaryLine(t *testing.T) {
boundary := "myBoundary" mr := NewReader(strings.NewReader(""), "myBoundary").(*multiReader)
prefix := "--" + boundary if !mr.isBoundaryDelimiterLine([]byte("--myBoundary\r\n")) {
if !isBoundaryDelimiterLine("--myBoundary\r\n", prefix) {
t.Error("expected") t.Error("expected")
} }
if !isBoundaryDelimiterLine("--myBoundary \r\n", prefix) { if !mr.isBoundaryDelimiterLine([]byte("--myBoundary \r\n")) {
t.Error("expected") t.Error("expected")
} }
if !isBoundaryDelimiterLine("--myBoundary \n", prefix) { if !mr.isBoundaryDelimiterLine([]byte("--myBoundary \n")) {
t.Error("expected") t.Error("expected")
} }
if isBoundaryDelimiterLine("--myBoundary bogus \n", prefix) { if mr.isBoundaryDelimiterLine([]byte("--myBoundary bogus \n")) {
t.Error("expected fail") t.Error("expected fail")
} }
if isBoundaryDelimiterLine("--myBoundary bogus--", prefix) { if mr.isBoundaryDelimiterLine([]byte("--myBoundary bogus--")) {
t.Error("expected fail") t.Error("expected fail")
} }
} }
...@@ -79,7 +78,9 @@ func TestFormName(t *testing.T) { ...@@ -79,7 +78,9 @@ func TestFormName(t *testing.T) {
} }
} }
func TestMultipart(t *testing.T) { var longLine = strings.Repeat("\n\n\r\r\r\n\r\000", (1<<20)/8)
func testMultipartBody() string {
testBody := ` testBody := `
This is a multi-part message. This line is ignored. This is a multi-part message. This line is ignored.
--MyBoundary --MyBoundary
...@@ -90,6 +91,10 @@ foo-bar: baz ...@@ -90,6 +91,10 @@ foo-bar: baz
My value My value
The end. The end.
--MyBoundary --MyBoundary
name: bigsection
[longline]
--MyBoundary
Header1: value1b Header1: value1b
HEADER2: value2b HEADER2: value2b
foo-bar: bazb foo-bar: bazb
...@@ -102,11 +107,26 @@ Line 3 ends in a newline, but just one. ...@@ -102,11 +107,26 @@ Line 3 ends in a newline, but just one.
never read data never read data
--MyBoundary-- --MyBoundary--
useless trailer
` `
testBody = regexp.MustCompile("\n").ReplaceAllString(testBody, "\r\n") testBody = strings.Replace(testBody, "\n", "\r\n", -1)
bodyReader := strings.NewReader(testBody) return strings.Replace(testBody, "[longline]", longLine, 1)
}
func TestMultipart(t *testing.T) {
bodyReader := strings.NewReader(testMultipartBody())
testMultipart(t, bodyReader)
}
func TestMultipartSlowInput(t *testing.T) {
bodyReader := strings.NewReader(testMultipartBody())
testMultipart(t, &slowReader{bodyReader})
}
reader := NewReader(bodyReader, "MyBoundary") func testMultipart(t *testing.T, r io.Reader) {
reader := NewReader(r, "MyBoundary")
buf := new(bytes.Buffer) buf := new(bytes.Buffer)
// Part1 // Part1
...@@ -125,38 +145,64 @@ never read data ...@@ -125,38 +145,64 @@ never read data
t.Error("Expected Foo-Bar: baz") t.Error("Expected Foo-Bar: baz")
} }
buf.Reset() buf.Reset()
io.Copy(buf, part) if _, err := io.Copy(buf, part); err != nil {
t.Errorf("part 1 copy: %v", err)
}
expectEq(t, "My value\r\nThe end.", expectEq(t, "My value\r\nThe end.",
buf.String(), "Value of first part") buf.String(), "Value of first part")
// Part2 // Part2
part, err = reader.NextPart() part, err = reader.NextPart()
if err != nil {
t.Fatalf("Expected part2; got: %v", err)
return
}
if e, g := "bigsection", part.Header.Get("name"); e != g {
t.Errorf("part2's name header: expected %q, got %q", e, g)
}
buf.Reset()
if _, err := io.Copy(buf, part); err != nil {
t.Errorf("part 2 copy: %v", err)
}
s := buf.String()
if len(s) != len(longLine) {
t.Errorf("part2 body expected long line of length %d; got length %d",
len(longLine), len(s))
}
if s != longLine {
t.Errorf("part2 long body didn't match")
}
// Part3
part, err = reader.NextPart()
if part == nil || err != nil { if part == nil || err != nil {
t.Error("Expected part2") t.Error("Expected part3")
return return
} }
if part.Header.Get("foo-bar") != "bazb" { if part.Header.Get("foo-bar") != "bazb" {
t.Error("Expected foo-bar: bazb") t.Error("Expected foo-bar: bazb")
} }
buf.Reset() buf.Reset()
io.Copy(buf, part) if _, err := io.Copy(buf, part); err != nil {
t.Errorf("part 3 copy: %v", err)
}
expectEq(t, "Line 1\r\nLine 2\r\nLine 3 ends in a newline, but just one.\r\n", expectEq(t, "Line 1\r\nLine 2\r\nLine 3 ends in a newline, but just one.\r\n",
buf.String(), "Value of second part") buf.String(), "body of part 3")
// Part3 // Part4
part, err = reader.NextPart() part, err = reader.NextPart()
if part == nil || err != nil { if part == nil || err != nil {
t.Error("Expected part3 without errors") t.Error("Expected part 4 without errors")
return return
} }
// Non-existent part4 // Non-existent part5
part, err = reader.NextPart() part, err = reader.NextPart()
if part != nil { if part != nil {
t.Error("Didn't expect a third part.") t.Error("Didn't expect a fifth part.")
} }
if err != nil { if err != nil {
t.Errorf("Unexpected error getting third part: %v", err) t.Errorf("Unexpected error getting fifth part: %v", err)
} }
} }
...@@ -237,3 +283,36 @@ func TestLineLimit(t *testing.T) { ...@@ -237,3 +283,36 @@ func TestLineLimit(t *testing.T) {
t.Errorf("expected to read < %d bytes; read %d", maxReadThreshold, mr.n) t.Errorf("expected to read < %d bytes; read %d", maxReadThreshold, mr.n)
} }
} }
func TestMultipartTruncated(t *testing.T) {
testBody := `
This is a multi-part message. This line is ignored.
--MyBoundary
foo-bar: baz
Oh no, premature EOF!
`
body := strings.Replace(testBody, "\n", "\r\n", -1)
bodyReader := strings.NewReader(body)
r := NewReader(bodyReader, "MyBoundary")
part, err := r.NextPart()
if err != nil {
t.Fatalf("didn't get a part")
}
_, err = io.Copy(ioutil.Discard, part)
if err != io.ErrUnexpectedEOF {
t.Fatalf("expected error io.ErrUnexpectedEOF; got %v", err)
}
}
type slowReader struct {
r io.Reader
}
func (s *slowReader) Read(p []byte) (int, os.Error) {
if len(p) == 0 {
return s.r.Read(p)
}
return s.r.Read(p[:1])
}
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment