rlp: check top-level value sizes against input limit

This is a preliminary fix for #420 (SEC-18 RLP decoder unsafe
allocation). If a sane input limit is set on the rlp.Stream,
it should no longer be possible to cause huge []byte allocations.
This commit is contained in:
Felix Lange 2015-03-23 15:02:55 +01:00
parent 4020258801
commit c35f4fd0bd
2 changed files with 171 additions and 56 deletions

View File

@ -9,6 +9,7 @@ import (
"io" "io"
"math/big" "math/big"
"reflect" "reflect"
"strings"
) )
var ( var (
@ -70,14 +71,22 @@ type Decoder interface {
// Non-empty interface types are not supported, nor are booleans, // Non-empty interface types are not supported, nor are booleans,
// signed integers, floating point numbers, maps, channels and // signed integers, floating point numbers, maps, channels and
// functions. // functions.
//
// Note that Decode does not set an input limit for all readers
// and may be vulnerable to panics cause by huge value sizes. If
// you need an input limit, use
//
// NewStream(r, limit).Decode(val)
func Decode(r io.Reader, val interface{}) error { func Decode(r io.Reader, val interface{}) error {
return NewStream(r).Decode(val) // TODO: this could use a Stream from a pool.
return NewStream(r, 0).Decode(val)
} }
// DecodeBytes parses RLP data from b into val. // DecodeBytes parses RLP data from b into val.
// Please see the documentation of Decode for the decoding rules. // Please see the documentation of Decode for the decoding rules.
func DecodeBytes(b []byte, val interface{}) error { func DecodeBytes(b []byte, val interface{}) error {
return NewStream(bytes.NewReader(b)).Decode(val) // TODO: this could use a Stream from a pool.
return NewStream(bytes.NewReader(b), uint64(len(b))).Decode(val)
} }
type decodeError struct { type decodeError struct {
@ -470,10 +479,12 @@ var (
ErrExpectedList = errors.New("rlp: expected List") ErrExpectedList = errors.New("rlp: expected List")
ErrCanonInt = errors.New("rlp: expected Int") ErrCanonInt = errors.New("rlp: expected Int")
ErrElemTooLarge = errors.New("rlp: element is larger than containing list") ErrElemTooLarge = errors.New("rlp: element is larger than containing list")
ErrValueTooLarge = errors.New("rlp: value size exceeds available input length")
// internal errors // internal errors
errNotInList = errors.New("rlp: call of ListEnd outside of any list") errNotInList = errors.New("rlp: call of ListEnd outside of any list")
errNotAtEOL = errors.New("rlp: call of ListEnd not positioned at EOL") errNotAtEOL = errors.New("rlp: call of ListEnd not positioned at EOL")
errUintOverflow = errors.New("rlp: uint overflow")
) )
// ByteReader must be implemented by any input reader for a Stream. It // ByteReader must be implemented by any input reader for a Stream. It
@ -496,7 +507,13 @@ type ByteReader interface {
// //
// Stream is not safe for concurrent use. // Stream is not safe for concurrent use.
type Stream struct { type Stream struct {
r ByteReader r ByteReader
// number of bytes remaining to be read from r.
remaining uint64
limited bool
// auxiliary buffer for integer decoding
uintbuf []byte uintbuf []byte
kind Kind // kind of value ahead kind Kind // kind of value ahead
@ -507,12 +524,26 @@ type Stream struct {
type listpos struct{ pos, size uint64 } type listpos struct{ pos, size uint64 }
// NewStream creates a new stream reading from r. // NewStream creates a new decoding stream reading from r.
// If r does not implement ByteReader, the Stream will //
// introduce its own buffering. // If r implements the ByteReader interface, Stream will
func NewStream(r io.Reader) *Stream { // not introduce any buffering.
//
// For non-toplevel values, Stream returns ErrElemTooLarge
// for values that do not fit into the enclosing list.
//
// Stream supports an optional input limit. If a limit is set, the
// size of any toplevel value will be checked against the remaining
// input length. Stream operations that encounter a value exceeding
// the remaining input length will return ErrValueTooLarge. The limit
// can be set by passing a non-zero value for inputLimit.
//
// If r is a bytes.Reader or strings.Reader, the input limit is set to
// the length of r's underlying data unless an explicit limit is
// provided.
func NewStream(r io.Reader, inputLimit uint64) *Stream {
s := new(Stream) s := new(Stream)
s.Reset(r) s.Reset(r, inputLimit)
return s return s
} }
@ -520,7 +551,7 @@ func NewStream(r io.Reader) *Stream {
// at an encoded list of the given length. // at an encoded list of the given length.
func NewListStream(r io.Reader, len uint64) *Stream { func NewListStream(r io.Reader, len uint64) *Stream {
s := new(Stream) s := new(Stream)
s.Reset(r) s.Reset(r, len)
s.kind = List s.kind = List
s.size = len s.size = len
return s return s
@ -574,8 +605,6 @@ func (s *Stream) Raw() ([]byte, error) {
return buf, nil return buf, nil
} }
var errUintOverflow = errors.New("rlp: uint overflow")
// Uint reads an RLP string of up to 8 bytes and returns its contents // Uint reads an RLP string of up to 8 bytes and returns its contents
// as an unsigned integer. If the input does not contain an RLP string, the // as an unsigned integer. If the input does not contain an RLP string, the
// returned error will be ErrExpectedString. // returned error will be ErrExpectedString.
@ -667,14 +696,36 @@ func (s *Stream) Decode(val interface{}) error {
} }
// Reset discards any information about the current decoding context // Reset discards any information about the current decoding context
// and starts reading from r. If r does not also implement ByteReader, // and starts reading from r. This method is meant to facilitate reuse
// Stream will do its own buffering. // of a preallocated Stream across many decoding operations.
func (s *Stream) Reset(r io.Reader) { //
// If r does not also implement ByteReader, Stream will do its own
// buffering.
func (s *Stream) Reset(r io.Reader, inputLimit uint64) {
if inputLimit > 0 {
s.remaining = inputLimit
s.limited = true
} else {
// Attempt to automatically discover
// the limit when reading from a byte slice.
switch br := r.(type) {
case *bytes.Reader:
s.remaining = uint64(br.Len())
s.limited = true
case *strings.Reader:
s.remaining = uint64(br.Len())
s.limited = true
default:
s.limited = false
}
}
// Wrap r with a buffer if it doesn't have one.
bufr, ok := r.(ByteReader) bufr, ok := r.(ByteReader)
if !ok { if !ok {
bufr = bufio.NewReader(r) bufr = bufio.NewReader(r)
} }
s.r = bufr s.r = bufr
// Reset the decoding context.
s.stack = s.stack[:0] s.stack = s.stack[:0]
s.size = 0 s.size = 0
s.kind = -1 s.kind = -1
@ -700,6 +751,8 @@ func (s *Stream) Kind() (kind Kind, size uint64, err error) {
tos = &s.stack[len(s.stack)-1] tos = &s.stack[len(s.stack)-1]
} }
if s.kind < 0 { if s.kind < 0 {
// don't read further if we're at the end of the
// innermost list.
if tos != nil && tos.pos == tos.size { if tos != nil && tos.pos == tos.size {
return 0, 0, EOL return 0, 0, EOL
} }
@ -709,8 +762,19 @@ func (s *Stream) Kind() (kind Kind, size uint64, err error) {
} }
s.kind, s.size = kind, size s.kind, s.size = kind, size
} }
if tos != nil && tos.pos+s.size > tos.size { // Make sure size is reasonable. This is done always
return 0, 0, ErrElemTooLarge // so Kind returns the same error when called multiple times.
if tos == nil {
// At toplevel, check that the value is smaller
// than the remaining input length.
if s.limited && s.size > s.remaining {
return 0, 0, ErrValueTooLarge
}
} else {
// Inside a list, check that the value doesn't overflow the list.
if tos.pos+s.size > tos.size {
return 0, 0, ErrElemTooLarge
}
} }
return s.kind, s.size, nil return s.kind, s.size, nil
} }
@ -778,6 +842,9 @@ func (s *Stream) readUint(size byte) (uint64, error) {
} }
func (s *Stream) readFull(buf []byte) (err error) { func (s *Stream) readFull(buf []byte) (err error) {
if s.limited && s.remaining < uint64(len(buf)) {
return ErrValueTooLarge
}
s.willRead(uint64(len(buf))) s.willRead(uint64(len(buf)))
var nn, n int var nn, n int
for n < len(buf) && err == nil { for n < len(buf) && err == nil {
@ -791,6 +858,9 @@ func (s *Stream) readFull(buf []byte) (err error) {
} }
func (s *Stream) readByte() (byte, error) { func (s *Stream) readByte() (byte, error) {
if s.limited && s.remaining == 0 {
return 0, io.EOF
}
s.willRead(1) s.willRead(1)
b, err := s.r.ReadByte() b, err := s.r.ReadByte()
if len(s.stack) > 0 && err == io.EOF { if len(s.stack) > 0 && err == io.EOF {
@ -801,6 +871,9 @@ func (s *Stream) readByte() (byte, error) {
func (s *Stream) willRead(n uint64) { func (s *Stream) willRead(n uint64) {
s.kind = -1 // rearm Kind s.kind = -1 // rearm Kind
if s.limited {
s.remaining -= n
}
if len(s.stack) > 0 { if len(s.stack) > 0 {
s.stack[len(s.stack)-1].pos += n s.stack[len(s.stack)-1].pos += n
} }

View File

@ -36,7 +36,8 @@ func TestStreamKind(t *testing.T) {
} }
for i, test := range tests { for i, test := range tests {
s := NewStream(bytes.NewReader(unhex(test.input))) // using plainReader to inhibit input limit errors.
s := NewStream(newPlainReader(unhex(test.input)), 0)
kind, len, err := s.Kind() kind, len, err := s.Kind()
if err != nil { if err != nil {
t.Errorf("test %d: Kind returned error: %v", i, err) t.Errorf("test %d: Kind returned error: %v", i, err)
@ -70,29 +71,63 @@ func TestNewListStream(t *testing.T) {
} }
func TestStreamErrors(t *testing.T) { func TestStreamErrors(t *testing.T) {
withoutInputLimit := func(b []byte) *Stream {
return NewStream(newPlainReader(b), 0)
}
withCustomInputLimit := func(limit uint64) func([]byte) *Stream {
return func(b []byte) *Stream {
return NewStream(bytes.NewReader(b), limit)
}
}
type calls []string type calls []string
tests := []struct { tests := []struct {
string string
calls calls
newStream func([]byte) *Stream // uses bytes.Reader if nil
error error
}{ }{
{"", calls{"Kind"}, io.EOF}, {"C0", calls{"Bytes"}, nil, ErrExpectedString},
{"", calls{"List"}, io.EOF}, {"C0", calls{"Uint"}, nil, ErrExpectedString},
{"", calls{"Uint"}, io.EOF}, {"89000000000000000001", calls{"Uint"}, nil, errUintOverflow},
{"C0", calls{"Bytes"}, ErrExpectedString}, {"00", calls{"List"}, nil, ErrExpectedList},
{"C0", calls{"Uint"}, ErrExpectedString}, {"80", calls{"List"}, nil, ErrExpectedList},
{"81", calls{"Bytes"}, io.ErrUnexpectedEOF}, {"C0", calls{"List", "Uint"}, nil, EOL},
{"81", calls{"Uint"}, io.ErrUnexpectedEOF}, {"C8C9010101010101010101", calls{"List", "Kind"}, nil, ErrElemTooLarge},
{"BFFFFFFFFFFFFFFF", calls{"Bytes"}, io.ErrUnexpectedEOF}, {"C3C2010201", calls{"List", "List", "Uint", "Uint", "ListEnd", "Uint"}, nil, EOL},
{"89000000000000000001", calls{"Uint"}, errUintOverflow}, {"00", calls{"ListEnd"}, nil, errNotInList},
{"00", calls{"List"}, ErrExpectedList}, {"C401020304", calls{"List", "Uint", "ListEnd"}, nil, errNotAtEOL},
{"80", calls{"List"}, ErrExpectedList},
{"C0", calls{"List", "Uint"}, EOL}, // Expected EOF
{"C801", calls{"List", "Uint", "Uint"}, io.ErrUnexpectedEOF}, {"", calls{"Kind"}, nil, io.EOF},
{"C8C9", calls{"List", "Kind"}, ErrElemTooLarge}, {"", calls{"Uint"}, nil, io.EOF},
{"C3C2010201", calls{"List", "List", "Uint", "Uint", "ListEnd", "Uint"}, EOL}, {"", calls{"List"}, nil, io.EOF},
{"00", calls{"ListEnd"}, errNotInList}, {"8105", calls{"Uint", "Uint"}, nil, io.EOF},
{"C40102", calls{"List", "Uint", "ListEnd"}, errNotAtEOL}, {"C0", calls{"List", "ListEnd", "List"}, nil, io.EOF},
// Input limit errors.
{"81", calls{"Bytes"}, nil, ErrValueTooLarge},
{"81", calls{"Uint"}, nil, ErrValueTooLarge},
{"81", calls{"Raw"}, nil, ErrValueTooLarge},
{"BFFFFFFFFFFFFFFFFFFF", calls{"Bytes"}, nil, ErrValueTooLarge},
{"C801", calls{"List"}, nil, ErrValueTooLarge},
// Test for input limit overflow. Since we are counting the limit
// down toward zero in Stream.remaining, reading too far can overflow
// remaining to a large value, effectively disabling the limit.
{"C40102030401", calls{"Raw", "Uint"}, withCustomInputLimit(5), io.EOF},
{"C4010203048102", calls{"Raw", "Uint"}, withCustomInputLimit(6), ErrValueTooLarge},
// Check that the same calls are fine without a limit.
{"C40102030401", calls{"Raw", "Uint"}, withoutInputLimit, nil},
{"C4010203048102", calls{"Raw", "Uint"}, withoutInputLimit, nil},
// Unexpected EOF. This only happens when there is
// no input limit, so the reader needs to be 'dumbed down'.
{"81", calls{"Bytes"}, withoutInputLimit, io.ErrUnexpectedEOF},
{"81", calls{"Uint"}, withoutInputLimit, io.ErrUnexpectedEOF},
{"BFFFFFFFFFFFFFFF", calls{"Bytes"}, withoutInputLimit, io.ErrUnexpectedEOF},
{"C801", calls{"List", "Uint", "Uint"}, withoutInputLimit, io.ErrUnexpectedEOF},
// This test verifies that the input position is advanced // This test verifies that the input position is advanced
// correctly when calling Bytes for empty strings. Kind can be called // correctly when calling Bytes for empty strings. Kind can be called
@ -109,12 +144,15 @@ func TestStreamErrors(t *testing.T) {
"Bytes", // past final element "Bytes", // past final element
"Bytes", // this one should fail "Bytes", // this one should fail
}, EOL}, }, nil, EOL},
} }
testfor: testfor:
for i, test := range tests { for i, test := range tests {
s := NewStream(bytes.NewReader(unhex(test.string))) if test.newStream == nil {
test.newStream = func(b []byte) *Stream { return NewStream(bytes.NewReader(b), 0) }
}
s := test.newStream(unhex(test.string))
rs := reflect.ValueOf(s) rs := reflect.ValueOf(s)
for j, call := range test.calls { for j, call := range test.calls {
fval := rs.MethodByName(call) fval := rs.MethodByName(call)
@ -124,8 +162,12 @@ testfor:
err = lastret.(error).Error() err = lastret.(error).Error()
} }
if j == len(test.calls)-1 { if j == len(test.calls)-1 {
if err != test.error.Error() { want := "<nil>"
t.Errorf("test %d: last call (%s) error mismatch\ngot: %s\nwant: %v", if test.error != nil {
want = test.error.Error()
}
if err != want {
t.Errorf("test %d: last call (%s) error mismatch\ngot: %s\nwant: %s",
i, call, err, test.error) i, call, err, test.error)
} }
} else if err != "<nil>" { } else if err != "<nil>" {
@ -137,7 +179,7 @@ testfor:
} }
func TestStreamList(t *testing.T) { func TestStreamList(t *testing.T) {
s := NewStream(bytes.NewReader(unhex("C80102030405060708"))) s := NewStream(bytes.NewReader(unhex("C80102030405060708")), 0)
len, err := s.List() len, err := s.List()
if err != nil { if err != nil {
@ -166,7 +208,7 @@ func TestStreamList(t *testing.T) {
} }
func TestStreamRaw(t *testing.T) { func TestStreamRaw(t *testing.T) {
s := NewStream(bytes.NewReader(unhex("C58401010101"))) s := NewStream(bytes.NewReader(unhex("C58401010101")), 0)
s.List() s.List()
want := unhex("8401010101") want := unhex("8401010101")
@ -284,11 +326,6 @@ var decodeTests = []decodeTest{
ptr: new([5]byte), ptr: new([5]byte),
error: "rlp: input string too long for [5]uint8", error: "rlp: input string too long for [5]uint8",
}, },
{
input: "850101",
ptr: new([5]byte),
error: io.ErrUnexpectedEOF.Error(),
},
// byte array reuse (should be zeroed) // byte array reuse (should be zeroed)
{input: "850102030405", ptr: &sharedByteArray, value: [5]byte{1, 2, 3, 4, 5}}, {input: "850102030405", ptr: &sharedByteArray, value: [5]byte{1, 2, 3, 4, 5}},
@ -401,11 +438,17 @@ func TestDecodeWithByteReader(t *testing.T) {
}) })
} }
// dumbReader reads from a byte slice but does not // plainReader reads from a byte slice but does not
// implement ReadByte. // implement ReadByte. It is also not recognized by the
type dumbReader []byte // size validation. This is useful to test how the decoder
// behaves on a non-buffered input stream.
type plainReader []byte
func (r *dumbReader) Read(buf []byte) (n int, err error) { func newPlainReader(b []byte) io.Reader {
return (*plainReader)(&b)
}
func (r *plainReader) Read(buf []byte) (n int, err error) {
if len(*r) == 0 { if len(*r) == 0 {
return 0, io.EOF return 0, io.EOF
} }
@ -416,15 +459,14 @@ func (r *dumbReader) Read(buf []byte) (n int, err error) {
func TestDecodeWithNonByteReader(t *testing.T) { func TestDecodeWithNonByteReader(t *testing.T) {
runTests(t, func(input []byte, into interface{}) error { runTests(t, func(input []byte, into interface{}) error {
r := dumbReader(input) return Decode(newPlainReader(input), into)
return Decode(&r, into)
}) })
} }
func TestDecodeStreamReset(t *testing.T) { func TestDecodeStreamReset(t *testing.T) {
s := NewStream(nil) s := NewStream(nil, 0)
runTests(t, func(input []byte, into interface{}) error { runTests(t, func(input []byte, into interface{}) error {
s.Reset(bytes.NewReader(input)) s.Reset(bytes.NewReader(input), 0)
return s.Decode(into) return s.Decode(into)
}) })
} }
@ -518,7 +560,7 @@ func ExampleDecode() {
func ExampleStream() { func ExampleStream() {
input, _ := hex.DecodeString("C90A1486666F6F626172") input, _ := hex.DecodeString("C90A1486666F6F626172")
s := NewStream(bytes.NewReader(input)) s := NewStream(bytes.NewReader(input), 0)
// Check what kind of value lies ahead // Check what kind of value lies ahead
kind, size, _ := s.Kind() kind, size, _ := s.Kind()