Skip to content

Commit

Permalink
feat: add max byte slice size config (#273)
Browse files Browse the repository at this point in the history
  • Loading branch information
nrwiersma authored Jul 16, 2023
1 parent 3abfe1e commit b4a402f
Show file tree
Hide file tree
Showing 4 changed files with 55 additions and 1 deletion.
7 changes: 7 additions & 0 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -125,11 +125,18 @@ encoding and decoding.
Enums may also implement `TextMarshaler` and `TextUnmarshaler`, and must resolve to valid symbols in the given enum schema.

##### Identical Underlying Types

One type can be [ConvertibleTo](https://go.dev/ref/spec#Conversions) another type if they have identical underlying types.
A non-native type is allowed be used if it can be convertible to *time.Time*, *big.Rat* or *avro.LogicalDuration* for the particular of *LogicalTypes*.

Ex.: `type Timestamp time.Time`

##### Untrusted Input With Bytes and Strings

For security reasons, the configuration `Config.MaxByteSliceSize` restricts the maximum size of `bytes` and `string` types created
by the `Reader`. The default maximum size is `1MiB` and is configurable. This is required to stop untrusted input from consuming all memory and
crashing the application. Should this not be need, setting a negative number will disable the behaviour.

### Recursive Structs

At this moment recursive structs are not supported. It is planned for the future.
Expand Down
14 changes: 14 additions & 0 deletions config.go
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,8 @@ import (
"github.com/modern-go/reflect2"
)

const maxByteSliceSize = 1024 * 1024

// DefaultConfig is the default API.
var DefaultConfig = Config{}.Freeze()

Expand Down Expand Up @@ -43,6 +45,10 @@ type Config struct {
// Disable caching layer for encoders and decoders, forcing them to get rebuilt on every
// call to Marshal() and Unmarshal()
DisableCaching bool

// MaxByteSliceSize is the maximum size of `bytes` or `string` types the Reader will create, defaulting to 1MiB.
// If this size is exceeded, the Reader returns an error. This can be disabled by setting a negative number.
MaxByteSliceSize int
}

// Freeze makes the configuration immutable.
Expand Down Expand Up @@ -252,3 +258,11 @@ func (c *frozenConfig) getBlockLength() int {
}
return blockSize
}

func (c *frozenConfig) getMaxByteSliceSize() int {
size := c.config.MaxByteSliceSize
if size == 0 {
return maxByteSliceSize
}
return size
}
9 changes: 8 additions & 1 deletion reader.go
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@ import (
"errors"
"fmt"
"io"
"strings"
"unsafe"
)

Expand Down Expand Up @@ -216,12 +217,18 @@ func (r *Reader) ReadString() string {
func (r *Reader) readBytes(op string) []byte {
size := int(r.ReadLong())
if size < 0 {
r.ReportError("ReadString", "invalid "+op+" length")
fnName := "Read" + strings.ToTitle(op)
r.ReportError(fnName, "invalid "+op+" length")
return nil
}
if size == 0 {
return []byte{}
}
if max := r.cfg.getMaxByteSliceSize(); max > 0 && size > max {
fnName := "Read" + strings.ToTitle(op)
r.ReportError(fnName, "size is greater than `Config.MaxByteSliceSize`")
return nil
}

// The bytes are entirely in the buffer and of a reasonable size.
// Use the byte slab.
Expand Down
26 changes: 26 additions & 0 deletions reader_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -507,6 +507,19 @@ func TestReader_ReadBytes(t *testing.T) {
}
}

func TestReader_ReadBytesLargerThanMaxByteSliceSize(t *testing.T) {
data := []byte{
246, 255, 255, 255, 255, 10, 255, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32,
32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32,
32, 32, 32, 32, 32, 32, 32,
}
r := avro.NewReader(bytes.NewReader(data), 4)

_ = r.ReadBytes()

assert.Error(t, r.Error)
}

func TestReader_ReadString(t *testing.T) {
tests := []struct {
data []byte
Expand Down Expand Up @@ -583,6 +596,19 @@ func TestReader_ReadString(t *testing.T) {
}
}

func TestReader_ReadStringLargerThanMaxByteSliceSize(t *testing.T) {
data := []byte{
246, 255, 255, 255, 255, 10, 255, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32,
32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32,
32, 32, 32, 32, 32, 32, 32,
}
r := avro.NewReader(bytes.NewReader(data), 4)

_ = r.ReadString()

assert.Error(t, r.Error)
}

func TestReader_ReadStringFastPathIsntBoundToBuffer(t *testing.T) {
data := []byte{0x06, 0x66, 0x6F, 0x6F, 0x08, 0x61, 0x76, 0x72, 0x6F}
r := avro.NewReader(bytes.NewReader(data), 4)
Expand Down

0 comments on commit b4a402f

Please sign in to comment.