FedP2P/bencode/decode.go

641 lines
12 KiB
Go
Raw Normal View History

2012-06-20 21:21:32 +08:00
package bencode
import (
"bytes"
"errors"
"fmt"
"io"
"math/big"
"reflect"
"runtime"
"strconv"
"strings"
)
2012-06-20 21:21:32 +08:00
type Decoder struct {
r interface {
io.ByteScanner
io.Reader
}
2017-11-05 12:45:30 +08:00
// Sum of bytes used to Decode values.
2017-11-05 12:42:37 +08:00
Offset int64
2012-06-20 21:21:32 +08:00
buf bytes.Buffer
}
func (d *Decoder) Decode(v interface{}) (err error) {
2012-06-20 21:34:10 +08:00
defer func() {
if err != nil {
return
}
r := recover()
_, ok := r.(runtime.Error)
if ok {
panic(r)
}
err, ok = r.(error)
if !ok && r != nil {
panic(r)
2012-06-20 21:34:10 +08:00
}
}()
2012-06-20 21:21:32 +08:00
pv := reflect.ValueOf(v)
if pv.Kind() != reflect.Ptr || pv.IsNil() {
return &UnmarshalInvalidArgError{reflect.TypeOf(v)}
}
ok, err := d.parseValue(pv.Elem())
if err != nil {
return
}
if !ok {
2017-11-05 12:42:37 +08:00
d.throwSyntaxError(d.Offset-1, errors.New("unexpected 'e'"))
}
return
2012-06-20 21:21:32 +08:00
}
func checkForUnexpectedEOF(err error, offset int64) {
2012-06-20 21:21:32 +08:00
if err == io.EOF {
panic(&SyntaxError{
Offset: offset,
What: io.ErrUnexpectedEOF,
2012-06-20 21:21:32 +08:00
})
}
}
func (d *Decoder) readByte() byte {
b, err := d.r.ReadByte()
2012-06-20 21:21:32 +08:00
if err != nil {
2017-11-05 12:42:37 +08:00
checkForUnexpectedEOF(err, d.Offset)
2012-06-20 21:21:32 +08:00
panic(err)
}
2017-11-05 12:42:37 +08:00
d.Offset++
2012-06-20 21:21:32 +08:00
return b
}
// reads data writing it to 'd.buf' until 'sep' byte is encountered, 'sep' byte
// is consumed, but not included into the 'd.buf'
func (d *Decoder) readUntil(sep byte) {
2012-06-20 21:21:32 +08:00
for {
b := d.readByte()
2012-06-20 21:21:32 +08:00
if b == sep {
return
}
d.buf.WriteByte(b)
}
}
func checkForIntParseError(err error, offset int64) {
2012-06-20 21:21:32 +08:00
if err != nil {
panic(&SyntaxError{
Offset: offset,
What: err,
2012-06-20 21:21:32 +08:00
})
}
}
func (d *Decoder) throwSyntaxError(offset int64, err error) {
panic(&SyntaxError{
Offset: offset,
What: err,
})
}
2012-06-20 21:21:32 +08:00
// called when 'i' was consumed
2016-08-26 12:51:38 +08:00
func (d *Decoder) parseInt(v reflect.Value) {
2017-11-05 12:42:37 +08:00
start := d.Offset - 1
d.readUntil('e')
2012-06-20 21:21:32 +08:00
if d.buf.Len() == 0 {
panic(&SyntaxError{
Offset: start,
What: errors.New("empty integer value"),
2012-06-20 21:21:32 +08:00
})
}
2015-08-23 15:51:24 +08:00
s := d.buf.String()
2012-06-20 21:21:32 +08:00
switch v.Kind() {
case reflect.Int, reflect.Int8, reflect.Int16, reflect.Int32, reflect.Int64:
2015-08-23 15:51:24 +08:00
n, err := strconv.ParseInt(s, 10, 64)
checkForIntParseError(err, start)
2012-06-20 21:21:32 +08:00
if v.OverflowInt(n) {
panic(&UnmarshalTypeError{
2015-08-23 15:51:24 +08:00
Value: "integer " + s,
2012-06-20 21:21:32 +08:00
Type: v.Type(),
})
}
v.SetInt(n)
case reflect.Uint, reflect.Uint8, reflect.Uint16, reflect.Uint32, reflect.Uint64:
2015-08-23 15:51:24 +08:00
n, err := strconv.ParseUint(s, 10, 64)
checkForIntParseError(err, start)
2012-06-20 21:21:32 +08:00
if v.OverflowUint(n) {
panic(&UnmarshalTypeError{
2015-08-23 15:51:24 +08:00
Value: "integer " + s,
2012-06-20 21:21:32 +08:00
Type: v.Type(),
})
}
v.SetUint(n)
case reflect.Bool:
2015-08-23 15:51:24 +08:00
v.SetBool(s != "0")
2012-06-20 21:21:32 +08:00
default:
panic(&UnmarshalTypeError{
2015-08-23 15:51:24 +08:00
Value: "integer " + s,
2012-06-20 21:21:32 +08:00
Type: v.Type(),
})
}
d.buf.Reset()
}
func (d *Decoder) parseString(v reflect.Value) error {
2017-11-05 12:42:37 +08:00
start := d.Offset - 1
2012-06-20 21:21:32 +08:00
// read the string length first
d.readUntil(':')
2012-06-20 21:21:32 +08:00
length, err := strconv.ParseInt(d.buf.String(), 10, 64)
checkForIntParseError(err, start)
2012-06-20 21:21:32 +08:00
d.buf.Reset()
n, err := io.CopyN(&d.buf, d.r, length)
2017-11-05 12:42:37 +08:00
d.Offset += n
2012-06-20 21:21:32 +08:00
if err != nil {
2017-11-05 12:42:37 +08:00
checkForUnexpectedEOF(err, d.Offset)
2012-06-20 21:21:32 +08:00
panic(&SyntaxError{
2017-11-05 12:42:37 +08:00
Offset: d.Offset,
What: errors.New("unexpected I/O error: " + err.Error()),
2012-06-20 21:21:32 +08:00
})
}
switch v.Kind() {
case reflect.String:
v.SetString(d.buf.String())
case reflect.Slice:
if v.Type().Elem().Kind() != reflect.Uint8 {
panic(&UnmarshalTypeError{
Value: "string",
Type: v.Type(),
})
}
v.SetBytes(append([]byte(nil), d.buf.Bytes()...))
2012-06-20 21:21:32 +08:00
default:
return &UnmarshalTypeError{
2012-06-20 21:21:32 +08:00
Value: "string",
Type: v.Type(),
}
2012-06-20 21:21:32 +08:00
}
d.buf.Reset()
return nil
2012-06-20 21:21:32 +08:00
}
// Info for parsing a dict value.
type dictField struct {
Value reflect.Value // Storage for the parsed value.
// True if field value should be parsed into Value. If false, the value
// should be parsed and discarded.
Ok bool
Set func() // Call this after parsing into Value.
IgnoreUnmarshalTypeError bool
}
// Returns specifics for parsing a dict field value.
func getDictField(dict reflect.Value, key string) dictField {
// get valuev as a map value or as a struct field
switch dict.Kind() {
case reflect.Map:
value := reflect.New(dict.Type().Elem()).Elem()
return dictField{
Value: value,
Ok: true,
Set: func() {
// Assigns the value into the map.
dict.SetMapIndex(reflect.ValueOf(key), value)
},
}
case reflect.Struct:
sf, ok := getStructFieldForKey(dict.Type(), key)
if !ok {
return dictField{}
}
if sf.PkgPath != "" {
panic(&UnmarshalFieldError{
Key: key,
Type: dict.Type(),
Field: sf,
})
}
return dictField{
Value: dict.FieldByIndex(sf.Index),
Ok: true,
Set: func() {},
IgnoreUnmarshalTypeError: getTag(sf.Tag).IgnoreUnmarshalTypeError(),
}
default:
panic(dict.Kind())
}
}
func getStructFieldForKey(struct_ reflect.Type, key string) (f reflect.StructField, ok bool) {
for i, n := 0, struct_.NumField(); i < n; i++ {
f = struct_.Field(i)
tag := f.Tag.Get("bencode")
if tag == "-" {
continue
}
if f.Anonymous {
continue
}
if parseTag(tag).Key() == key {
ok = true
break
}
if f.Name == key {
ok = true
break
}
if strings.EqualFold(f.Name, key) {
ok = true
break
}
}
return
}
func (d *Decoder) parseDict(v reflect.Value) error {
2012-06-20 21:21:32 +08:00
switch v.Kind() {
case reflect.Map:
t := v.Type()
if t.Key().Kind() != reflect.String {
panic(&UnmarshalTypeError{
Value: "object",
Type: t,
})
}
if v.IsNil() {
v.Set(reflect.MakeMap(t))
}
case reflect.Struct:
default:
panic(&UnmarshalTypeError{
Value: "object",
Type: v.Type(),
})
}
// so, at this point 'd' byte was consumed, let's just read key/value
// pairs one by one
for {
var keyStr string
keyValue := reflect.ValueOf(&keyStr).Elem()
ok, err := d.parseValue(keyValue)
if err != nil {
return fmt.Errorf("error parsing dict key: %s", err)
}
if !ok {
return nil
2012-06-20 21:21:32 +08:00
}
df := getDictField(v, keyStr)
2012-06-20 21:21:32 +08:00
// now we need to actually parse it
if df.Ok {
// log.Printf("parsing ok struct field for key %q", keyStr)
ok, err = d.parseValue(df.Value)
} else {
// Discard the value, there's nowhere to put it.
var if_ interface{}
if_, ok = d.parseValueInterface()
if if_ == nil {
err = fmt.Errorf("error parsing value for key %q", keyStr)
2012-06-20 21:21:32 +08:00
}
}
if err != nil {
if _, ok := err.(*UnmarshalTypeError); !ok || !df.IgnoreUnmarshalTypeError {
return fmt.Errorf("parsing value for key %q: %s", keyStr, err)
}
}
if !ok {
return fmt.Errorf("missing value for key %q", keyStr)
2012-06-20 21:21:32 +08:00
}
if df.Ok {
df.Set()
2012-06-20 21:21:32 +08:00
}
}
}
func (d *Decoder) parseList(v reflect.Value) error {
2012-06-20 21:21:32 +08:00
switch v.Kind() {
case reflect.Array, reflect.Slice:
default:
panic(&UnmarshalTypeError{
Value: "array",
Type: v.Type(),
})
}
i := 0
for ; ; i++ {
2012-06-20 21:21:32 +08:00
if v.Kind() == reflect.Slice && i >= v.Len() {
v.Set(reflect.Append(v, reflect.Zero(v.Type().Elem())))
}
if i < v.Len() {
ok, err := d.parseValue(v.Index(i))
if err != nil {
return err
}
if !ok {
break
}
2012-06-20 21:21:32 +08:00
} else {
_, ok := d.parseValueInterface()
if !ok {
break
}
2012-06-20 21:21:32 +08:00
}
}
if i < v.Len() {
if v.Kind() == reflect.Array {
z := reflect.Zero(v.Type().Elem())
for n := v.Len(); i < n; i++ {
v.Index(i).Set(z)
}
} else {
v.SetLen(i)
}
}
if i == 0 && v.Kind() == reflect.Slice {
v.Set(reflect.MakeSlice(v.Type(), 0, 0))
}
return nil
2012-06-20 21:21:32 +08:00
}
func (d *Decoder) readOneValue() bool {
b, err := d.r.ReadByte()
if err != nil {
panic(err)
}
if b == 'e' {
d.r.UnreadByte()
return false
} else {
2017-11-05 12:42:37 +08:00
d.Offset++
d.buf.WriteByte(b)
}
switch b {
case 'd', 'l':
// read until there is nothing to read
for d.readOneValue() {
}
// consume 'e' as well
b = d.readByte()
d.buf.WriteByte(b)
case 'i':
d.readUntil('e')
d.buf.WriteString("e")
default:
if b >= '0' && b <= '9' {
start := d.buf.Len() - 1
d.readUntil(':')
length, err := strconv.ParseInt(d.buf.String()[start:], 10, 64)
2017-11-05 12:42:37 +08:00
checkForIntParseError(err, d.Offset-1)
d.buf.WriteString(":")
n, err := io.CopyN(&d.buf, d.r, length)
2017-11-05 12:42:37 +08:00
d.Offset += n
if err != nil {
2017-11-05 12:42:37 +08:00
checkForUnexpectedEOF(err, d.Offset)
panic(&SyntaxError{
2017-11-05 12:42:37 +08:00
Offset: d.Offset,
What: errors.New("unexpected I/O error: " + err.Error()),
})
}
break
}
2017-11-05 12:42:37 +08:00
d.raiseUnknownValueType(b, d.Offset-1)
}
return true
}
func (d *Decoder) parseUnmarshaler(v reflect.Value) bool {
m, ok := v.Interface().(Unmarshaler)
if !ok {
// T doesn't work, try *T
if v.Kind() != reflect.Ptr && v.CanAddr() {
m, ok = v.Addr().Interface().(Unmarshaler)
if ok {
v = v.Addr()
}
}
}
if ok && (v.Kind() != reflect.Ptr || !v.IsNil()) {
if d.readOneValue() {
err := m.UnmarshalBencode(d.buf.Bytes())
d.buf.Reset()
if err != nil {
panic(&UnmarshalerError{v.Type(), err})
}
return true
}
d.buf.Reset()
}
return false
}
// Returns true if there was a value and it's now stored in 'v', otherwise
// there was an end symbol ("e") and no value was stored.
func (d *Decoder) parseValue(v reflect.Value) (bool, error) {
// we support one level of indirection at the moment
if v.Kind() == reflect.Ptr {
2012-06-20 21:21:32 +08:00
// if the pointer is nil, allocate a new element of the type it
// points to
if v.IsNil() {
v.Set(reflect.New(v.Type().Elem()))
2012-06-20 21:21:32 +08:00
}
v = v.Elem()
}
if d.parseUnmarshaler(v) {
return true, nil
2012-06-20 21:21:32 +08:00
}
// common case: interface{}
if v.Kind() == reflect.Interface && v.NumMethod() == 0 {
iface, _ := d.parseValueInterface()
2012-06-20 21:21:32 +08:00
v.Set(reflect.ValueOf(iface))
return true, nil
2012-06-20 21:21:32 +08:00
}
b, err := d.r.ReadByte()
2012-06-20 21:21:32 +08:00
if err != nil {
panic(err)
}
2017-11-05 12:42:37 +08:00
d.Offset++
2012-06-20 21:21:32 +08:00
switch b {
case 'e':
return false, nil
2012-06-20 21:21:32 +08:00
case 'd':
return true, d.parseDict(v)
2012-06-20 21:21:32 +08:00
case 'l':
return true, d.parseList(v)
2012-06-20 21:21:32 +08:00
case 'i':
2016-08-26 12:51:38 +08:00
d.parseInt(v)
return true, nil
2012-06-20 21:21:32 +08:00
default:
if b >= '0' && b <= '9' {
// string
// append first digit of the length to the buffer
d.buf.WriteByte(b)
return true, d.parseString(v)
2012-06-20 21:21:32 +08:00
}
2017-11-05 12:42:37 +08:00
d.raiseUnknownValueType(b, d.Offset-1)
2012-06-20 21:21:32 +08:00
}
panic("unreachable")
2012-06-20 21:21:32 +08:00
}
// An unknown bencode type character was encountered.
func (d *Decoder) raiseUnknownValueType(b byte, offset int64) {
panic(&SyntaxError{
Offset: offset,
What: fmt.Errorf("unknown value type %+q", b),
})
}
func (d *Decoder) parseValueInterface() (interface{}, bool) {
b, err := d.r.ReadByte()
2012-06-20 21:21:32 +08:00
if err != nil {
panic(err)
}
2017-11-05 12:42:37 +08:00
d.Offset++
2012-06-20 21:21:32 +08:00
switch b {
case 'e':
return nil, false
case 'd':
return d.parseDictInterface(), true
2012-06-20 21:21:32 +08:00
case 'l':
return d.parseListInterface(), true
2012-06-20 21:21:32 +08:00
case 'i':
return d.parseIntInterface(), true
2012-06-20 21:21:32 +08:00
default:
if b >= '0' && b <= '9' {
// string
// append first digit of the length to the buffer
d.buf.WriteByte(b)
return d.parseStringInterface(), true
2012-06-20 21:21:32 +08:00
}
2017-11-05 12:42:37 +08:00
d.raiseUnknownValueType(b, d.Offset-1)
panic("unreachable")
2012-06-20 21:21:32 +08:00
}
}
func (d *Decoder) parseIntInterface() (ret interface{}) {
2017-11-05 12:42:37 +08:00
start := d.Offset - 1
d.readUntil('e')
2012-06-20 21:21:32 +08:00
if d.buf.Len() == 0 {
panic(&SyntaxError{
Offset: start,
What: errors.New("empty integer value"),
2012-06-20 21:21:32 +08:00
})
}
n, err := strconv.ParseInt(d.buf.String(), 10, 64)
if ne, ok := err.(*strconv.NumError); ok && ne.Err == strconv.ErrRange {
i := new(big.Int)
_, ok := i.SetString(d.buf.String(), 10)
if !ok {
panic(&SyntaxError{
Offset: start,
What: errors.New("failed to parse integer"),
})
}
ret = i
} else {
checkForIntParseError(err, start)
ret = n
}
2012-06-20 21:21:32 +08:00
d.buf.Reset()
return
2012-06-20 21:21:32 +08:00
}
func (d *Decoder) parseStringInterface() interface{} {
2017-11-05 12:42:37 +08:00
start := d.Offset - 1
2012-06-20 21:21:32 +08:00
// read the string length first
d.readUntil(':')
2012-06-20 21:21:32 +08:00
length, err := strconv.ParseInt(d.buf.String(), 10, 64)
checkForIntParseError(err, start)
2012-06-20 21:21:32 +08:00
d.buf.Reset()
n, err := io.CopyN(&d.buf, d.r, length)
2017-11-05 12:42:37 +08:00
d.Offset += n
2012-06-20 21:21:32 +08:00
if err != nil {
2017-11-05 12:42:37 +08:00
checkForUnexpectedEOF(err, d.Offset)
2012-06-20 21:21:32 +08:00
panic(&SyntaxError{
2017-11-05 12:42:37 +08:00
Offset: d.Offset,
What: errors.New("unexpected I/O error: " + err.Error()),
2012-06-20 21:21:32 +08:00
})
}
s := d.buf.String()
d.buf.Reset()
return s
}
func (d *Decoder) parseDictInterface() interface{} {
2012-06-20 21:21:32 +08:00
dict := make(map[string]interface{})
for {
keyi, ok := d.parseValueInterface()
2012-06-20 21:21:32 +08:00
if !ok {
break
}
key, ok := keyi.(string)
if !ok {
panic(&SyntaxError{
2017-11-05 12:42:37 +08:00
Offset: d.Offset,
What: errors.New("non-string key in a dict"),
2012-06-20 21:21:32 +08:00
})
}
valuei, ok := d.parseValueInterface()
2012-06-20 21:21:32 +08:00
if !ok {
break
2012-06-20 21:21:32 +08:00
}
dict[key] = valuei
}
return dict
}
func (d *Decoder) parseListInterface() interface{} {
2012-06-20 21:21:32 +08:00
var list []interface{}
for {
valuei, ok := d.parseValueInterface()
2012-06-20 21:21:32 +08:00
if !ok {
break
}
list = append(list, valuei)
}
if list == nil {
list = make([]interface{}, 0, 0)
}
2012-06-20 21:21:32 +08:00
return list
}