// // Besides, jsoniter.Iterator provides a different set of interfaces // iterating given bytes/string/reader // and yielding parsed elements one by one. // This set of interfaces reads input as required and gives // better performance. package jsoniter import ( "fmt" "io" ) type ValueType int const ( Invalid ValueType = iota String Number Nil Bool Array Object ) var hexDigits []byte var valueTypes []ValueType func init() { hexDigits = make([]byte, 256) for i := 0; i < len(hexDigits); i++ { hexDigits[i] = 255 } for i := '0'; i <= '9'; i++ { hexDigits[i] = byte(i - '0') } for i := 'a'; i <= 'f'; i++ { hexDigits[i] = byte((i - 'a') + 10) } for i := 'A'; i <= 'F'; i++ { hexDigits[i] = byte((i - 'A') + 10) } valueTypes = make([]ValueType, 256) for i := 0; i < len(valueTypes); i++ { valueTypes[i] = Invalid } valueTypes['"'] = String valueTypes['-'] = Number valueTypes['0'] = Number valueTypes['1'] = Number valueTypes['2'] = Number valueTypes['3'] = Number valueTypes['4'] = Number valueTypes['5'] = Number valueTypes['6'] = Number valueTypes['7'] = Number valueTypes['8'] = Number valueTypes['9'] = Number valueTypes['t'] = Bool valueTypes['f'] = Bool valueTypes['n'] = Nil valueTypes['['] = Array valueTypes['{'] = Object } // Iterator is a fast and flexible JSON parser type Iterator struct { cfg *frozenConfig reader io.Reader buf []byte head int tail int captureStartedAt int captured []byte Error error } // Create creates an empty Iterator instance func NewIterator(cfg *frozenConfig) *Iterator { return &Iterator{ cfg: cfg, reader: nil, buf: nil, head: 0, tail: 0, } } // Parse parses a json buffer in io.Reader into an Iterator instance func Parse(cfg *frozenConfig, reader io.Reader, bufSize int) *Iterator { return &Iterator{ cfg: cfg, reader: reader, buf: make([]byte, bufSize), head: 0, tail: 0, } } // ParseBytes parses a json byte slice into an Iterator instance func ParseBytes(cfg *frozenConfig, input []byte) *Iterator { return &Iterator{ cfg: cfg, reader: nil, buf: input, head: 0, tail: len(input), } } // ParseString parses a json string into an Iterator instance func ParseString(cfg *frozenConfig, input string) *Iterator { return ParseBytes(cfg, []byte(input)) } func (iter *Iterator) Config() *frozenConfig { return iter.cfg } // Reset can reset an Iterator instance for another json buffer in io.Reader func (iter *Iterator) Reset(reader io.Reader) *Iterator { iter.reader = reader iter.head = 0 iter.tail = 0 return iter } // ResetBytes can reset an Iterator instance for another json byte slice func (iter *Iterator) ResetBytes(input []byte) *Iterator { iter.reader = nil iter.buf = input iter.head = 0 iter.tail = len(input) return iter } // WhatIsNext gets ValueType of relatively next json object func (iter *Iterator) WhatIsNext() ValueType { valueType := valueTypes[iter.nextToken()] iter.unreadByte() return valueType } func (iter *Iterator) skipWhitespacesWithoutLoadMore() bool { for i := iter.head; i < iter.tail; i++ { c := iter.buf[i] switch c { case ' ', '\n', '\t', '\r': continue } iter.head = i return false } return true } func (iter *Iterator) isObjectEnd() bool { c := iter.nextToken() if c == ',' { return false } if c == '}' { return true } iter.ReportError("isObjectEnd", "object ended prematurely") return true } func (iter *Iterator) nextToken() byte { // a variation of skip whitespaces, returning the next non-whitespace token for { for i := iter.head; i < iter.tail; i++ { c := iter.buf[i] switch c { case ' ', '\n', '\t', '\r': continue } iter.head = i + 1 return c } if !iter.loadMore() { return 0 } } } func (iter *Iterator) ReportError(operation string, msg string) { if iter.Error != nil { if iter.Error != io.EOF { return } } peekStart := iter.head - 10 if peekStart < 0 { peekStart = 0 } iter.Error = fmt.Errorf("%s: %s, parsing %v ...%s... at %s", operation, msg, iter.head, string(iter.buf[peekStart:iter.head]), string(iter.buf[0:iter.tail])) } // CurrentBuffer gets current buffer as string func (iter *Iterator) CurrentBuffer() string { peekStart := iter.head - 10 if peekStart < 0 { peekStart = 0 } return fmt.Sprintf("parsing %v ...|%s|... at %s", iter.head, string(iter.buf[peekStart:iter.head]), string(iter.buf[0:iter.tail])) } func (iter *Iterator) readByte() (ret byte) { if iter.head == iter.tail { if iter.loadMore() { ret = iter.buf[iter.head] iter.head++ return ret } return 0 } ret = iter.buf[iter.head] iter.head++ return ret } func (iter *Iterator) loadMore() bool { if iter.reader == nil { if iter.Error == nil { iter.head = iter.tail iter.Error = io.EOF } return false } if iter.captureStartedAt != -1 { iter.captured = append(iter.captured, iter.buf[iter.captureStartedAt:iter.tail]...) iter.captureStartedAt = 0 } for { n, err := iter.reader.Read(iter.buf) if n == 0 { if err != nil { if iter.Error == nil { iter.Error = err } return false } } else { iter.head = 0 iter.tail = n return true } } } func (iter *Iterator) unreadByte() { if iter.head == 0 { iter.ReportError("unreadByte", "unread too many bytes") return } iter.head-- return } func (iter *Iterator) Read() interface{} { valueType := iter.WhatIsNext() switch valueType { case String: return iter.ReadString() case Number: return iter.ReadFloat64() case Nil: iter.skipFixedBytes(4) // null return nil case Bool: return iter.ReadBool() case Array: arr := []interface{}{} iter.ReadArrayCB(func(iter *Iterator) bool { arr = append(arr, iter.Read()) return true }) return arr case Object: obj := map[string]interface{}{} iter.ReadObjectCB(func(Iter *Iterator, field string) bool { obj[field] = iter.Read() return true }) return obj default: iter.ReportError("Read", fmt.Sprintf("unexpected value type: %v", valueType)) return nil } }