From fca4b8e2f6fa519fd004896a13b340367f5fb938 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E4=B8=96=E7=95=8C?= Date: Mon, 27 May 2024 21:42:00 +0800 Subject: [PATCH] contentjson: Add support for tailing comma --- common/json/internal/contextjson/scanner.go | 4 +- common/json/internal/contextjson/stream.go | 47 +++++++++++++++++++-- 2 files changed, 46 insertions(+), 5 deletions(-) diff --git a/common/json/internal/contextjson/scanner.go b/common/json/internal/contextjson/scanner.go index 4c43f5f9..c0017116 100644 --- a/common/json/internal/contextjson/scanner.go +++ b/common/json/internal/contextjson/scanner.go @@ -300,7 +300,7 @@ func stateEndValue(s *scanner, c byte) int { case parseObjectValue: if c == ',' { s.parseState[n-1] = parseObjectKey - s.step = stateBeginString + s.step = stateBeginStringOrEmpty return scanObjectValue } if c == '}' { @@ -310,7 +310,7 @@ func stateEndValue(s *scanner, c byte) int { return s.error(c, "after object key:value pair") case parseArrayValue: if c == ',' { - s.step = stateBeginValue + s.step = stateBeginValueOrEmpty return scanArrayValue } if c == ']' { diff --git a/common/json/internal/contextjson/stream.go b/common/json/internal/contextjson/stream.go index 1cf37c56..a670ab14 100644 --- a/common/json/internal/contextjson/stream.go +++ b/common/json/internal/contextjson/stream.go @@ -153,6 +153,10 @@ func (dec *Decoder) refill() error { dec.scanp = 0 } + return dec.refill0() +} + +func (dec *Decoder) refill0() error { // Grow buffer if not large enough. const minRead = 512 if cap(dec.buf)-len(dec.buf) < minRead { @@ -402,7 +406,7 @@ func (dec *Decoder) Token() (Token, error) { return Delim('{'), nil case '}': - if dec.tokenState != tokenObjectStart && dec.tokenState != tokenObjectComma { + if dec.tokenState != tokenObjectStart && dec.tokenState != tokenObjectComma && dec.tokenState != tokenObjectKey { return dec.tokenError(c) } dec.scanp++ @@ -410,7 +414,6 @@ func (dec *Decoder) Token() (Token, error) { dec.tokenStack = dec.tokenStack[:len(dec.tokenStack)-1] dec.tokenValueEnd() return Delim('}'), nil - case ':': if dec.tokenState != tokenObjectColon { return dec.tokenError(c) @@ -483,7 +486,26 @@ func (dec *Decoder) tokenError(c byte) (Token, error) { // current array or object being parsed. func (dec *Decoder) More() bool { c, err := dec.peek() - return err == nil && c != ']' && c != '}' + // return err == nil && c != ']' && c != '}' + if err != nil { + return false + } + if c == ']' || c == '}' { + return false + } + if c == ',' { + scanp := dec.scanp + dec.scanp++ + c, err = dec.peekNoRefill() + dec.scanp = scanp + if err != nil { + return false + } + if c == ']' || c == '}' { + return false + } + } + return true } func (dec *Decoder) peek() (byte, error) { @@ -505,6 +527,25 @@ func (dec *Decoder) peek() (byte, error) { } } +func (dec *Decoder) peekNoRefill() (byte, error) { + var err error + for { + for i := dec.scanp; i < len(dec.buf); i++ { + c := dec.buf[i] + if isSpace(c) { + continue + } + dec.scanp = i + return c, nil + } + // buffer has been scanned, now report any error + if err != nil { + return 0, err + } + err = dec.refill0() + } +} + // InputOffset returns the input stream byte offset of the current decoder position. // The offset gives the location of the end of the most recently returned token // and the beginning of the next token.