internal/encoding/json: improve decoding of JSON numbers for floats Per Joe's suggestion, remove producing numberParts when parsing a JSON number to produce corresponding Value. This saves having to store it inside Value as well. Only produce numberParts for calls to Value.{Int,Uint} call. numberParts is only used for producing integers and removing the logic to produce numberParts improves overall decoding speed for floats, and shows no change for integers. name old time/op new time/op delta Float-4 559ns ± 0% 288ns ± 0% ~ (p=1.000 n=1+1) Int-4 471ns ± 0% 466ns ± 0% ~ (p=1.000 n=1+1) Change-Id: I21bf304ca67dda8d41a4ea0022dcbefd51058c1c Reviewed-on: https://go-review.googlesource.com/c/protobuf/+/168781 Reviewed-by: Joe Tsai <thebrokentoaster@gmail.com>

commit: a3421952acf1d6b060d2dd251463b1946732d6bb [log] [tgz]
author: Herbie Ong <herbie@google.com> Thu Mar 21 18:12:26 2019 -0700
committer: Herbie Ong <herbie@google.com> Sat Mar 23 22:02:55 2019 +0000
tree: f459bb6bcc51752b7f96776c0361357bf4e117c2
parent: f503c300f70e2aa8ab0749f0ea90f836f275f4a1 [diff]
diff --git a/internal/encoding/json/bench_test.go b/internal/encoding/json/bench_test.go
new file mode 100644
index 0000000..4db8af9
--- /dev/null
+++ b/internal/encoding/json/bench_test.go

@@ -0,0 +1,41 @@
+// Copyright 2019 The Go Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style
+// license that can be found in the LICENSE file.
+
+package json_test
+
+import (
+	"testing"
+
+	"github.com/golang/protobuf/v2/internal/encoding/json"
+)
+
+func BenchmarkFloat(b *testing.B) {
+	input := []byte("1.797693134862315708145274237317043567981e+308")
+	for i := 0; i < b.N; i++ {
+		dec := json.NewDecoder(input)
+		val, err := dec.Read()
+		if err != nil {
+			b.Fatal(err)
+		}
+		_, err = val.Float(64)
+		if err != nil {
+			b.Fatal(err)
+		}
+	}
+}
+
+func BenchmarkInt(b *testing.B) {
+	input := []byte("922337203.6854775807e+10")
+	for i := 0; i < b.N; i++ {
+		dec := json.NewDecoder(input)
+		val, err := dec.Read()
+		if err != nil {
+			b.Fatal(err)
+		}
+		_, err = val.Int(64)
+		if err != nil {
+			b.Fatal(err)
+		}
+	}
+}

diff --git a/internal/encoding/json/decode.go b/internal/encoding/json/decode.go
index 452e873..ddf3a68 100644
--- a/internal/encoding/json/decode.go
+++ b/internal/encoding/json/decode.go

@@ -182,11 +182,11 @@
 		}
 
 	case '-', '0', '1', '2', '3', '4', '5', '6', '7', '8', '9':
-		num, n := parseNumber(in)
-		if num == nil {
+		n, ok := consumeNumber(in)
+		if !ok {
 			return Value{}, 0, d.newSyntaxError("invalid number %s", errRegexp.Find(in))
 		}
-		return d.newValue(Number, in[:n], num), n, nil
+		return d.newValue(Number, in[:n], nil), n, nil
 
 	case '"':
 		var nerr errors.NonFatal
@@ -308,7 +308,6 @@
 	typ    Type
 	// value will be set to the following Go type based on the type field:
 	//    Bool   => bool
-	//    Number => *numberParts
 	//    String => string
 	//    Name   => string
 	// It will be nil if none of the above.
@@ -414,8 +413,11 @@
 	if v.typ != Number {
 		return "", v.newError("%s is not a number", v.input)
 	}
-	pnum := v.value.(*numberParts)
-	num, ok := normalizeToIntString(pnum)
+	parts, ok := parseNumber(v.input)
+	if !ok {
+		return "", v.newError("%s is not a number", v.input)
+	}
+	num, ok := normalizeToIntString(parts)
 	if !ok {
 		return "", v.newError("cannot convert %s to integer", v.input)
 	}

diff --git a/internal/encoding/json/number.go b/internal/encoding/json/number.go
index 6b3ed86..75f6a3a 100644
--- a/internal/encoding/json/number.go
+++ b/internal/encoding/json/number.go

@@ -41,70 +41,50 @@
 	return out
 }
 
-// numberParts is the result of parsing out a valid JSON number. It contains
-// the parts of a number. The parts are used for integer conversion.
-type numberParts struct {
-	neg  bool
-	intp []byte
-	frac []byte
-	exp  []byte
-}
-
-// parseNumber returns a numberParts instance if it is able to read a JSON
-// number from the given []byte. It also returns the number of bytes read.
-// Parsing logic follows the definition in
+// consumeNumber reads the given []byte for a valid JSON number. If it is valid,
+// it returns the number of bytes.  Parsing logic follows the definition in
 // https://tools.ietf.org/html/rfc7159#section-6, and is based off
 // encoding/json.isValidNumber function.
-func parseNumber(input []byte) (*numberParts, int) {
+func consumeNumber(input []byte) (int, bool) {
 	var n int
-	var neg bool
-	var intp []byte
-	var frac []byte
-	var exp []byte
 
 	s := input
 	if len(s) == 0 {
-		return nil, 0
+		return 0, false
 	}
 
 	// Optional -
 	if s[0] == '-' {
-		neg = true
 		s = s[1:]
 		n++
 		if len(s) == 0 {
-			return nil, 0
+			return 0, false
 		}
 	}
 
 	// Digits
 	switch {
 	case s[0] == '0':
-		// Skip first 0 and no need to store.
 		s = s[1:]
 		n++
 
 	case '1' <= s[0] && s[0] <= '9':
-		intp = append(intp, s[0])
 		s = s[1:]
 		n++
 		for len(s) > 0 && '0' <= s[0] && s[0] <= '9' {
-			intp = append(intp, s[0])
 			s = s[1:]
 			n++
 		}
 
 	default:
-		return nil, 0
+		return 0, false
 	}
 
 	// . followed by 1 or more digits.
 	if len(s) >= 2 && s[0] == '.' && '0' <= s[1] && s[1] <= '9' {
-		frac = append(frac, s[1])
 		s = s[2:]
 		n += 2
 		for len(s) > 0 && '0' <= s[0] && s[0] <= '9' {
-			frac = append(frac, s[0])
 			s = s[1:]
 			n++
 		}
@@ -116,15 +96,13 @@
 		s = s[1:]
 		n++
 		if s[0] == '+' || s[0] == '-' {
-			exp = append(exp, s[0])
 			s = s[1:]
 			n++
 			if len(s) == 0 {
-				return nil, 0
+				return 0, false
 			}
 		}
 		for len(s) > 0 && '0' <= s[0] && s[0] <= '9' {
-			exp = append(exp, s[0])
 			s = s[1:]
 			n++
 		}
@@ -132,21 +110,101 @@
 
 	// Check that next byte is a delimiter or it is at the end.
 	if n < len(input) && isNotDelim(input[n]) {
-		return nil, 0
+		return 0, false
 	}
 
-	return &numberParts{
+	return n, true
+}
+
+// numberParts is the result of parsing out a valid JSON number. It contains
+// the parts of a number. The parts are used for integer conversion.
+type numberParts struct {
+	neg  bool
+	intp []byte
+	frac []byte
+	exp  []byte
+}
+
+// parseNumber constructs numberParts from given []byte. The logic here is
+// similar to consumeNumber above with the difference of having to construct
+// numberParts.
+func parseNumber(input []byte) (numberParts, bool) {
+	var neg bool
+	var intp []byte
+	var frac []byte
+	var exp []byte
+
+	s := input
+	if len(s) == 0 {
+		return numberParts{}, false
+	}
+
+	// Optional -
+	if s[0] == '-' {
+		neg = true
+		s = s[1:]
+		if len(s) == 0 {
+			return numberParts{}, false
+		}
+	}
+
+	// Digits
+	switch {
+	case s[0] == '0':
+		// Skip first 0 and no need to store.
+		s = s[1:]
+
+	case '1' <= s[0] && s[0] <= '9':
+		intp = append(intp, s[0])
+		s = s[1:]
+		for len(s) > 0 && '0' <= s[0] && s[0] <= '9' {
+			intp = append(intp, s[0])
+			s = s[1:]
+		}
+
+	default:
+		return numberParts{}, false
+	}
+
+	// . followed by 1 or more digits.
+	if len(s) >= 2 && s[0] == '.' && '0' <= s[1] && s[1] <= '9' {
+		frac = append(frac, s[1])
+		s = s[2:]
+		for len(s) > 0 && '0' <= s[0] && s[0] <= '9' {
+			frac = append(frac, s[0])
+			s = s[1:]
+		}
+	}
+
+	// e or E followed by an optional - or + and
+	// 1 or more digits.
+	if len(s) >= 2 && (s[0] == 'e' || s[0] == 'E') {
+		s = s[1:]
+		if s[0] == '+' || s[0] == '-' {
+			exp = append(exp, s[0])
+			s = s[1:]
+			if len(s) == 0 {
+				return numberParts{}, false
+			}
+		}
+		for len(s) > 0 && '0' <= s[0] && s[0] <= '9' {
+			exp = append(exp, s[0])
+			s = s[1:]
+		}
+	}
+
+	return numberParts{
 		neg:  neg,
 		intp: intp,
 		frac: bytes.TrimRight(frac, "0"), // Remove unnecessary 0s to the right.
 		exp:  exp,
-	}, n
+	}, true
 }
 
 // normalizeToIntString returns an integer string in normal form without the
 // E-notation for given numberParts. It will return false if it is not an
 // integer or if the exponent exceeds than max/min int value.
-func normalizeToIntString(n *numberParts) (string, bool) {
+func normalizeToIntString(n numberParts) (string, bool) {
 	num := n.intp
 	intpSize := len(num)
 	fracSize := len(n.frac)
commit	a3421952acf1d6b060d2dd251463b1946732d6bb	[log] [tgz]
author	Herbie Ong <herbie@google.com>	Thu Mar 21 18:12:26 2019 -0700
committer	Herbie Ong <herbie@google.com>	Sat Mar 23 22:02:55 2019 +0000
tree	f459bb6bcc51752b7f96776c0361357bf4e117c2
parent	f503c300f70e2aa8ab0749f0ea90f836f275f4a1 [diff]