fmt: make recursive scan more efficient.

Detect when scan is being called recursively and re-use the same scan state. On my machine, for a recursion-heavy benchmark, this results in 44x speed up. This does impose a 4% penalty on the non-recursive case, which can be removed by heap-allocating the saved state, at 40% performance penalty on the recursive case. Either way is fine with me. R=r CC=golang-dev https://golang.org/cl/4253049
2024-11-25 01:57:56 -07:00 · 2011-03-03 10:43:29 -08:00 · 2011-03-03 10:43:29 -08:00 · 5bd284e868
commit 5bd284e868
parent e46acb091f
2 changed files with 173 additions and 25 deletions
--- a/src/pkg/fmt/scan.go
+++ b/src/pkg/fmt/scan.go
@ -103,18 +103,18 @@ func Sscanf(str string, format string, a ...interface{}) (n int, err os.Error) {
 // returns the number of items successfully scanned.  If that is less
 // than the number of arguments, err will report why.
 func Fscan(r io.Reader, a ...interface{}) (n int, err os.Error) {
-	s := newScanState(r, true, false)
+	s, old := newScanState(r, true, false)
 	n, err = s.doScan(a)
-	s.free()
+	s.free(old)
 	return
 }
 // Fscanln is similar to Fscan, but stops scanning at a newline and
 // after the final item there must be a newline or EOF.
 func Fscanln(r io.Reader, a ...interface{}) (n int, err os.Error) {
-	s := newScanState(r, false, true)
+	s, old := newScanState(r, false, true)
 	n, err = s.doScan(a)
-	s.free()
+	s.free(old)
 	return
 }
@ -122,9 +122,9 @@ func Fscanln(r io.Reader, a ...interface{}) (n int, err os.Error) {
 // values into successive arguments as determined by the format.  It
 // returns the number of items successfully parsed.
 func Fscanf(r io.Reader, format string, a ...interface{}) (n int, err os.Error) {
-	s := newScanState(r, false, false)
+	s, old := newScanState(r, false, false)
 	n, err = s.doScanf(format, a)
-	s.free()
+	s.free(old)
 	return
 }
@ -138,15 +138,24 @@ const EOF = -1
 // ss is the internal implementation of ScanState.
 type ss struct {
-	rr        io.RuneReader // where to read input
+	rr       io.RuneReader // where to read input
-	buf       bytes.Buffer  // token accumulator
+	buf      bytes.Buffer  // token accumulator
-	nlIsSpace bool          // whether newline counts as white space
+	peekRune int           // one-rune lookahead
-	nlIsEnd   bool          // whether newline terminates scan
+	prevRune int           // last rune returned by ReadRune
-	peekRune  int           // one-rune lookahead
+	count    int           // runes consumed so far.
-	prevRune  int           // last rune returned by ReadRune
+	atEOF    bool          // already read EOF
-	atEOF     bool          // already read EOF
+	ssave
-	maxWid    int           // max width of field, in runes
+}
-	wid       int           // width consumed so far; used in accept()
+
 // ssave holds the parts of ss that need to be
 // saved and restored on recursive scans.
 type ssave struct {
 	validSave  bool // is or was a part of an actual ss.
 	nlIsEnd    bool // whether newline terminates scan
 	nlIsSpace  bool // whether newline counts as white space
 	fieldLimit int  // max value of ss.count for this field; fieldLimit <= limit
 	limit      int  // max value of ss.count.
 	maxWid     int  // width of this field.
 }
 // The Read method is only in ScanState so that ScanState
@ -158,21 +167,21 @@ func (s *ss) Read(buf []byte) (n int, err os.Error) {
 func (s *ss) ReadRune() (rune int, size int, err os.Error) {
 	if s.peekRune >= 0 {
-		s.wid++
+		s.count++
 		rune = s.peekRune
 		size = utf8.RuneLen(rune)
 		s.prevRune = rune
 		s.peekRune = -1
 		return
 	}
-	if s.atEOF || s.nlIsEnd && s.prevRune == '\n' || s.wid >= s.maxWid {
+	if s.atEOF || s.nlIsEnd && s.prevRune == '\n' || s.count >= s.fieldLimit {
 		err = os.EOF
 		return
 	}
 	rune, size, err = s.rr.ReadRune()
 	if err == nil {
-		s.wid++
+		s.count++
 		s.prevRune = rune
 	} else if err == os.EOF {
 		s.atEOF = true
@ -217,7 +226,7 @@ func (s *ss) UnreadRune() os.Error {
 	} else {
 		s.peekRune = s.prevRune
 	}
-	s.wid--
+	s.count--
 	return nil
 }
@ -305,8 +314,19 @@ func (r *readRune) ReadRune() (rune int, size int, err os.Error) {
 var ssFree = newCache(func() interface{} { return new(ss) })
 // Allocate a new ss struct or grab a cached one.
-func newScanState(r io.Reader, nlIsSpace, nlIsEnd bool) *ss {
+func newScanState(r io.Reader, nlIsSpace, nlIsEnd bool) (s *ss, old ssave) {
-	s := ssFree.get().(*ss)
+	// If the reader is a *ss, then we've got a recursive
 	// call to Scan, so re-use the scan state.
 	s, ok := r.(*ss)
 	if ok {
 		old = s.ssave
 		s.limit = s.fieldLimit
 		s.nlIsEnd = nlIsEnd || s.nlIsEnd
 		s.nlIsSpace = nlIsSpace
 		return
 	}
 	s = ssFree.get().(*ss)
 	if rr, ok := r.(io.RuneReader); ok {
 		s.rr = rr
 	} else {
@ -317,12 +337,20 @@ func newScanState(r io.Reader, nlIsSpace, nlIsEnd bool) *ss {
 	s.prevRune = -1
 	s.peekRune = -1
 	s.atEOF = false
 	s.limit = hugeWid
 	s.fieldLimit = hugeWid
 	s.maxWid = hugeWid
-	return s
+	s.validSave = true
 	return
 }
 // Save used ss structs in ssFree; avoid an allocation per invocation.
-func (s *ss) free() {
+func (s *ss) free(old ssave) {
 	// If it was used recursively, just restore the old state.
 	if old.validSave {
 		s.ssave = old
 		return
 	}
 	// Don't hold on to ss structs with large buffers.
 	if cap(s.buf.Bytes()) > 1024 {
 		return
@ -1014,7 +1042,10 @@ func (s *ss) doScanf(format string, a []interface{}) (numProcessed int, err os.E
 		if !widPresent {
 			s.maxWid = hugeWid
 		}
-		s.wid = 0
+		s.fieldLimit = s.limit
 		if f := s.count + s.maxWid; f < s.fieldLimit {
 			s.fieldLimit = f
 		}
 		c, w := utf8.DecodeRuneInString(format[i:])
 		i += w
@ -1027,7 +1058,7 @@ func (s *ss) doScanf(format string, a []interface{}) (numProcessed int, err os.E
 		s.scanOne(c, field)
 		numProcessed++
-		s.maxWid = hugeWid
+		s.fieldLimit = s.limit
 	}
 	if numProcessed < len(a) {
 		s.errorString("too many operands")
--- a/src/pkg/fmt/scan_test.go
+++ b/src/pkg/fmt/scan_test.go
@ -6,6 +6,7 @@ package fmt_test
 import (
 	"bufio"
 	"bytes"
 	. "fmt"
 	"io"
 	"math"
@ -745,3 +746,119 @@ func TestMultiLine(t *testing.T) {
 		t.Errorf("Sscanln: expected io.ErrUnexpectedEOF (ha!); got %s", err)
 	}
 }
 // RecursiveInt accepts an string matching %d.%d.%d....
 // and parses it into a linked list.
 // It allows us to benchmark recursive descent style scanners.
 type RecursiveInt struct {
 	i    int
 	next *RecursiveInt
 }
 func (r *RecursiveInt) Scan(state ScanState, verb int) (err os.Error) {
 	_, err = Fscan(state, &r.i)
 	if err != nil {
 		return
 	}
 	next := new(RecursiveInt)
 	_, err = Fscanf(state, ".%v", next)
 	if err != nil {
 		if err == os.ErrorString("input does not match format") || err == io.ErrUnexpectedEOF {
 			err = nil
 		}
 		return
 	}
 	r.next = next
 	return
 }
 // Perform the same scanning task as RecursiveInt.Scan
 // but without recurring through scanner, so we can compare
 // performance more directly.
 func scanInts(r *RecursiveInt, b *bytes.Buffer) (err os.Error) {
 	r.next = nil
 	_, err = Fscan(b, &r.i)
 	if err != nil {
 		return
 	}
 	var c int
 	c, _, err = b.ReadRune()
 	if err != nil {
 		if err == os.EOF {
 			err = nil
 		}
 		return
 	}
 	if c != '.' {
 		return
 	}
 	next := new(RecursiveInt)
 	err = scanInts(next, b)
 	if err == nil {
 		r.next = next
 	}
 	return
 }
 func makeInts(n int) []byte {
 	var buf bytes.Buffer
 	Fprintf(&buf, "1")
 	for i := 1; i < n; i++ {
 		Fprintf(&buf, ".%d", i+1)
 	}
 	return buf.Bytes()
 }
 func TestScanInts(t *testing.T) {
 	testScanInts(t, scanInts)
 	testScanInts(t, func(r *RecursiveInt, b *bytes.Buffer) (err os.Error) {
 		_, err = Fscan(b, r)
 		return
 	})
 }
 const intCount = 1000
 func testScanInts(t *testing.T, scan func(*RecursiveInt, *bytes.Buffer) os.Error) {
 	r := new(RecursiveInt)
 	ints := makeInts(intCount)
 	buf := bytes.NewBuffer(ints)
 	err := scan(r, buf)
 	if err != nil {
 		t.Error("unexpected error", err)
 	}
 	i := 1
 	for ; r != nil; r = r.next {
 		if r.i != i {
 			t.Fatal("bad scan: expected %d got %d", i, r.i)
 		}
 		i++
 	}
 	if i-1 != intCount {
 		t.Fatal("bad scan count: expected %d got %d", intCount, i-1)
 	}
 }
 func BenchmarkScanInts(b *testing.B) {
 	b.ResetTimer()
 	ints := makeInts(intCount)
 	var r RecursiveInt
 	for i := b.N - 1; i >= 0; i-- {
 		buf := bytes.NewBuffer(ints)
 		b.StartTimer()
 		scanInts(&r, buf)
 		b.StopTimer()
 	}
 }
 func BenchmarkScanRecursiveInt(b *testing.B) {
 	b.ResetTimer()
 	ints := makeInts(intCount)
 	var r RecursiveInt
 	for i := b.N - 1; i >= 0; i-- {
 		buf := bytes.NewBuffer(ints)
 		b.StartTimer()
 		Fscan(buf, &r)
 		b.StopTimer()
 	}
 }