go/src/runtime/gc_test.go

// Copyright 2011 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

package runtime_test

import (
	"fmt"
	"os"
	"reflect"
	"runtime"
	"runtime/debug"
	"sort"
	"sync"
	"sync/atomic"
	"testing"
	"time"
	"unsafe"
)

func TestGcSys(t *testing.T) {
	if os.Getenv("GOGC") == "off" {
		t.Skip("skipping test; GOGC=off in environment")
	}
	got := runTestProg(t, "testprog", "GCSys")
	want := "OK\n"
	if got != want {
		t.Fatalf("expected %q, but got %q", want, got)
	}
}

func TestGcDeepNesting(t *testing.T) {
	type T [2][2][2][2][2][2][2][2][2][2]*int
	a := new(T)

	// Prevent the compiler from applying escape analysis.
	// This makes sure new(T) is allocated on heap, not on the stack.
	t.Logf("%p", a)

	a[0][0][0][0][0][0][0][0][0][0] = new(int)
	*a[0][0][0][0][0][0][0][0][0][0] = 13
	runtime.GC()
	if *a[0][0][0][0][0][0][0][0][0][0] != 13 {
		t.Fail()
	}
}

func TestGcMapIndirection(t *testing.T) {
	defer debug.SetGCPercent(debug.SetGCPercent(1))
	runtime.GC()
	type T struct {
		a [256]int
	}
	m := make(map[T]T)
	for i := 0; i < 2000; i++ {
		var a T
		a.a[0] = i
		m[a] = T{}
	}
}

func TestGcArraySlice(t *testing.T) {
	type X struct {
		buf     [1]byte
		nextbuf []byte
		next    *X
	}
	var head *X
	for i := 0; i < 10; i++ {
		p := &X{}
		p.buf[0] = 42
		p.next = head
		if head != nil {
			p.nextbuf = head.buf[:]
		}
		head = p
		runtime.GC()
	}
	for p := head; p != nil; p = p.next {
		if p.buf[0] != 42 {
			t.Fatal("corrupted heap")
		}
	}
}

func TestGcRescan(t *testing.T) {
	type X struct {
		c     chan error
		nextx *X
	}
	type Y struct {
		X
		nexty *Y
		p     *int
	}
	var head *Y
	for i := 0; i < 10; i++ {
		p := &Y{}
		p.c = make(chan error)
		if head != nil {
			p.nextx = &head.X
		}
		p.nexty = head
		p.p = new(int)
		*p.p = 42
		head = p
		runtime.GC()
	}
	for p := head; p != nil; p = p.nexty {
		if *p.p != 42 {
			t.Fatal("corrupted heap")
		}
	}
}

func TestGcLastTime(t *testing.T) {
	ms := new(runtime.MemStats)
	t0 := time.Now().UnixNano()
	runtime.GC()
	t1 := time.Now().UnixNano()
	runtime.ReadMemStats(ms)
	last := int64(ms.LastGC)
	if t0 > last || last > t1 {
		t.Fatalf("bad last GC time: got %v, want [%v, %v]", last, t0, t1)
	}
	pause := ms.PauseNs[(ms.NumGC+255)%256]
	// Due to timer granularity, pause can actually be 0 on windows
	// or on virtualized environments.
	if pause == 0 {
		t.Logf("last GC pause was 0")
	} else if pause > 10e9 {
		t.Logf("bad last GC pause: got %v, want [0, 10e9]", pause)
	}
}

var hugeSink interface{}

func TestHugeGCInfo(t *testing.T) {
	// The test ensures that compiler can chew these huge types even on weakest machines.
	// The types are not allocated at runtime.
	if hugeSink != nil {
		// 400MB on 32 bots, 4TB on 64-bits.
		const n = (400 << 20) + (unsafe.Sizeof(uintptr(0))-4)<<40
		hugeSink = new([n]*byte)
		hugeSink = new([n]uintptr)
		hugeSink = new(struct {
			x float64
			y [n]*byte
			z []string
		})
		hugeSink = new(struct {
			x float64
			y [n]uintptr
			z []string
		})
	}
}

func TestPeriodicGC(t *testing.T) {
	if runtime.GOARCH == "wasm" {
		t.Skip("no sysmon on wasm yet")
	}

	// Make sure we're not in the middle of a GC.
	runtime.GC()

	var ms1, ms2 runtime.MemStats
	runtime.ReadMemStats(&ms1)

	// Make periodic GC run continuously.
	orig := *runtime.ForceGCPeriod
	*runtime.ForceGCPeriod = 0

	// Let some periodic GCs happen. In a heavily loaded system,
	// it's possible these will be delayed, so this is designed to
	// succeed quickly if things are working, but to give it some
	// slack if things are slow.
	var numGCs uint32
	const want = 2
	for i := 0; i < 200 && numGCs < want; i++ {
		time.Sleep(5 * time.Millisecond)

		// Test that periodic GC actually happened.
		runtime.ReadMemStats(&ms2)
		numGCs = ms2.NumGC - ms1.NumGC
	}
	*runtime.ForceGCPeriod = orig

	if numGCs < want {
		t.Fatalf("no periodic GC: got %v GCs, want >= 2", numGCs)
	}
}

func BenchmarkSetTypePtr(b *testing.B) {
	benchSetType(b, new(*byte))
}

func BenchmarkSetTypePtr8(b *testing.B) {
	benchSetType(b, new([8]*byte))
}

func BenchmarkSetTypePtr16(b *testing.B) {
	benchSetType(b, new([16]*byte))
}

func BenchmarkSetTypePtr32(b *testing.B) {
	benchSetType(b, new([32]*byte))
}

func BenchmarkSetTypePtr64(b *testing.B) {
	benchSetType(b, new([64]*byte))
}

func BenchmarkSetTypePtr126(b *testing.B) {
	benchSetType(b, new([126]*byte))
}

func BenchmarkSetTypePtr128(b *testing.B) {
	benchSetType(b, new([128]*byte))
}

func BenchmarkSetTypePtrSlice(b *testing.B) {
	benchSetType(b, make([]*byte, 1<<10))
}

type Node1 struct {
	Value       [1]uintptr
	Left, Right *byte
}

func BenchmarkSetTypeNode1(b *testing.B) {
	benchSetType(b, new(Node1))
}

func BenchmarkSetTypeNode1Slice(b *testing.B) {
	benchSetType(b, make([]Node1, 32))
}

type Node8 struct {
	Value       [8]uintptr
	Left, Right *byte
}

func BenchmarkSetTypeNode8(b *testing.B) {
	benchSetType(b, new(Node8))
}

func BenchmarkSetTypeNode8Slice(b *testing.B) {
	benchSetType(b, make([]Node8, 32))
}

type Node64 struct {
	Value       [64]uintptr
	Left, Right *byte
}

func BenchmarkSetTypeNode64(b *testing.B) {
	benchSetType(b, new(Node64))
}

func BenchmarkSetTypeNode64Slice(b *testing.B) {
	benchSetType(b, make([]Node64, 32))
}

type Node64Dead struct {
	Left, Right *byte
	Value       [64]uintptr
}

func BenchmarkSetTypeNode64Dead(b *testing.B) {
	benchSetType(b, new(Node64Dead))
}

func BenchmarkSetTypeNode64DeadSlice(b *testing.B) {
	benchSetType(b, make([]Node64Dead, 32))
}

type Node124 struct {
	Value       [124]uintptr
	Left, Right *byte
}

func BenchmarkSetTypeNode124(b *testing.B) {
	benchSetType(b, new(Node124))
}

func BenchmarkSetTypeNode124Slice(b *testing.B) {
	benchSetType(b, make([]Node124, 32))
}

type Node126 struct {
	Value       [126]uintptr
	Left, Right *byte
}

func BenchmarkSetTypeNode126(b *testing.B) {
	benchSetType(b, new(Node126))
}

func BenchmarkSetTypeNode126Slice(b *testing.B) {
	benchSetType(b, make([]Node126, 32))
}

type Node128 struct {
	Value       [128]uintptr
	Left, Right *byte
}

func BenchmarkSetTypeNode128(b *testing.B) {
	benchSetType(b, new(Node128))
}

func BenchmarkSetTypeNode128Slice(b *testing.B) {
	benchSetType(b, make([]Node128, 32))
}

type Node130 struct {
	Value       [130]uintptr
	Left, Right *byte
}

func BenchmarkSetTypeNode130(b *testing.B) {
	benchSetType(b, new(Node130))
}

func BenchmarkSetTypeNode130Slice(b *testing.B) {
	benchSetType(b, make([]Node130, 32))
}

type Node1024 struct {
	Value       [1024]uintptr
	Left, Right *byte
}

func BenchmarkSetTypeNode1024(b *testing.B) {
	benchSetType(b, new(Node1024))
}

func BenchmarkSetTypeNode1024Slice(b *testing.B) {
	benchSetType(b, make([]Node1024, 32))
}

func benchSetType(b *testing.B, x interface{}) {
	v := reflect.ValueOf(x)
	t := v.Type()
	switch t.Kind() {
	case reflect.Ptr:
		b.SetBytes(int64(t.Elem().Size()))
	case reflect.Slice:
		b.SetBytes(int64(t.Elem().Size()) * int64(v.Len()))
	}
	b.ResetTimer()
	runtime.BenchSetType(b.N, x)
}

func BenchmarkAllocation(b *testing.B) {
	type T struct {
		x, y *byte
	}
	ngo := runtime.GOMAXPROCS(0)
	work := make(chan bool, b.N+ngo)
	result := make(chan *T)
	for i := 0; i < b.N; i++ {
		work <- true
	}
	for i := 0; i < ngo; i++ {
		work <- false
	}
	for i := 0; i < ngo; i++ {
		go func() {
			var x *T
			for <-work {
				for i := 0; i < 1000; i++ {
					x = &T{}
				}
			}
			result <- x
		}()
	}
	for i := 0; i < ngo; i++ {
		<-result
	}
}

func TestPrintGC(t *testing.T) {
	if testing.Short() {
		t.Skip("Skipping in short mode")
	}
	defer runtime.GOMAXPROCS(runtime.GOMAXPROCS(2))
	done := make(chan bool)
	go func() {
		for {
			select {
			case <-done:
				return
			default:
				runtime.GC()
			}
		}
	}()
	for i := 0; i < 1e4; i++ {
		func() {
			defer print("")
		}()
	}
	close(done)
}

func testTypeSwitch(x interface{}) error {
	switch y := x.(type) {
	case nil:
		// ok
	case error:
		return y
	}
	return nil
}

func testAssert(x interface{}) error {
	if y, ok := x.(error); ok {
		return y
	}
	return nil
}

func testAssertVar(x interface{}) error {
	var y, ok = x.(error)
	if ok {
		return y
	}
	return nil
}

var a bool

//go:noinline
func testIfaceEqual(x interface{}) {
	if x == "abc" {
		a = true
	}
}

func TestPageAccounting(t *testing.T) {
	// Grow the heap in small increments. This used to drop the
	// pages-in-use count below zero because of a rounding
	// mismatch (golang.org/issue/15022).
	const blockSize = 64 << 10
	blocks := make([]*[blockSize]byte, (64<<20)/blockSize)
	for i := range blocks {
		blocks[i] = new([blockSize]byte)
	}

	// Check that the running page count matches reality.
	pagesInUse, counted := runtime.CountPagesInUse()
	if pagesInUse != counted {
		t.Fatalf("mheap_.pagesInUse is %d, but direct count is %d", pagesInUse, counted)
	}
}

func TestReadMemStats(t *testing.T) {
	base, slow := runtime.ReadMemStatsSlow()
	if base != slow {
		logDiff(t, "MemStats", reflect.ValueOf(base), reflect.ValueOf(slow))
		t.Fatal("memstats mismatch")
	}
}

func logDiff(t *testing.T, prefix string, got, want reflect.Value) {
	typ := got.Type()
	switch typ.Kind() {
	case reflect.Array, reflect.Slice:
		if got.Len() != want.Len() {
			t.Logf("len(%s): got %v, want %v", prefix, got, want)
			return
		}
		for i := 0; i < got.Len(); i++ {
			logDiff(t, fmt.Sprintf("%s[%d]", prefix, i), got.Index(i), want.Index(i))
		}
	case reflect.Struct:
		for i := 0; i < typ.NumField(); i++ {
			gf, wf := got.Field(i), want.Field(i)
			logDiff(t, prefix+"."+typ.Field(i).Name, gf, wf)
		}
	case reflect.Map:
		t.Fatal("not implemented: logDiff for map")
	default:
		if got.Interface() != want.Interface() {
			t.Logf("%s: got %v, want %v", prefix, got, want)
		}
	}
}

func BenchmarkReadMemStats(b *testing.B) {
	var ms runtime.MemStats
	const heapSize = 100 << 20
	x := make([]*[1024]byte, heapSize/1024)
	for i := range x {
		x[i] = new([1024]byte)
	}
	hugeSink = x

	b.ResetTimer()
	for i := 0; i < b.N; i++ {
		runtime.ReadMemStats(&ms)
	}

	hugeSink = nil
}

func BenchmarkReadMemStatsLatency(b *testing.B) {
	// We’ll apply load to the runtime with maxProcs-1 goroutines
	// and use one more to actually benchmark. It doesn't make sense
	// to try to run this test with only 1 P (that's what
	// BenchmarkReadMemStats is for).
	maxProcs := runtime.GOMAXPROCS(-1)
	if maxProcs == 1 {
		b.Skip("This benchmark can only be run with GOMAXPROCS > 1")
	}

	// Code to build a big tree with lots of pointers.
	type node struct {
		children [16]*node
	}
	var buildTree func(depth int) *node
	buildTree = func(depth int) *node {
		tree := new(node)
		if depth != 0 {
			for i := range tree.children {
				tree.children[i] = buildTree(depth - 1)
			}
		}
		return tree
	}

	// Keep the GC busy by continuously generating large trees.
	done := make(chan struct{})
	var wg sync.WaitGroup
	for i := 0; i < maxProcs-1; i++ {
		wg.Add(1)
		go func() {
			defer wg.Done()
			var hold *node
		loop:
			for {
				hold = buildTree(5)
				select {
				case <-done:
					break loop
				default:
				}
			}
			runtime.KeepAlive(hold)
		}()
	}

	// Spend this much time measuring latencies.
	latencies := make([]time.Duration, 0, 1024)

	// Run for timeToBench hitting ReadMemStats continuously
	// and measuring the latency.
	b.ResetTimer()
	var ms runtime.MemStats
	for i := 0; i < b.N; i++ {
		// Sleep for a bit, otherwise we're just going to keep
		// stopping the world and no one will get to do anything.
		time.Sleep(100 * time.Millisecond)
		start := time.Now()
		runtime.ReadMemStats(&ms)
		latencies = append(latencies, time.Now().Sub(start))
	}
	close(done)
	// Make sure to stop the timer before we wait! The goroutines above
	// are very heavy-weight and not easy to stop, so we could end up
	// confusing the benchmarking framework for small b.N.
	b.StopTimer()
	wg.Wait()

	// Disable the default */op metrics.
	// ns/op doesn't mean anything because it's an average, but we
	// have a sleep in our b.N loop above which skews this significantly.
	b.ReportMetric(0, "ns/op")
	b.ReportMetric(0, "B/op")
	b.ReportMetric(0, "allocs/op")

	// Sort latencies then report percentiles.
	sort.Slice(latencies, func(i, j int) bool {
		return latencies[i] < latencies[j]
	})
	b.ReportMetric(float64(latencies[len(latencies)*50/100]), "p50-ns")
	b.ReportMetric(float64(latencies[len(latencies)*90/100]), "p90-ns")
	b.ReportMetric(float64(latencies[len(latencies)*99/100]), "p99-ns")
}

func TestUserForcedGC(t *testing.T) {
	// Test that runtime.GC() triggers a GC even if GOGC=off.
	defer debug.SetGCPercent(debug.SetGCPercent(-1))

	var ms1, ms2 runtime.MemStats
	runtime.ReadMemStats(&ms1)
	runtime.GC()
	runtime.ReadMemStats(&ms2)
	if ms1.NumGC == ms2.NumGC {
		t.Fatalf("runtime.GC() did not trigger GC")
	}
	if ms1.NumForcedGC == ms2.NumForcedGC {
		t.Fatalf("runtime.GC() was not accounted in NumForcedGC")
	}
}

func writeBarrierBenchmark(b *testing.B, f func()) {
	runtime.GC()
	var ms runtime.MemStats
	runtime.ReadMemStats(&ms)
	//b.Logf("heap size: %d MB", ms.HeapAlloc>>20)

	// Keep GC running continuously during the benchmark, which in
	// turn keeps the write barrier on continuously.
	var stop uint32
	done := make(chan bool)
	go func() {
		for atomic.LoadUint32(&stop) == 0 {
			runtime.GC()
		}
		close(done)
	}()
	defer func() {
		atomic.StoreUint32(&stop, 1)
		<-done
	}()

	b.ResetTimer()
	f()
	b.StopTimer()
}

func BenchmarkWriteBarrier(b *testing.B) {
	if runtime.GOMAXPROCS(-1) < 2 {
		// We don't want GC to take our time.
		b.Skip("need GOMAXPROCS >= 2")
	}

	// Construct a large tree both so the GC runs for a while and
	// so we have a data structure to manipulate the pointers of.
	type node struct {
		l, r *node
	}
	var wbRoots []*node
	var mkTree func(level int) *node
	mkTree = func(level int) *node {
		if level == 0 {
			return nil
		}
		n := &node{mkTree(level - 1), mkTree(level - 1)}
		if level == 10 {
			// Seed GC with enough early pointers so it
			// doesn't start termination barriers when it
			// only has the top of the tree.
			wbRoots = append(wbRoots, n)
		}
		return n
	}
	const depth = 22 // 64 MB
	root := mkTree(22)

	writeBarrierBenchmark(b, func() {
		var stack [depth]*node
		tos := -1

		// There are two write barriers per iteration, so i+=2.
		for i := 0; i < b.N; i += 2 {
			if tos == -1 {
				stack[0] = root
				tos = 0
			}

			// Perform one step of reversing the tree.
			n := stack[tos]
			if n.l == nil {
				tos--
			} else {
				n.l, n.r = n.r, n.l
				stack[tos] = n.l
				stack[tos+1] = n.r
				tos++
			}

			if i%(1<<12) == 0 {
				// Avoid non-preemptible loops (see issue #10958).
				runtime.Gosched()
			}
		}
	})

	runtime.KeepAlive(wbRoots)
}

func BenchmarkBulkWriteBarrier(b *testing.B) {
	if runtime.GOMAXPROCS(-1) < 2 {
		// We don't want GC to take our time.
		b.Skip("need GOMAXPROCS >= 2")
	}

	// Construct a large set of objects we can copy around.
	const heapSize = 64 << 20
	type obj [16]*byte
	ptrs := make([]*obj, heapSize/unsafe.Sizeof(obj{}))
	for i := range ptrs {
		ptrs[i] = new(obj)
	}

	writeBarrierBenchmark(b, func() {
		const blockSize = 1024
		var pos int
		for i := 0; i < b.N; i += blockSize {
			// Rotate block.
			block := ptrs[pos : pos+blockSize]
			first := block[0]
			copy(block, block[1:])
			block[blockSize-1] = first

			pos += blockSize
			if pos+blockSize > len(ptrs) {
				pos = 0
			}

			runtime.Gosched()
		}
	})

	runtime.KeepAlive(ptrs)
}

func BenchmarkScanStackNoLocals(b *testing.B) {
	var ready sync.WaitGroup
	teardown := make(chan bool)
	for j := 0; j < 10; j++ {
		ready.Add(1)
		go func() {
			x := 100000
			countpwg(&x, &ready, teardown)
		}()
	}
	ready.Wait()
	b.ResetTimer()
	for i := 0; i < b.N; i++ {
		b.StartTimer()
		runtime.GC()
		runtime.GC()
		b.StopTimer()
	}
	close(teardown)
}

func countpwg(n *int, ready *sync.WaitGroup, teardown chan bool) {
	if *n == 0 {
		ready.Done()
		<-teardown
		return
	}
	*n--
	countpwg(n, ready, teardown)
}
-												pkg: Add & fix Copyright of "hand generated" files

R=golang-dev, r
CC=golang-dev
https://golang.org/cl/5554064

											
										
										
											2012-01-19 11:14:56 -07:00
+								// Copyright 2011 The Go Authors. All rights reserved.
 								// Use of this source code is governed by a BSD-style
 								// license that can be found in the LICENSE file.
-												runtime: fix memory leak in parallel garbage collector

The work buffer management used by the garbage
collector during parallel collections leaks buffers.
This CL tests for and fixes the leak.

R=golang-dev, dvyukov, r
CC=golang-dev
https://golang.org/cl/5254059

											
										
										
											2011-10-12 11:23:34 -06:00
+								package runtime_test
 								import (
-												runtime: make ReadMemStats STW for < 25µs

Currently ReadMemStats stops the world for ~1.7 ms/GB of heap because
it collects statistics from every single span. For large heaps, this
can be quite costly. This is particularly unfortunate because many
production infrastructures call this function regularly to collect and
report statistics.

Fix this by tracking the necessary cumulative statistics in the
mcaches. ReadMemStats still has to stop the world to stabilize these
statistics, but there are only O(GOMAXPROCS) mcaches to collect
statistics from, so this pause is only 25µs even at GOMAXPROCS=100.

Fixes #13613.

Change-Id: I3c0a4e14833f4760dab675efc1916e73b4c0032a
Reviewed-on: https://go-review.googlesource.com/34937
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-01-03 10:15:55 -07:00
+									"fmt"
-												runtime: better error from TestGcSys when gc is disabled

R=golang-dev, bradfitz
CC=golang-dev
https://golang.org/cl/7390047

											
										
										
											2013-02-21 11:30:31 -07:00
+									"os"
-												runtime: add benchmark of heapBitsSetType

There was an old benchmark that measured this indirectly
via allocation, but I don't understand how to factor out the
allocation cost when interpreting the numbers.

Replace with a benchmark that only calls heapBitsSetType,
that does not allocate. This was not possible when the
benchmark was first written, because heapBitsSetType had
not been factored out of mallocgc.

Change-Id: I30f0f02362efab3465a50769398be859832e6640
Reviewed-on: https://go-review.googlesource.com/9701
Reviewed-by: Austin Clements <austin@google.com>

											
										
										
											2015-05-02 20:59:35 -06:00
+									"reflect"
-												runtime: fix memory leak in parallel garbage collector

The work buffer management used by the garbage
collector during parallel collections leaks buffers.
This CL tests for and fixes the leak.

R=golang-dev, dvyukov, r
CC=golang-dev
https://golang.org/cl/5254059

											
										
										
											2011-10-12 11:23:34 -06:00
+									"runtime"
-												runtime: prevent garbage collection during hashmap insertion

Inserting a key-value pair into a hashmap storing keys or values
indirectly can cause the garbage collector to find the hashmap in
an inconsistent	state.

Fixes #5074.

R=golang-dev, minux.ma, rsc
CC=golang-dev
https://golang.org/cl/7913043

											
										
										
											2013-03-19 15:17:39 -06:00
+									"runtime/debug"
-												runtime: add ReadMemStats latency benchmark

This change adds a benchmark to the runtime which measures ReadMemStats
latencies. It generates allocations with lots of pointers to keep the GC
busy while hitting ReadMemStats and measuring the time it takes to
complete.

Updates #19812.

Change-Id: I7a76aaf497ba5324d3c7a7b3df32461b3e6c3ac8
Reviewed-on: https://go-review.googlesource.com/c/go/+/220177
Run-TryBot: Michael Knyszek <mknyszek@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Austin Clements <austin@google.com>
Reviewed-by: Emmanuel Odeke <emm.odeke@gmail.com>

											
										
										
											2020-02-19 13:54:25 -07:00
+									"sort"
-												runtime: add BenchmarkScanStack

There are many possible stack scanning benchmarks,
but this one is at least a start.

cpuprofiling shows about 75% of CPU in func scanstack.

Change-Id: I906b0493966f2165c1920636c4e057d16d6447e0
Reviewed-on: https://go-review.googlesource.com/105535
Run-TryBot: Josh Bleecher Snyder <josharian@gmail.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Austin Clements <austin@google.com>

											
										
										
											2018-04-06 18:44:26 -06:00
+									"sync"
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
+									"sync/atomic"
-												runtime: fix memory leak in parallel garbage collector

The work buffer management used by the garbage
collector during parallel collections leaks buffers.
This CL tests for and fixes the leak.

R=golang-dev, dvyukov, r
CC=golang-dev
https://golang.org/cl/5254059

											
										
										
											2011-10-12 11:23:34 -06:00
+									"testing"
-												runtime: make MemStats.LastGC Unix time again
The monotonic clock patch changed all runtime times
to abstract monotonic time. As the result user-visible
MemStats.LastGC become monotonic time as well.
Restore Unix time for LastGC.

This is the simplest way to expose time.now to runtime that I found.
Another option would be to change time.now to C called
int64 runtime.unixnanotime() and then express time.now in terms of it.
But this would require to introduce 2 64-bit divisions into time.now.
Another option would be to change time.now to C called
void runtime.unixnanotime1(struct {int64 sec, int32 nsec} *now)
and then express both time.now and runtime.unixnanotime in terms of it.

Fixes #7852.

LGTM=minux.ma, iant
R=minux.ma, rsc, iant
CC=golang-codereviews
https://golang.org/cl/93720045

											
										
										
											2014-05-02 10:32:42 -06:00
+									"time"
-												runtime: simpler and faster GC

Implement the design described in:
https://docs.google.com/document/d/1v4Oqa0WwHunqlb8C3ObL_uNQw3DfSY-ztoA-4wWbKcg/pub

Summary of the changes:
GC uses "2-bits per word" pointer type info embed directly into bitmap.
Scanning of stacks/data/heap is unified.
The old spans types go away.
Compiler generates "sparse" 4-bits type info for GC (directly for GC bitmap).
Linker generates "dense" 2-bits type info for data/bss (the same as stacks use).

Summary of results:
-1680 lines of code total (-1000+ in mgc0.c only)
-25% memory consumption
-3-7% binary size
-15% GC pause reduction
-7% run time reduction

LGTM=khr
R=golang-codereviews, rsc, christoph, khr
CC=golang-codereviews, rlh
https://golang.org/cl/106260045

											
										
										
											2014-07-29 01:01:02 -06:00
+									"unsafe"
-												runtime: fix memory leak in parallel garbage collector

The work buffer management used by the garbage
collector during parallel collections leaks buffers.
This CL tests for and fixes the leak.

R=golang-dev, dvyukov, r
CC=golang-dev
https://golang.org/cl/5254059

											
										
										
											2011-10-12 11:23:34 -06:00
+								)
 								func TestGcSys(t *testing.T) {
-												runtime: better error from TestGcSys when gc is disabled

R=golang-dev, bradfitz
CC=golang-dev
https://golang.org/cl/7390047

											
										
										
											2013-02-21 11:30:31 -07:00
+									if os.Getenv("GOGC") == "off" {
-												runtime: TestGcSys: if GOGC=off, skip instead of failing

R=golang-dev, bradfitz
CC=golang-dev
https://golang.org/cl/8201043

											
										
										
											2013-03-30 16:10:53 -06:00
+										t.Skip("skipping test; GOGC=off in environment")
-												runtime: better error from TestGcSys when gc is disabled

R=golang-dev, bradfitz
CC=golang-dev
https://golang.org/cl/7390047

											
										
										
											2013-02-21 11:30:31 -07:00
+									}
-												runtime: move test programs out of source code, coalesce

Now there are just three programs to compile instead of many,
and repeated tests can reuse the compilation result instead of
rebuilding it.

Combined, these changes reduce the time spent testing runtime
during all.bash on my laptop from about 60 to about 30 seconds.
(All.bash itself runs in 5½ minutes.)

For #10571.

Change-Id: Ie2c1798b847f1a635a860d11dcdab14375319ae9
Reviewed-on: https://go-review.googlesource.com/18085
Reviewed-by: Austin Clements <austin@google.com>
Run-TryBot: Austin Clements <austin@google.com>

											
										
										
											2015-12-21 08:29:21 -07:00
+									got := runTestProg(t, "testprog", "GCSys")
-												runtime: move TestGcSys into a separate process
Fixes #4904.
The problem was that when the test runs the heap had grown to ~100MB,
so GC allows it to grow to 200MB, and so the test fails.
Moving the test to a separate process makes it much more isolated and stable.

R=golang-dev, minux.ma
CC=golang-dev
https://golang.org/cl/7441046

											
										
										
											2013-03-01 23:36:06 -07:00
+									want := "OK\n"
 									if got != want {
 										t.Fatalf("expected %q, but got %q", want, got)
 									}
 								}
-												gc: generate garbage collection info for types

R=rsc, nigeltao, minux.ma
CC=golang-dev
https://golang.org/cl/6290043

											
										
										
											2012-09-12 10:08:27 -06:00
+								func TestGcDeepNesting(t *testing.T) {
 									type T [2][2][2][2][2][2][2][2][2][2]*int
 									a := new(T)
 									// Prevent the compiler from applying escape analysis.
 									// This makes sure new(T) is allocated on heap, not on the stack.
 									t.Logf("%p", a)
 									a[0][0][0][0][0][0][0][0][0][0] = new(int)
 									*a[0][0][0][0][0][0][0][0][0][0] = 13
 									runtime.GC()
 									if *a[0][0][0][0][0][0][0][0][0][0] != 13 {
 										t.Fail()
 									}
 								}
-												runtime: prevent garbage collection during hashmap insertion

Inserting a key-value pair into a hashmap storing keys or values
indirectly can cause the garbage collector to find the hashmap in
an inconsistent	state.

Fixes #5074.

R=golang-dev, minux.ma, rsc
CC=golang-dev
https://golang.org/cl/7913043

											
										
										
											2013-03-19 15:17:39 -06:00
-												runtime: rename the TestGcHashmapIndirection to TestGcMapIndirection

There was still the word 'Hashmap' in gc_test.go, so I renamed it to just 'Map'

Previous renaming commit: https://golang.org/cl/90336

Change-Id: I5b0e5c2229d1c30937c7216247f4533effb81ce7
Reviewed-on: https://go-review.googlesource.com/96675
Reviewed-by: Brad Fitzpatrick <bradfitz@golang.org>

											
										
										
											2018-02-23 06:44:10 -07:00
+								func TestGcMapIndirection(t *testing.T) {
-												runtime: prevent garbage collection during hashmap insertion

Inserting a key-value pair into a hashmap storing keys or values
indirectly can cause the garbage collector to find the hashmap in
an inconsistent	state.

Fixes #5074.

R=golang-dev, minux.ma, rsc
CC=golang-dev
https://golang.org/cl/7913043

											
										
										
											2013-03-19 15:17:39 -06:00
+									defer debug.SetGCPercent(debug.SetGCPercent(1))
 									runtime.GC()
 									type T struct {
 										a [256]int
 									}
 									m := make(map[T]T)
 									for i := 0; i < 2000; i++ {
 										var a T
 										a.a[0] = i
 										m[a] = T{}
 									}
 								}
-												runtime: fix GC scanning of slices
If a slice points to an array embedded in a struct,
the whole struct can be incorrectly scanned as the slice buffer.
Fixes #5443.

R=cshapiro, iant, r, cshapiro, minux.ma
CC=bradfitz, gobot, golang-dev
https://golang.org/cl/9372044

											
										
										
											2013-05-15 13:50:32 -06:00
 								func TestGcArraySlice(t *testing.T) {
 									type X struct {
 										buf     [1]byte
 										nextbuf []byte
 										next    *X
 									}
 									var head *X
 									for i := 0; i < 10; i++ {
 										p := &X{}
 										p.buf[0] = 42
 										p.next = head
 										if head != nil {
 											p.nextbuf = head.buf[:]
 										}
 										head = p
 										runtime.GC()
 									}
 									for p := head; p != nil; p = p.next {
 										if p.buf[0] != 42 {
 											t.Fatal("corrupted heap")
 										}
 									}
 								}
-												runtime: fix heap corruption during GC
The 'n' variable is used during rescan initiation in GC_END case,
but it's overwritten with chan capacity in GC_CHAN case.
As the result rescan is done with the wrong object size.
Fixes #5554.

R=golang-dev, khr
CC=golang-dev
https://golang.org/cl/9831043

											
										
										
											2013-05-28 09:17:47 -06:00
 								func TestGcRescan(t *testing.T) {
 									type X struct {
 										c     chan error
 										nextx *X
 									}
 									type Y struct {
 										X
 										nexty *Y
 										p     *int
 									}
 									var head *Y
 									for i := 0; i < 10; i++ {
 										p := &Y{}
 										p.c = make(chan error)
-												tests: remove two misuses of nil pointers

R=golang-dev, bradfitz
CC=golang-dev
https://golang.org/cl/12858044

											
										
										
											2013-08-15 09:51:04 -06:00
+										if head != nil {
 											p.nextx = &head.X
 										}
-												runtime: fix heap corruption during GC
The 'n' variable is used during rescan initiation in GC_END case,
but it's overwritten with chan capacity in GC_CHAN case.
As the result rescan is done with the wrong object size.
Fixes #5554.

R=golang-dev, khr
CC=golang-dev
https://golang.org/cl/9831043

											
										
										
											2013-05-28 09:17:47 -06:00
+										p.nexty = head
 										p.p = new(int)
 										*p.p = 42
 										head = p
 										runtime.GC()
 									}
 									for p := head; p != nil; p = p.nexty {
 										if *p.p != 42 {
 											t.Fatal("corrupted heap")
 										}
 									}
 								}
-												runtime: get rid of the settype buffer and lock.

MCaches	now hold a MSpan for each sizeclass which they have
exclusive access to allocate from, so no lock is needed.

Modifying the heap bitmaps also no longer requires a cas.

runtime.free gets more expensive.  But we don't use it
much any more.

It's not much faster on 1 processor, but it's a lot
faster on multiple processors.

benchmark                 old ns/op    new ns/op    delta
BenchmarkSetTypeNoPtr1           24           23   -0.42%
BenchmarkSetTypeNoPtr2           33           34   +0.89%
BenchmarkSetTypePtr1             51           49   -3.72%
BenchmarkSetTypePtr2             55           54   -1.98%

benchmark                old ns/op    new ns/op    delta
BenchmarkAllocation          52739        50770   -3.73%
BenchmarkAllocation-2        33957        34141   +0.54%
BenchmarkAllocation-3        33326        29015  -12.94%
BenchmarkAllocation-4        38105        25795  -32.31%
BenchmarkAllocation-5        68055        24409  -64.13%
BenchmarkAllocation-6        71544        23488  -67.17%
BenchmarkAllocation-7        68374        23041  -66.30%
BenchmarkAllocation-8        70117        20758  -70.40%

LGTM=rsc, dvyukov
R=dvyukov, bradfitz, khr, rsc
CC=golang-codereviews
https://golang.org/cl/46810043

											
										
										
											2014-02-26 16:52:58 -07:00
-												runtime: make MemStats.LastGC Unix time again
The monotonic clock patch changed all runtime times
to abstract monotonic time. As the result user-visible
MemStats.LastGC become monotonic time as well.
Restore Unix time for LastGC.

This is the simplest way to expose time.now to runtime that I found.
Another option would be to change time.now to C called
int64 runtime.unixnanotime() and then express time.now in terms of it.
But this would require to introduce 2 64-bit divisions into time.now.
Another option would be to change time.now to C called
void runtime.unixnanotime1(struct {int64 sec, int32 nsec} *now)
and then express both time.now and runtime.unixnanotime in terms of it.

Fixes #7852.

LGTM=minux.ma, iant
R=minux.ma, rsc, iant
CC=golang-codereviews
https://golang.org/cl/93720045

											
										
										
											2014-05-02 10:32:42 -06:00
+								func TestGcLastTime(t *testing.T) {
 									ms := new(runtime.MemStats)
 									t0 := time.Now().UnixNano()
 									runtime.GC()
 									t1 := time.Now().UnixNano()
 									runtime.ReadMemStats(ms)
 									last := int64(ms.LastGC)
 									if t0 > last || last > t1 {
 										t.Fatalf("bad last GC time: got %v, want [%v, %v]", last, t0, t1)
 									}
-												runtime: fix MemStats on 32-bits
Int64's do not fit into uintptr's.

LGTM=khr
R=golang-codereviews, khr, rsc
CC=golang-codereviews, rlh
https://golang.org/cl/128380043

											
										
										
											2014-08-19 01:53:20 -06:00
+									pause := ms.PauseNs[(ms.NumGC+255)%256]
-												runtime: relax flaky GC pause test

We often saw GC pauses of 0 ns, not just on Windows.
Google Compute Engine timer granularity might suck
too.

LGTM=rsc
R=rsc, dvyukov
CC=golang-codereviews
https://golang.org/cl/140910043

											
										
										
											2014-09-03 10:54:53 -06:00
+									// Due to timer granularity, pause can actually be 0 on windows
 									// or on virtualized environments.
 									if pause == 0 {
 										t.Logf("last GC pause was 0")
 									} else if pause > 10e9 {
 										t.Logf("bad last GC pause: got %v, want [0, 10e9]", pause)
-												runtime: fix MemStats on 32-bits
Int64's do not fit into uintptr's.

LGTM=khr
R=golang-codereviews, khr, rsc
CC=golang-codereviews, rlh
https://golang.org/cl/128380043

											
										
										
											2014-08-19 01:53:20 -06:00
+									}
-												runtime: make MemStats.LastGC Unix time again
The monotonic clock patch changed all runtime times
to abstract monotonic time. As the result user-visible
MemStats.LastGC become monotonic time as well.
Restore Unix time for LastGC.

This is the simplest way to expose time.now to runtime that I found.
Another option would be to change time.now to C called
int64 runtime.unixnanotime() and then express time.now in terms of it.
But this would require to introduce 2 64-bit divisions into time.now.
Another option would be to change time.now to C called
void runtime.unixnanotime1(struct {int64 sec, int32 nsec} *now)
and then express both time.now and runtime.unixnanotime in terms of it.

Fixes #7852.

LGTM=minux.ma, iant
R=minux.ma, rsc, iant
CC=golang-codereviews
https://golang.org/cl/93720045

											
										
										
											2014-05-02 10:32:42 -06:00
+								}
-												runtime: simpler and faster GC

Implement the design described in:
https://docs.google.com/document/d/1v4Oqa0WwHunqlb8C3ObL_uNQw3DfSY-ztoA-4wWbKcg/pub

Summary of the changes:
GC uses "2-bits per word" pointer type info embed directly into bitmap.
Scanning of stacks/data/heap is unified.
The old spans types go away.
Compiler generates "sparse" 4-bits type info for GC (directly for GC bitmap).
Linker generates "dense" 2-bits type info for data/bss (the same as stacks use).

Summary of results:
-1680 lines of code total (-1000+ in mgc0.c only)
-25% memory consumption
-3-7% binary size
-15% GC pause reduction
-7% run time reduction

LGTM=khr
R=golang-codereviews, rsc, christoph, khr
CC=golang-codereviews, rlh
https://golang.org/cl/106260045

											
										
										
											2014-07-29 01:01:02 -06:00
+								var hugeSink interface{}
 								func TestHugeGCInfo(t *testing.T) {
 									// The test ensures that compiler can chew these huge types even on weakest machines.
 									// The types are not allocated at runtime.
 									if hugeSink != nil {
 										// 400MB on 32 bots, 4TB on 64-bits.
 										const n = (400 << 20) + (unsafe.Sizeof(uintptr(0))-4)<<40
 										hugeSink = new([n]*byte)
 										hugeSink = new([n]uintptr)
 										hugeSink = new(struct {
 											x float64
 											y [n]*byte
 											z []string
 										})
 										hugeSink = new(struct {
 											x float64
 											y [n]uintptr
 											z []string
 										})
 									}
 								}
-												runtime: test that periodic GC works

We've broken periodic GC a few times without noticing because there's
no test for it, partly because you have to wait two minutes to see if
it happens. This exposes control of the periodic GC timeout to runtime
tests and adds a test that cranks it down to zero and sleeps for a bit
to make sure periodic GCs happen.

Change-Id: I3ec44e967e99f4eda752f85c329eebd18b87709e
Reviewed-on: https://go-review.googlesource.com/13169
Reviewed-by: Rick Hudson <rlh@golang.org>
Run-TryBot: Austin Clements <austin@google.com>

											
										
										
											2015-08-05 09:35:28 -06:00
+								func TestPeriodicGC(t *testing.T) {
-												all: skip unsupported tests for js/wasm

The general policy for the current state of js/wasm is that it only
has to support tests that are also supported by nacl.

The test nilptr3.go makes assumptions about which nil checks can be
removed. Since WebAssembly does not signal on reading a null pointer,
all nil checks have to be explicit.

Updates #18892

Change-Id: I06a687860b8d22ae26b1c391499c0f5183e4c485
Reviewed-on: https://go-review.googlesource.com/110096
Reviewed-by: Brad Fitzpatrick <bradfitz@golang.org>
Run-TryBot: Brad Fitzpatrick <bradfitz@golang.org>
TryBot-Result: Gobot Gobot <gobot@golang.org>

											
										
										
											2018-03-04 04:15:37 -07:00
+									if runtime.GOARCH == "wasm" {
 										t.Skip("no sysmon on wasm yet")
 									}
-												runtime: test that periodic GC works

We've broken periodic GC a few times without noticing because there's
no test for it, partly because you have to wait two minutes to see if
it happens. This exposes control of the periodic GC timeout to runtime
tests and adds a test that cranks it down to zero and sleeps for a bit
to make sure periodic GCs happen.

Change-Id: I3ec44e967e99f4eda752f85c329eebd18b87709e
Reviewed-on: https://go-review.googlesource.com/13169
Reviewed-by: Rick Hudson <rlh@golang.org>
Run-TryBot: Austin Clements <austin@google.com>

											
										
										
											2015-08-05 09:35:28 -06:00
+									// Make sure we're not in the middle of a GC.
 									runtime.GC()
 									var ms1, ms2 runtime.MemStats
 									runtime.ReadMemStats(&ms1)
 									// Make periodic GC run continuously.
 									orig := *runtime.ForceGCPeriod
 									*runtime.ForceGCPeriod = 0
 									// Let some periodic GCs happen. In a heavily loaded system,
 									// it's possible these will be delayed, so this is designed to
 									// succeed quickly if things are working, but to give it some
 									// slack if things are slow.
 									var numGCs uint32
 									const want = 2
-												runtime: deflake TestPeriodicGC

It was only waiting 0.1 seconds for the two GCs it wanted.
Let it wait 1 second.

Change-Id: Ib3cdc8127cbf95694a9f173643c02529a85063af
Reviewed-on: https://go-review.googlesource.com/68151
Run-TryBot: Russ Cox <rsc@golang.org>
Reviewed-by: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>

											
										
										
											2017-10-04 10:28:20 -06:00
+									for i := 0; i < 200 && numGCs < want; i++ {
-												runtime: test that periodic GC works

We've broken periodic GC a few times without noticing because there's
no test for it, partly because you have to wait two minutes to see if
it happens. This exposes control of the periodic GC timeout to runtime
tests and adds a test that cranks it down to zero and sleeps for a bit
to make sure periodic GCs happen.

Change-Id: I3ec44e967e99f4eda752f85c329eebd18b87709e
Reviewed-on: https://go-review.googlesource.com/13169
Reviewed-by: Rick Hudson <rlh@golang.org>
Run-TryBot: Austin Clements <austin@google.com>

											
										
										
											2015-08-05 09:35:28 -06:00
+										time.Sleep(5 * time.Millisecond)
 										// Test that periodic GC actually happened.
 										runtime.ReadMemStats(&ms2)
 										numGCs = ms2.NumGC - ms1.NumGC
 									}
 									*runtime.ForceGCPeriod = orig
 									if numGCs < want {
 										t.Fatalf("no periodic GC: got %v GCs, want >= 2", numGCs)
 									}
 								}
-												runtime: add benchmark of heapBitsSetType

There was an old benchmark that measured this indirectly
via allocation, but I don't understand how to factor out the
allocation cost when interpreting the numbers.

Replace with a benchmark that only calls heapBitsSetType,
that does not allocate. This was not possible when the
benchmark was first written, because heapBitsSetType had
not been factored out of mallocgc.

Change-Id: I30f0f02362efab3465a50769398be859832e6640
Reviewed-on: https://go-review.googlesource.com/9701
Reviewed-by: Austin Clements <austin@google.com>

											
										
										
											2015-05-02 20:59:35 -06:00
+								func BenchmarkSetTypePtr(b *testing.B) {
 									benchSetType(b, new(*byte))
-												runtime: get rid of the settype buffer and lock.

MCaches	now hold a MSpan for each sizeclass which they have
exclusive access to allocate from, so no lock is needed.

Modifying the heap bitmaps also no longer requires a cas.

runtime.free gets more expensive.  But we don't use it
much any more.

It's not much faster on 1 processor, but it's a lot
faster on multiple processors.

benchmark                 old ns/op    new ns/op    delta
BenchmarkSetTypeNoPtr1           24           23   -0.42%
BenchmarkSetTypeNoPtr2           33           34   +0.89%
BenchmarkSetTypePtr1             51           49   -3.72%
BenchmarkSetTypePtr2             55           54   -1.98%

benchmark                old ns/op    new ns/op    delta
BenchmarkAllocation          52739        50770   -3.73%
BenchmarkAllocation-2        33957        34141   +0.54%
BenchmarkAllocation-3        33326        29015  -12.94%
BenchmarkAllocation-4        38105        25795  -32.31%
BenchmarkAllocation-5        68055        24409  -64.13%
BenchmarkAllocation-6        71544        23488  -67.17%
BenchmarkAllocation-7        68374        23041  -66.30%
BenchmarkAllocation-8        70117        20758  -70.40%

LGTM=rsc, dvyukov
R=dvyukov, bradfitz, khr, rsc
CC=golang-codereviews
https://golang.org/cl/46810043

											
										
										
											2014-02-26 16:52:58 -07:00
+								}
-												runtime: add benchmark of heapBitsSetType

There was an old benchmark that measured this indirectly
via allocation, but I don't understand how to factor out the
allocation cost when interpreting the numbers.

Replace with a benchmark that only calls heapBitsSetType,
that does not allocate. This was not possible when the
benchmark was first written, because heapBitsSetType had
not been factored out of mallocgc.

Change-Id: I30f0f02362efab3465a50769398be859832e6640
Reviewed-on: https://go-review.googlesource.com/9701
Reviewed-by: Austin Clements <austin@google.com>

											
										
										
											2015-05-02 20:59:35 -06:00
 								func BenchmarkSetTypePtr8(b *testing.B) {
 									benchSetType(b, new([8]*byte))
-												runtime: get rid of the settype buffer and lock.

MCaches	now hold a MSpan for each sizeclass which they have
exclusive access to allocate from, so no lock is needed.

Modifying the heap bitmaps also no longer requires a cas.

runtime.free gets more expensive.  But we don't use it
much any more.

It's not much faster on 1 processor, but it's a lot
faster on multiple processors.

benchmark                 old ns/op    new ns/op    delta
BenchmarkSetTypeNoPtr1           24           23   -0.42%
BenchmarkSetTypeNoPtr2           33           34   +0.89%
BenchmarkSetTypePtr1             51           49   -3.72%
BenchmarkSetTypePtr2             55           54   -1.98%

benchmark                old ns/op    new ns/op    delta
BenchmarkAllocation          52739        50770   -3.73%
BenchmarkAllocation-2        33957        34141   +0.54%
BenchmarkAllocation-3        33326        29015  -12.94%
BenchmarkAllocation-4        38105        25795  -32.31%
BenchmarkAllocation-5        68055        24409  -64.13%
BenchmarkAllocation-6        71544        23488  -67.17%
BenchmarkAllocation-7        68374        23041  -66.30%
BenchmarkAllocation-8        70117        20758  -70.40%

LGTM=rsc, dvyukov
R=dvyukov, bradfitz, khr, rsc
CC=golang-codereviews
https://golang.org/cl/46810043

											
										
										
											2014-02-26 16:52:58 -07:00
+								}
-												runtime: add benchmark of heapBitsSetType

There was an old benchmark that measured this indirectly
via allocation, but I don't understand how to factor out the
allocation cost when interpreting the numbers.

Replace with a benchmark that only calls heapBitsSetType,
that does not allocate. This was not possible when the
benchmark was first written, because heapBitsSetType had
not been factored out of mallocgc.

Change-Id: I30f0f02362efab3465a50769398be859832e6640
Reviewed-on: https://go-review.googlesource.com/9701
Reviewed-by: Austin Clements <austin@google.com>

											
										
										
											2015-05-02 20:59:35 -06:00
 								func BenchmarkSetTypePtr16(b *testing.B) {
 									benchSetType(b, new([16]*byte))
-												runtime: get rid of the settype buffer and lock.

MCaches	now hold a MSpan for each sizeclass which they have
exclusive access to allocate from, so no lock is needed.

Modifying the heap bitmaps also no longer requires a cas.

runtime.free gets more expensive.  But we don't use it
much any more.

It's not much faster on 1 processor, but it's a lot
faster on multiple processors.

benchmark                 old ns/op    new ns/op    delta
BenchmarkSetTypeNoPtr1           24           23   -0.42%
BenchmarkSetTypeNoPtr2           33           34   +0.89%
BenchmarkSetTypePtr1             51           49   -3.72%
BenchmarkSetTypePtr2             55           54   -1.98%

benchmark                old ns/op    new ns/op    delta
BenchmarkAllocation          52739        50770   -3.73%
BenchmarkAllocation-2        33957        34141   +0.54%
BenchmarkAllocation-3        33326        29015  -12.94%
BenchmarkAllocation-4        38105        25795  -32.31%
BenchmarkAllocation-5        68055        24409  -64.13%
BenchmarkAllocation-6        71544        23488  -67.17%
BenchmarkAllocation-7        68374        23041  -66.30%
BenchmarkAllocation-8        70117        20758  -70.40%

LGTM=rsc, dvyukov
R=dvyukov, bradfitz, khr, rsc
CC=golang-codereviews
https://golang.org/cl/46810043

											
										
										
											2014-02-26 16:52:58 -07:00
+								}
-												runtime: add benchmark of heapBitsSetType

There was an old benchmark that measured this indirectly
via allocation, but I don't understand how to factor out the
allocation cost when interpreting the numbers.

Replace with a benchmark that only calls heapBitsSetType,
that does not allocate. This was not possible when the
benchmark was first written, because heapBitsSetType had
not been factored out of mallocgc.

Change-Id: I30f0f02362efab3465a50769398be859832e6640
Reviewed-on: https://go-review.googlesource.com/9701
Reviewed-by: Austin Clements <austin@google.com>

											
										
										
											2015-05-02 20:59:35 -06:00
 								func BenchmarkSetTypePtr32(b *testing.B) {
 									benchSetType(b, new([32]*byte))
 								}
 								func BenchmarkSetTypePtr64(b *testing.B) {
 									benchSetType(b, new([64]*byte))
 								}
 								func BenchmarkSetTypePtr126(b *testing.B) {
 									benchSetType(b, new([126]*byte))
 								}
 								func BenchmarkSetTypePtr128(b *testing.B) {
 									benchSetType(b, new([128]*byte))
 								}
 								func BenchmarkSetTypePtrSlice(b *testing.B) {
 									benchSetType(b, make([]*byte, 1<<10))
 								}
 								type Node1 struct {
 									Value       [1]uintptr
 									Left, Right *byte
 								}
 								func BenchmarkSetTypeNode1(b *testing.B) {
 									benchSetType(b, new(Node1))
 								}
 								func BenchmarkSetTypeNode1Slice(b *testing.B) {
 									benchSetType(b, make([]Node1, 32))
 								}
 								type Node8 struct {
 									Value       [8]uintptr
 									Left, Right *byte
 								}
 								func BenchmarkSetTypeNode8(b *testing.B) {
 									benchSetType(b, new(Node8))
 								}
 								func BenchmarkSetTypeNode8Slice(b *testing.B) {
 									benchSetType(b, make([]Node8, 32))
 								}
 								type Node64 struct {
 									Value       [64]uintptr
 									Left, Right *byte
 								}
 								func BenchmarkSetTypeNode64(b *testing.B) {
 									benchSetType(b, new(Node64))
 								}
 								func BenchmarkSetTypeNode64Slice(b *testing.B) {
 									benchSetType(b, make([]Node64, 32))
 								}
 								type Node64Dead struct {
 									Left, Right *byte
 									Value       [64]uintptr
 								}
 								func BenchmarkSetTypeNode64Dead(b *testing.B) {
 									benchSetType(b, new(Node64Dead))
 								}
 								func BenchmarkSetTypeNode64DeadSlice(b *testing.B) {
 									benchSetType(b, make([]Node64Dead, 32))
 								}
 								type Node124 struct {
 									Value       [124]uintptr
 									Left, Right *byte
 								}
 								func BenchmarkSetTypeNode124(b *testing.B) {
 									benchSetType(b, new(Node124))
 								}
 								func BenchmarkSetTypeNode124Slice(b *testing.B) {
 									benchSetType(b, make([]Node124, 32))
 								}
 								type Node126 struct {
 									Value       [126]uintptr
 									Left, Right *byte
 								}
 								func BenchmarkSetTypeNode126(b *testing.B) {
 									benchSetType(b, new(Node126))
 								}
 								func BenchmarkSetTypeNode126Slice(b *testing.B) {
 									benchSetType(b, make([]Node126, 32))
 								}
-												runtime: add Node128, Node130 benchmarks

Change-Id: I815a7ceeea48cc652b3c8568967665af39b02834
Reviewed-on: https://go-review.googlesource.com/10045
Reviewed-by: Brad Fitzpatrick <bradfitz@golang.org>

											
										
										
											2015-05-14 12:23:12 -06:00
+								type Node128 struct {
 									Value       [128]uintptr
 									Left, Right *byte
 								}
 								func BenchmarkSetTypeNode128(b *testing.B) {
 									benchSetType(b, new(Node128))
 								}
 								func BenchmarkSetTypeNode128Slice(b *testing.B) {
 									benchSetType(b, make([]Node128, 32))
 								}
 								type Node130 struct {
 									Value       [130]uintptr
 									Left, Right *byte
 								}
 								func BenchmarkSetTypeNode130(b *testing.B) {
 									benchSetType(b, new(Node130))
 								}
 								func BenchmarkSetTypeNode130Slice(b *testing.B) {
 									benchSetType(b, make([]Node130, 32))
 								}
-												runtime: add benchmark of heapBitsSetType

There was an old benchmark that measured this indirectly
via allocation, but I don't understand how to factor out the
allocation cost when interpreting the numbers.

Replace with a benchmark that only calls heapBitsSetType,
that does not allocate. This was not possible when the
benchmark was first written, because heapBitsSetType had
not been factored out of mallocgc.

Change-Id: I30f0f02362efab3465a50769398be859832e6640
Reviewed-on: https://go-review.googlesource.com/9701
Reviewed-by: Austin Clements <austin@google.com>

											
										
										
											2015-05-02 20:59:35 -06:00
+								type Node1024 struct {
 									Value       [1024]uintptr
 									Left, Right *byte
 								}
 								func BenchmarkSetTypeNode1024(b *testing.B) {
 									benchSetType(b, new(Node1024))
 								}
 								func BenchmarkSetTypeNode1024Slice(b *testing.B) {
 									benchSetType(b, make([]Node1024, 32))
 								}
 								func benchSetType(b *testing.B, x interface{}) {
 									v := reflect.ValueOf(x)
 									t := v.Type()
 									switch t.Kind() {
 									case reflect.Ptr:
 										b.SetBytes(int64(t.Elem().Size()))
 									case reflect.Slice:
 										b.SetBytes(int64(t.Elem().Size()) * int64(v.Len()))
 									}
 									b.ResetTimer()
 									runtime.BenchSetType(b.N, x)
-												runtime: get rid of the settype buffer and lock.

MCaches	now hold a MSpan for each sizeclass which they have
exclusive access to allocate from, so no lock is needed.

Modifying the heap bitmaps also no longer requires a cas.

runtime.free gets more expensive.  But we don't use it
much any more.

It's not much faster on 1 processor, but it's a lot
faster on multiple processors.

benchmark                 old ns/op    new ns/op    delta
BenchmarkSetTypeNoPtr1           24           23   -0.42%
BenchmarkSetTypeNoPtr2           33           34   +0.89%
BenchmarkSetTypePtr1             51           49   -3.72%
BenchmarkSetTypePtr2             55           54   -1.98%

benchmark                old ns/op    new ns/op    delta
BenchmarkAllocation          52739        50770   -3.73%
BenchmarkAllocation-2        33957        34141   +0.54%
BenchmarkAllocation-3        33326        29015  -12.94%
BenchmarkAllocation-4        38105        25795  -32.31%
BenchmarkAllocation-5        68055        24409  -64.13%
BenchmarkAllocation-6        71544        23488  -67.17%
BenchmarkAllocation-7        68374        23041  -66.30%
BenchmarkAllocation-8        70117        20758  -70.40%

LGTM=rsc, dvyukov
R=dvyukov, bradfitz, khr, rsc
CC=golang-codereviews
https://golang.org/cl/46810043

											
										
										
											2014-02-26 16:52:58 -07:00
+								}
 								func BenchmarkAllocation(b *testing.B) {
 									type T struct {
 										x, y *byte
 									}
 									ngo := runtime.GOMAXPROCS(0)
 									work := make(chan bool, b.N+ngo)
 									result := make(chan *T)
 									for i := 0; i < b.N; i++ {
 										work <- true
 									}
 									for i := 0; i < ngo; i++ {
 										work <- false
 									}
 									for i := 0; i < ngo; i++ {
 										go func() {
 											var x *T
 											for <-work {
 												for i := 0; i < 1000; i++ {
 													x = &T{}
 												}
 											}
 											result <- x
 										}()
 									}
 									for i := 0; i < ngo; i++ {
 										<-result
 									}
 								}
-												runtime: move built-in print routines to go.

Fixes #8297

LGTM=bradfitz
R=golang-codereviews, bradfitz, khr, dave, dvyukov
CC=golang-codereviews
https://golang.org/cl/119240043

											
										
										
											2014-07-31 14:48:48 -06:00
 								func TestPrintGC(t *testing.T) {
 									if testing.Short() {
 										t.Skip("Skipping in short mode")
 									}
 									defer runtime.GOMAXPROCS(runtime.GOMAXPROCS(2))
 									done := make(chan bool)
 									go func() {
 										for {
 											select {
 											case <-done:
 												return
 											default:
 												runtime.GC()
 											}
 										}
 									}()
 									for i := 0; i < 1e4; i++ {
 										func() {
 											defer print("")
 										}()
 									}
 									close(done)
 								}
-												cmd/compile: fix uninitialized memory during type switch assertE2I2

Fixes arm64 builder crash.

The bug is possible on all architectures; you just have to get lucky
and hit a preemption or a stack growth on entry to assertE2I2.
The test stacks the deck.

Change-Id: I8419da909b06249b1ad15830cbb64e386b6aa5f6
Reviewed-on: https://go-review.googlesource.com/12890
Reviewed-by: Ian Lance Taylor <iant@golang.org>
Reviewed-by: Rob Pike <r@golang.org>

											
										
										
											2015-07-29 22:46:42 -06:00
 								func testTypeSwitch(x interface{}) error {
 									switch y := x.(type) {
 									case nil:
 										// ok
 									case error:
 										return y
 									}
 									return nil
 								}
 								func testAssert(x interface{}) error {
 									if y, ok := x.(error); ok {
 										return y
 									}
 									return nil
 								}
 								func testAssertVar(x interface{}) error {
 									var y, ok = x.(error)
 									if ok {
 										return y
 									}
 									return nil
 								}
-												cmd/compile: fix uninitialized memory in compare of interface value

A comparison of the form l == r where l is an interface and r is
concrete performs a type assertion on l to convert it to r's type.
However, the compiler fails to zero the temporary where the result of
the type assertion is written, so if the type is a pointer type and a
stack scan occurs while in the type assertion, it may see an invalid
pointer on the stack.

Fix this by zeroing the temporary. This is equivalent to the fix for
type switches from c4092ac.

Fixes #12253.

Change-Id: Iaf205d456b856c056b317b4e888ce892f0c555b9
Reviewed-on: https://go-review.googlesource.com/13872
Reviewed-by: Russ Cox <rsc@golang.org>

											
										
										
											2015-08-24 11:35:49 -06:00
-												test: use go:noinline consistently

Replace various implementations of inlining prevention with
"go:noinline"

Change-Id: Iac90895c3a62d6f4b7a6c72e11e165d15a0abfa4
Reviewed-on: https://go-review.googlesource.com/16510
Reviewed-by: Keith Randall <khr@golang.org>
Run-TryBot: Todd Neal <todd@tneal.org>
TryBot-Result: Gobot Gobot <gobot@golang.org>

											
										
										
											2015-10-29 20:45:19 -06:00
+								var a bool
 								//go:noinline
-												cmd/compile: fix uninitialized memory in compare of interface value

A comparison of the form l == r where l is an interface and r is
concrete performs a type assertion on l to convert it to r's type.
However, the compiler fails to zero the temporary where the result of
the type assertion is written, so if the type is a pointer type and a
stack scan occurs while in the type assertion, it may see an invalid
pointer on the stack.

Fix this by zeroing the temporary. This is equivalent to the fix for
type switches from c4092ac.

Fixes #12253.

Change-Id: Iaf205d456b856c056b317b4e888ce892f0c555b9
Reviewed-on: https://go-review.googlesource.com/13872
Reviewed-by: Russ Cox <rsc@golang.org>

											
										
										
											2015-08-24 11:35:49 -06:00
+								func testIfaceEqual(x interface{}) {
 									if x == "abc" {
-												test: use go:noinline consistently

Replace various implementations of inlining prevention with
"go:noinline"

Change-Id: Iac90895c3a62d6f4b7a6c72e11e165d15a0abfa4
Reviewed-on: https://go-review.googlesource.com/16510
Reviewed-by: Keith Randall <khr@golang.org>
Run-TryBot: Todd Neal <todd@tneal.org>
TryBot-Result: Gobot Gobot <gobot@golang.org>

											
										
										
											2015-10-29 20:45:19 -06:00
+										a = true
-												cmd/compile: fix uninitialized memory in compare of interface value

A comparison of the form l == r where l is an interface and r is
concrete performs a type assertion on l to convert it to r's type.
However, the compiler fails to zero the temporary where the result of
the type assertion is written, so if the type is a pointer type and a
stack scan occurs while in the type assertion, it may see an invalid
pointer on the stack.

Fix this by zeroing the temporary. This is equivalent to the fix for
type switches from c4092ac.

Fixes #12253.

Change-Id: Iaf205d456b856c056b317b4e888ce892f0c555b9
Reviewed-on: https://go-review.googlesource.com/13872
Reviewed-by: Russ Cox <rsc@golang.org>

											
										
										
											2015-08-24 11:35:49 -06:00
+									}
 								}
-												runtime: fix pagesInUse accounting

When we grow the heap, we create a temporary "in use" span for the
memory acquired from the OS and then free that span to link it into
the heap. Hence, we (1) increase pagesInUse when we make the temporary
span so that (2) freeing the span will correctly decrease it.

However, currently step (1) increases pagesInUse by the number of
pages requested from the heap, while step (2) decreases it by the
number of pages requested from the OS (the size of the temporary
span). These aren't necessarily the same, since we round up the number
of pages we request from the OS, so steps 1 and 2 don't necessarily
cancel out like they're supposed to. Over time, this can add up and
cause pagesInUse to underflow and wrap around to 2^64. The garbage
collector computes the sweep ratio from this, so if this happens, the
sweep ratio becomes effectively infinite, causing the first allocation
on each P in a sweep cycle to sweep the entire heap. This makes
sweeping effectively STW.

Fix this by increasing pagesInUse in step 1 by the number of pages
requested from the OS, so that the two steps correctly cancel out. We
add a test that checks that the running total matches the actual state
of the heap.

Fixes #15022. For 1.6.x.

Change-Id: Iefd9d6abe37d0d447cbdbdf9941662e4f18eeffc
Reviewed-on: https://go-review.googlesource.com/21280
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Russ Cox <rsc@golang.org>

											
										
										
											2016-03-29 10:28:24 -06:00
 								func TestPageAccounting(t *testing.T) {
 									// Grow the heap in small increments. This used to drop the
 									// pages-in-use count below zero because of a rounding
 									// mismatch (golang.org/issue/15022).
 									const blockSize = 64 << 10
 									blocks := make([]*[blockSize]byte, (64<<20)/blockSize)
 									for i := range blocks {
 										blocks[i] = new([blockSize]byte)
 									}
 									// Check that the running page count matches reality.
 									pagesInUse, counted := runtime.CountPagesInUse()
 									if pagesInUse != counted {
 										t.Fatalf("mheap_.pagesInUse is %d, but direct count is %d", pagesInUse, counted)
 									}
 								}
-												runtime: make ReadMemStats STW for < 25µs

Currently ReadMemStats stops the world for ~1.7 ms/GB of heap because
it collects statistics from every single span. For large heaps, this
can be quite costly. This is particularly unfortunate because many
production infrastructures call this function regularly to collect and
report statistics.

Fix this by tracking the necessary cumulative statistics in the
mcaches. ReadMemStats still has to stop the world to stabilize these
statistics, but there are only O(GOMAXPROCS) mcaches to collect
statistics from, so this pause is only 25µs even at GOMAXPROCS=100.

Fixes #13613.

Change-Id: I3c0a4e14833f4760dab675efc1916e73b4c0032a
Reviewed-on: https://go-review.googlesource.com/34937
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-01-03 10:15:55 -07:00
 								func TestReadMemStats(t *testing.T) {
 									base, slow := runtime.ReadMemStatsSlow()
 									if base != slow {
 										logDiff(t, "MemStats", reflect.ValueOf(base), reflect.ValueOf(slow))
 										t.Fatal("memstats mismatch")
 									}
 								}
 								func logDiff(t *testing.T, prefix string, got, want reflect.Value) {
 									typ := got.Type()
 									switch typ.Kind() {
 									case reflect.Array, reflect.Slice:
 										if got.Len() != want.Len() {
 											t.Logf("len(%s): got %v, want %v", prefix, got, want)
 											return
 										}
 										for i := 0; i < got.Len(); i++ {
 											logDiff(t, fmt.Sprintf("%s[%d]", prefix, i), got.Index(i), want.Index(i))
 										}
 									case reflect.Struct:
 										for i := 0; i < typ.NumField(); i++ {
 											gf, wf := got.Field(i), want.Field(i)
 											logDiff(t, prefix+"."+typ.Field(i).Name, gf, wf)
 										}
 									case reflect.Map:
 										t.Fatal("not implemented: logDiff for map")
 									default:
 										if got.Interface() != want.Interface() {
 											t.Logf("%s: got %v, want %v", prefix, got, want)
 										}
 									}
 								}
 								func BenchmarkReadMemStats(b *testing.B) {
 									var ms runtime.MemStats
 									const heapSize = 100 << 20
 									x := make([]*[1024]byte, heapSize/1024)
 									for i := range x {
 										x[i] = new([1024]byte)
 									}
 									hugeSink = x
 									b.ResetTimer()
 									for i := 0; i < b.N; i++ {
 										runtime.ReadMemStats(&ms)
 									}
 									hugeSink = nil
 								}
-												runtime: make runtime.GC() trigger GC even if GOGC=off

Currently, the priority of checks in (gcTrigger).test() puts the
gcpercent<0 test above gcTriggerCycle, which is used for runtime.GC().
This is an unintentional change from 1.8 and before, where
runtime.GC() triggered a GC even if GOGC=off.

Fix this by rearranging the priority so the gcTriggerCycle test
executes even if gcpercent < 0.

Fixes #22023.

Change-Id: I109328d7b643b6824eb9d79061a9e775f0149575
Reviewed-on: https://go-review.googlesource.com/65994
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-09-25 12:58:13 -06:00
-												runtime: add ReadMemStats latency benchmark

This change adds a benchmark to the runtime which measures ReadMemStats
latencies. It generates allocations with lots of pointers to keep the GC
busy while hitting ReadMemStats and measuring the time it takes to
complete.

Updates #19812.

Change-Id: I7a76aaf497ba5324d3c7a7b3df32461b3e6c3ac8
Reviewed-on: https://go-review.googlesource.com/c/go/+/220177
Run-TryBot: Michael Knyszek <mknyszek@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Austin Clements <austin@google.com>
Reviewed-by: Emmanuel Odeke <emm.odeke@gmail.com>

											
										
										
											2020-02-19 13:54:25 -07:00
+								func BenchmarkReadMemStatsLatency(b *testing.B) {
 									// We’ll apply load to the runtime with maxProcs-1 goroutines
 									// and use one more to actually benchmark. It doesn't make sense
 									// to try to run this test with only 1 P (that's what
 									// BenchmarkReadMemStats is for).
 									maxProcs := runtime.GOMAXPROCS(-1)
 									if maxProcs == 1 {
 										b.Skip("This benchmark can only be run with GOMAXPROCS > 1")
 									}
 									// Code to build a big tree with lots of pointers.
 									type node struct {
 										children [16]*node
 									}
 									var buildTree func(depth int) *node
 									buildTree = func(depth int) *node {
 										tree := new(node)
 										if depth != 0 {
 											for i := range tree.children {
 												tree.children[i] = buildTree(depth - 1)
 											}
 										}
 										return tree
 									}
 									// Keep the GC busy by continuously generating large trees.
 									done := make(chan struct{})
 									var wg sync.WaitGroup
 									for i := 0; i < maxProcs-1; i++ {
 										wg.Add(1)
 										go func() {
 											defer wg.Done()
 											var hold *node
 										loop:
 											for {
 												hold = buildTree(5)
 												select {
 												case <-done:
 													break loop
 												default:
 												}
 											}
 											runtime.KeepAlive(hold)
 										}()
 									}
 									// Spend this much time measuring latencies.
 									latencies := make([]time.Duration, 0, 1024)
 									// Run for timeToBench hitting ReadMemStats continuously
 									// and measuring the latency.
 									b.ResetTimer()
 									var ms runtime.MemStats
 									for i := 0; i < b.N; i++ {
 										// Sleep for a bit, otherwise we're just going to keep
 										// stopping the world and no one will get to do anything.
 										time.Sleep(100 * time.Millisecond)
 										start := time.Now()
 										runtime.ReadMemStats(&ms)
 										latencies = append(latencies, time.Now().Sub(start))
 									}
 									close(done)
 									// Make sure to stop the timer before we wait! The goroutines above
 									// are very heavy-weight and not easy to stop, so we could end up
 									// confusing the benchmarking framework for small b.N.
 									b.StopTimer()
 									wg.Wait()
 									// Disable the default */op metrics.
 									// ns/op doesn't mean anything because it's an average, but we
 									// have a sleep in our b.N loop above which skews this significantly.
 									b.ReportMetric(0, "ns/op")
 									b.ReportMetric(0, "B/op")
 									b.ReportMetric(0, "allocs/op")
 									// Sort latencies then report percentiles.
 									sort.Slice(latencies, func(i, j int) bool {
 										return latencies[i] < latencies[j]
 									})
 									b.ReportMetric(float64(latencies[len(latencies)*50/100]), "p50-ns")
 									b.ReportMetric(float64(latencies[len(latencies)*90/100]), "p90-ns")
 									b.ReportMetric(float64(latencies[len(latencies)*99/100]), "p99-ns")
 								}
-												runtime: make runtime.GC() trigger GC even if GOGC=off

Currently, the priority of checks in (gcTrigger).test() puts the
gcpercent<0 test above gcTriggerCycle, which is used for runtime.GC().
This is an unintentional change from 1.8 and before, where
runtime.GC() triggered a GC even if GOGC=off.

Fix this by rearranging the priority so the gcTriggerCycle test
executes even if gcpercent < 0.

Fixes #22023.

Change-Id: I109328d7b643b6824eb9d79061a9e775f0149575
Reviewed-on: https://go-review.googlesource.com/65994
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-09-25 12:58:13 -06:00
+								func TestUserForcedGC(t *testing.T) {
 									// Test that runtime.GC() triggers a GC even if GOGC=off.
 									defer debug.SetGCPercent(debug.SetGCPercent(-1))
 									var ms1, ms2 runtime.MemStats
 									runtime.ReadMemStats(&ms1)
 									runtime.GC()
 									runtime.ReadMemStats(&ms2)
 									if ms1.NumGC == ms2.NumGC {
 										t.Fatalf("runtime.GC() did not trigger GC")
 									}
 									if ms1.NumForcedGC == ms2.NumForcedGC {
 										t.Fatalf("runtime.GC() was not accounted in NumForcedGC")
 									}
 								}
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+								func writeBarrierBenchmark(b *testing.B, f func()) {
 									runtime.GC()
 									var ms runtime.MemStats
 									runtime.ReadMemStats(&ms)
 									//b.Logf("heap size: %d MB", ms.HeapAlloc>>20)
 									// Keep GC running continuously during the benchmark, which in
 									// turn keeps the write barrier on continuously.
 									var stop uint32
 									done := make(chan bool)
 									go func() {
 										for atomic.LoadUint32(&stop) == 0 {
 											runtime.GC()
 										}
 										close(done)
 									}()
 									defer func() {
 										atomic.StoreUint32(&stop, 1)
 										<-done
 									}()
 									b.ResetTimer()
 									f()
 									b.StopTimer()
 								}
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
+								func BenchmarkWriteBarrier(b *testing.B) {
 									if runtime.GOMAXPROCS(-1) < 2 {
 										// We don't want GC to take our time.
 										b.Skip("need GOMAXPROCS >= 2")
 									}
 									// Construct a large tree both so the GC runs for a while and
 									// so we have a data structure to manipulate the pointers of.
 									type node struct {
 										l, r *node
 									}
 									var wbRoots []*node
 									var mkTree func(level int) *node
 									mkTree = func(level int) *node {
 										if level == 0 {
 											return nil
 										}
 										n := &node{mkTree(level - 1), mkTree(level - 1)}
 										if level == 10 {
 											// Seed GC with enough early pointers so it
-												runtime: eliminate mark 2 and fix mark termination race

The mark 2 phase was originally introduced as a way to reduce the
chance of entering STW mark termination while there was still marking
work to do. It works by flushing and disabling all local work caches
so that all enqueued work becomes immediately globally visible.
However, mark 2 is not only slow–disabling caches makes marking and
the write barrier both much more expensive–but also imperfect. There
is still a rare but possible race (~once per all.bash) that can cause
GC to enter mark termination while there is still marking work. This
race is detailed at
https://github.com/golang/proposal/blob/master/design/17503-eliminate-rescan.md#appendix-mark-completion-race
The effect of this is that mark termination must still cope with the
possibility that there may be work remaining after a concurrent mark
phase. Dealing with this increases STW pause time and increases the
complexity of mark termination.

Furthermore, a similar but far more likely race can cause early
transition from mark 1 to mark 2. This is unfortunate because it
causes performance instability because of the cost of mark 2.

This CL fixes this by replacing mark 2 with a distributed termination
detection algorithm. This algorithm is correct, so it eliminates the
mark termination race, and doesn't require disabling local caches. It
ensures that there are no grey objects upon entering mark termination.
With this change, we're one step closer to eliminating marking from
mark termination entirely (it's still used by STW GC and checkmarks
mode).

This CL does not eliminate the gcBlackenPromptly global flag, though
it is always set to false now. It will be removed in a cleanup CL.

This led to only minor variations in the go1 benchmarks
(https://perf.golang.org/search?q=upload:20180909.1) and compilebench
benchmarks (https://perf.golang.org/search?q=upload:20180910.2).

This significantly improves performance of the garbage benchmark, with
no impact on STW times:

name                        old time/op    new time/op   delta
Garbage/benchmem-MB=64-12    2.21ms ± 1%   2.05ms ± 1%   -7.38% (p=0.000 n=18+19)
Garbage/benchmem-MB=1024-12  2.30ms ±16%   2.20ms ± 7%   -4.51% (p=0.001 n=20+20)

name                        old STW-ns/GC  new STW-ns/GC  delta
Garbage/benchmem-MB=64-12      138k ±44%     141k ±23%     ~    (p=0.309 n=19+20)
Garbage/benchmem-MB=1024-12    159k ±25%     178k ±98%     ~    (p=0.798 n=16+18)

name                        old STW-ns/op  new STW-ns/op                delta
Garbage/benchmem-MB=64-12     4.42k ±44%    4.24k ±23%     ~    (p=0.531 n=19+20)
Garbage/benchmem-MB=1024-12     591 ±24%      636 ±111%    ~    (p=0.309 n=16+18)

(https://perf.golang.org/search?q=upload:20180910.1)

Updates #26903.
Updates #17503.

Change-Id: Icbd1e12b7a12a76f423c9bf033b13cb363e4cd19
Reviewed-on: https://go-review.googlesource.com/c/134318
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2018-08-03 15:13:09 -06:00
+											// doesn't start termination barriers when it
 											// only has the top of the tree.
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
+											wbRoots = append(wbRoots, n)
 										}
 										return n
 									}
 									const depth = 22 // 64 MB
 									root := mkTree(22)
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+									writeBarrierBenchmark(b, func() {
 										var stack [depth]*node
 										tos := -1
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+										// There are two write barriers per iteration, so i+=2.
 										for i := 0; i < b.N; i += 2 {
 											if tos == -1 {
 												stack[0] = root
 												tos = 0
 											}
 											// Perform one step of reversing the tree.
 											n := stack[tos]
 											if n.l == nil {
 												tos--
 											} else {
 												n.l, n.r = n.r, n.l
 												stack[tos] = n.l
 												stack[tos+1] = n.r
 												tos++
 											}
 											if i%(1<<12) == 0 {
 												// Avoid non-preemptible loops (see issue #10958).
 												runtime.Gosched()
 											}
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
+										}
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+									})
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+									runtime.KeepAlive(wbRoots)
 								}
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+								func BenchmarkBulkWriteBarrier(b *testing.B) {
 									if runtime.GOMAXPROCS(-1) < 2 {
 										// We don't want GC to take our time.
 										b.Skip("need GOMAXPROCS >= 2")
 									}
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+									// Construct a large set of objects we can copy around.
 									const heapSize = 64 << 20
 									type obj [16]*byte
 									ptrs := make([]*obj, heapSize/unsafe.Sizeof(obj{}))
 									for i := range ptrs {
 										ptrs[i] = new(obj)
 									}
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+									writeBarrierBenchmark(b, func() {
 										const blockSize = 1024
 										var pos int
 										for i := 0; i < b.N; i += blockSize {
 											// Rotate block.
 											block := ptrs[pos : pos+blockSize]
 											first := block[0]
 											copy(block, block[1:])
 											block[blockSize-1] = first
 											pos += blockSize
 											if pos+blockSize > len(ptrs) {
 												pos = 0
 											}
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
 											runtime.Gosched()
 										}
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+									})
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
-												runtime: benchmark for bulk write barriers

This adds a benchmark of typedslicecopy and its bulk write barriers.

For #22460.

Change-Id: I439ca3b130bb22944468095f8f18b464e5bb43ca
Reviewed-on: https://go-review.googlesource.com/74051
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-27 13:29:05 -06:00
+									runtime.KeepAlive(ptrs)
-												runtime: add benchmark for write barriers

For #22460.

Change-Id: I798f26d45bbe1efd16b632e201413cb26cb3e6c7
Reviewed-on: https://go-review.googlesource.com/73811
Run-TryBot: Austin Clements <austin@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Rick Hudson <rlh@golang.org>

											
										
										
											2017-10-24 09:56:00 -06:00
+								}
-												runtime: add BenchmarkScanStack

There are many possible stack scanning benchmarks,
but this one is at least a start.

cpuprofiling shows about 75% of CPU in func scanstack.

Change-Id: I906b0493966f2165c1920636c4e057d16d6447e0
Reviewed-on: https://go-review.googlesource.com/105535
Run-TryBot: Josh Bleecher Snyder <josharian@gmail.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Austin Clements <austin@google.com>

											
										
										
											2018-04-06 18:44:26 -06:00
 								func BenchmarkScanStackNoLocals(b *testing.B) {
 									var ready sync.WaitGroup
 									teardown := make(chan bool)
 									for j := 0; j < 10; j++ {
 										ready.Add(1)
 										go func() {
 											x := 100000
 											countpwg(&x, &ready, teardown)
 										}()
 									}
 									ready.Wait()
 									b.ResetTimer()
 									for i := 0; i < b.N; i++ {
 										b.StartTimer()
 										runtime.GC()
 										runtime.GC()
 										b.StopTimer()
 									}
 									close(teardown)
 								}
 								func countpwg(n *int, ready *sync.WaitGroup, teardown chan bool) {
 									if *n == 0 {
 										ready.Done()
 										<-teardown
 										return
 									}
 									*n--
 									countpwg(n, ready, teardown)
 								}