mirror of
https://github.com/golang/go
synced 2024-11-19 16:04:48 -07:00
a6ae01a64a
This computes the maximum possible waste in a size class due to both internal and external fragmentation as a percent of the span size. This parallels the reasoning about overhead in the comment at the top of mksizeclasses.go and confirms that comment's assertion that (except for the few smallest size classes), none of the size classes have worst-case internal and external fragmentation simultaneously. Change-Id: Idb66fe6c241d56f33d391831d4cd5a626955562b Reviewed-on: https://go-review.googlesource.com/49370 Run-TryBot: Austin Clements <austin@google.com> TryBot-Result: Gobot Gobot <gobot@golang.org> Reviewed-by: Keith Randall <khr@golang.org>
329 lines
8.6 KiB
Go
329 lines
8.6 KiB
Go
// Copyright 2016 The Go Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style
|
|
// license that can be found in the LICENSE file.
|
|
|
|
// +build ignore
|
|
|
|
// Generate tables for small malloc size classes.
|
|
//
|
|
// See malloc.go for overview.
|
|
//
|
|
// The size classes are chosen so that rounding an allocation
|
|
// request up to the next size class wastes at most 12.5% (1.125x).
|
|
//
|
|
// Each size class has its own page count that gets allocated
|
|
// and chopped up when new objects of the size class are needed.
|
|
// That page count is chosen so that chopping up the run of
|
|
// pages into objects of the given size wastes at most 12.5% (1.125x)
|
|
// of the memory. It is not necessary that the cutoff here be
|
|
// the same as above.
|
|
//
|
|
// The two sources of waste multiply, so the worst possible case
|
|
// for the above constraints would be that allocations of some
|
|
// size might have a 26.6% (1.266x) overhead.
|
|
// In practice, only one of the wastes comes into play for a
|
|
// given size (sizes < 512 waste mainly on the round-up,
|
|
// sizes > 512 waste mainly on the page chopping).
|
|
// For really small sizes, alignment constraints force the
|
|
// overhead higher.
|
|
|
|
package main
|
|
|
|
import (
|
|
"bytes"
|
|
"flag"
|
|
"fmt"
|
|
"go/format"
|
|
"io"
|
|
"io/ioutil"
|
|
"log"
|
|
"os"
|
|
)
|
|
|
|
// Generate msize.go
|
|
|
|
var stdout = flag.Bool("stdout", false, "write to stdout instead of sizeclasses.go")
|
|
|
|
func main() {
|
|
flag.Parse()
|
|
|
|
var b bytes.Buffer
|
|
fmt.Fprintln(&b, "// Code generated by mksizeclasses.go; DO NOT EDIT.")
|
|
fmt.Fprintln(&b, "//go:generate go run mksizeclasses.go")
|
|
fmt.Fprintln(&b)
|
|
fmt.Fprintln(&b, "package runtime")
|
|
classes := makeClasses()
|
|
|
|
printComment(&b, classes)
|
|
|
|
printClasses(&b, classes)
|
|
|
|
out, err := format.Source(b.Bytes())
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
if *stdout {
|
|
_, err = os.Stdout.Write(out)
|
|
} else {
|
|
err = ioutil.WriteFile("sizeclasses.go", out, 0666)
|
|
}
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
}
|
|
|
|
const (
|
|
// Constants that we use and will transfer to the runtime.
|
|
maxSmallSize = 32 << 10
|
|
smallSizeDiv = 8
|
|
smallSizeMax = 1024
|
|
largeSizeDiv = 128
|
|
pageShift = 13
|
|
|
|
// Derived constants.
|
|
pageSize = 1 << pageShift
|
|
)
|
|
|
|
type class struct {
|
|
size int // max size
|
|
npages int // number of pages
|
|
|
|
mul int
|
|
shift uint
|
|
shift2 uint
|
|
mask int
|
|
}
|
|
|
|
func powerOfTwo(x int) bool {
|
|
return x != 0 && x&(x-1) == 0
|
|
}
|
|
|
|
func makeClasses() []class {
|
|
var classes []class
|
|
|
|
classes = append(classes, class{}) // class #0 is a dummy entry
|
|
|
|
align := 8
|
|
for size := align; size <= maxSmallSize; size += align {
|
|
if powerOfTwo(size) { // bump alignment once in a while
|
|
if size >= 2048 {
|
|
align = 256
|
|
} else if size >= 128 {
|
|
align = size / 8
|
|
} else if size >= 16 {
|
|
align = 16 // required for x86 SSE instructions, if we want to use them
|
|
}
|
|
}
|
|
if !powerOfTwo(align) {
|
|
panic("incorrect alignment")
|
|
}
|
|
|
|
// Make the allocnpages big enough that
|
|
// the leftover is less than 1/8 of the total,
|
|
// so wasted space is at most 12.5%.
|
|
allocsize := pageSize
|
|
for allocsize%size > allocsize/8 {
|
|
allocsize += pageSize
|
|
}
|
|
npages := allocsize / pageSize
|
|
|
|
// If the previous sizeclass chose the same
|
|
// allocation size and fit the same number of
|
|
// objects into the page, we might as well
|
|
// use just this size instead of having two
|
|
// different sizes.
|
|
if len(classes) > 1 && npages == classes[len(classes)-1].npages && allocsize/size == allocsize/classes[len(classes)-1].size {
|
|
classes[len(classes)-1].size = size
|
|
continue
|
|
}
|
|
classes = append(classes, class{size: size, npages: npages})
|
|
}
|
|
|
|
// Increase object sizes if we can fit the same number of larger objects
|
|
// into the same number of pages. For example, we choose size 8448 above
|
|
// with 6 objects in 7 pages. But we can well use object size 9472,
|
|
// which is also 6 objects in 7 pages but +1024 bytes (+12.12%).
|
|
// We need to preserve at least largeSizeDiv alignment otherwise
|
|
// sizeToClass won't work.
|
|
for i := range classes {
|
|
if i == 0 {
|
|
continue
|
|
}
|
|
c := &classes[i]
|
|
psize := c.npages * pageSize
|
|
new_size := (psize / (psize / c.size)) &^ (largeSizeDiv - 1)
|
|
if new_size > c.size {
|
|
c.size = new_size
|
|
}
|
|
}
|
|
|
|
if len(classes) != 67 {
|
|
panic("number of size classes has changed")
|
|
}
|
|
|
|
for i := range classes {
|
|
computeDivMagic(&classes[i])
|
|
}
|
|
|
|
return classes
|
|
}
|
|
|
|
// computeDivMagic computes some magic constants to implement
|
|
// the division required to compute object number from span offset.
|
|
// n / c.size is implemented as n >> c.shift * c.mul >> c.shift2
|
|
// for all 0 <= n < c.npages * pageSize
|
|
func computeDivMagic(c *class) {
|
|
// divisor
|
|
d := c.size
|
|
if d == 0 {
|
|
return
|
|
}
|
|
|
|
// maximum input value for which the formula needs to work.
|
|
max := c.npages*pageSize - 1
|
|
|
|
if powerOfTwo(d) {
|
|
// If the size is a power of two, heapBitsForObject can divide even faster by masking.
|
|
// Compute this mask.
|
|
if max >= 1<<16 {
|
|
panic("max too big for power of two size")
|
|
}
|
|
c.mask = 1<<16 - d
|
|
}
|
|
|
|
// Compute pre-shift by factoring power of 2 out of d.
|
|
for d%2 == 0 {
|
|
c.shift++
|
|
d >>= 1
|
|
max >>= 1
|
|
}
|
|
|
|
// Find the smallest k that works.
|
|
// A small k allows us to fit the math required into 32 bits
|
|
// so we can use 32-bit multiplies and shifts on 32-bit platforms.
|
|
nextk:
|
|
for k := uint(0); ; k++ {
|
|
mul := (int(1)<<k + d - 1) / d // ⌈2^k / d⌉
|
|
|
|
// Test to see if mul works.
|
|
for n := 0; n <= max; n++ {
|
|
if n*mul>>k != n/d {
|
|
continue nextk
|
|
}
|
|
}
|
|
if mul >= 1<<16 {
|
|
panic("mul too big")
|
|
}
|
|
if uint64(mul)*uint64(max) >= 1<<32 {
|
|
panic("mul*max too big")
|
|
}
|
|
c.mul = mul
|
|
c.shift2 = k
|
|
break
|
|
}
|
|
|
|
// double-check.
|
|
for n := 0; n <= max; n++ {
|
|
if n*c.mul>>c.shift2 != n/d {
|
|
fmt.Printf("d=%d max=%d mul=%d shift2=%d n=%d\n", d, max, c.mul, c.shift2, n)
|
|
panic("bad multiply magic")
|
|
}
|
|
// Also check the exact computations that will be done by the runtime,
|
|
// for both 32 and 64 bit operations.
|
|
if uint32(n)*uint32(c.mul)>>uint8(c.shift2) != uint32(n/d) {
|
|
fmt.Printf("d=%d max=%d mul=%d shift2=%d n=%d\n", d, max, c.mul, c.shift2, n)
|
|
panic("bad 32-bit multiply magic")
|
|
}
|
|
if uint64(n)*uint64(c.mul)>>uint8(c.shift2) != uint64(n/d) {
|
|
fmt.Printf("d=%d max=%d mul=%d shift2=%d n=%d\n", d, max, c.mul, c.shift2, n)
|
|
panic("bad 64-bit multiply magic")
|
|
}
|
|
}
|
|
}
|
|
|
|
func printComment(w io.Writer, classes []class) {
|
|
fmt.Fprintf(w, "// %-5s %-9s %-10s %-7s %-10s %-9s\n", "class", "bytes/obj", "bytes/span", "objects", "tail waste", "max waste")
|
|
prevSize := 0
|
|
for i, c := range classes {
|
|
if i == 0 {
|
|
continue
|
|
}
|
|
spanSize := c.npages * pageSize
|
|
objects := spanSize / c.size
|
|
tailWaste := spanSize - c.size*(spanSize/c.size)
|
|
maxWaste := float64((c.size-prevSize-1)*objects+tailWaste) / float64(spanSize)
|
|
prevSize = c.size
|
|
fmt.Fprintf(w, "// %5d %9d %10d %7d %10d %8.2f%%\n", i, c.size, spanSize, objects, tailWaste, 100*maxWaste)
|
|
}
|
|
fmt.Fprintf(w, "\n")
|
|
}
|
|
|
|
func printClasses(w io.Writer, classes []class) {
|
|
fmt.Fprintln(w, "const (")
|
|
fmt.Fprintf(w, "_MaxSmallSize = %d\n", maxSmallSize)
|
|
fmt.Fprintf(w, "smallSizeDiv = %d\n", smallSizeDiv)
|
|
fmt.Fprintf(w, "smallSizeMax = %d\n", smallSizeMax)
|
|
fmt.Fprintf(w, "largeSizeDiv = %d\n", largeSizeDiv)
|
|
fmt.Fprintf(w, "_NumSizeClasses = %d\n", len(classes))
|
|
fmt.Fprintf(w, "_PageShift = %d\n", pageShift)
|
|
fmt.Fprintln(w, ")")
|
|
|
|
fmt.Fprint(w, "var class_to_size = [_NumSizeClasses]uint16 {")
|
|
for _, c := range classes {
|
|
fmt.Fprintf(w, "%d,", c.size)
|
|
}
|
|
fmt.Fprintln(w, "}")
|
|
|
|
fmt.Fprint(w, "var class_to_allocnpages = [_NumSizeClasses]uint8 {")
|
|
for _, c := range classes {
|
|
fmt.Fprintf(w, "%d,", c.npages)
|
|
}
|
|
fmt.Fprintln(w, "}")
|
|
|
|
fmt.Fprintln(w, "type divMagic struct {")
|
|
fmt.Fprintln(w, " shift uint8")
|
|
fmt.Fprintln(w, " shift2 uint8")
|
|
fmt.Fprintln(w, " mul uint16")
|
|
fmt.Fprintln(w, " baseMask uint16")
|
|
fmt.Fprintln(w, "}")
|
|
fmt.Fprint(w, "var class_to_divmagic = [_NumSizeClasses]divMagic {")
|
|
for _, c := range classes {
|
|
fmt.Fprintf(w, "{%d,%d,%d,%d},", c.shift, c.shift2, c.mul, c.mask)
|
|
}
|
|
fmt.Fprintln(w, "}")
|
|
|
|
// map from size to size class, for small sizes.
|
|
sc := make([]int, smallSizeMax/smallSizeDiv+1)
|
|
for i := range sc {
|
|
size := i * smallSizeDiv
|
|
for j, c := range classes {
|
|
if c.size >= size {
|
|
sc[i] = j
|
|
break
|
|
}
|
|
}
|
|
}
|
|
fmt.Fprint(w, "var size_to_class8 = [smallSizeMax/smallSizeDiv+1]uint8 {")
|
|
for _, v := range sc {
|
|
fmt.Fprintf(w, "%d,", v)
|
|
}
|
|
fmt.Fprintln(w, "}")
|
|
|
|
// map from size to size class, for large sizes.
|
|
sc = make([]int, (maxSmallSize-smallSizeMax)/largeSizeDiv+1)
|
|
for i := range sc {
|
|
size := smallSizeMax + i*largeSizeDiv
|
|
for j, c := range classes {
|
|
if c.size >= size {
|
|
sc[i] = j
|
|
break
|
|
}
|
|
}
|
|
}
|
|
fmt.Fprint(w, "var size_to_class128 = [(_MaxSmallSize-smallSizeMax)/largeSizeDiv+1]uint8 {")
|
|
for _, v := range sc {
|
|
fmt.Fprintf(w, "%d,", v)
|
|
}
|
|
fmt.Fprintln(w, "}")
|
|
}
|