mirror of
https://github.com/golang/go
synced 2024-11-15 03:50:33 -07:00
ef3e1dae2f
goos: linux goarch: loong64 pkg: test/bench/go1 cpu: Loongson-3A6000 @ 2500.00MHz | bench.old | bench.new | | sec/op | sec/op vs base | BinaryTree17 7.766 ± 1% 7.640 ± 2% -1.62% (p=0.000 n=20) Fannkuch11 2.649 ± 0% 2.358 ± 0% -10.96% (p=0.000 n=20) FmtFprintfEmpty 35.89n ± 0% 35.87n ± 0% -0.06% (p=0.000 n=20) FmtFprintfString 59.44n ± 0% 57.25n ± 2% -3.68% (p=0.000 n=20) FmtFprintfInt 62.07n ± 0% 60.04n ± 0% -3.27% (p=0.000 n=20) FmtFprintfIntInt 97.90n ± 0% 97.26n ± 0% -0.65% (p=0.000 n=20) FmtFprintfPrefixedInt 116.7n ± 0% 119.2n ± 0% +2.14% (p=0.000 n=20) FmtFprintfFloat 204.5n ± 0% 201.9n ± 0% -1.30% (p=0.000 n=20) FmtManyArgs 455.9n ± 0% 466.8n ± 0% +2.39% (p=0.000 n=20) GobDecode 7.458m ± 1% 7.138m ± 1% -4.28% (p=0.000 n=20) GobEncode 8.573m ± 1% 8.473m ± 1% ~ (p=0.091 n=20) Gzip 280.2m ± 0% 284.9m ± 0% +1.67% (p=0.000 n=20) Gunzip 32.68m ± 0% 32.67m ± 0% ~ (p=0.211 n=20) HTTPClientServer 54.22µ ± 0% 53.24µ ± 0% -1.80% (p=0.000 n=20) JSONEncode 9.427m ± 1% 9.152m ± 0% -2.92% (p=0.000 n=20) JSONDecode 47.08m ± 1% 46.85m ± 1% -0.49% (p=0.007 n=20) Mandelbrot200 4.601m ± 0% 4.605m ± 0% +0.08% (p=0.000 n=20) GoParse 4.776m ± 0% 4.655m ± 1% -2.52% (p=0.000 n=20) RegexpMatchEasy0_32 59.77n ± 0% 57.59n ± 0% -3.66% (p=0.000 n=20) RegexpMatchEasy0_1K 458.1n ± 0% 458.8n ± 0% +0.15% (p=0.000 n=20) RegexpMatchEasy1_32 59.36n ± 0% 59.24n ± 0% -0.20% (p=0.000 n=20) RegexpMatchEasy1_1K 557.7n ± 0% 560.2n ± 0% +0.46% (p=0.000 n=20) RegexpMatchMedium_32 803.1n ± 0% 772.8n ± 0% -3.77% (p=0.000 n=20) RegexpMatchMedium_1K 27.29µ ± 0% 25.88µ ± 0% -5.18% (p=0.000 n=20) RegexpMatchHard_32 1.385µ ± 0% 1.304µ ± 0% -5.85% (p=0.000 n=20) RegexpMatchHard_1K 40.92µ ± 0% 39.58µ ± 0% -3.27% (p=0.000 n=20) Revcomp 474.3m ± 0% 410.0m ± 0% -13.56% (p=0.000 n=20) Template 78.16m ± 0% 76.32m ± 1% -2.36% (p=0.000 n=20) TimeParse 271.8n ± 0% 272.1n ± 0% +0.11% (p=0.000 n=20) TimeFormat 292.3n ± 0% 294.8n ± 0% +0.86% (p=0.000 n=20) geomean 51.98µ 50.82µ -2.22% Change-Id: Ia78f1ddee8f1d9ec7192a4b8d2a4ec6058679956 Reviewed-on: https://go-review.googlesource.com/c/go/+/615918 Reviewed-by: Qiqi Huang <huangqiqi@loongson.cn> Reviewed-by: Dmitri Shuralyov <dmitshur@google.com> Reviewed-by: Michael Knyszek <mknyszek@google.com> LUCI-TryBot-Result: Go LUCI <golang-scoped@luci-project-accounts.iam.gserviceaccount.com> Reviewed-by: abner chenc <chenguoqi@loongson.cn>
245 lines
5.3 KiB
Go
245 lines
5.3 KiB
Go
// asmcheck
|
|
|
|
// Copyright 2018 The Go Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style
|
|
// license that can be found in the LICENSE file.
|
|
|
|
package codegen
|
|
|
|
// This file contains codegen tests related to arithmetic
|
|
// simplifications and optimizations on float types.
|
|
// For codegen tests on integer types, see arithmetic.go.
|
|
|
|
// --------------------- //
|
|
// Strength-reduce //
|
|
// --------------------- //
|
|
|
|
func Mul2(f float64) float64 {
|
|
// 386/sse2:"ADDSD",-"MULSD"
|
|
// amd64:"ADDSD",-"MULSD"
|
|
// arm/7:"ADDD",-"MULD"
|
|
// arm64:"FADDD",-"FMULD"
|
|
// ppc64x:"FADD",-"FMUL"
|
|
// riscv64:"FADDD",-"FMULD"
|
|
return f * 2.0
|
|
}
|
|
|
|
func DivPow2(f1, f2, f3 float64) (float64, float64, float64) {
|
|
// 386/sse2:"MULSD",-"DIVSD"
|
|
// amd64:"MULSD",-"DIVSD"
|
|
// arm/7:"MULD",-"DIVD"
|
|
// arm64:"FMULD",-"FDIVD"
|
|
// ppc64x:"FMUL",-"FDIV"
|
|
// riscv64:"FMULD",-"FDIVD"
|
|
x := f1 / 16.0
|
|
|
|
// 386/sse2:"MULSD",-"DIVSD"
|
|
// amd64:"MULSD",-"DIVSD"
|
|
// arm/7:"MULD",-"DIVD"
|
|
// arm64:"FMULD",-"FDIVD"
|
|
// ppc64x:"FMUL",-"FDIVD"
|
|
// riscv64:"FMULD",-"FDIVD"
|
|
y := f2 / 0.125
|
|
|
|
// 386/sse2:"ADDSD",-"DIVSD",-"MULSD"
|
|
// amd64:"ADDSD",-"DIVSD",-"MULSD"
|
|
// arm/7:"ADDD",-"MULD",-"DIVD"
|
|
// arm64:"FADDD",-"FMULD",-"FDIVD"
|
|
// ppc64x:"FADD",-"FMUL",-"FDIV"
|
|
// riscv64:"FADDD",-"FMULD",-"FDIVD"
|
|
z := f3 / 0.5
|
|
|
|
return x, y, z
|
|
}
|
|
|
|
func indexLoad(b0 []float32, b1 float32, idx int) float32 {
|
|
// arm64:`FMOVS\s\(R[0-9]+\)\(R[0-9]+<<2\),\sF[0-9]+`
|
|
// loong64:`MOVF\s\(R[0-9]+\)\(R[0-9]+\),\sF[0-9]+`
|
|
return b0[idx] * b1
|
|
}
|
|
|
|
func indexStore(b0 []float64, b1 float64, idx int) {
|
|
// arm64:`FMOVD\sF[0-9]+,\s\(R[0-9]+\)\(R[0-9]+<<3\)`
|
|
// loong64:`MOVD\sF[0-9]+,\s\(R[0-9]+\)\(R[0-9]+\)`
|
|
b0[idx] = b1
|
|
}
|
|
|
|
// ----------- //
|
|
// Fused //
|
|
// ----------- //
|
|
|
|
func FusedAdd32(x, y, z float32) float32 {
|
|
// s390x:"FMADDS\t"
|
|
// ppc64x:"FMADDS\t"
|
|
// arm64:"FMADDS"
|
|
// riscv64:"FMADDS\t"
|
|
return x*y + z
|
|
}
|
|
|
|
func FusedSub32_a(x, y, z float32) float32 {
|
|
// s390x:"FMSUBS\t"
|
|
// ppc64x:"FMSUBS\t"
|
|
// riscv64:"FMSUBS\t"
|
|
return x*y - z
|
|
}
|
|
|
|
func FusedSub32_b(x, y, z float32) float32 {
|
|
// arm64:"FMSUBS"
|
|
// riscv64:"FNMSUBS\t"
|
|
return z - x*y
|
|
}
|
|
|
|
func FusedAdd64(x, y, z float64) float64 {
|
|
// s390x:"FMADD\t"
|
|
// ppc64x:"FMADD\t"
|
|
// arm64:"FMADDD"
|
|
// riscv64:"FMADDD\t"
|
|
return x*y + z
|
|
}
|
|
|
|
func FusedSub64_a(x, y, z float64) float64 {
|
|
// s390x:"FMSUB\t"
|
|
// ppc64x:"FMSUB\t"
|
|
// riscv64:"FMSUBD\t"
|
|
return x*y - z
|
|
}
|
|
|
|
func FusedSub64_b(x, y, z float64) float64 {
|
|
// arm64:"FMSUBD"
|
|
// riscv64:"FNMSUBD\t"
|
|
return z - x*y
|
|
}
|
|
|
|
func Cmp(f float64) bool {
|
|
// arm64:"FCMPD","(BGT|BLE|BMI|BPL)",-"CSET\tGT",-"CBZ"
|
|
return f > 4 || f < -4
|
|
}
|
|
|
|
func CmpZero64(f float64) bool {
|
|
// s390x:"LTDBR",-"FCMPU"
|
|
return f <= 0
|
|
}
|
|
|
|
func CmpZero32(f float32) bool {
|
|
// s390x:"LTEBR",-"CEBR"
|
|
return f <= 0
|
|
}
|
|
|
|
func CmpWithSub(a float64, b float64) bool {
|
|
f := a - b
|
|
// s390x:-"LTDBR"
|
|
return f <= 0
|
|
}
|
|
|
|
func CmpWithAdd(a float64, b float64) bool {
|
|
f := a + b
|
|
// s390x:-"LTDBR"
|
|
return f <= 0
|
|
}
|
|
|
|
// ---------------- //
|
|
// Non-floats //
|
|
// ---------------- //
|
|
|
|
// We should make sure that the compiler doesn't generate floating point
|
|
// instructions for non-float operations on Plan 9, because floating point
|
|
// operations are not allowed in the note handler.
|
|
|
|
func ArrayZero() [16]byte {
|
|
// amd64:"MOVUPS"
|
|
// plan9/amd64/:-"MOVUPS"
|
|
var a [16]byte
|
|
return a
|
|
}
|
|
|
|
func ArrayCopy(a [16]byte) (b [16]byte) {
|
|
// amd64:"MOVUPS"
|
|
// plan9/amd64/:-"MOVUPS"
|
|
b = a
|
|
return
|
|
}
|
|
|
|
// ---------------- //
|
|
// Float Min/Max //
|
|
// ---------------- //
|
|
|
|
func Float64Min(a, b float64) float64 {
|
|
// amd64:"MINSD"
|
|
// arm64:"FMIND"
|
|
// loong64:"FMIND"
|
|
// riscv64:"FMIN"
|
|
// ppc64/power9:"XSMINJDP"
|
|
// ppc64/power10:"XSMINJDP"
|
|
return min(a, b)
|
|
}
|
|
|
|
func Float64Max(a, b float64) float64 {
|
|
// amd64:"MINSD"
|
|
// arm64:"FMAXD"
|
|
// loong64:"FMAXD"
|
|
// riscv64:"FMAX"
|
|
// ppc64/power9:"XSMAXJDP"
|
|
// ppc64/power10:"XSMAXJDP"
|
|
return max(a, b)
|
|
}
|
|
|
|
func Float32Min(a, b float32) float32 {
|
|
// amd64:"MINSS"
|
|
// arm64:"FMINS"
|
|
// loong64:"FMINF"
|
|
// riscv64:"FMINS"
|
|
// ppc64/power9:"XSMINJDP"
|
|
// ppc64/power10:"XSMINJDP"
|
|
return min(a, b)
|
|
}
|
|
|
|
func Float32Max(a, b float32) float32 {
|
|
// amd64:"MINSS"
|
|
// arm64:"FMAXS"
|
|
// loong64:"FMAXF"
|
|
// riscv64:"FMAXS"
|
|
// ppc64/power9:"XSMAXJDP"
|
|
// ppc64/power10:"XSMAXJDP"
|
|
return max(a, b)
|
|
}
|
|
|
|
// ------------------------ //
|
|
// Constant Optimizations //
|
|
// ------------------------ //
|
|
|
|
func Float32Constant() float32 {
|
|
// ppc64x/power8:"FMOVS\t[$]f32\\.42440000\\(SB\\)"
|
|
// ppc64x/power9:"FMOVS\t[$]f32\\.42440000\\(SB\\)"
|
|
// ppc64x/power10:"XXSPLTIDP\t[$]1111752704,"
|
|
return 49.0
|
|
}
|
|
|
|
func Float64Constant() float64 {
|
|
// ppc64x/power8:"FMOVD\t[$]f64\\.4048800000000000\\(SB\\)"
|
|
// ppc64x/power9:"FMOVD\t[$]f64\\.4048800000000000\\(SB\\)"
|
|
// ppc64x/power10:"XXSPLTIDP\t[$]1111752704,"
|
|
return 49.0
|
|
}
|
|
|
|
func Float32DenormalConstant() float32 {
|
|
// ppc64x:"FMOVS\t[$]f32\\.00400000\\(SB\\)"
|
|
return 0x1p-127
|
|
}
|
|
|
|
// A float64 constant which can be exactly represented as a
|
|
// denormal float32 value. On ppc64x, denormal values cannot
|
|
// be used with XXSPLTIDP.
|
|
func Float64DenormalFloat32Constant() float64 {
|
|
// ppc64x:"FMOVD\t[$]f64\\.3800000000000000\\(SB\\)"
|
|
return 0x1p-127
|
|
}
|
|
|
|
func Float64ConstantStore(p *float64) {
|
|
// amd64: "MOVQ\t[$]4617801906721357038"
|
|
*p = 5.432
|
|
}
|
|
func Float32ConstantStore(p *float32) {
|
|
// amd64: "MOVL\t[$]1085133554"
|
|
*p = 5.432
|
|
}
|