// asmcheck // Copyright 2018 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. package codegen // This file contains codegen tests related to arithmetic // simplifications and optimizations on float types. // For codegen tests on integer types, see arithmetic.go. // --------------------- // // Strength-reduce // // --------------------- // func Mul2(f float64) float64 { // 386/sse2:"ADDSD",-"MULSD" // amd64:"ADDSD",-"MULSD" // arm/7:"ADDD",-"MULD" // arm64:"FADDD",-"FMULD" // ppc64x:"FADD",-"FMUL" // riscv64:"FADDD",-"FMULD" return f * 2.0 } func DivPow2(f1, f2, f3 float64) (float64, float64, float64) { // 386/sse2:"MULSD",-"DIVSD" // amd64:"MULSD",-"DIVSD" // arm/7:"MULD",-"DIVD" // arm64:"FMULD",-"FDIVD" // ppc64x:"FMUL",-"FDIV" // riscv64:"FMULD",-"FDIVD" x := f1 / 16.0 // 386/sse2:"MULSD",-"DIVSD" // amd64:"MULSD",-"DIVSD" // arm/7:"MULD",-"DIVD" // arm64:"FMULD",-"FDIVD" // ppc64x:"FMUL",-"FDIVD" // riscv64:"FMULD",-"FDIVD" y := f2 / 0.125 // 386/sse2:"ADDSD",-"DIVSD",-"MULSD" // amd64:"ADDSD",-"DIVSD",-"MULSD" // arm/7:"ADDD",-"MULD",-"DIVD" // arm64:"FADDD",-"FMULD",-"FDIVD" // ppc64x:"FADD",-"FMUL",-"FDIV" // riscv64:"FADDD",-"FMULD",-"FDIVD" z := f3 / 0.5 return x, y, z } func indexLoad(b0 []float32, b1 float32, idx int) float32 { // arm64:`FMOVS\s\(R[0-9]+\)\(R[0-9]+<<2\),\sF[0-9]+` // loong64:`MOVF\s\(R[0-9]+\)\(R[0-9]+\),\sF[0-9]+` return b0[idx] * b1 } func indexStore(b0 []float64, b1 float64, idx int) { // arm64:`FMOVD\sF[0-9]+,\s\(R[0-9]+\)\(R[0-9]+<<3\)` // loong64:`MOVD\sF[0-9]+,\s\(R[0-9]+\)\(R[0-9]+\)` b0[idx] = b1 } // ----------- // // Fused // // ----------- // func FusedAdd32(x, y, z float32) float32 { // s390x:"FMADDS\t" // ppc64x:"FMADDS\t" // arm64:"FMADDS" // loong64:"FMADDF\t" // riscv64:"FMADDS\t" return x*y + z } func FusedSub32_a(x, y, z float32) float32 { // s390x:"FMSUBS\t" // ppc64x:"FMSUBS\t" // riscv64:"FMSUBS\t" // loong64:"FMSUBF\t" return x*y - z } func FusedSub32_b(x, y, z float32) float32 { // arm64:"FMSUBS" // loong64:"FNMSUBF\t" // riscv64:"FNMSUBS\t" return z - x*y } func FusedAdd64(x, y, z float64) float64 { // s390x:"FMADD\t" // ppc64x:"FMADD\t" // arm64:"FMADDD" // loong64:"FMADDD\t" // riscv64:"FMADDD\t" return x*y + z } func FusedSub64_a(x, y, z float64) float64 { // s390x:"FMSUB\t" // ppc64x:"FMSUB\t" // riscv64:"FMSUBD\t" // loong64:"FMSUBD\t" return x*y - z } func FusedSub64_b(x, y, z float64) float64 { // arm64:"FMSUBD" // loong64:"FNMSUBD\t" // riscv64:"FNMSUBD\t" return z - x*y } func Cmp(f float64) bool { // arm64:"FCMPD","(BGT|BLE|BMI|BPL)",-"CSET\tGT",-"CBZ" return f > 4 || f < -4 } func CmpZero64(f float64) bool { // s390x:"LTDBR",-"FCMPU" return f <= 0 } func CmpZero32(f float32) bool { // s390x:"LTEBR",-"CEBR" return f <= 0 } func CmpWithSub(a float64, b float64) bool { f := a - b // s390x:-"LTDBR" return f <= 0 } func CmpWithAdd(a float64, b float64) bool { f := a + b // s390x:-"LTDBR" return f <= 0 } // ---------------- // // Non-floats // // ---------------- // // We should make sure that the compiler doesn't generate floating point // instructions for non-float operations on Plan 9, because floating point // operations are not allowed in the note handler. func ArrayZero() [16]byte { // amd64:"MOVUPS" // plan9/amd64/:-"MOVUPS" var a [16]byte return a } func ArrayCopy(a [16]byte) (b [16]byte) { // amd64:"MOVUPS" // plan9/amd64/:-"MOVUPS" b = a return } // ---------------- // // Float Min/Max // // ---------------- // func Float64Min(a, b float64) float64 { // amd64:"MINSD" // arm64:"FMIND" // loong64:"FMIND" // riscv64:"FMIN" // ppc64/power9:"XSMINJDP" // ppc64/power10:"XSMINJDP" return min(a, b) } func Float64Max(a, b float64) float64 { // amd64:"MINSD" // arm64:"FMAXD" // loong64:"FMAXD" // riscv64:"FMAX" // ppc64/power9:"XSMAXJDP" // ppc64/power10:"XSMAXJDP" return max(a, b) } func Float32Min(a, b float32) float32 { // amd64:"MINSS" // arm64:"FMINS" // loong64:"FMINF" // riscv64:"FMINS" // ppc64/power9:"XSMINJDP" // ppc64/power10:"XSMINJDP" return min(a, b) } func Float32Max(a, b float32) float32 { // amd64:"MINSS" // arm64:"FMAXS" // loong64:"FMAXF" // riscv64:"FMAXS" // ppc64/power9:"XSMAXJDP" // ppc64/power10:"XSMAXJDP" return max(a, b) } // ------------------------ // // Constant Optimizations // // ------------------------ // func Float32Constant() float32 { // ppc64x/power8:"FMOVS\t[$]f32\\.42440000\\(SB\\)" // ppc64x/power9:"FMOVS\t[$]f32\\.42440000\\(SB\\)" // ppc64x/power10:"XXSPLTIDP\t[$]1111752704," return 49.0 } func Float64Constant() float64 { // ppc64x/power8:"FMOVD\t[$]f64\\.4048800000000000\\(SB\\)" // ppc64x/power9:"FMOVD\t[$]f64\\.4048800000000000\\(SB\\)" // ppc64x/power10:"XXSPLTIDP\t[$]1111752704," return 49.0 } func Float32DenormalConstant() float32 { // ppc64x:"FMOVS\t[$]f32\\.00400000\\(SB\\)" return 0x1p-127 } // A float64 constant which can be exactly represented as a // denormal float32 value. On ppc64x, denormal values cannot // be used with XXSPLTIDP. func Float64DenormalFloat32Constant() float64 { // ppc64x:"FMOVD\t[$]f64\\.3800000000000000\\(SB\\)" return 0x1p-127 } func Float64ConstantStore(p *float64) { // amd64: "MOVQ\t[$]4617801906721357038" *p = 5.432 } func Float32ConstantStore(p *float32) { // amd64: "MOVL\t[$]1085133554" *p = 5.432 }