2021-07-02 22:02:30 -06:00
|
|
|
// asmcheck
|
|
|
|
|
|
|
|
// Copyright 2021 The Go Authors. All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style
|
|
|
|
// license that can be found in the LICENSE file.
|
|
|
|
|
|
|
|
package codegen
|
|
|
|
|
|
|
|
func andn64(x, y int64) int64 {
|
|
|
|
// amd64/v3:"ANDNQ"
|
|
|
|
return x &^ y
|
|
|
|
}
|
|
|
|
|
|
|
|
func andn32(x, y int32) int32 {
|
|
|
|
// amd64/v3:"ANDNL"
|
|
|
|
return x &^ y
|
|
|
|
}
|
|
|
|
|
|
|
|
func blsi64(x int64) int64 {
|
|
|
|
// amd64/v3:"BLSIQ"
|
|
|
|
return x & -x
|
|
|
|
}
|
|
|
|
|
|
|
|
func blsi32(x int32) int32 {
|
|
|
|
// amd64/v3:"BLSIL"
|
|
|
|
return x & -x
|
|
|
|
}
|
|
|
|
|
|
|
|
func blsmsk64(x int64) int64 {
|
|
|
|
// amd64/v3:"BLSMSKQ"
|
|
|
|
return x ^ (x - 1)
|
|
|
|
}
|
|
|
|
|
|
|
|
func blsmsk32(x int32) int32 {
|
|
|
|
// amd64/v3:"BLSMSKL"
|
|
|
|
return x ^ (x - 1)
|
|
|
|
}
|
|
|
|
|
|
|
|
func blsr64(x int64) int64 {
|
|
|
|
// amd64/v3:"BLSRQ"
|
|
|
|
return x & (x - 1)
|
|
|
|
}
|
|
|
|
|
|
|
|
func blsr32(x int32) int32 {
|
|
|
|
// amd64/v3:"BLSRL"
|
|
|
|
return x & (x - 1)
|
|
|
|
}
|
2022-03-02 01:32:16 -07:00
|
|
|
|
2022-11-05 23:37:13 -06:00
|
|
|
func isPowerOfTwo64(x int64) bool {
|
|
|
|
// amd64/v3:"BLSRQ",-"TESTQ",-"CALL"
|
|
|
|
return blsr64(x) == 0
|
|
|
|
}
|
|
|
|
|
|
|
|
func isPowerOfTwo32(x int32) bool {
|
|
|
|
// amd64/v3:"BLSRL",-"TESTL",-"CALL"
|
|
|
|
return blsr32(x) == 0
|
|
|
|
}
|
|
|
|
|
|
|
|
func isPowerOfTwoSelect64(x, a, b int64) int64 {
|
|
|
|
var r int64
|
|
|
|
// amd64/v3:"BLSRQ",-"TESTQ",-"CALL"
|
|
|
|
if isPowerOfTwo64(x) {
|
|
|
|
r = a
|
|
|
|
} else {
|
|
|
|
r = b
|
|
|
|
}
|
|
|
|
// amd64/v3:"CMOVQEQ",-"TESTQ",-"CALL"
|
|
|
|
return r * 2 // force return blocks joining
|
|
|
|
}
|
|
|
|
|
|
|
|
func isPowerOfTwoSelect32(x, a, b int32) int32 {
|
|
|
|
var r int32
|
|
|
|
// amd64/v3:"BLSRL",-"TESTL",-"CALL"
|
|
|
|
if isPowerOfTwo32(x) {
|
|
|
|
r = a
|
|
|
|
} else {
|
|
|
|
r = b
|
|
|
|
}
|
|
|
|
// amd64/v3:"CMOVLEQ",-"TESTL",-"CALL"
|
|
|
|
return r * 2 // force return blocks joining
|
|
|
|
}
|
|
|
|
|
|
|
|
func isPowerOfTwoBranch64(x int64, a func(bool), b func(string)) {
|
|
|
|
// amd64/v3:"BLSRQ",-"TESTQ",-"CALL"
|
|
|
|
if isPowerOfTwo64(x) {
|
|
|
|
a(true)
|
|
|
|
} else {
|
|
|
|
b("false")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func isPowerOfTwoBranch32(x int32, a func(bool), b func(string)) {
|
|
|
|
// amd64/v3:"BLSRL",-"TESTL",-"CALL"
|
|
|
|
if isPowerOfTwo32(x) {
|
|
|
|
a(true)
|
|
|
|
} else {
|
|
|
|
b("false")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func isNotPowerOfTwo64(x int64) bool {
|
|
|
|
// amd64/v3:"BLSRQ",-"TESTQ",-"CALL"
|
|
|
|
return blsr64(x) != 0
|
|
|
|
}
|
|
|
|
|
|
|
|
func isNotPowerOfTwo32(x int32) bool {
|
|
|
|
// amd64/v3:"BLSRL",-"TESTL",-"CALL"
|
|
|
|
return blsr32(x) != 0
|
|
|
|
}
|
|
|
|
|
|
|
|
func isNotPowerOfTwoSelect64(x, a, b int64) int64 {
|
|
|
|
var r int64
|
|
|
|
// amd64/v3:"BLSRQ",-"TESTQ",-"CALL"
|
|
|
|
if isNotPowerOfTwo64(x) {
|
|
|
|
r = a
|
|
|
|
} else {
|
|
|
|
r = b
|
|
|
|
}
|
|
|
|
// amd64/v3:"CMOVQNE",-"TESTQ",-"CALL"
|
|
|
|
return r * 2 // force return blocks joining
|
|
|
|
}
|
|
|
|
|
|
|
|
func isNotPowerOfTwoSelect32(x, a, b int32) int32 {
|
|
|
|
var r int32
|
|
|
|
// amd64/v3:"BLSRL",-"TESTL",-"CALL"
|
|
|
|
if isNotPowerOfTwo32(x) {
|
|
|
|
r = a
|
|
|
|
} else {
|
|
|
|
r = b
|
|
|
|
}
|
|
|
|
// amd64/v3:"CMOVLNE",-"TESTL",-"CALL"
|
|
|
|
return r * 2 // force return blocks joining
|
|
|
|
}
|
|
|
|
|
|
|
|
func isNotPowerOfTwoBranch64(x int64, a func(bool), b func(string)) {
|
|
|
|
// amd64/v3:"BLSRQ",-"TESTQ",-"CALL"
|
|
|
|
if isNotPowerOfTwo64(x) {
|
|
|
|
a(true)
|
|
|
|
} else {
|
|
|
|
b("false")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func isNotPowerOfTwoBranch32(x int32, a func(bool), b func(string)) {
|
|
|
|
// amd64/v3:"BLSRL",-"TESTL",-"CALL"
|
|
|
|
if isNotPowerOfTwo32(x) {
|
|
|
|
a(true)
|
|
|
|
} else {
|
|
|
|
b("false")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-04-08 02:44:13 -06:00
|
|
|
func sarx64(x, y int64) int64 {
|
|
|
|
// amd64/v3:"SARXQ"
|
|
|
|
return x >> y
|
|
|
|
}
|
|
|
|
|
|
|
|
func sarx32(x, y int32) int32 {
|
|
|
|
// amd64/v3:"SARXL"
|
|
|
|
return x >> y
|
|
|
|
}
|
|
|
|
|
2022-04-08 03:33:50 -06:00
|
|
|
func sarx64_load(x []int64, i int) int64 {
|
|
|
|
// amd64/v3: `SARXQ\t[A-Z]+[0-9]*, \([A-Z]+[0-9]*\)\([A-Z]+[0-9]*\*8\), [A-Z]+[0-9]*`
|
|
|
|
s := x[i] >> (i & 63)
|
|
|
|
// amd64/v3: `SARXQ\t[A-Z]+[0-9]*, 8\([A-Z]+[0-9]*\)\([A-Z]+[0-9]*\*8\), [A-Z]+[0-9]*`
|
|
|
|
s = x[i+1] >> (s & 63)
|
|
|
|
return s
|
|
|
|
}
|
|
|
|
|
|
|
|
func sarx32_load(x []int32, i int) int32 {
|
|
|
|
// amd64/v3: `SARXL\t[A-Z]+[0-9]*, \([A-Z]+[0-9]*\)\([A-Z]+[0-9]*\*4\), [A-Z]+[0-9]*`
|
|
|
|
s := x[i] >> (i & 63)
|
|
|
|
// amd64/v3: `SARXL\t[A-Z]+[0-9]*, 4\([A-Z]+[0-9]*\)\([A-Z]+[0-9]*\*4\), [A-Z]+[0-9]*`
|
|
|
|
s = x[i+1] >> (s & 63)
|
|
|
|
return s
|
|
|
|
}
|
|
|
|
|
2022-04-09 00:40:40 -06:00
|
|
|
func shlrx64(x, y uint64) uint64 {
|
|
|
|
// amd64/v3:"SHRXQ"
|
|
|
|
s := x >> y
|
|
|
|
// amd64/v3:"SHLXQ"
|
|
|
|
s = s << y
|
|
|
|
return s
|
|
|
|
}
|
|
|
|
|
|
|
|
func shlrx32(x, y uint32) uint32 {
|
|
|
|
// amd64/v3:"SHRXL"
|
|
|
|
s := x >> y
|
|
|
|
// amd64/v3:"SHLXL"
|
|
|
|
s = s << y
|
|
|
|
return s
|
|
|
|
}
|
|
|
|
|
|
|
|
func shlrx64_load(x []uint64, i int, s uint64) uint64 {
|
2022-03-02 01:32:16 -07:00
|
|
|
// amd64/v3: `SHRXQ\t[A-Z]+[0-9]*, \([A-Z]+[0-9]*\)\([A-Z]+[0-9]*\*8\), [A-Z]+[0-9]*`
|
|
|
|
s = x[i] >> i
|
|
|
|
// amd64/v3: `SHLXQ\t[A-Z]+[0-9]*, 8\([A-Z]+[0-9]*\)\([A-Z]+[0-9]*\*8\), [A-Z]+[0-9]*`
|
|
|
|
s = x[i+1] << s
|
|
|
|
return s
|
|
|
|
}
|
|
|
|
|
2022-04-09 00:40:40 -06:00
|
|
|
func shlrx32_load(x []uint32, i int, s uint32) uint32 {
|
2022-03-02 01:32:16 -07:00
|
|
|
// amd64/v3: `SHRXL\t[A-Z]+[0-9]*, \([A-Z]+[0-9]*\)\([A-Z]+[0-9]*\*4\), [A-Z]+[0-9]*`
|
|
|
|
s = x[i] >> i
|
|
|
|
// amd64/v3: `SHLXL\t[A-Z]+[0-9]*, 4\([A-Z]+[0-9]*\)\([A-Z]+[0-9]*\*4\), [A-Z]+[0-9]*`
|
|
|
|
s = x[i+1] << s
|
|
|
|
return s
|
|
|
|
}
|