2018-02-26 17:59:58 -07:00
|
|
|
// asmcheck
|
|
|
|
|
2018-03-02 13:06:09 -07:00
|
|
|
// Copyright 2018 The Go Authors. All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style
|
|
|
|
// license that can be found in the LICENSE file.
|
|
|
|
|
2018-02-26 17:59:58 -07:00
|
|
|
package codegen
|
|
|
|
|
2020-10-23 11:12:34 -06:00
|
|
|
import "math/bits"
|
|
|
|
|
2018-03-10 15:51:05 -07:00
|
|
|
// ------------------- //
|
|
|
|
// const rotates //
|
|
|
|
// ------------------- //
|
|
|
|
|
|
|
|
func rot64(x uint64) uint64 {
|
|
|
|
var a uint64
|
|
|
|
|
|
|
|
// amd64:"ROLQ\t[$]7"
|
|
|
|
// arm64:"ROR\t[$]57"
|
2020-05-11 10:44:48 -06:00
|
|
|
// s390x:"RISBGZ\t[$]0, [$]63, [$]7, "
|
2018-10-15 10:53:07 -06:00
|
|
|
// ppc64:"ROTL\t[$]7"
|
2018-03-10 15:51:05 -07:00
|
|
|
// ppc64le:"ROTL\t[$]7"
|
|
|
|
a += x<<7 | x>>57
|
|
|
|
|
|
|
|
// amd64:"ROLQ\t[$]8"
|
|
|
|
// arm64:"ROR\t[$]56"
|
2020-05-11 10:44:48 -06:00
|
|
|
// s390x:"RISBGZ\t[$]0, [$]63, [$]8, "
|
2018-10-15 10:53:07 -06:00
|
|
|
// ppc64:"ROTL\t[$]8"
|
2018-03-10 15:51:05 -07:00
|
|
|
// ppc64le:"ROTL\t[$]8"
|
|
|
|
a += x<<8 + x>>56
|
|
|
|
|
|
|
|
// amd64:"ROLQ\t[$]9"
|
|
|
|
// arm64:"ROR\t[$]55"
|
2020-05-11 10:44:48 -06:00
|
|
|
// s390x:"RISBGZ\t[$]0, [$]63, [$]9, "
|
2018-10-15 10:53:07 -06:00
|
|
|
// ppc64:"ROTL\t[$]9"
|
2018-03-10 15:51:05 -07:00
|
|
|
// ppc64le:"ROTL\t[$]9"
|
|
|
|
a += x<<9 ^ x>>55
|
|
|
|
|
|
|
|
return a
|
|
|
|
}
|
|
|
|
|
2018-02-26 17:59:58 -07:00
|
|
|
func rot32(x uint32) uint32 {
|
|
|
|
var a uint32
|
2018-03-10 15:51:05 -07:00
|
|
|
|
|
|
|
// amd64:"ROLL\t[$]7"
|
|
|
|
// arm:"MOVW\tR\\d+@>25"
|
|
|
|
// arm64:"RORW\t[$]25"
|
|
|
|
// s390x:"RLL\t[$]7"
|
2018-10-15 10:53:07 -06:00
|
|
|
// ppc64:"ROTLW\t[$]7"
|
2018-03-10 15:51:05 -07:00
|
|
|
// ppc64le:"ROTLW\t[$]7"
|
|
|
|
a += x<<7 | x>>25
|
|
|
|
|
|
|
|
// amd64:`ROLL\t[$]8`
|
|
|
|
// arm:"MOVW\tR\\d+@>24"
|
|
|
|
// arm64:"RORW\t[$]24"
|
|
|
|
// s390x:"RLL\t[$]8"
|
2018-10-15 10:53:07 -06:00
|
|
|
// ppc64:"ROTLW\t[$]8"
|
2018-03-10 15:51:05 -07:00
|
|
|
// ppc64le:"ROTLW\t[$]8"
|
|
|
|
a += x<<8 + x>>24
|
|
|
|
|
|
|
|
// amd64:"ROLL\t[$]9"
|
|
|
|
// arm:"MOVW\tR\\d+@>23"
|
|
|
|
// arm64:"RORW\t[$]23"
|
|
|
|
// s390x:"RLL\t[$]9"
|
2018-10-15 10:53:07 -06:00
|
|
|
// ppc64:"ROTLW\t[$]9"
|
2018-03-10 15:51:05 -07:00
|
|
|
// ppc64le:"ROTLW\t[$]9"
|
|
|
|
a += x<<9 ^ x>>23
|
|
|
|
|
2018-02-26 17:59:58 -07:00
|
|
|
return a
|
|
|
|
}
|
|
|
|
|
2018-03-10 15:51:05 -07:00
|
|
|
func rot16(x uint16) uint16 {
|
|
|
|
var a uint16
|
|
|
|
|
|
|
|
// amd64:"ROLW\t[$]7"
|
|
|
|
a += x<<7 | x>>9
|
|
|
|
|
|
|
|
// amd64:`ROLW\t[$]8`
|
|
|
|
a += x<<8 + x>>8
|
|
|
|
|
|
|
|
// amd64:"ROLW\t[$]9"
|
|
|
|
a += x<<9 ^ x>>7
|
|
|
|
|
|
|
|
return a
|
|
|
|
}
|
|
|
|
|
|
|
|
func rot8(x uint8) uint8 {
|
|
|
|
var a uint8
|
|
|
|
|
|
|
|
// amd64:"ROLB\t[$]5"
|
|
|
|
a += x<<5 | x>>3
|
|
|
|
|
|
|
|
// amd64:`ROLB\t[$]6`
|
|
|
|
a += x<<6 + x>>2
|
|
|
|
|
|
|
|
// amd64:"ROLB\t[$]7"
|
|
|
|
a += x<<7 ^ x>>1
|
|
|
|
|
|
|
|
return a
|
|
|
|
}
|
|
|
|
|
|
|
|
// ----------------------- //
|
|
|
|
// non-const rotates //
|
|
|
|
// ----------------------- //
|
|
|
|
|
|
|
|
func rot64nc(x uint64, z uint) uint64 {
|
2018-02-26 17:59:58 -07:00
|
|
|
var a uint64
|
2018-03-10 15:51:05 -07:00
|
|
|
|
|
|
|
z &= 63
|
|
|
|
|
|
|
|
// amd64:"ROLQ"
|
2018-10-15 10:53:07 -06:00
|
|
|
// ppc64:"ROTL"
|
2018-05-09 15:35:10 -06:00
|
|
|
// ppc64le:"ROTL"
|
2018-03-10 15:51:05 -07:00
|
|
|
a += x<<z | x>>(64-z)
|
|
|
|
|
|
|
|
// amd64:"RORQ"
|
|
|
|
a += x>>z | x<<(64-z)
|
|
|
|
|
2018-02-26 17:59:58 -07:00
|
|
|
return a
|
|
|
|
}
|
2018-03-10 15:51:05 -07:00
|
|
|
|
|
|
|
func rot32nc(x uint32, z uint) uint32 {
|
|
|
|
var a uint32
|
|
|
|
|
|
|
|
z &= 31
|
|
|
|
|
|
|
|
// amd64:"ROLL"
|
2018-10-15 10:53:07 -06:00
|
|
|
// ppc64:"ROTLW"
|
2018-05-09 15:35:10 -06:00
|
|
|
// ppc64le:"ROTLW"
|
2018-03-10 15:51:05 -07:00
|
|
|
a += x<<z | x>>(32-z)
|
|
|
|
|
|
|
|
// amd64:"RORL"
|
|
|
|
a += x>>z | x<<(32-z)
|
|
|
|
|
|
|
|
return a
|
|
|
|
}
|
|
|
|
|
|
|
|
func rot16nc(x uint16, z uint) uint16 {
|
|
|
|
var a uint16
|
|
|
|
|
|
|
|
z &= 15
|
|
|
|
|
|
|
|
// amd64:"ROLW"
|
|
|
|
a += x<<z | x>>(16-z)
|
|
|
|
|
|
|
|
// amd64:"RORW"
|
|
|
|
a += x>>z | x<<(16-z)
|
|
|
|
|
|
|
|
return a
|
|
|
|
}
|
|
|
|
|
|
|
|
func rot8nc(x uint8, z uint) uint8 {
|
|
|
|
var a uint8
|
|
|
|
|
|
|
|
z &= 7
|
|
|
|
|
|
|
|
// amd64:"ROLB"
|
|
|
|
a += x<<z | x>>(8-z)
|
|
|
|
|
|
|
|
// amd64:"RORB"
|
|
|
|
a += x>>z | x<<(8-z)
|
|
|
|
|
|
|
|
return a
|
|
|
|
}
|
|
|
|
|
|
|
|
// Issue 18254: rotate after inlining
|
|
|
|
func f32(x uint32) uint32 {
|
|
|
|
// amd64:"ROLL\t[$]7"
|
|
|
|
return rot32nc(x, 7)
|
|
|
|
}
|
2020-10-23 11:12:34 -06:00
|
|
|
|
|
|
|
// --------------------------------------- //
|
|
|
|
// Combined Rotate + Masking operations //
|
|
|
|
// --------------------------------------- //
|
|
|
|
|
|
|
|
func checkMaskedRotate32(a []uint32, r int) {
|
|
|
|
i := 0
|
|
|
|
|
2021-01-05 15:44:43 -07:00
|
|
|
// ppc64le: "RLWNM\t[$]16, R[0-9]+, [$]8, [$]15, R[0-9]+"
|
|
|
|
// ppc64: "RLWNM\t[$]16, R[0-9]+, [$]8, [$]15, R[0-9]+"
|
2020-10-23 11:12:34 -06:00
|
|
|
a[i] = bits.RotateLeft32(a[i], 16) & 0xFF0000
|
|
|
|
i++
|
2021-01-05 15:44:43 -07:00
|
|
|
// ppc64le: "RLWNM\t[$]16, R[0-9]+, [$]8, [$]15, R[0-9]+"
|
|
|
|
// ppc64: "RLWNM\t[$]16, R[0-9]+, [$]8, [$]15, R[0-9]+"
|
2020-10-23 11:12:34 -06:00
|
|
|
a[i] = bits.RotateLeft32(a[i]&0xFF, 16)
|
|
|
|
i++
|
2021-01-05 15:44:43 -07:00
|
|
|
// ppc64le: "RLWNM\t[$]4, R[0-9]+, [$]20, [$]27, R[0-9]+"
|
|
|
|
// ppc64: "RLWNM\t[$]4, R[0-9]+, [$]20, [$]27, R[0-9]+"
|
2020-10-23 11:12:34 -06:00
|
|
|
a[i] = bits.RotateLeft32(a[i], 4) & 0xFF0
|
|
|
|
i++
|
2021-01-05 15:44:43 -07:00
|
|
|
// ppc64le: "RLWNM\t[$]16, R[0-9]+, [$]24, [$]31, R[0-9]+"
|
|
|
|
// ppc64: "RLWNM\t[$]16, R[0-9]+, [$]24, [$]31, R[0-9]+"
|
2020-10-23 11:12:34 -06:00
|
|
|
a[i] = bits.RotateLeft32(a[i]&0xFF0000, 16)
|
|
|
|
i++
|
|
|
|
|
2021-01-05 15:44:43 -07:00
|
|
|
// ppc64le: "RLWNM\tR[0-9]+, R[0-9]+, [$]8, [$]15, R[0-9]+"
|
|
|
|
// ppc64: "RLWNM\tR[0-9]+, R[0-9]+, [$]8, [$]15, R[0-9]+"
|
2020-10-23 11:12:34 -06:00
|
|
|
a[i] = bits.RotateLeft32(a[i], r) & 0xFF0000
|
|
|
|
i++
|
2021-01-05 15:44:43 -07:00
|
|
|
// ppc64le: "RLWNM\tR[0-9]+, R[0-9]+, [$]16, [$]23, R[0-9]+"
|
|
|
|
// ppc64: "RLWNM\tR[0-9]+, R[0-9]+, [$]16, [$]23, R[0-9]+"
|
2020-10-23 11:12:34 -06:00
|
|
|
a[i] = bits.RotateLeft32(a[3], r) & 0xFF00
|
|
|
|
i++
|
|
|
|
|
2021-01-05 15:44:43 -07:00
|
|
|
// ppc64le: "RLWNM\tR[0-9]+, R[0-9]+, [$]20, [$]11, R[0-9]+"
|
|
|
|
// ppc64: "RLWNM\tR[0-9]+, R[0-9]+, [$]20, [$]11, R[0-9]+"
|
2020-10-23 11:12:34 -06:00
|
|
|
a[i] = bits.RotateLeft32(a[3], r) & 0xFFF00FFF
|
|
|
|
i++
|
2021-01-05 15:44:43 -07:00
|
|
|
// ppc64le: "RLWNM\t[$]4, R[0-9]+, [$]20, [$]11, R[0-9]+"
|
|
|
|
// ppc64: "RLWNM\t[$]4, R[0-9]+, [$]20, [$]11, R[0-9]+"
|
2020-10-23 11:12:34 -06:00
|
|
|
a[i] = bits.RotateLeft32(a[3], 4) & 0xFFF00FFF
|
|
|
|
i++
|
|
|
|
}
|