mirror of
https://github.com/golang/go.git
synced 2025-12-08 06:10:04 +00:00
This CL also updates the internal uses of these APIs. This CL also fixed a instable output issue left by previous CLs. Change-Id: Ibc38361d35e2af0c4943a48578f3c610b74ed14d Reviewed-on: https://go-review.googlesource.com/c/go/+/720020 Reviewed-by: Cherry Mui <cherryyz@google.com> LUCI-TryBot-Result: Go LUCI <golang-scoped@luci-project-accounts.iam.gserviceaccount.com>
79 lines
1.8 KiB
Go
79 lines
1.8 KiB
Go
// asmcheck
|
|
|
|
// Copyright 2025 The Go Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style
|
|
// license that can be found in the LICENSE file.
|
|
|
|
// These tests check code generation of simd peephole optimizations.
|
|
|
|
//go:build goexperiment.simd
|
|
|
|
package codegen
|
|
|
|
import "simd"
|
|
|
|
func vptest1() bool {
|
|
v1 := simd.LoadUint64x2Slice([]uint64{0, 1})
|
|
v2 := simd.LoadUint64x2Slice([]uint64{0, 0})
|
|
// amd64:`VPTEST\s(.*)(.*)$`
|
|
// amd64:`SETCS\s(.*)$`
|
|
return v1.AndNot(v2).IsZero()
|
|
}
|
|
|
|
func vptest2() bool {
|
|
v1 := simd.LoadUint64x2Slice([]uint64{0, 1})
|
|
v2 := simd.LoadUint64x2Slice([]uint64{0, 0})
|
|
// amd64:`VPTEST\s(.*)(.*)$`
|
|
// amd64:`SETEQ\s(.*)$`
|
|
return v1.And(v2).IsZero()
|
|
}
|
|
|
|
type Args2 struct {
|
|
V0 simd.Uint8x32
|
|
V1 simd.Uint8x32
|
|
x string
|
|
}
|
|
|
|
//go:noinline
|
|
func simdStructNoSpill(a Args2) simd.Uint8x32 {
|
|
// amd64:-`VMOVDQU\s.*$`
|
|
return a.V0.Xor(a.V1)
|
|
}
|
|
|
|
func simdStructWrapperNoSpill(a Args2) simd.Uint8x32 {
|
|
// amd64:-`VMOVDQU\s.*$`
|
|
a.x = "test"
|
|
return simdStructNoSpill(a)
|
|
}
|
|
|
|
//go:noinline
|
|
func simdArrayNoSpill(a [1]Args2) simd.Uint8x32 {
|
|
// amd64:-`VMOVDQU\s.*$`
|
|
return a[0].V0.Xor(a[0].V1)
|
|
}
|
|
|
|
func simdArrayWrapperNoSpill(a [1]Args2) simd.Uint8x32 {
|
|
// amd64:-`VMOVDQU\s.*$`
|
|
a[0].x = "test"
|
|
return simdArrayNoSpill(a)
|
|
}
|
|
|
|
func simdFeatureGuardedMaskOpt() simd.Int16x16 {
|
|
var x, y simd.Int16x16
|
|
if simd.X86.AVX512() {
|
|
mask := simd.Mask16x16FromBits(5)
|
|
return x.Add(y).Masked(mask) // amd64:`VPADDW.Z\s.*$`
|
|
}
|
|
mask := simd.Mask16x16FromBits(5)
|
|
return x.Add(y).Masked(mask) // amd64:`VPAND\s.*$`
|
|
}
|
|
|
|
func simdMaskedMerge() simd.Int16x16 {
|
|
var x, y simd.Int16x16
|
|
if simd.X86.AVX512() {
|
|
mask := simd.Mask16x16FromBits(5)
|
|
return x.Add(y).Merge(x, mask) // amd64:-`VPBLENDVB\s.*$`
|
|
}
|
|
mask := simd.Mask16x16FromBits(5)
|
|
return x.Add(y).Merge(x, mask) // amd64:`VPBLENDVB\s.*$`
|
|
}
|