| // Copyright 2026 The Go Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file. |
| |
| //go:build goexperiment.simd && arm64 |
| |
| package simd_test |
| |
| import ( |
| "simd/archsimd" |
| "testing" |
| ) |
| |
| // --- Equal (hardware: CMEQ / FCMEQ) --- |
| |
| func TestEqual(t *testing.T) { |
| testInt8x16Compare(t, archsimd.Int8x16.Equal, equalSlice[int8]) |
| testInt16x8Compare(t, archsimd.Int16x8.Equal, equalSlice[int16]) |
| testInt32x4Compare(t, archsimd.Int32x4.Equal, equalSlice[int32]) |
| testInt64x2Compare(t, archsimd.Int64x2.Equal, equalSlice[int64]) |
| |
| testUint8x16Compare(t, archsimd.Uint8x16.Equal, equalSlice[uint8]) |
| testUint16x8Compare(t, archsimd.Uint16x8.Equal, equalSlice[uint16]) |
| testUint32x4Compare(t, archsimd.Uint32x4.Equal, equalSlice[uint32]) |
| testUint64x2Compare(t, archsimd.Uint64x2.Equal, equalSlice[uint64]) |
| |
| testFloat32x4Compare(t, archsimd.Float32x4.Equal, equalSlice[float32]) |
| testFloat64x2Compare(t, archsimd.Float64x2.Equal, equalSlice[float64]) |
| } |
| |
| // --- Greater (hardware: CMGT/CMHI for signed/unsigned, FCMGT for float) --- |
| |
| func TestGreater(t *testing.T) { |
| testInt8x16Compare(t, archsimd.Int8x16.Greater, greaterSlice[int8]) |
| testInt16x8Compare(t, archsimd.Int16x8.Greater, greaterSlice[int16]) |
| testInt32x4Compare(t, archsimd.Int32x4.Greater, greaterSlice[int32]) |
| testInt64x2Compare(t, archsimd.Int64x2.Greater, greaterSlice[int64]) |
| |
| testUint8x16Compare(t, archsimd.Uint8x16.Greater, greaterSlice[uint8]) |
| testUint16x8Compare(t, archsimd.Uint16x8.Greater, greaterSlice[uint16]) |
| testUint32x4Compare(t, archsimd.Uint32x4.Greater, greaterSlice[uint32]) |
| testUint64x2Compare(t, archsimd.Uint64x2.Greater, greaterSlice[uint64]) |
| |
| testFloat32x4Compare(t, archsimd.Float32x4.Greater, greaterSlice[float32]) |
| testFloat64x2Compare(t, archsimd.Float64x2.Greater, greaterSlice[float64]) |
| } |
| |
| // --- GreaterEqual (hardware: CMGE/CMHS for signed/unsigned, FCMGE for float) --- |
| |
| func TestGreaterEqual(t *testing.T) { |
| testInt8x16Compare(t, archsimd.Int8x16.GreaterEqual, greaterEqualSlice[int8]) |
| testInt16x8Compare(t, archsimd.Int16x8.GreaterEqual, greaterEqualSlice[int16]) |
| testInt32x4Compare(t, archsimd.Int32x4.GreaterEqual, greaterEqualSlice[int32]) |
| testInt64x2Compare(t, archsimd.Int64x2.GreaterEqual, greaterEqualSlice[int64]) |
| |
| testUint8x16Compare(t, archsimd.Uint8x16.GreaterEqual, greaterEqualSlice[uint8]) |
| testUint16x8Compare(t, archsimd.Uint16x8.GreaterEqual, greaterEqualSlice[uint16]) |
| testUint32x4Compare(t, archsimd.Uint32x4.GreaterEqual, greaterEqualSlice[uint32]) |
| testUint64x2Compare(t, archsimd.Uint64x2.GreaterEqual, greaterEqualSlice[uint64]) |
| |
| testFloat32x4Compare(t, archsimd.Float32x4.GreaterEqual, greaterEqualSlice[float32]) |
| testFloat64x2Compare(t, archsimd.Float64x2.GreaterEqual, greaterEqualSlice[float64]) |
| } |
| |
| // --- Less (derived: y.Greater(x)) --- |
| |
| func TestLess(t *testing.T) { |
| testInt8x16Compare(t, archsimd.Int8x16.Less, lessSlice[int8]) |
| testInt16x8Compare(t, archsimd.Int16x8.Less, lessSlice[int16]) |
| testInt32x4Compare(t, archsimd.Int32x4.Less, lessSlice[int32]) |
| testInt64x2Compare(t, archsimd.Int64x2.Less, lessSlice[int64]) |
| |
| testUint8x16Compare(t, archsimd.Uint8x16.Less, lessSlice[uint8]) |
| testUint16x8Compare(t, archsimd.Uint16x8.Less, lessSlice[uint16]) |
| testUint32x4Compare(t, archsimd.Uint32x4.Less, lessSlice[uint32]) |
| testUint64x2Compare(t, archsimd.Uint64x2.Less, lessSlice[uint64]) |
| |
| testFloat32x4Compare(t, archsimd.Float32x4.Less, lessSlice[float32]) |
| testFloat64x2Compare(t, archsimd.Float64x2.Less, lessSlice[float64]) |
| } |
| |
| // --- LessEqual (derived: y.GreaterEqual(x)) --- |
| |
| func TestLessEqual(t *testing.T) { |
| testInt8x16Compare(t, archsimd.Int8x16.LessEqual, lessEqualSlice[int8]) |
| testInt16x8Compare(t, archsimd.Int16x8.LessEqual, lessEqualSlice[int16]) |
| testInt32x4Compare(t, archsimd.Int32x4.LessEqual, lessEqualSlice[int32]) |
| testInt64x2Compare(t, archsimd.Int64x2.LessEqual, lessEqualSlice[int64]) |
| |
| testUint8x16Compare(t, archsimd.Uint8x16.LessEqual, lessEqualSlice[uint8]) |
| testUint16x8Compare(t, archsimd.Uint16x8.LessEqual, lessEqualSlice[uint16]) |
| testUint32x4Compare(t, archsimd.Uint32x4.LessEqual, lessEqualSlice[uint32]) |
| testUint64x2Compare(t, archsimd.Uint64x2.LessEqual, lessEqualSlice[uint64]) |
| |
| testFloat32x4Compare(t, archsimd.Float32x4.LessEqual, lessEqualSlice[float32]) |
| testFloat64x2Compare(t, archsimd.Float64x2.LessEqual, lessEqualSlice[float64]) |
| } |
| |
| // --- NotEqual (derived: Equal().Not()) --- |
| |
| func TestNotEqual(t *testing.T) { |
| testInt8x16Compare(t, archsimd.Int8x16.NotEqual, notEqualSlice[int8]) |
| testInt16x8Compare(t, archsimd.Int16x8.NotEqual, notEqualSlice[int16]) |
| testInt32x4Compare(t, archsimd.Int32x4.NotEqual, notEqualSlice[int32]) |
| testInt64x2Compare(t, archsimd.Int64x2.NotEqual, notEqualSlice[int64]) |
| |
| testUint8x16Compare(t, archsimd.Uint8x16.NotEqual, notEqualSlice[uint8]) |
| testUint16x8Compare(t, archsimd.Uint16x8.NotEqual, notEqualSlice[uint16]) |
| testUint32x4Compare(t, archsimd.Uint32x4.NotEqual, notEqualSlice[uint32]) |
| testUint64x2Compare(t, archsimd.Uint64x2.NotEqual, notEqualSlice[uint64]) |
| |
| testFloat32x4Compare(t, archsimd.Float32x4.NotEqual, notEqualSlice[float32]) |
| testFloat64x2Compare(t, archsimd.Float64x2.NotEqual, notEqualSlice[float64]) |
| } |
| |
| // --- Masked: zero elements where mask is false --- |
| |
| func TestMasked(t *testing.T) { |
| // Test Masked for Int8x16 |
| forSlicePair(t, int8s, 16, func(x, y []int8) bool { |
| t.Helper() |
| a := archsimd.LoadInt8x16(x) |
| mask := archsimd.LoadInt8x16(y).Greater(archsimd.Int8x16{}) // mask: y > 0 |
| g := make([]int8, 16) |
| a.Masked(mask).Store(g) |
| w := make([]int8, 16) |
| for i := range w { |
| if y[i] > 0 { |
| w[i] = x[i] |
| } |
| } |
| return checkSlicesLogInput(t, g, w, 0.0, func() { t.Helper(); t.Logf("x=%v, y=%v", x, y) }) |
| }) |
| |
| // Test Masked for Float64x2 |
| forSlicePair(t, float64s, 2, func(x, y []float64) bool { |
| t.Helper() |
| a := archsimd.LoadFloat64x2(x) |
| mask := archsimd.LoadFloat64x2(y).Greater(archsimd.Float64x2{}) // mask: y > 0 |
| g := make([]float64, 2) |
| a.Masked(mask).Store(g) |
| w := make([]float64, 2) |
| for i := range w { |
| if y[i] > 0 { |
| w[i] = x[i] |
| } |
| } |
| return checkSlicesLogInput(t, g, w, 0.0, func() { t.Helper(); t.Logf("x=%v, y=%v", x, y) }) |
| }) |
| } |
| |
| // --- IfElse: set elements to y where mask is true, keep x where true --- |
| |
| func TestIfElse(t *testing.T) { |
| // Test Merge for Int8x16 |
| forSliceTriple(t, int8s, 16, func(x, y, m []int8) bool { |
| t.Helper() |
| a := archsimd.LoadInt8x16(x) |
| b := archsimd.LoadInt8x16(y) |
| mask := archsimd.LoadInt8x16(m).Greater(archsimd.Int8x16{}) // mask: m > 0 |
| g := make([]int8, 16) |
| a.IfElse(mask, b).Store(g) |
| w := make([]int8, 16) |
| for i := range w { |
| if m[i] > 0 { |
| w[i] = y[i] |
| } else { |
| w[i] = x[i] |
| } |
| } |
| return checkSlicesLogInput(t, g, w, 0.0, func() { t.Helper(); t.Logf("x=%v, y=%v, m=%v", x, y, m) }) |
| }) |
| |
| // Test Merge for Float32x4 |
| forSliceTriple(t, float32s, 4, func(x, y, m []float32) bool { |
| t.Helper() |
| a := archsimd.LoadFloat32x4(x) |
| b := archsimd.LoadFloat32x4(y) |
| mask := archsimd.LoadFloat32x4(m).Greater(archsimd.Float32x4{}) // mask: m > 0 |
| g := make([]float32, 4) |
| a.IfElse(mask, b).Store(g) |
| w := make([]float32, 4) |
| for i := range w { |
| if m[i] > 0 { |
| w[i] = y[i] |
| } else { |
| w[i] = x[i] |
| } |
| } |
| return checkSlicesLogInput(t, g, w, 0.0, func() { t.Helper(); t.Logf("x=%v, y=%v, m=%v", x, y, m) }) |
| }) |
| } |