| // Copyright 2025 The Go Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file. |
| |
| //go:build goexperiment.simd && amd64 |
| |
| package simd_test |
| |
| import ( |
| "simd/archsimd" |
| "testing" |
| ) |
| |
| func TestPartInt8x32(t *testing.T) { |
| a := []int8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, |
| 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32} |
| b := []int8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, |
| 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32} |
| for i := 32; i >= 0; i-- { |
| u, _ := archsimd.LoadInt8x32Part(a[:i]) |
| c := make([]int8, 32, 32) |
| u.Store(c) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func xTestPartUint8x16(t *testing.T) { |
| a := []uint8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| b := []uint8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| for i := 16; i >= 0; i-- { |
| u, _ := archsimd.LoadUint8x16Part(a[:i]) |
| c := make([]uint8, 32, 32) |
| u.Store(c) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func TestPartUint8x32(t *testing.T) { |
| a := []uint8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, |
| 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32} |
| b := []uint8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, |
| 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32} |
| for i := 32; i >= 0; i-- { |
| u, _ := archsimd.LoadUint8x32Part(a[:i]) |
| c := make([]uint8, 32, 32) |
| u.Store(c) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func xTestPartInt16x8(t *testing.T) { |
| a := []int16{1, 2, 3, 4, 5, 6, 7, 8} |
| b := []int16{1, 2, 3, 4, 5, 6, 7, 8} |
| for i := 8; i >= 0; i-- { |
| u, _ := archsimd.LoadInt16x8Part(a[:i]) |
| c := make([]int16, 16, 16) |
| u.Store(c) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func TestPartInt16x16(t *testing.T) { |
| a := []int16{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| b := []int16{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| for i := 16; i >= 0; i-- { |
| u, _ := archsimd.LoadInt16x16Part(a[:i]) |
| c := make([]int16, 16, 16) |
| u.Store(c) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func xTestSlicesPartStoreInt8x16(t *testing.T) { |
| a := []int8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| b := []int8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| for i := 16; i >= 0; i-- { |
| v := archsimd.LoadInt8x16(a) |
| c := make([]int8, 32, 32) |
| v.StorePart(c[:i]) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func xTestSlicesPartStoreInt16x8(t *testing.T) { |
| a := []int16{1, 2, 3, 4, 5, 6, 7, 8} |
| b := []int16{1, 2, 3, 4, 5, 6, 7, 8} |
| for i := 8; i >= 0; i-- { |
| v := archsimd.LoadInt16x8(a) |
| c := make([]int16, 32, 32) |
| v.StorePart(c[:i]) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func TestSlicesPartStoreInt16x16(t *testing.T) { |
| a := []int16{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| b := []int16{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| for i := 16; i >= 0; i-- { |
| v := archsimd.LoadInt16x16(a) |
| c := make([]int16, 32, 32) |
| v.StorePart(c[:i]) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func xTestSlicesPartStoreUint8x16(t *testing.T) { |
| a := []uint8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| b := []uint8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| for i := 16; i >= 0; i-- { |
| v := archsimd.LoadUint8x16(a) |
| c := make([]uint8, 32, 32) |
| v.StorePart(c[:i]) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func TestSlicesPartStoreUint16x16(t *testing.T) { |
| a := []uint16{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| b := []uint16{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16} |
| for i := 16; i >= 0; i-- { |
| v := archsimd.LoadUint16x16(a) |
| c := make([]uint16, 32, 32) |
| v.StorePart(c[:i]) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func TestSlicesPartStoreUint8x32(t *testing.T) { |
| a := []uint8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, |
| 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32} |
| b := []uint8{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, |
| 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32} |
| for i := 32; i >= 0; i-- { |
| v := archsimd.LoadUint8x32(a) |
| c := make([]uint8, 32, 32) |
| v.StorePart(c[:i]) |
| checkSlices(t, c, b) |
| if i > 0 { |
| b[i-1] = 0 |
| } |
| } |
| } |
| |
| func TestPartUint64(t *testing.T) { |
| // 64x4 |
| L := 4 |
| c := []uint64{1, 2, 3, 4, 5, 86, 86, 86, 86} |
| a := c[:L+1] |
| for i := range a { |
| // Test the load first |
| // e is a partial slice. |
| e := a[i:] |
| v, _ := archsimd.LoadUint64x4Part(e) |
| // d contains what a ought to contain |
| d := make([]uint64, L) |
| for j := 0; j < len(e) && j < len(d); j++ { |
| d[j] = e[j] |
| } |
| |
| b := make([]uint64, L) |
| v.Store(b) |
| // test the load |
| checkSlices(t, d, b) |
| |
| // Test the store |
| f := make([]uint64, L+1) |
| for i := range f { |
| f[i] = 99 |
| } |
| |
| v.StorePart(f[:len(e)]) |
| if len(e) < len(b) { |
| checkSlices(t, f, b[:len(e)]) |
| } else { |
| checkSlices(t, f, b) |
| } |
| for i := len(e); i < len(f); i++ { |
| if f[i] != 99 { |
| t.Errorf("StorePart altered f[%d], expected 99, saw %d", i, f[i]) |
| } |
| } |
| } |
| } |
| |
| func TestPartFloat32(t *testing.T) { |
| // 32x8 |
| L := 8 |
| c := []float32{1, 2, 3, 4, 5, 6, 7, 8, 86, 86, 86, 86} |
| a := c[:L+1] |
| for i := range a { |
| // Test the load first |
| // e is a partial slice. |
| e := a[i:] |
| v, _ := archsimd.LoadFloat32x8Part(e) |
| // d contains what a ought to contain |
| d := make([]float32, L) |
| for j := 0; j < len(e) && j < len(d); j++ { |
| d[j] = e[j] |
| } |
| |
| b := make([]float32, L) |
| v.Store(b) |
| // test the load |
| checkSlices(t, d, b) |
| |
| // Test the store |
| f := make([]float32, L+1) |
| for i := range f { |
| f[i] = 99 |
| } |
| |
| v.StorePart(f[:len(e)]) |
| if len(e) < len(b) { |
| checkSlices(t, f, b[:len(e)]) |
| } else { |
| checkSlices(t, f, b) |
| } |
| for i := len(e); i < len(f); i++ { |
| if f[i] != 99 { |
| t.Errorf("StorePart altered f[%d], expected 99, saw %v", i, f[i]) |
| } |
| } |
| } |
| } |
| |
| // 512-bit load |
| |
| func TestPartInt64(t *testing.T) { |
| if !archsimd.X86.AVX512() { |
| t.Skip("Test requires X86.AVX512, not available on this hardware") |
| return |
| } |
| |
| L := 8 |
| c := []int64{1, 2, 3, 4, 5, 6, 7, 8, 86, 86, 86, 86} |
| a := c[:L+1] |
| for i := range a { |
| // Test the load first |
| // e is a partial slice. |
| e := a[i:] |
| v, _ := archsimd.LoadInt64x8Part(e) |
| // d contains what a ought to contain |
| d := make([]int64, L) |
| for j := 0; j < len(e) && j < len(d); j++ { |
| d[j] = e[j] |
| } |
| |
| b := make([]int64, L) |
| v.Store(b) |
| // test the load |
| checkSlicesLogInput(t, b, d, 0.0, func() { t.Helper(); t.Logf("Len(e)=%d", len(e)) }) |
| |
| // Test the store |
| f := make([]int64, L+1) |
| for i := range f { |
| f[i] = 99 |
| } |
| |
| v.StorePart(f[:len(e)]) |
| if len(e) < len(b) { |
| checkSlices(t, f, b[:len(e)]) |
| } else { |
| checkSlices(t, f, b) |
| } |
| for i := len(e); i < len(f); i++ { |
| if f[i] != 99 { |
| t.Errorf("StorePart altered f[%d], expected 99, saw %v", i, f[i]) |
| } |
| } |
| } |
| } |