src/math/big/arith_test.go - go.git - Git at Google

 // Copyright 2009 The Go Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.

 // This file defines tests of consistent behavior between assembly and Go versions of basic operators,
 // as well as tests of pure Go implementations.

 package big

 import (
 	"fmt"
 	"internal/testenv"
 	"iter"
 	"math/bits"
 	"math/rand/v2"
 	"slices"
 	"strings"
 	"testing"
 )

 var isRaceBuilder = strings.HasSuffix(testenv.Builder(), "-race")

 var words4 = []Word{0, 1, _M - 1, _M}
 var words2 = []Word{0, _M}
 var muls = []Word{0, 1, 2, 3, 4, 5, _M / 4, _M / 2, _M - 3, _M - 2, _M - 1, _M}
 var adds = []Word{0, 1, _M - 1, _M}
 var shifts = []uint{1, 2, 3, _W/4 - 1, _W / 4, _W/4 + 1, _W/2 - 1, _W / 2, _W/2 + 1, _W - 3, _W - 2, _W - 1}

 func TestAddVV(t *testing.T)      { testVV(t, "addVV", addVV, addVV_g) }
 func TestSubVV(t *testing.T)      { testVV(t, "subVV", subVV, subVV_g) }
 func TestAddVW(t *testing.T)      { testVW(t, "addVW", addVW, addVW_ref, words4) }
 func TestSubVW(t *testing.T)      { testVW(t, "subVW", subVW, subVW_ref, words4) }
 func TestLshVU(t *testing.T)      { testVU(t, "lshVU", lshVU, lshVU_g, shifts) }
 func TestRshVU(t *testing.T)      { testVU(t, "rshVU", rshVU, rshVU_g, shifts) }
 func TestMulAddVWW(t *testing.T)  { testVWW(t, "mulAddVWW", mulAddVWW, mulAddVWW_g, muls) }
 func TestAddMulVVWW(t *testing.T) { testVVWW(t, "addMulVVWW", addMulVVWW, addMulVVWW_g, muls, adds) }

 // Note: It would be nice to avoid all the duplication of these test variants,
 // but the only obvious way is to use reflection. These tests are already
 // pretty expensive, and hitting them with reflect call overhead would
 // reduce the amount of exhaustive testing it's reasonable to do, so instead
 // we put up with the duplication.

 func testVV(t *testing.T, name string, fn, ref func(z, x, y []Word) (c Word)) {
 	for size := range 100 {
 		xx := make([]Word, 1+size+1)
 		yy := make([]Word, 1+size+1)
 		zz := make([]Word, 1+size+1)
 		words := words4
 		if size > 5 {
 			words = words2
 		}
 		if size > 10 {
 			words = nil // random
 		}
 		for x := range nats(words, size) {
 			for y := range nats(words, size) {
 				wantZ := make([]Word, size)
 				wantC := ref(wantZ, x, y)

 				for _, inplace := range []bool{false, true} {
 					name := name
 					if inplace {
 						name = "in-place " + name
 					}
 					setSlice(xx, 1, x)
 					setSlice(yy, 2, y)
 					zz := zz
 					if inplace {
 						zz = xx
 					} else {
 						for i := range zz {
 							zz[i] = 0x9876
 						}
 					}
 					setSlice(zz, 3, nil)
 					c := fn(zz[1:1+size], xx[1:1+size], yy[1:1+size])
 					if !slices.Equal(zz[1:1+size], wantZ) || c != wantC {
 						t.Errorf("%s(%#x, %#x) = %#x, %#x, want %#x, %#x", name, x, y, zz[1:1+size], c, wantZ, wantC)
 					}
 					if !inplace {
 						checkSlice(t, name, "x", xx, 1, x)
 					}
 					checkSlice(t, name, "y", yy, 2, y)
 					checkSlice(t, name, "z", zz, 3, nil)
 					if t.Failed() {
 						t.FailNow()
 					}
 				}
 			}
 		}
 	}
 }

 func testVV2(t *testing.T, name string, fn, ref func(z1, z2, x, y []Word) (c1, c2 Word)) {
 	for size := range 100 {
 		xx := make([]Word, 1+size+1)
 		yy := make([]Word, 1+size+1)
 		zz1 := make([]Word, 1+size+1)
 		zz2 := make([]Word, 1+size+1)
 		words := words4
 		if size > 5 {
 			words = words2
 		}
 		if size > 10 {
 			words = nil // random
 		}
 		for x := range nats(words, size) {
 			for y := range nats(words, size) {
 				wantZ1 := make([]Word, size)
 				wantZ2 := make([]Word, size)
 				wantC1, wantC2 := ref(wantZ1, wantZ2, x, y)

 				for _, inplace := range []bool{false, true} {
 					name := name
 					if inplace {
 						name = "in-place " + name
 					}
 					setSlice(xx, 1, x)
 					setSlice(yy, 2, y)
 					zz1 := zz1
 					zz2 := zz2
 					if inplace {
 						zz1 = xx
 						zz2 = yy
 					} else {
 						for i := range zz1 {
 							zz1[i] = 0x9876
 						}
 						for i := range zz2 {
 							zz2[i] = 0x8765
 						}
 					}
 					setSlice(zz1, 3, nil)
 					setSlice(zz2, 4, nil)
 					c1, c2 := fn(zz1[1:1+size], zz2[1:1+size], xx[1:1+size], yy[1:1+size])
 					if !slices.Equal(zz1[1:1+size], wantZ1) || !slices.Equal(zz2[1:1+size], wantZ2) || c1 != wantC1 || c2 != wantC2 {
 						t.Errorf("%s(%#x, %#x) = %#x, %#x, %#x, %#x, want %#x, %#x, %#x, %#x", name, x, y, zz1[1:1+size], zz2[1:1+size], c1, c2, wantZ1, wantZ2, wantC1, wantC2)
 					}
 					if !inplace {
 						checkSlice(t, name, "x", xx, 1, x)
 						checkSlice(t, name, "y", yy, 2, y)
 					}
 					checkSlice(t, name, "z1", zz1, 3, nil)
 					checkSlice(t, name, "z2", zz2, 4, nil)
 					if t.Failed() {
 						t.FailNow()
 					}
 				}
 			}
 		}
 	}
 }

 func testVW(t *testing.T, name string, fn, ref func(z, x []Word, w Word) (c Word), ws []Word) {
 	const (
 		magic0 = 0x123450
 		magic1 = 0x543210
 	)

 	for size := range 100 {
 		xx := make([]Word, 1+size+1)
 		zz := make([]Word, 1+size+1)
 		words := words4
 		if size > 5 {
 			words = words2
 		}
 		if size > 10 {
 			words = nil // random
 		}
 		for x := range nats(words, size) {
 			for _, w := range ws {
 				wantZ := make([]Word, size)
 				wantC := ref(wantZ, x, w)

 				copy(xx[1:], x)
 				for _, inplace := range []bool{false, true} {
 					name := name
 					if inplace {
 						name = "in-place " + name
 					}
 					setSlice(xx, 1, x)
 					zz := zz
 					if inplace {
 						zz = xx
 					} else {
 						for i := range zz {
 							zz[i] = 0x9876
 						}
 					}
 					setSlice(zz, 2, nil)
 					c := fn(zz[1:1+size], xx[1:1+size], w)
 					if !slices.Equal(zz[1:1+size], wantZ) || c != wantC {
 						t.Errorf("%s(%#x, %#x) = %#x, %#x, want %#x, %#x", name, x, w, zz[1:1+size], c, wantZ, wantC)
 					}
 					if !inplace {
 						checkSlice(t, name, "x", xx, 1, x)
 					}
 					checkSlice(t, name, "z", zz, 2, nil)
 					if t.Failed() {
 						t.FailNow()
 					}
 				}
 			}
 		}
 	}
 }

 func testVU(t *testing.T, name string, fn, ref func(z, x []Word, y uint) (c Word), ys []uint) {
 	wys := make([]Word, len(ys))
 	for i, y := range ys {
 		wys[i] = Word(y)
 	}
 	testVW(t, name,
 		func(z, x []Word, y Word) Word { return fn(z, x, uint(y)) },
 		func(z, x []Word, y Word) Word { return ref(z, x, uint(y)) },
 		wys)
 }

 func testVWW(t *testing.T, name string, fn, ref func(z, x []Word, y, r Word) (c Word), ys []Word) {
 	const (
 		magic0 = 0x123450
 		magic1 = 0x543210
 	)

 	for size := range 100 {
 		xx := make([]Word, 1+size+1)
 		zz := make([]Word, 1+size+1)
 		words := words4
 		if size > 5 {
 			words = words2
 		}
 		if size > 10 {
 			words = nil // random
 		}
 		for x := range nats(words, size) {
 			for _, y := range ys {
 				for _, r := range ys {
 					wantZ := make([]Word, size)
 					wantC := ref(wantZ, x, y, r)

 					copy(xx[1:], x)
 					for _, inplace := range []bool{false, true} {
 						name := name
 						if inplace {
 							name = "in-place " + name
 						}
 						setSlice(xx, 1, x)
 						zz := zz
 						if inplace {
 							zz = xx
 						} else {
 							for i := range zz {
 								zz[i] = 0x9876
 							}
 						}
 						setSlice(zz, 2, nil)
 						c := fn(zz[1:1+size], xx[1:1+size], y, r)
 						if !slices.Equal(zz[1:1+size], wantZ) || c != wantC {
 							t.Errorf("%s(%#x, %#x, %#x) = %#x, %#x, want %#x, %#x", name, x, y, r, zz[1:1+size], c, wantZ, wantC)
 						}
 						if !inplace {
 							checkSlice(t, name, "x", xx, 1, x)
 						}
 						checkSlice(t, name, "z", zz, 2, nil)
 						if t.Failed() {
 							t.FailNow()
 						}
 					}
 				}
 			}
 		}
 	}
 }

 func testVVU(t *testing.T, name string, fn, ref func(z, x, y []Word, s uint) (c Word), shifts []uint) {
 	for size := range 100 {
 		xx := make([]Word, 1+size+1)
 		yy := make([]Word, 1+size+1)
 		zz := make([]Word, 1+size+1)
 		words := words4
 		if size > 5 {
 			words = words2
 		}
 		if size > 10 {
 			words = nil // random
 		}
 		for x := range nats(words, size) {
 			for y := range nats(words, size) {
 				for _, s := range shifts {
 					wantZ := make([]Word, size)
 					wantC := ref(wantZ, x, y, s)

 					for _, inplace := range []bool{false, true} {
 						name := name
 						if inplace {
 							name = "in-place " + name
 						}
 						setSlice(xx, 1, x)
 						setSlice(yy, 2, y)
 						zz := zz
 						if inplace {
 							zz = xx
 						} else {
 							for i := range zz {
 								zz[i] = 0x9876
 							}
 						}
 						setSlice(zz, 3, nil)
 						c := fn(zz[1:1+size], xx[1:1+size], yy[1:1+size], s)
 						if !slices.Equal(zz[1:1+size], wantZ) || c != wantC {
 							t.Errorf("%s(%#x, %#x, %#x) = %#x, %#x, want %#x, %#x", name, x, y, s, zz[1:1+size], c, wantZ, wantC)
 						}
 						if !inplace {
 							checkSlice(t, name, "x", xx, 1, x)
 						}
 						checkSlice(t, name, "y", yy, 2, y)
 						checkSlice(t, name, "z", zz, 3, nil)
 						if t.Failed() {
 							t.FailNow()
 						}
 					}
 				}
 			}
 		}
 	}
 }

 func testVVWW(t *testing.T, name string, fn, ref func(z, x, y []Word, m, a Word) (c Word), ms, as []Word) {
 	for size := range 100 {
 		zz := make([]Word, 1+size+1)
 		xx := make([]Word, 1+size+1)
 		yy := make([]Word, 1+size+1)
 		words := words4
 		if size > 3 {
 			words = words2
 		}
 		if size > 7 {
 			words = nil // random
 		}
 		for x := range nats(words, size) {
 			for y := range nats(words, size) {
 				for _, m := range ms {
 					for _, a := range as {
 						wantZ := make([]Word, size)
 						wantC := ref(wantZ, x, y, m, a)

 						for _, inplace := range []bool{false, true} {
 							name := name
 							if inplace {
 								name = "in-place " + name
 							}
 							setSlice(xx, 1, x)
 							setSlice(yy, 2, y)
 							zz := zz
 							if inplace {
 								zz = xx
 							} else {
 								for i := range zz {
 									zz[i] = 0x9876
 								}
 							}
 							setSlice(zz, 3, nil)
 							c := fn(zz[1:1+size], xx[1:1+size], yy[1:1+size], m, a)
 							if !slices.Equal(zz[1:1+size], wantZ) || c != wantC {
 								t.Errorf("%s(%#x, %#x, %#x, %#x) = %#x, %#x, want %#x, %#x", name, x, y, m, a, zz[1:1+size], c, wantZ, wantC)
 							}
 							if !inplace {
 								checkSlice(t, name, "x", xx, 1, x)
 							}
 							checkSlice(t, name, "y", yy, 2, y)
 							checkSlice(t, name, "z", zz, 3, nil)
 							if t.Failed() {
 								t.FailNow()
 							}
 						}
 					}
 				}
 			}
 		}
 	}
 }

 const (
 	magic0 = 0x123450
 	magic1 = 0x543210
 )

 // setSlice sets x[1:len(x)-1] to orig, leaving magic values in x[0] and x[len(x)-1]
 // so that we can tell if routines accidentally write before or after the data.
 func setSlice(x []Word, id Word, orig []Word) {
 	x[0] = magic0 + id
 	copy(x[1:len(x)-1], orig)
 	x[len(x)-1] = magic1 + id
 }

 // checkSlice checks that the magic values left by setSlices are still there.
 // If orig != nil, it also checks that the actual data in x is unmodified since setSlice.
 func checkSlice(t *testing.T, name, val string, x []Word, id Word, orig []Word) {
 	if x[0] != magic0+id {
 		t.Errorf("%s smashed %s[-1]", name, val)
 	}
 	if x[len(x)-1] != magic1+id {
 		t.Errorf("%s smashed %s[len(%s)]", name, val, val)
 	}
 	if orig != nil && !slices.Equal(x[1:len(x)-1], orig) {
 		t.Errorf("%s smashed %s: have %d, want %d", name, val, x[1:len(x)-1], orig)
 	}
 }

 // nats returns a sequence of interesting nats of the given size:
 //
 //   - all 0
 //   - all ^0
 //   - all possible combinations of words
 //   - ten random values
 func nats(words []Word, size int) iter.Seq[[]Word] {
 	return func(yield func([]Word) bool) {
 		if size == 0 {
 			yield(nil)
 			return
 		}
 		w := make([]Word, size)

 		// all 0
 		for i := range w {
 			w[i] = 0
 		}
 		if !yield(w) {
 			return
 		}

 		// all ^0
 		for i := range w {
 			w[i] = _M
 		}
 		if !yield(w) {
 			return
 		}

 		// all possible combinations of words
 		var generate func(int) bool
 		generate = func(i int) bool {
 			if i >= len(w) {
 				return yield(w)
 			}
 			for _, w[i] = range words {
 				if !generate(i + 1) {
 					return false
 				}
 			}
 			return true
 		}
 		if !generate(0) {
 			return
 		}

 		// ten random values
 		for range 10 {
 			for i := range w {
 				w[i] = Word(rnd.Uint())
 			}
 			if !yield(w) {
 				return
 			}
 		}
 	}
 }

 // Always the same seed for reproducible results.
 var rnd = rand.New(rand.NewPCG(1, 2))

 func rndW() Word {
 	return Word(rnd.Uint())
 }

 func rndV(n int) []Word {
 	v := make([]Word, n)
 	for i := range v {
 		v[i] = rndW()
 	}
 	return v
 }

 // Construct a vector comprising the same word, usually '0' or 'maximum uint'
 func makeWordVec(e Word, n int) []Word {
 	v := make([]Word, n)
 	for i := range v {
 		v[i] = e
 	}
 	return v
 }

 type argVU struct {
 	d  []Word // d is a Word slice, the input parameters x and z come from this array.
 	l  uint   // l is the length of the input parameters x and z.
 	xp uint   // xp is the starting position of the input parameter x, x := d[xp:xp+l].
 	zp uint   // zp is the starting position of the input parameter z, z := d[zp:zp+l].
 	s  uint   // s is the shift number.
 	r  []Word // r is the expected output result z.
 	c  Word   // c is the expected return value.
 	m  string // message.
 }

 var arglshVUIn = []Word{1, 2, 4, 8, 16, 32, 64, 0, 0, 0}
 var arglshVUr0 = []Word{1, 2, 4, 8, 16, 32, 64}
 var arglshVUr1 = []Word{2, 4, 8, 16, 32, 64, 128}
 var arglshVUrWm1 = []Word{1 << (_W - 1), 0, 1, 2, 4, 8, 16}

 var arglshVU = []argVU{
 	// test cases for lshVU
 	{[]Word{1, _M, _M, _M, _M, _M, 3 << (_W - 2), 0}, 7, 0, 0, 1, []Word{2, _M - 1, _M, _M, _M, _M, 1<<(_W-1) + 1}, 1, "complete overlap of lshVU"},
 	{[]Word{1, _M, _M, _M, _M, _M, 3 << (_W - 2), 0, 0, 0, 0}, 7, 0, 3, 1, []Word{2, _M - 1, _M, _M, _M, _M, 1<<(_W-1) + 1}, 1, "partial overlap by half of lshVU"},
 	{[]Word{1, _M, _M, _M, _M, _M, 3 << (_W - 2), 0, 0, 0, 0, 0, 0, 0}, 7, 0, 6, 1, []Word{2, _M - 1, _M, _M, _M, _M, 1<<(_W-1) + 1}, 1, "partial overlap by 1 Word of lshVU"},
 	{[]Word{1, _M, _M, _M, _M, _M, 3 << (_W - 2), 0, 0, 0, 0, 0, 0, 0, 0}, 7, 0, 7, 1, []Word{2, _M - 1, _M, _M, _M, _M, 1<<(_W-1) + 1}, 1, "no overlap of lshVU"},
 	// additional test cases with shift values of 1 and (_W-1)
 	{arglshVUIn, 7, 0, 0, 1, arglshVUr1, 0, "complete overlap of lshVU and shift of 1"},
 	{arglshVUIn, 7, 0, 0, _W - 1, arglshVUrWm1, 32, "complete overlap of lshVU and shift of _W - 1"},
 	{arglshVUIn, 7, 0, 1, 1, arglshVUr1, 0, "partial overlap by 6 Words of lshVU and shift of 1"},
 	{arglshVUIn, 7, 0, 1, _W - 1, arglshVUrWm1, 32, "partial overlap by 6 Words of lshVU and shift of _W - 1"},
 	{arglshVUIn, 7, 0, 2, 1, arglshVUr1, 0, "partial overlap by 5 Words of lshVU and shift of 1"},
 	{arglshVUIn, 7, 0, 2, _W - 1, arglshVUrWm1, 32, "partial overlap by 5 Words of lshVU abd shift of _W - 1"},
 	{arglshVUIn, 7, 0, 3, 1, arglshVUr1, 0, "partial overlap by 4 Words of lshVU and shift of 1"},
 	{arglshVUIn, 7, 0, 3, _W - 1, arglshVUrWm1, 32, "partial overlap by 4 Words of lshVU and shift of _W - 1"},
 }

 var argrshVUIn = []Word{0, 0, 0, 1, 2, 4, 8, 16, 32, 64}
 var argrshVUr0 = []Word{1, 2, 4, 8, 16, 32, 64}
 var argrshVUr1 = []Word{0, 1, 2, 4, 8, 16, 32}
 var argrshVUrWm1 = []Word{4, 8, 16, 32, 64, 128, 0}

 var argrshVU = []argVU{
 	// test cases for rshVU
 	{[]Word{0, 3, _M, _M, _M, _M, _M, 1 << (_W - 1)}, 7, 1, 1, 1, []Word{1<<(_W-1) + 1, _M, _M, _M, _M, _M >> 1, 1 << (_W - 2)}, 1 << (_W - 1), "complete overlap of rshVU"},
 	{[]Word{0, 0, 0, 0, 3, _M, _M, _M, _M, _M, 1 << (_W - 1)}, 7, 4, 1, 1, []Word{1<<(_W-1) + 1, _M, _M, _M, _M, _M >> 1, 1 << (_W - 2)}, 1 << (_W - 1), "partial overlap by half of rshVU"},
 	{[]Word{0, 0, 0, 0, 0, 0, 0, 3, _M, _M, _M, _M, _M, 1 << (_W - 1)}, 7, 7, 1, 1, []Word{1<<(_W-1) + 1, _M, _M, _M, _M, _M >> 1, 1 << (_W - 2)}, 1 << (_W - 1), "partial overlap by 1 Word of rshVU"},
 	{[]Word{0, 0, 0, 0, 0, 0, 0, 0, 3, _M, _M, _M, _M, _M, 1 << (_W - 1)}, 7, 8, 1, 1, []Word{1<<(_W-1) + 1, _M, _M, _M, _M, _M >> 1, 1 << (_W - 2)}, 1 << (_W - 1), "no overlap of rshVU"},
 	// additional test cases with shift values of 0, 1 and (_W-1)
 	{argrshVUIn, 7, 3, 3, 1, argrshVUr1, 1 << (_W - 1), "complete overlap of rshVU and shift of 1"},
 	{argrshVUIn, 7, 3, 3, _W - 1, argrshVUrWm1, 2, "complete overlap of rshVU and shift of _W - 1"},
 	{argrshVUIn, 7, 3, 2, 1, argrshVUr1, 1 << (_W - 1), "partial overlap by 6 Words of rshVU and shift of 1"},
 	{argrshVUIn, 7, 3, 2, _W - 1, argrshVUrWm1, 2, "partial overlap by 6 Words of rshVU and shift of _W - 1"},
 	{argrshVUIn, 7, 3, 1, 1, argrshVUr1, 1 << (_W - 1), "partial overlap by 5 Words of rshVU and shift of 1"},
 	{argrshVUIn, 7, 3, 1, _W - 1, argrshVUrWm1, 2, "partial overlap by 5 Words of rshVU and shift of _W - 1"},
 	{argrshVUIn, 7, 3, 0, 1, argrshVUr1, 1 << (_W - 1), "partial overlap by 4 Words of rshVU and shift of 1"},
 	{argrshVUIn, 7, 3, 0, _W - 1, argrshVUrWm1, 2, "partial overlap by 4 Words of rshVU and shift of _W - 1"},
 }

 func testShiftFunc(t *testing.T, f func(z, x []Word, s uint) Word, a argVU) {
 	// work on copy of a.d to preserve the original data.
 	b := make([]Word, len(a.d))
 	copy(b, a.d)
 	z := b[a.zp : a.zp+a.l]
 	x := b[a.xp : a.xp+a.l]
 	c := f(z, x, a.s)
 	for i, zi := range z {
 		if zi != a.r[i] {
 			t.Errorf("d := %v, %s (d[%d:%d], d[%d:%d], %d)\n\tgot z[%d] = %#x; want %#x", a.d, a.m, a.zp, a.zp+a.l, a.xp, a.xp+a.l, a.s, i, zi, a.r[i])
 			break
 		}
 	}
 	if c != a.c {
 		t.Errorf("d := %v, %s (d[%d:%d], d[%d:%d], %d)\n\tgot c = %#x; want %#x", a.d, a.m, a.zp, a.zp+a.l, a.xp, a.xp+a.l, a.s, c, a.c)
 	}
 }

 func TestShiftOverlap(t *testing.T) {
 	for _, a := range arglshVU {
 		arg := a
 		testShiftFunc(t, lshVU, arg)
 	}

 	for _, a := range argrshVU {
 		arg := a
 		testShiftFunc(t, rshVU, arg)
 	}
 }

 func TestIssue31084(t *testing.T) {
 	stk := getStack()
 	defer stk.free()

 	// compute 10^n via 5^n << n.
 	const n = 165
 	p := nat(nil).expNN(stk, nat{5}, nat{n}, nil, false)
 	p = p.lsh(p, n)
 	got := string(p.utoa(10))
 	want := "1" + strings.Repeat("0", n)
 	if got != want {
 		t.Errorf("lsh(%v, %v)\n\tgot  %s\n\twant %s", p, n, got, want)
 	}
 }

 const issue42838Value = "159309191113245227702888039776771180559110455519261878607388585338616290151305816094308987472018268594098344692611135542392730712890625"

 func TestIssue42838(t *testing.T) {
 	const s = 192
 	z, _, _, _ := nat(nil).scan(strings.NewReader(issue42838Value), 0, false)
 	z = z.lsh(z, s)
 	got := string(z.utoa(10))
 	want := "1" + strings.Repeat("0", s)
 	if got != want {
 		t.Errorf("lsh(%v, %v)\n\tgot  %s\n\twant %s", z, s, got, want)
 	}
 }

 type funVWW func(z, x []Word, y, r Word) (c Word)
 type argVWW struct {
 	z, x nat
 	y, r Word
 	c    Word
 }

 var prodVWW = []argVWW{
 	{},
 	{nat{0}, nat{0}, 0, 0, 0},
 	{nat{991}, nat{0}, 0, 991, 0},
 	{nat{0}, nat{_M}, 0, 0, 0},
 	{nat{991}, nat{_M}, 0, 991, 0},
 	{nat{0}, nat{0}, _M, 0, 0},
 	{nat{991}, nat{0}, _M, 991, 0},
 	{nat{1}, nat{1}, 1, 0, 0},
 	{nat{992}, nat{1}, 1, 991, 0},
 	{nat{22793}, nat{991}, 23, 0, 0},
 	{nat{22800}, nat{991}, 23, 7, 0},
 	{nat{0, 0, 0, 22793}, nat{0, 0, 0, 991}, 23, 0, 0},
 	{nat{7, 0, 0, 22793}, nat{0, 0, 0, 991}, 23, 7, 0},
 	{nat{0, 0, 0, 0}, nat{7893475, 7395495, 798547395, 68943}, 0, 0, 0},
 	{nat{991, 0, 0, 0}, nat{7893475, 7395495, 798547395, 68943}, 0, 991, 0},
 	{nat{0, 0, 0, 0}, nat{0, 0, 0, 0}, 894375984, 0, 0},
 	{nat{991, 0, 0, 0}, nat{0, 0, 0, 0}, 894375984, 991, 0},
 	{nat{_M << 1 & _M}, nat{_M}, 1 << 1, 0, _M >> (_W - 1)},
 	{nat{_M<<1&_M + 1}, nat{_M}, 1 << 1, 1, _M >> (_W - 1)},
 	{nat{_M << 7 & _M}, nat{_M}, 1 << 7, 0, _M >> (_W - 7)},
 	{nat{_M<<7&_M + 1<<6}, nat{_M}, 1 << 7, 1 << 6, _M >> (_W - 7)},
 	{nat{_M << 7 & _M, _M, _M, _M}, nat{_M, _M, _M, _M}, 1 << 7, 0, _M >> (_W - 7)},
 	{nat{_M<<7&_M + 1<<6, _M, _M, _M}, nat{_M, _M, _M, _M}, 1 << 7, 1 << 6, _M >> (_W - 7)},
 }

 func testFunVWW(t *testing.T, msg string, f funVWW, a argVWW) {
 	z := make(nat, len(a.z))
 	c := f(z, a.x, a.y, a.r)
 	for i, zi := range z {
 		if zi != a.z[i] {
 			t.Errorf("%s%+v\n\tgot z[%d] = %#x; want %#x", msg, a, i, zi, a.z[i])
 			break
 		}
 	}
 	if c != a.c {
 		t.Errorf("%s%+v\n\tgot c = %#x; want %#x", msg, a, c, a.c)
 	}
 }

 // TODO(gri) mulAddVWW and divWVW are symmetric operations but
 // their signature is not symmetric. Try to unify.

 type funWVW func(z []Word, xn Word, x []Word, y Word) (r Word)
 type argWVW struct {
 	z  nat
 	xn Word
 	x  nat
 	y  Word
 	r  Word
 }

 func testFunWVW(t *testing.T, msg string, f funWVW, a argWVW) {
 	z := make(nat, len(a.z))
 	r := f(z, a.xn, a.x, a.y)
 	if !slices.Equal(z, a.z) || r != a.r {
 		t.Errorf("%s%+v\nhave %v, %v\nwant %v, %v", msg, a, z, r, a.z, a.r)
 	} else {
 		t.Logf("%s%+v\ngood %v, %v", msg, a, z, r)
 	}
 }

 func TestFunVWW(t *testing.T) {
 	for _, a := range prodVWW {
 		arg := a
 		testFunVWW(t, "mulAddVWW_g", mulAddVWW_g, arg)
 		testFunVWW(t, "mulAddVWW", mulAddVWW, arg)

 		if a.y != 0 && a.r < a.y {
 			arg := argWVW{a.x, a.c, a.z, a.y, a.r}
 			testFunWVW(t, "divWVW", divWVW, arg)
 		}
 	}
 }

 var mulWWTests = []struct {
 	x, y Word
 	q, r Word
 }{
 	{_M, _M, _M - 1, 1},
 	// 32 bit only: {0xc47dfa8c, 50911, 0x98a4, 0x998587f4},
 }

 func TestMulWW(t *testing.T) {
 	for i, test := range mulWWTests {
 		q, r := mulWW(test.x, test.y)
 		if q != test.q || r != test.r {
 			t.Errorf("#%d got (%x, %x) want (%x, %x)", i, q, r, test.q, test.r)
 		}
 	}
 }

 var mulAddWWWTests = []struct {
 	x, y, c Word
 	q, r    Word
 }{
 	// TODO(agl): These will only work on 64-bit platforms.
 	// {15064310297182388543, 0xe7df04d2d35d5d80, 13537600649892366549, 13644450054494335067, 10832252001440893781},
 	// {15064310297182388543, 0xdab2f18048baa68d, 13644450054494335067, 12869334219691522700, 14233854684711418382},
 	{_M, _M, 0, _M - 1, 1},
 	{_M, _M, _M, _M, 0},
 }

 func TestMulAddWWW(t *testing.T) {
 	for i, test := range mulAddWWWTests {
 		q, r := mulAddWWW_g(test.x, test.y, test.c)
 		if q != test.q || r != test.r {
 			t.Errorf("#%d got (%x, %x) want (%x, %x)", i, q, r, test.q, test.r)
 		}
 	}
 }

 var divWWTests = []struct {
 	x1, x0, y Word
 	q, r      Word
 }{
 	{_M >> 1, 0, _M, _M >> 1, _M >> 1},
 	{_M - (1 << (_W - 2)), _M, 3 << (_W - 2), _M, _M - (1 << (_W - 2))},
 }

 const testsNumber = 1 << 16

 func TestDivWW(t *testing.T) {
 	i := 0
 	for i, test := range divWWTests {
 		rec := reciprocalWord(test.y)
 		q, r := divWW(test.x1, test.x0, test.y, rec)
 		if q != test.q || r != test.r {
 			t.Errorf("#%d got (%x, %x) want (%x, %x)", i, q, r, test.q, test.r)
 		}
 	}
 	//random tests
 	for ; i < testsNumber; i++ {
 		x1 := rndW()
 		x0 := rndW()
 		y := rndW()
 		if x1 >= y {
 			continue
 		}
 		rec := reciprocalWord(y)
 		qGot, rGot := divWW(x1, x0, y, rec)
 		qWant, rWant := bits.Div(uint(x1), uint(x0), uint(y))
 		if uint(qGot) != qWant || uint(rGot) != rWant {
 			t.Errorf("#%d got (%x, %x) want (%x, %x)", i, qGot, rGot, qWant, rWant)
 		}
 	}
 }

 // benchSizes are the benchmark word sizes.
 var benchSizes = []int{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 16, 32, 64, 100, 1000, 10_000, 100_000}

 // A benchFunc is a function to be benchmarked.
 // It takes one output buffer and two input buffers,
 // but it does not have to use any of them.
 type benchFunc func(z, x, y []Word)

 // bench runs benchmarks of fn for a variety of word sizes.
 // It adds the given suffix (for example "/impl=go") to the benchmark names it creates,
 // after a "/words=N" parameter. Putting words first makes it easier to run
 // all benchmarks with a specific word size
 // (go test -run=NONE '-bench=V/words=100$')
 // even if different benchmarks have different numbers of other parameters.
 func bench(b *testing.B, suffix string, fn benchFunc) {
 	for _, n := range benchSizes {
 		if isRaceBuilder && n > 1e3 {
 			continue
 		}
 		var z, x, y []Word
 		b.Run(fmt.Sprintf("words=%d%s", n, suffix), func(b *testing.B) {
 			if z == nil {
 				z = make([]Word, n)
 				x = rndV(n)
 				y = rndV(n)
 			}
 			b.SetBytes(int64(n * _S))
 			for b.Loop() {
 				fn(z, x, y)
 			}
 		})
 	}
 }

 // Benchmark basic I/O and arithmetic processing speed,
 // to help estimate the upper bounds on other operations.

 func BenchmarkCopyVV(b *testing.B) { bench(b, "", benchVV(copyVV)) }

 func copyVV(z, x, y []Word) Word {
 	copy(z, x)
 	return 0
 }

 // Note: This benchmark consistently runs faster (even up to 2X faster on MB/s)
 // with words=10 and words=100 than larger amounts like words=1000 or words=10000.
 // The reason appears to that if you run 100-word addition loops repeatedly,
 // they are independent calculations, and the processor speculates/pipelines/whatever
 // to such a deep level that it can overlap the repeated loops.
 // In contrast, if you run 1000-word or 10000-word loops repeatedly,
 // the dependency chains are so long that the processor cannot overlap them.
 // If we change arithVV to take the starting value of s and pass in the result
 // from the previous arithVV, then even the 10-word or 100-loops become
 // a single long dependency chain and the 2X disappears. But since we are
 // using BenchmarkArithVV for a given word size to estimate the upper bound
 // of, say, BenchmarkAddVV for that same word size, we actually want the
 // dependency chain-length variation in BenchmarkArithVV too.
 // It's just mysterious to see until you understand what is causing it.

 func BenchmarkArithVV(b *testing.B) { bench(b, "", benchVV(arithVV)) }

 func arithVV(z, x, y []Word) Word {
 	var a, b, c, d, e, f, g, h, i, j Word
 	if len(z) >= 8 {
 		a, b, c, d, e, f, g, h, i, j = 1, 2, 3, 4, 5, 6, 7, 8, 9, 10
 	}
 	if len(z) < 10 {
 		// We don't really care about the speed here, but
 		// do something so that the small word counts aren't all the same.
 		s := Word(0)
 		for _, zi := range z {
 			s += zi
 		}
 		return s
 	}
 	s := Word(0)
 	for range len(z) / 10 {
 		s += a
 		s += b
 		s += c
 		s += d
 		s += e
 		s += f
 		s += g
 		s += h
 		s += i
 		s += j
 	}
 	return s
 }

 func BenchmarkAddVV(b *testing.B) {
 	bench(b, "/impl=asm", benchVV(addVV))
 	bench(b, "/impl=go", benchVV(addVV_g))
 }

 func BenchmarkSubVV(b *testing.B) {
 	bench(b, "/impl=asm", benchVV(subVV))
 	bench(b, "/impl=go", benchVV(subVV_g))
 }

 func benchVV(fn func(z, x, y []Word) Word) benchFunc {
 	return func(z, x, y []Word) { fn(z, x, y) }
 }

 func BenchmarkAddVW(b *testing.B) {
 	bench(b, "/data=random", benchVW(addVW, 123))
 	bench(b, "/data=carry", benchCarryVW(addVW, ^Word(0), 1))
 	bench(b, "/data=shortcut", benchShortVW(addVW, 123))
 }

 func BenchmarkSubVW(b *testing.B) {
 	bench(b, "/data=random", benchVW(subVW, 123))
 	bench(b, "/data=carry", benchCarryVW(subVW, 0, 1))
 	bench(b, "/data=shortcut", benchShortVW(subVW, 123))
 }

 func benchVW(fn func(z, x []Word, w Word) Word, w Word) benchFunc {
 	return func(z, x, y []Word) { fn(z, x, w) }
 }

 func benchCarryVW(fn func(z, x []Word, w Word) Word, xi, w Word) benchFunc {
 	return func(z, x, y []Word) {
 		// Fill x with xi the first time we are called with a given x.
 		// Otherwise x is random, so checking the first two elements is good enough.
 		// Assume this is the warmup, so we don't need to worry about it taking longer.
 		if x[0] != w || len(x) >= 2 && x[1] != w {
 			for i := range x {
 				x[i] = xi
 			}
 		}
 		fn(z, x, w)
 	}
 }

 func benchShortVW(fn func(z, x []Word, w Word) Word, w Word) benchFunc {
 	// Note: calling fn with x not z, to benchmark in-place overwriting.
 	return func(z, x, y []Word) { fn(x, x, w) }
 }

 func BenchmarkLshVU(b *testing.B) {
 	bench(b, "/impl=asm", benchVU(lshVU, 3))
 	bench(b, "/impl=go", benchVU(lshVU_g, 3))
 }

 func BenchmarkRshVU(b *testing.B) {
 	bench(b, "/impl=asm", benchVU(rshVU, 3))
 	bench(b, "/impl=go", benchVU(rshVU_g, 3))
 }

 func benchVU(fn func(z, x []Word, s uint) Word, s uint) benchFunc {
 	return func(z, x, y []Word) { fn(z, x, s) }
 }

 func BenchmarkMulAddVWW(b *testing.B) {
 	bench(b, "/impl=asm", benchVWW(mulAddVWW, 42, 100))
 	bench(b, "/impl=go", benchVWW(mulAddVWW_g, 42, 100))
 }

 func benchVWW(fn func(z, x []Word, w1, w2 Word) Word, w1, w2 Word) benchFunc {
 	return func(z, x, y []Word) { fn(z, x, w1, w2) }
 }

 func BenchmarkAddMulVVWW(b *testing.B) {
 	bench(b, "/impl=asm", benchVVWW(addMulVVWW, 42, 100))
 	bench(b, "/impl=go", benchVVWW(addMulVVWW_g, 42, 100))
 }

 func benchVVWW(fn func(z, x, y []Word, w1, w2 Word) Word, w1, w2 Word) benchFunc {
 	return func(z, x, y []Word) { fn(z, x, y, w1, w2) }
 }

 func BenchmarkDivWVW(b *testing.B) {
 	bench(b, "", benchWVW(divWVW, 100, 200))
 }

 func benchWVW(fn func(z []Word, w1 Word, x []Word, w2 Word) Word, w1, w2 Word) benchFunc {
 	return func(z, x, y []Word) { fn(z, w1, x, w2) }
 }