| // asmcheck |
| |
| // Copyright 2018 The Go Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file. |
| |
| package codegen |
| |
| // This file contains codegen tests related to arithmetic |
| // simplifications and optimizations on float types. |
| // For codegen tests on integer types, see arithmetic.go. |
| |
| // --------------------- // |
| // Strength-reduce // |
| // --------------------- // |
| |
| func Mul2(f float64) float64 { |
| // 386/sse2:"ADDSD",-"MULSD" |
| // amd64:"ADDSD",-"MULSD" |
| // arm/7:"ADDD",-"MULD" |
| // arm64:"FADDD",-"FMULD" |
| // ppc64x:"FADD",-"FMUL" |
| // riscv64:"FADDD",-"FMULD" |
| return f * 2.0 |
| } |
| |
| func DivPow2(f1, f2, f3 float64) (float64, float64, float64) { |
| // 386/sse2:"MULSD",-"DIVSD" |
| // amd64:"MULSD",-"DIVSD" |
| // arm/7:"MULD",-"DIVD" |
| // arm64:"FMULD",-"FDIVD" |
| // ppc64x:"FMUL",-"FDIV" |
| // riscv64:"FMULD",-"FDIVD" |
| x := f1 / 16.0 |
| |
| // 386/sse2:"MULSD",-"DIVSD" |
| // amd64:"MULSD",-"DIVSD" |
| // arm/7:"MULD",-"DIVD" |
| // arm64:"FMULD",-"FDIVD" |
| // ppc64x:"FMUL",-"FDIVD" |
| // riscv64:"FMULD",-"FDIVD" |
| y := f2 / 0.125 |
| |
| // 386/sse2:"ADDSD",-"DIVSD",-"MULSD" |
| // amd64:"ADDSD",-"DIVSD",-"MULSD" |
| // arm/7:"ADDD",-"MULD",-"DIVD" |
| // arm64:"FADDD",-"FMULD",-"FDIVD" |
| // ppc64x:"FADD",-"FMUL",-"FDIV" |
| // riscv64:"FADDD",-"FMULD",-"FDIVD" |
| z := f3 / 0.5 |
| |
| return x, y, z |
| } |
| |
| func indexLoad(b0 []float32, b1 float32, idx int) float32 { |
| // arm64:`FMOVS\s\(R[0-9]+\)\(R[0-9]+<<2\),\sF[0-9]+` |
| return b0[idx] * b1 |
| } |
| |
| func indexStore(b0 []float64, b1 float64, idx int) { |
| // arm64:`FMOVD\sF[0-9]+,\s\(R[0-9]+\)\(R[0-9]+<<3\)` |
| b0[idx] = b1 |
| } |
| |
| // ----------- // |
| // Fused // |
| // ----------- // |
| |
| func FusedAdd32(x, y, z float32) float32 { |
| // s390x:"FMADDS\t" |
| // ppc64x:"FMADDS\t" |
| // arm64:"FMADDS" |
| // riscv64:"FMADDS\t" |
| return x*y + z |
| } |
| |
| func FusedSub32_a(x, y, z float32) float32 { |
| // s390x:"FMSUBS\t" |
| // ppc64x:"FMSUBS\t" |
| // riscv64:"FMSUBS\t" |
| return x*y - z |
| } |
| |
| func FusedSub32_b(x, y, z float32) float32 { |
| // arm64:"FMSUBS" |
| // riscv64:"FNMSUBS\t" |
| return z - x*y |
| } |
| |
| func FusedAdd64(x, y, z float64) float64 { |
| // s390x:"FMADD\t" |
| // ppc64x:"FMADD\t" |
| // arm64:"FMADDD" |
| // riscv64:"FMADDD\t" |
| return x*y + z |
| } |
| |
| func FusedSub64_a(x, y, z float64) float64 { |
| // s390x:"FMSUB\t" |
| // ppc64x:"FMSUB\t" |
| // riscv64:"FMSUBD\t" |
| return x*y - z |
| } |
| |
| func FusedSub64_b(x, y, z float64) float64 { |
| // arm64:"FMSUBD" |
| // riscv64:"FNMSUBD\t" |
| return z - x*y |
| } |
| |
| func Cmp(f float64) bool { |
| // arm64:"FCMPD","(BGT|BLE|BMI|BPL)",-"CSET\tGT",-"CBZ" |
| return f > 4 || f < -4 |
| } |
| |
| func CmpZero64(f float64) bool { |
| // s390x:"LTDBR",-"FCMPU" |
| return f <= 0 |
| } |
| |
| func CmpZero32(f float32) bool { |
| // s390x:"LTEBR",-"CEBR" |
| return f <= 0 |
| } |
| |
| func CmpWithSub(a float64, b float64) bool { |
| f := a - b |
| // s390x:-"LTDBR" |
| return f <= 0 |
| } |
| |
| func CmpWithAdd(a float64, b float64) bool { |
| f := a + b |
| // s390x:-"LTDBR" |
| return f <= 0 |
| } |
| |
| // ---------------- // |
| // Non-floats // |
| // ---------------- // |
| |
| // We should make sure that the compiler doesn't generate floating point |
| // instructions for non-float operations on Plan 9, because floating point |
| // operations are not allowed in the note handler. |
| |
| func ArrayZero() [16]byte { |
| // amd64:"MOVUPS" |
| // plan9/amd64/:-"MOVUPS" |
| var a [16]byte |
| return a |
| } |
| |
| func ArrayCopy(a [16]byte) (b [16]byte) { |
| // amd64:"MOVUPS" |
| // plan9/amd64/:-"MOVUPS" |
| b = a |
| return |
| } |
| |
| // ---------------- // |
| // Float Min/Max // |
| // ---------------- // |
| |
| func Float64Min(a, b float64) float64 { |
| // amd64:"MINSD" |
| // arm64:"FMIND" |
| // riscv64:"FMIN" |
| // ppc64/power9:"XSMINJDP" |
| // ppc64/power10:"XSMINJDP" |
| return min(a, b) |
| } |
| |
| func Float64Max(a, b float64) float64 { |
| // amd64:"MINSD" |
| // arm64:"FMAXD" |
| // riscv64:"FMAX" |
| // ppc64/power9:"XSMAXJDP" |
| // ppc64/power10:"XSMAXJDP" |
| return max(a, b) |
| } |
| |
| func Float32Min(a, b float32) float32 { |
| // amd64:"MINSS" |
| // arm64:"FMINS" |
| // riscv64:"FMINS" |
| // ppc64/power9:"XSMINJDP" |
| // ppc64/power10:"XSMINJDP" |
| return min(a, b) |
| } |
| |
| func Float32Max(a, b float32) float32 { |
| // amd64:"MINSS" |
| // arm64:"FMAXS" |
| // riscv64:"FMAXS" |
| // ppc64/power9:"XSMAXJDP" |
| // ppc64/power10:"XSMAXJDP" |
| return max(a, b) |
| } |
| |
| // ------------------------ // |
| // Constant Optimizations // |
| // ------------------------ // |
| |
| func Float32Constant() float32 { |
| // ppc64x/power8:"FMOVS\t[$]f32\\.42440000\\(SB\\)" |
| // ppc64x/power9:"FMOVS\t[$]f32\\.42440000\\(SB\\)" |
| // ppc64x/power10:"XXSPLTIDP\t[$]1111752704," |
| return 49.0 |
| } |
| |
| func Float64Constant() float64 { |
| // ppc64x/power8:"FMOVD\t[$]f64\\.4048800000000000\\(SB\\)" |
| // ppc64x/power9:"FMOVD\t[$]f64\\.4048800000000000\\(SB\\)" |
| // ppc64x/power10:"XXSPLTIDP\t[$]1111752704," |
| return 49.0 |
| } |
| |
| func Float32DenormalConstant() float32 { |
| // ppc64x:"FMOVS\t[$]f32\\.00400000\\(SB\\)" |
| return 0x1p-127 |
| } |
| |
| // A float64 constant which can be exactly represented as a |
| // denormal float32 value. On ppc64x, denormal values cannot |
| // be used with XXSPLTIDP. |
| func Float64DenormalFloat32Constant() float64 { |
| // ppc64x:"FMOVD\t[$]f64\\.3800000000000000\\(SB\\)" |
| return 0x1p-127 |
| } |