| // Copyright 2016 The Go Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file. |
| |
| #include "textflag.h" |
| |
| // Constants |
| DATA coshrodataL23<>+0(SB)/8, $0.231904681384629956E-16 |
| DATA coshrodataL23<>+8(SB)/8, $0.693147180559945286E+00 |
| DATA coshrodataL23<>+16(SB)/8, $0.144269504088896339E+01 |
| DATA coshrodataL23<>+24(SB)/8, $704.E0 |
| GLOBL coshrodataL23<>+0(SB), RODATA, $32 |
| DATA coshxinf<>+0(SB)/8, $0x7FF0000000000000 |
| GLOBL coshxinf<>+0(SB), RODATA, $8 |
| DATA coshxlim1<>+0(SB)/8, $800.E0 |
| GLOBL coshxlim1<>+0(SB), RODATA, $8 |
| DATA coshxaddhy<>+0(SB)/8, $0xc2f0000100003fdf |
| GLOBL coshxaddhy<>+0(SB), RODATA, $8 |
| DATA coshx4ff<>+0(SB)/8, $0x4ff0000000000000 |
| GLOBL coshx4ff<>+0(SB), RODATA, $8 |
| DATA coshe1<>+0(SB)/8, $0x3ff000000000000a |
| GLOBL coshe1<>+0(SB), RODATA, $8 |
| |
| // Log multiplier table |
| DATA coshtab<>+0(SB)/8, $0.442737824274138381E-01 |
| DATA coshtab<>+8(SB)/8, $0.263602189790660309E-01 |
| DATA coshtab<>+16(SB)/8, $0.122565642281703586E-01 |
| DATA coshtab<>+24(SB)/8, $0.143757052860721398E-02 |
| DATA coshtab<>+32(SB)/8, $-.651375034121276075E-02 |
| DATA coshtab<>+40(SB)/8, $-.119317678849450159E-01 |
| DATA coshtab<>+48(SB)/8, $-.150868749549871069E-01 |
| DATA coshtab<>+56(SB)/8, $-.161992609578469234E-01 |
| DATA coshtab<>+64(SB)/8, $-.154492360403337917E-01 |
| DATA coshtab<>+72(SB)/8, $-.129850717389178721E-01 |
| DATA coshtab<>+80(SB)/8, $-.892902649276657891E-02 |
| DATA coshtab<>+88(SB)/8, $-.338202636596794887E-02 |
| DATA coshtab<>+96(SB)/8, $0.357266307045684762E-02 |
| DATA coshtab<>+104(SB)/8, $0.118665304327406698E-01 |
| DATA coshtab<>+112(SB)/8, $0.214434994118118914E-01 |
| DATA coshtab<>+120(SB)/8, $0.322580645161290314E-01 |
| GLOBL coshtab<>+0(SB), RODATA, $128 |
| |
| // Minimax polynomial approximations |
| DATA coshe2<>+0(SB)/8, $0.500000000000004237e+00 |
| GLOBL coshe2<>+0(SB), RODATA, $8 |
| DATA coshe3<>+0(SB)/8, $0.166666666630345592e+00 |
| GLOBL coshe3<>+0(SB), RODATA, $8 |
| DATA coshe4<>+0(SB)/8, $0.416666664838056960e-01 |
| GLOBL coshe4<>+0(SB), RODATA, $8 |
| DATA coshe5<>+0(SB)/8, $0.833349307718286047e-02 |
| GLOBL coshe5<>+0(SB), RODATA, $8 |
| DATA coshe6<>+0(SB)/8, $0.138926439368309441e-02 |
| GLOBL coshe6<>+0(SB), RODATA, $8 |
| |
| // Cosh returns the hyperbolic cosine of x. |
| // |
| // Special cases are: |
| // Cosh(±0) = 1 |
| // Cosh(±Inf) = +Inf |
| // Cosh(NaN) = NaN |
| // The algorithm used is minimax polynomial approximation |
| // with coefficients determined with a Remez exchange algorithm. |
| |
| TEXT ·coshAsm(SB),NOSPLIT,$0-16 |
| FMOVD x+0(FP), F0 |
| MOVD $coshrodataL23<>+0(SB), R9 |
| LTDBR F0, F0 |
| MOVD $0x4086000000000000, R2 |
| MOVD $0x4086000000000000, R3 |
| BLTU L19 |
| FMOVD F0, F4 |
| L2: |
| WORD $0xED409018 //cdb %f4,.L24-.L23(%r9) |
| BYTE $0x00 |
| BYTE $0x19 |
| BGE L14 //jnl .L14 |
| BVS L14 |
| WFCEDBS V4, V4, V2 |
| BEQ L20 |
| L1: |
| FMOVD F0, ret+8(FP) |
| RET |
| |
| L14: |
| WFCEDBS V4, V4, V2 |
| BVS L1 |
| MOVD $coshxlim1<>+0(SB), R1 |
| FMOVD 0(R1), F2 |
| WFCHEDBS V4, V2, V2 |
| BEQ L21 |
| MOVD $coshxaddhy<>+0(SB), R1 |
| FMOVD coshrodataL23<>+16(SB), F5 |
| FMOVD 0(R1), F2 |
| WFMSDB V0, V5, V2, V5 |
| FMOVD coshrodataL23<>+8(SB), F3 |
| FADD F5, F2 |
| MOVD $coshe6<>+0(SB), R1 |
| WFMSDB V2, V3, V0, V3 |
| FMOVD 0(R1), F6 |
| WFMDB V3, V3, V1 |
| MOVD $coshe4<>+0(SB), R1 |
| FMOVD coshrodataL23<>+0(SB), F7 |
| WFMADB V2, V7, V3, V2 |
| FMOVD 0(R1), F3 |
| MOVD $coshe5<>+0(SB), R1 |
| WFMADB V1, V6, V3, V6 |
| FMOVD 0(R1), F7 |
| MOVD $coshe3<>+0(SB), R1 |
| FMOVD 0(R1), F3 |
| WFMADB V1, V7, V3, V7 |
| FNEG F2, F3 |
| LGDR F5, R1 |
| MOVD $coshe2<>+0(SB), R3 |
| WFCEDBS V4, V0, V0 |
| FMOVD 0(R3), F5 |
| MOVD $coshe1<>+0(SB), R3 |
| WFMADB V1, V6, V5, V6 |
| FMOVD 0(R3), F5 |
| RISBGN $0, $15, $48, R1, R2 |
| WFMADB V1, V7, V5, V1 |
| BVS L22 |
| RISBGZ $57, $60, $3, R1, R4 |
| MOVD $coshtab<>+0(SB), R3 |
| WFMADB V3, V6, V1, V6 |
| WORD $0x68043000 //ld %f0,0(%r4,%r3) |
| FMSUB F0, F3, F2 |
| WORD $0xA71AF000 //ahi %r1,-4096 |
| WFMADB V2, V6, V0, V6 |
| L17: |
| RISBGN $0, $15, $48, R1, R2 |
| LDGR R2, F2 |
| FMADD F2, F6, F2 |
| MOVD $coshx4ff<>+0(SB), R1 |
| FMOVD 0(R1), F0 |
| FMUL F2, F0 |
| FMOVD F0, ret+8(FP) |
| RET |
| |
| L19: |
| FNEG F0, F4 |
| BR L2 |
| L20: |
| MOVD $coshxaddhy<>+0(SB), R1 |
| FMOVD coshrodataL23<>+16(SB), F3 |
| FMOVD 0(R1), F2 |
| WFMSDB V0, V3, V2, V3 |
| FMOVD coshrodataL23<>+8(SB), F4 |
| FADD F3, F2 |
| MOVD $coshe6<>+0(SB), R1 |
| FMSUB F4, F2, F0 |
| FMOVD 0(R1), F6 |
| WFMDB V0, V0, V1 |
| MOVD $coshe4<>+0(SB), R1 |
| FMOVD 0(R1), F4 |
| MOVD $coshe5<>+0(SB), R1 |
| FMOVD coshrodataL23<>+0(SB), F5 |
| WFMADB V1, V6, V4, V6 |
| FMADD F5, F2, F0 |
| FMOVD 0(R1), F2 |
| MOVD $coshe3<>+0(SB), R1 |
| FMOVD 0(R1), F4 |
| WFMADB V1, V2, V4, V2 |
| MOVD $coshe2<>+0(SB), R1 |
| FMOVD 0(R1), F5 |
| FNEG F0, F4 |
| WFMADB V1, V6, V5, V6 |
| MOVD $coshe1<>+0(SB), R1 |
| FMOVD 0(R1), F5 |
| WFMADB V1, V2, V5, V1 |
| LGDR F3, R1 |
| MOVD $coshtab<>+0(SB), R5 |
| WFMADB V4, V6, V1, V3 |
| RISBGZ $57, $60, $3, R1, R4 |
| WFMSDB V4, V6, V1, V6 |
| WORD $0x68145000 //ld %f1,0(%r4,%r5) |
| WFMSDB V4, V1, V0, V2 |
| WORD $0xA7487FBE //lhi %r4,32702 |
| FMADD F3, F2, F1 |
| SUBW R1, R4 |
| RISBGZ $57, $60, $3, R4, R12 |
| WORD $0x682C5000 //ld %f2,0(%r12,%r5) |
| FMSUB F2, F4, F0 |
| RISBGN $0, $15, $48, R1, R2 |
| WFMADB V0, V6, V2, V6 |
| RISBGN $0, $15, $48, R4, R3 |
| LDGR R2, F2 |
| LDGR R3, F0 |
| FMADD F2, F1, F2 |
| FMADD F0, F6, F0 |
| FADD F2, F0 |
| FMOVD F0, ret+8(FP) |
| RET |
| |
| L22: |
| WORD $0xA7387FBE //lhi %r3,32702 |
| MOVD $coshtab<>+0(SB), R4 |
| SUBW R1, R3 |
| WFMSDB V3, V6, V1, V6 |
| RISBGZ $57, $60, $3, R3, R3 |
| WORD $0x68034000 //ld %f0,0(%r3,%r4) |
| FMSUB F0, F3, F2 |
| WORD $0xA7386FBE //lhi %r3,28606 |
| WFMADB V2, V6, V0, V6 |
| SUBW R1, R3, R1 |
| BR L17 |
| L21: |
| MOVD $coshxinf<>+0(SB), R1 |
| FMOVD 0(R1), F0 |
| FMOVD F0, ret+8(FP) |
| RET |
| |