| // Copyright 2017 The Go Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file. |
| |
| #include "textflag.h" |
| |
| // Minimax polynomial coefficients and other constants |
| DATA ·asinhrodataL18<> + 0(SB)/8, $0.749999999977387502E-01 |
| DATA ·asinhrodataL18<> + 8(SB)/8, $-.166666666666657082E+00 |
| DATA ·asinhrodataL18<> + 16(SB)/8, $0.303819368237360639E-01 |
| DATA ·asinhrodataL18<> + 24(SB)/8, $-.446428569571752982E-01 |
| DATA ·asinhrodataL18<> + 32(SB)/8, $0.173500047922695924E-01 |
| DATA ·asinhrodataL18<> + 40(SB)/8, $-.223719767210027185E-01 |
| DATA ·asinhrodataL18<> + 48(SB)/8, $0.113655037946822130E-01 |
| DATA ·asinhrodataL18<> + 56(SB)/8, $0.579747490622448943E-02 |
| DATA ·asinhrodataL18<> + 64(SB)/8, $-.139372433914359122E-01 |
| DATA ·asinhrodataL18<> + 72(SB)/8, $-.218674325255800840E-02 |
| DATA ·asinhrodataL18<> + 80(SB)/8, $-.891074277756961157E-02 |
| DATA ·asinhrodataL18<> + 88(SB)/8, $.41375273347623353626 |
| DATA ·asinhrodataL18<> + 96(SB)/8, $.51487302528619766235E+04 |
| DATA ·asinhrodataL18<> + 104(SB)/8, $-1.67526912689208984375 |
| DATA ·asinhrodataL18<> + 112(SB)/8, $0.181818181818181826E+00 |
| DATA ·asinhrodataL18<> + 120(SB)/8, $-.165289256198351540E-01 |
| DATA ·asinhrodataL18<> + 128(SB)/8, $0.200350613573012186E-02 |
| DATA ·asinhrodataL18<> + 136(SB)/8, $-.273205381970859341E-03 |
| DATA ·asinhrodataL18<> + 144(SB)/8, $0.397389654305194527E-04 |
| DATA ·asinhrodataL18<> + 152(SB)/8, $0.938370938292558173E-06 |
| DATA ·asinhrodataL18<> + 160(SB)/8, $0.212881813645679599E-07 |
| DATA ·asinhrodataL18<> + 168(SB)/8, $-.602107458843052029E-05 |
| DATA ·asinhrodataL18<> + 176(SB)/8, $-.148682720127920854E-06 |
| DATA ·asinhrodataL18<> + 184(SB)/8, $-5.5 |
| DATA ·asinhrodataL18<> + 192(SB)/8, $1.0 |
| DATA ·asinhrodataL18<> + 200(SB)/8, $1.0E-20 |
| GLOBL ·asinhrodataL18<> + 0(SB), RODATA, $208 |
| |
| // Table of log correction terms |
| DATA ·asinhtab2080<> + 0(SB)/8, $0.585235384085551248E-01 |
| DATA ·asinhtab2080<> + 8(SB)/8, $0.412206153771168640E-01 |
| DATA ·asinhtab2080<> + 16(SB)/8, $0.273839003221648339E-01 |
| DATA ·asinhtab2080<> + 24(SB)/8, $0.166383778368856480E-01 |
| DATA ·asinhtab2080<> + 32(SB)/8, $0.866678223433169637E-02 |
| DATA ·asinhtab2080<> + 40(SB)/8, $0.319831684989627514E-02 |
| DATA ·asinhtab2080<> + 48(SB)/8, $0.0 |
| DATA ·asinhtab2080<> + 56(SB)/8, $-.113006378583725549E-02 |
| DATA ·asinhtab2080<> + 64(SB)/8, $-.367979419636602491E-03 |
| DATA ·asinhtab2080<> + 72(SB)/8, $0.213172484510484979E-02 |
| DATA ·asinhtab2080<> + 80(SB)/8, $0.623271047682013536E-02 |
| DATA ·asinhtab2080<> + 88(SB)/8, $0.118140812789696885E-01 |
| DATA ·asinhtab2080<> + 96(SB)/8, $0.187681358930914206E-01 |
| DATA ·asinhtab2080<> + 104(SB)/8, $0.269985148668178992E-01 |
| DATA ·asinhtab2080<> + 112(SB)/8, $0.364186619761331328E-01 |
| DATA ·asinhtab2080<> + 120(SB)/8, $0.469505379381388441E-01 |
| GLOBL ·asinhtab2080<> + 0(SB), RODATA, $128 |
| |
| // Asinh returns the inverse hyperbolic sine of the argument. |
| // |
| // Special cases are: |
| // Asinh(±0) = ±0 |
| // Asinh(±Inf) = ±Inf |
| // Asinh(NaN) = NaN |
| // The algorithm used is minimax polynomial approximation |
| // with coefficients determined with a Remez exchange algorithm. |
| |
| TEXT ·asinhAsm(SB), NOSPLIT, $0-16 |
| FMOVD x+0(FP), F0 |
| MOVD $·asinhrodataL18<>+0(SB), R9 |
| LGDR F0, R12 |
| WORD $0xC0293FDF //iilf %r2,1071644671 |
| BYTE $0xFF |
| BYTE $0xFF |
| SRAD $32, R12 |
| WORD $0xB917001C //llgtr %r1,%r12 |
| MOVW R1, R6 |
| MOVW R2, R7 |
| CMPBLE R6, R7, L2 |
| WORD $0xC0295FEF //iilf %r2,1609564159 |
| BYTE $0xFF |
| BYTE $0xFF |
| MOVW R2, R7 |
| CMPBLE R6, R7, L14 |
| L3: |
| WORD $0xC0297FEF //iilf %r2,2146435071 |
| BYTE $0xFF |
| BYTE $0xFF |
| CMPW R1, R2 |
| BGT L1 |
| LTDBR F0, F0 |
| FMOVD F0, F10 |
| BLTU L15 |
| L9: |
| FMOVD $0, F0 |
| WFADB V0, V10, V0 |
| WORD $0xC0398006 //iilf %r3,2147909631 |
| BYTE $0x7F |
| BYTE $0xFF |
| LGDR F0, R5 |
| SRAD $32, R5 |
| MOVH $0x0, R2 |
| SUBW R5, R3 |
| FMOVD $0, F8 |
| WORD $0xEC4320AF //risbg %r4,%r3,32,128+47,0 |
| BYTE $0x00 |
| BYTE $0x55 |
| BYTE $0x18 //lr %r1,%r4 |
| BYTE $0x14 |
| WORD $0xEC24001F //risbgn %r2,%r4,64-64+0,64-64+0+32-1,64-0-32 |
| BYTE $0x20 |
| BYTE $0x59 |
| SUBW $0x100000, R1 |
| SRAW $8, R1, R1 |
| ORW $0x45000000, R1 |
| BR L6 |
| L2: |
| MOVD $0x30000000, R2 |
| CMPW R1, R2 |
| BGT L16 |
| FMOVD 200(R9), F2 |
| FMADD F2, F0, F0 |
| L1: |
| FMOVD F0, ret+8(FP) |
| RET |
| L14: |
| LTDBR F0, F0 |
| BLTU L17 |
| FMOVD F0, F10 |
| L4: |
| FMOVD 192(R9), F2 |
| WFMADB V0, V0, V2, V0 |
| LTDBR F0, F0 |
| FSQRT F0, F8 |
| L5: |
| WFADB V8, V10, V0 |
| WORD $0xC0398006 //iilf %r3,2147909631 |
| BYTE $0x7F |
| BYTE $0xFF |
| LGDR F0, R5 |
| SRAD $32, R5 |
| MOVH $0x0, R2 |
| SUBW R5, R3 |
| WORD $0xEC4320AF //risbg %r4,%r3,32,128+47,0 |
| BYTE $0x00 |
| BYTE $0x55 |
| SRAW $8, R4, R1 |
| WORD $0xEC24001F //risbgn %r2,%r4,64-64+0,64-64+0+32-1,64-0-32 |
| BYTE $0x20 |
| BYTE $0x59 |
| ORW $0x45000000, R1 |
| L6: |
| LDGR R2, F2 |
| FMOVD 184(R9), F0 |
| WFMADB V8, V2, V0, V8 |
| FMOVD 176(R9), F4 |
| WFMADB V10, V2, V8, V2 |
| FMOVD 168(R9), F0 |
| FMOVD 160(R9), F6 |
| FMOVD 152(R9), F1 |
| WFMADB V2, V6, V4, V6 |
| WFMADB V2, V1, V0, V1 |
| WFMDB V2, V2, V4 |
| FMOVD 144(R9), F0 |
| WFMADB V6, V4, V1, V6 |
| FMOVD 136(R9), F1 |
| WORD $0xEC3339BC //risbg %r3,%r3,57,128+60,64-13 |
| BYTE $0x33 |
| BYTE $0x55 |
| WFMADB V2, V0, V1, V0 |
| FMOVD 128(R9), F1 |
| WFMADB V4, V6, V0, V6 |
| FMOVD 120(R9), F0 |
| WFMADB V2, V1, V0, V1 |
| VLVGF $0, R1, V0 |
| WFMADB V4, V6, V1, V4 |
| LDEBR F0, F0 |
| FMOVD 112(R9), F6 |
| WFMADB V2, V4, V6, V4 |
| MOVD $·asinhtab2080<>+0(SB), R1 |
| FMOVD 104(R9), F1 |
| WORD $0x68331000 //ld %f3,0(%r3,%r1) |
| FMOVD 96(R9), F6 |
| WFMADB V2, V4, V3, V2 |
| WFMADB V0, V1, V6, V0 |
| FMOVD 88(R9), F4 |
| WFMADB V0, V4, V2, V0 |
| MOVD R12, R6 |
| CMPBGT R6, $0, L1 |
| |
| WORD $0xB3130000 //lcdbr %f0,%f0 |
| FMOVD F0, ret+8(FP) |
| RET |
| L16: |
| WFMDB V0, V0, V1 |
| FMOVD 80(R9), F6 |
| WFMDB V1, V1, V4 |
| FMOVD 72(R9), F2 |
| WFMADB V4, V2, V6, V2 |
| FMOVD 64(R9), F3 |
| FMOVD 56(R9), F6 |
| WFMADB V4, V2, V3, V2 |
| FMOVD 48(R9), F3 |
| WFMADB V4, V6, V3, V6 |
| FMOVD 40(R9), F5 |
| FMOVD 32(R9), F3 |
| WFMADB V4, V2, V5, V2 |
| WFMADB V4, V6, V3, V6 |
| FMOVD 24(R9), F5 |
| FMOVD 16(R9), F3 |
| WFMADB V4, V2, V5, V2 |
| WFMADB V4, V6, V3, V6 |
| FMOVD 8(R9), F5 |
| FMOVD 0(R9), F3 |
| WFMADB V4, V2, V5, V2 |
| WFMADB V4, V6, V3, V4 |
| WFMDB V0, V1, V6 |
| WFMADB V1, V4, V2, V4 |
| FMADD F4, F6, F0 |
| FMOVD F0, ret+8(FP) |
| RET |
| L17: |
| WORD $0xB31300A0 //lcdbr %f10,%f0 |
| BR L4 |
| L15: |
| WORD $0xB31300A0 //lcdbr %f10,%f0 |
| BR L9 |