// Copyright 2017 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

#include "textflag.h"

// Minimax polynomial coefficients and other constants
DATA ·atanhrodataL10<> + 0(SB)/8, $.41375273347623353626
DATA ·atanhrodataL10<> + 8(SB)/8, $.51487302528619766235E+04
DATA ·atanhrodataL10<> + 16(SB)/8, $-1.67526912689208984375
DATA ·atanhrodataL10<> + 24(SB)/8, $0.181818181818181826E+00
DATA ·atanhrodataL10<> + 32(SB)/8, $-.165289256198351540E-01
DATA ·atanhrodataL10<> + 40(SB)/8, $0.200350613573012186E-02
DATA ·atanhrodataL10<> + 48(SB)/8, $0.397389654305194527E-04
DATA ·atanhrodataL10<> + 56(SB)/8, $-.273205381970859341E-03
DATA ·atanhrodataL10<> + 64(SB)/8, $0.938370938292558173E-06
DATA ·atanhrodataL10<> + 72(SB)/8, $-.148682720127920854E-06
DATA ·atanhrodataL10<> + 80(SB)/8, $ 0.212881813645679599E-07
DATA ·atanhrodataL10<> + 88(SB)/8, $-.602107458843052029E-05
DATA ·atanhrodataL10<> + 96(SB)/8, $-5.5
DATA ·atanhrodataL10<> + 104(SB)/8, $-0.5
DATA ·atanhrodataL10<> + 112(SB)/8, $0.0
DATA ·atanhrodataL10<> + 120(SB)/8, $0x7ff8000000000000      //Nan
DATA ·atanhrodataL10<> + 128(SB)/8, $-1.0
DATA ·atanhrodataL10<> + 136(SB)/8, $1.0
DATA ·atanhrodataL10<> + 144(SB)/8, $1.0E-20
GLOBL ·atanhrodataL10<> + 0(SB), RODATA, $152

// Table of log correction terms
DATA ·atanhtab2076<> + 0(SB)/8, $0.585235384085551248E-01
DATA ·atanhtab2076<> + 8(SB)/8, $0.412206153771168640E-01
DATA ·atanhtab2076<> + 16(SB)/8, $0.273839003221648339E-01
DATA ·atanhtab2076<> + 24(SB)/8, $0.166383778368856480E-01
DATA ·atanhtab2076<> + 32(SB)/8, $0.866678223433169637E-02
DATA ·atanhtab2076<> + 40(SB)/8, $0.319831684989627514E-02
DATA ·atanhtab2076<> + 48(SB)/8, $0.000000000000000000E+00
DATA ·atanhtab2076<> + 56(SB)/8, $-.113006378583725549E-02
DATA ·atanhtab2076<> + 64(SB)/8, $-.367979419636602491E-03
DATA ·atanhtab2076<> + 72(SB)/8, $0.213172484510484979E-02
DATA ·atanhtab2076<> + 80(SB)/8, $0.623271047682013536E-02
DATA ·atanhtab2076<> + 88(SB)/8, $0.118140812789696885E-01
DATA ·atanhtab2076<> + 96(SB)/8, $0.187681358930914206E-01
DATA ·atanhtab2076<> + 104(SB)/8, $0.269985148668178992E-01
DATA ·atanhtab2076<> + 112(SB)/8, $0.364186619761331328E-01
DATA ·atanhtab2076<> + 120(SB)/8, $0.469505379381388441E-01
GLOBL ·atanhtab2076<> + 0(SB), RODATA, $128

// Table of +/- .5
DATA ·atanhtabh2075<> + 0(SB)/8, $0.5
DATA ·atanhtabh2075<> + 8(SB)/8, $-.5
GLOBL ·atanhtabh2075<> + 0(SB), RODATA, $16

// Atanh returns the inverse hyperbolic tangent of the argument.
//
// Special cases are:
//      Atanh(1) = +Inf
//      Atanh(±0) = ±0
//      Atanh(-1) = -Inf
//      Atanh(x) = NaN if x < -1 or x > 1
//      Atanh(NaN) = NaN
// The algorithm used is minimax polynomial approximation
// with coefficients determined with a Remez exchange algorithm.

TEXT    ·atanhAsm(SB), NOSPLIT, $0-16
    FMOVD   x+0(FP), F0
    MOVD    $·atanhrodataL10<>+0(SB), R5
    LGDR    F0, R1
    WORD    $0xC0393FEF //iilf  %r3,1072693247
    BYTE    $0xFF
    BYTE    $0xFF
    SRAD    $32, R1
    WORD    $0xB9170021 //llgtr %r2,%r1
    MOVW    R2, R6
    MOVW    R3, R7
    CMPBGT  R6, R7, L2
    WORD    $0xC0392FFF //iilf  %r3,805306367
    BYTE    $0xFF
    BYTE    $0xFF
    MOVW    R2, R6
    MOVW    R3, R7
    CMPBGT  R6, R7, L9
L3:
    FMOVD   144(R5), F2
    FMADD   F2, F0, F0
L1:
    FMOVD   F0, ret+8(FP)
    RET

L2:
    WORD    $0xED005088 //cdb   %f0,.L12-.L10(%r5)
    BYTE    $0x00
    BYTE    $0x19
    BEQ L5
    WORD    $0xED005080 //cdb   %f0,.L13-.L10(%r5)
    BYTE    $0x00
    BYTE    $0x19
    BEQ L5
    WFCEDBS V0, V0, V2
    BVS L1
    FMOVD   120(R5), F0
    BR  L1
L5:
    WORD    $0xED005070 //ddb   %f0,.L15-.L10(%r5)
    BYTE    $0x00
    BYTE    $0x1D
    FMOVD   F0, ret+8(FP)
    RET

L9:
    FMOVD   F0, F2
    MOVD    $·atanhtabh2075<>+0(SB), R2
    SRW $31, R1, R1
    FMOVD   104(R5), F4
    MOVW    R1, R1
    SLD $3, R1, R1
    WORD    $0x68012000 //ld    %f0,0(%r1,%r2)
    WFMADB  V2, V4, V0, V4
    VLEG    $0, 96(R5), V16
    FDIV    F4, F2
    WORD    $0xC0298006 //iilf  %r2,2147909631
    BYTE    $0x7F
    BYTE    $0xFF
    FMOVD   88(R5), F6
    FMOVD   80(R5), F1
    FMOVD   72(R5), F7
    FMOVD   64(R5), F5
    FMOVD   F2, F4
    WORD    $0xED405088 //adb   %f4,.L12-.L10(%r5)
    BYTE    $0x00
    BYTE    $0x1A
    LGDR    F4, R4
    SRAD    $32, R4
    FMOVD   F4, F3
    WORD    $0xED305088 //sdb   %f3,.L12-.L10(%r5)
    BYTE    $0x00
    BYTE    $0x1B
    SUBW    R4, R2
    WFSDB   V3, V2, V3
    WORD    $0xEC1220AF //risbg %r1,%r2,32,128+47,0
    BYTE    $0x00
    BYTE    $0x55
    SLD $32, R1, R1
    LDGR    R1, F2
    WFMADB  V4, V2, V16, V4
    SRAW    $8, R2, R1
    WFMADB  V4, V5, V6, V5
    WFMDB   V4, V4, V6
    WFMADB  V4, V1, V7, V1
    WFMADB  V2, V3, V4, V2
    WFMADB  V1, V6, V5, V1
    FMOVD   56(R5), F3
    FMOVD   48(R5), F5
    WFMADB  V4, V5, V3, V4
    FMOVD   40(R5), F3
    FMADD   F1, F6, F4
    FMOVD   32(R5), F1
    FMADD   F3, F2, F1
    ANDW    $0xFFFFFF00, R1
    WFMADB  V6, V4, V1, V6
    FMOVD   24(R5), F3
    ORW $0x45000000, R1
    WFMADB  V2, V6, V3, V6
    VLVGF   $0, R1, V4
    LDEBR   F4, F4
    WORD    $0xEC2239BC //risbg %r2,%r2,57,128+60,64-13
    BYTE    $0x33
    BYTE    $0x55
    MOVD    $·atanhtab2076<>+0(SB), R1
    FMOVD   16(R5), F3
    WORD    $0x68521000 //ld    %f5,0(%r2,%r1)
    FMOVD   8(R5), F1
    WFMADB  V2, V6, V5, V2
    WFMADB  V4, V3, V1, V4
    FMOVD   0(R5), F6
    FMADD   F6, F4, F2
    FMUL    F2, F0
    FMOVD   F0, ret+8(FP)
    RET