Lines Matching refs:fma
1261 fma.s1 FR_p_2 = f1, f1, f1 // 2.0
1328 fma.s1 FR_l_Q0 = f1,FR_l_Y0,f0 // Q0 = Y0
1366 (p15) fma.s1 FR_n_XS = FR_l_AbsX , f1, FR_n_XNS // xs = x - int(x)
1378 fma.s1 FR_l_E2 = FR_l_E0,FR_l_E0,FR_l_E0 // e2 = e+e^2
1383 fma.s1 FR_l_E1 = FR_l_E0,FR_l_E0,f0 // e1 = e^2
1400 fma.s1 FR_l_CXL = FR_l_AbsX, f1, FR_l_CXH // CXL = |X|+CXH
1412 (p15) fma.s1 FR_n_XS2 = FR_n_XS, FR_n_XS, f0 // xs^2 = xs*xs
1424 fma.s1 FR_l_Y1 = FR_l_Y0,FR_l_E2,FR_l_Y0 // y1 = y+y*e2
1429 fma.s1 FR_l_E3 = FR_l_E1,FR_l_E1,FR_l_E0 // e3 = e+e1^2
1454 (p15) fma.s1 FR_n_TT = FR_n_A2L, FR_n_XS2, f0 // T=A2L*x^2
1465 (p15) fma.s1 FR_n_A7 = FR_n_A8, FR_n_XS2, FR_n_A7 // poly tail
1470 (p15) fma.s1 FR_n_XS4 = FR_n_XS2, FR_n_XS2, f0 // xs^4 = xs^2*xs^2
1476 fma.s1 FR_l_Y2 = FR_l_Y1, FR_l_E3, FR_l_Y0 // y2 = y+y1*e3
1509 fma.s1 FR_l_CXL = FR_l_CXL, f1, FR_l_CL
1514 (p15) fma.s1 FR_n_TT = FR_n_A2H, FR_n_XS2L, FR_n_TT // T=A2H*x2L+T
1520 (p15) fma.s1 FR_n_A3 = FR_n_A4, FR_n_XS2, FR_n_A3 // poly tail
1525 (p15) fma.s1 FR_n_A5 = FR_n_A6, FR_n_XS2, FR_n_A5 // poly tail
1536 fma.s1 FR_l_Z = FR_l_Z,FR_l_Y2,FR_l_Q0 // x_hi = q+r*y2
1542 (p15) fma.s1 FR_n_A7 = FR_n_A9, FR_n_XS4, FR_n_A7 // poly tail
1547 (p15) fma.s1 FR_n_XS7 = FR_n_XS4, FR_n_XS2, f0 // = x^4*x^2
1558 (p15) fma.s1 FR_n_XS8 = FR_n_XS4, FR_n_XS4, f0 // xs^8 = xs^4*xs^4
1569 (p15) fma.s1 FR_n_TH = FR_n_A2H, FR_n_XS2, FR_n_TT // A2H*xs2+T
1586 fma.s1 FR_l_Z2 = FR_l_Z, FR_l_Z, f0 // Z^2
1591 (p15) fma.s1 FR_n_A3 = FR_n_A5, FR_n_XS4, FR_n_A3 // poly tail
1603 (p15) fma.s1 FR_n_XS7 = FR_n_XS7, FR_n_XS, f0 // x^7 construction
1614 (p15) fma.s1 FR_n_PolyH = FR_n_TH, f1, FR_n_A1H // PolyH=TH+A1H
1631 fma.s1 FR_l_B14 = FR_l_B16, FR_l_Z2, FR_l_B14// Bernoulli tail
1636 fma.s1 FR_l_Z4 = FR_l_Z2, FR_l_Z2, f0 // Z^4 = Z^2*Z^2
1642 fma.s1 FR_l_B2 = FR_l_B4, FR_l_Z2, FR_l_B2 // Bernoulli tail
1647 fma.s1 FR_l_B6 = FR_l_B8, FR_l_Z2, FR_l_B6 // Bernoulli tail
1653 fma.s1 FR_l_B10 = FR_l_B12, FR_l_Z2, FR_l_B10// Bernoulli tail
1658 (p15) fma.s1 FR_n_Tail = FR_n_A7, FR_n_XS8, FR_n_A3 // poly tail
1664 (p15) fma.s1 FR_n_TL = FR_n_TL, f1, FR_n_TT // TL = TL+T
1675 fma.s1 FR_l_poly_lo = FR_l_r, FR_l_Q_6, FR_l_Q_5 // Q_5+r*Q_6
1691 fma.s1 FR_l_poly = FR_l_r, FR_l_Q_2, FR_l_Q_1 //poly=r*Q2+Q1
1702 fma.s1 FR_l_G = FR_l_float_N, FR_l_log2_hi, FR_l_H // Tbl =
1709 fma.s1 FR_l_Y_lo = FR_l_float_N, FR_l_log2_lo, FR_l_h // Y_lo=
1715 fma.s1 FR_l_B14 = FR_l_B18, FR_l_Z4, FR_l_B14 //bernulli tail
1721 fma.s1 FR_l_B2 = FR_l_B6, FR_l_Z4, FR_l_B2 //bernulli tail
1726 fma.s1 FR_l_Z8 = FR_l_Z4, FR_l_Z4, f0 //bernulli tail
1732 fma.s1 FR_l_poly_lo = FR_l_r, FR_l_poly_lo, FR_l_Q_4 // poly_lo =
1744 (p15) fma.s1 FR_n_PolyL = FR_n_PolyL, f1, FR_n_TH // polyL+TH
1749 (p15) fma.s1 FR_n_TT = FR_n_TL, f1, FR_n_A1L // TL+A1L
1761 fma.s1 FR_l_B10 = FR_l_B14, FR_l_Z4, FR_l_B10 //bernulli tail
1767 fma.s1 FR_l_poly_lo = FR_l_r, FR_l_poly_lo, FR_l_Q_3 // poly_lo =
1779 (p15) fma.s1 FR_n_PolyL = FR_n_PolyL, f1, FR_n_TT // polyL+TT
1790 fma.s1 FR_l_XYH = FR_l_logl_YHi, FR_l_AbsX_m_Half, f0 // XYH=
1797 fma.s1 FR_l_SS = FR_l_B10, FR_l_Z8, FR_l_B2 // Bernoulli tail
1808 fma.s1 FR_l_poly = FR_l_rsq, FR_l_poly_lo, FR_l_poly //poly=
1815 (p15) fma.s1 FR_n_TT = FR_n_PolyL, FR_n_XS2, f0 // T=polyL*xs^2
1833 fma.s1 FR_l_SSCXH = FR_l_SS, FR_l_Z, FR_l_CXH // SS*Z+CXH
1838 (p15) fma.s1 FR_l_SignedXYH = FR_l_XYH, FR_n_NegOne, f0 // XYH = -XYH
1854 fma.s1 FR_l_poly = FR_l_rsq, FR_l_poly, FR_l_r_cor // poly =
1861 (p15) fma.s1 FR_n_TT = FR_n_PolyH, FR_n_XS2L, FR_n_TT
1883 fma.s1 FR_e_expl_Input_AbsX = FR_l_XYH, f1, FR_l_SSCXH // HI EXP
1890 (p14) fma.s1 FR_e_expl_Input_X = FR_l_XYH, f1, FR_l_SSCXH // HI EXP
1907 (p15) fma.s1 FR_n_TH = FR_n_PolyH, FR_n_XS2, FR_n_TT // TH=
1930 fma.s1 FR_l_SSCXL = FR_l_SS, FR_l_Z, FR_l_SSCXL
1947 fma.s1 FR_l_XYL = FR_l_logl_YLo, FR_l_AbsX_m_Half, FR_l_XYL
1960 (p15) fma.s1 FR_n_Poly1H = FR_n_TH, f1, f1 // poly1H = TH+1
1972 fma.s1 FR_l_SSCXL = FR_l_SSCXL, f1, FR_l_CXL
1977 fma.s1 FR_e_expl_Input_Y = FR_e_expl_Input_Y, f1, FR_l_SSCXH
1983 fma.s1 FR_e_N_signif=FR_e_expl_Input_X,FR_e_INV_LN2_2TO63,FR_e_RSHF_2TO51
1995 (p15) fma.s1 FR_n_PolyH = FR_n_Poly1H, FR_n_XS, f0//sin(Pi*x) poly
2006 (p15) fma.s1 FR_n_TL = FR_n_TL, f1, FR_n_TT//sin(Pi*x) poly
2012 fma.s1 FR_l_Temp = FR_l_XYL, f1, FR_l_SSCXL // XYL+SS*CXL
2017 (p15) fma.s1 FR_e_expl_Input_Y = FR_e_expl_Input_Y, FR_n_NegOne, f0
2036 (p15) fma.s1 FR_n_Poly1L = FR_n_Poly1L, f1, FR_n_TH //sin(Pi*x) poly
2054 (p14) fma.s1 FR_e_expl_Input_Y = FR_e_expl_Input_Y, f1, FR_l_Temp
2073 (p15) fma.s1 FR_n_Poly1L = FR_n_Poly1L, f1, FR_n_TL //sin(Pi*x) poly
2081 fma.s1 FR_e_r = FR_e_r, f1, FR_e_expl_Input_Y
2099 (p15) fma.s1 FR_n_PolyL = FR_n_Poly1L, FR_n_XS, FR_n_PolyL
2130 (p15) fma.s1 FR_n_PolyL = FR_n_Tail, FR_n_XS7, FR_n_PolyL
2137 fma.s1 FR_e_poly = FR_e_r, FR_e_A3, FR_e_A2 // poly=r*A3+A2
2159 (p15) fma.s1 FR_n_TT = FR_n_PolyL, FR_l_AbsX, f0 //sin(Pi*x) poly
2165 fma.s1 FR_e_poly = FR_e_r, FR_e_poly, FR_e_A1
2172 fma.s1 FR_e_T_scale = FR_e_T, FR_e_scale, f0 // T_scale=T*scale
2177 fma.s1 FR_e_W = FR_e_W2, FR_e_W1_p1, FR_e_W1
2184 (p15) fma.s1 FR_n_SinxH = FR_n_PolyH, FR_l_AbsX, FR_n_TT
2197 fma.s1 FR_e_poly = FR_e_rsq, FR_e_poly, FR_e_r
2204 fma.s1 FR_e_Wp1_T_scale = FR_e_W, FR_e_T_scale, FR_e_T_scale
2210 fma.s1 FR_e_W_T_scale = FR_e_W, FR_e_T_scale, f0 // W*T*scale
2229 fma.s1 FR_e_result_lo = FR_e_Wp1_T_scale, FR_e_poly, FR_e_W_T_scale
2236 (p15) fma.s1 FR_n_SinxL = FR_n_SinxL, f1, FR_n_TT // sin low result
2242 (p15) fma.s1 FR_n_Q0 = f1,FR_n_Y0,f0 // q = y
2254 (p14) fma.s0 f8 = FR_e_Y_hi, FR_e_scale, FR_e_result_lo
2260 fma.s1 FR_e_expl_Output_X = FR_e_Y_hi, FR_e_scale, f0 // exp result
2265 fma.s1 FR_e_expl_Output_Y = FR_e_result_lo, f1, f0// exp lo result
2271 fma.s1 FR_n_E2 = FR_n_E0,FR_n_E0,FR_n_E0 // e2 = e+e^2
2276 fma.s1 FR_n_E1 = FR_n_E0,FR_n_E0,f0 // e1 = e^2
2282 fma.s1 FR_n_Y1 = FR_n_Y0,FR_n_E2,FR_n_Y0 // y1 = y+y*e2
2287 fma.s1 FR_n_E3 = FR_n_E1,FR_n_E1,FR_n_E0 // e3 = e+e1^2
2293 fma.s1 FR_n_Y2 = FR_n_Y1,FR_n_E3,FR_n_Y0 // y2 = y+y1*e3
2309 fma.s1 FR_n_RcpResH = FR_n_R0,FR_n_Y2,FR_n_Q0 // x = q+r*y2
2315 fma.s1 FR_n_Y3 = FR_n_Y2,FR_n_E4,FR_n_Y2 // y3 = y2+y2*e4
2333 fma.s1 FR_n_RcpResL = FR_n_R1,FR_n_Y3,f0 // x_lo = r1*y3
2338 fma.s1 FR_n_Temp = FR_n_RcpResH, FR_e_expl_Output_Y, f0
2345 fma.s1 FR_n_Temp = FR_n_RcpResL, FR_e_expl_Output_X, FR_n_Temp
2352 fma.s1 FR_n_ResH = FR_n_RcpResH, FR_e_expl_Output_X, FR_n_Temp
2365 (p12) fma.s1 FR_n_ResH = FR_n_ResH, FR_n_NegOne, f0 // Negate
2371 fma.s1 FR_n_ResL = FR_n_ResL, f1, FR_n_Temp
2379 (p13) fma.s0 f8 = FR_n_ResH, f1, FR_n_ResL // For odd
2489 fma.s1 FR_r_XS = FR_r_AbsX , f1, FR_r_XNS // xs = x - [x]
2501 fma.s1 FR_p_XN = FR_p_XN, f1, FR_p_0p5 // xn = xn+0.5
2525 fma.s1 FR_r_XS2 = FR_r_XS, FR_r_XS, f0 // xs2 = xs*xs
2560 fma.s1 FR_r_TH = FR_r_A2H, FR_r_XS2, f0 // sin for neg
2565 fma.s1 FR_r_TL = FR_r_A2L, FR_r_XS2, f0 // sin for neg
2577 fma.s1 FR_p_Temp5H = FR_p_A5H, FR_p_XR, f0 // A5H*r
2583 fma.s1 FR_p_XR2 = FR_p_XR, FR_p_XR, f0 // r^2 = r*r
2594 fma.s1 FR_p_Temp2H = FR_p_A2H, FR_p_XR, f0 // A2H*r
2606 fma.s1 FR_r_ResH = FR_r_TH, f1, FR_r_A1H // sin for neg
2612 fma.s1 FR_r_TL = FR_r_A2H, FR_r_XS2L, FR_r_TL // sin for neg
2624 fma.s1 FR_p_Poly5H = FR_p_Temp5H, f1, FR_p_A4H // A5H*r+A4H
2637 fma.s1 FR_p_Poly2H = FR_p_Temp2H, f1, FR_p_A1H // A2H*r+A1H
2644 fma.s1 FR_p_XR3 = FR_p_XR2, FR_p_XR, f0 // r^3 = r^2*r
2655 fma.s1 FR_p_A18 = FR_p_A19, FR_p_XR, FR_p_A18 // Poly tail
2660 fma.s1 FR_p_A14 = FR_p_A15, FR_p_XR, FR_p_A14 // Poly tail
2666 fma.s1 FR_p_XR4 = FR_p_XR2, FR_p_XR2, f0 // r^4 = r^2*r^2
2672 fma.s1 FR_p_Temp5L = FR_p_A5L, FR_p_XR, FR_p_Temp5L// Low part
2685 fma.s1 FR_p_Temp4H = FR_p_Poly5H, FR_p_XR, f0 // (A5H*r+A4H)*r
2690 fma.s1 FR_p_Temp2L = FR_p_A2L, FR_p_XR, FR_p_Temp2L // A2*r low
2701 fma.s1 FR_p_Temp1H = FR_p_Poly2H, FR_p_XR, f0 // High poly
2712 fma.s1 FR_p_A16 = FR_p_A17, FR_p_XR, FR_p_A16 // Poly tail
2723 fma.s1 FR_r_TL = FR_r_TL, f1, FR_r_TT // sin for neg
2729 fma.s1 FR_p_Temp5L = FR_p_Temp5L, f1, FR_p_A4L // Low poly
2734 fma.s1 FR_p_Poly5L = FR_p_Poly5L, f1, FR_p_Temp5H // Low poly
2745 fma.s1 FR_p_Poly4H = FR_p_Temp4H, f1, FR_p_A3H // Low poly
2751 fma.s1 FR_p_Temp2L = FR_p_Temp2L, f1, FR_p_A1L // High poly
2756 fma.s1 FR_p_Poly2L = FR_p_Poly2L, f1, FR_p_Temp2H // High poly
2767 fma.s1 FR_p_Poly1H = FR_p_Temp1H, f1, FR_p_A0H // High poly
2773 fma.s1 FR_p_A12 = FR_p_A13, FR_p_XR, FR_p_A12 // Poly tail
2778 fma.s1 FR_p_XR3L = FR_p_XR2L, FR_p_XR, FR_p_XR3L // x^3 low
2784 fma.s1 FR_p_Poly5L = FR_p_Poly5L, f1, FR_p_Temp5L // Low poly
2789 fma.s1 FR_p_A10 = FR_p_A11, FR_p_XR, FR_p_A10 // Poly tail
2800 fma.s1 FR_p_A6 = FR_p_A7, FR_p_XR, FR_p_A6 // Poly tail
2806 fma.s1 FR_p_A8 = FR_p_A9, FR_p_XR, FR_p_A8 // Poly tail
2811 fma.s1 FR_p_XR6 = FR_p_XR4, FR_p_XR2, f0 // Poly tail
2817 fma.s1 FR_p_Poly2L = FR_p_Poly2L, f1, FR_p_Temp2L // High poly
2828 fma.s1 FR_r_ResL = FR_r_ResL, f1, FR_r_TH // sin for neg
2833 fma.s1 FR_r_TT = FR_r_TL, f1, FR_r_A1L // sin for neg
2839 fma.s1 FR_p_Temp4L = FR_p_Poly5L,FR_p_XR,FR_p_Temp4L // Low poly
2844 fma.s1 FR_p_A18 = FR_p_A20, FR_p_XR2, FR_p_A18 // Poly tail
2850 fma.s1 FR_p_Poly4L = FR_p_Poly4L, f1, FR_p_Temp4H // Low poly
2855 fma.s1 FR_p_A14 = FR_p_A16, FR_p_XR2, FR_p_A14 // Poly tail
2861 fma.s1 FR_p_A6 = FR_p_A8, FR_p_XR2, FR_p_A6 // Poly tail
2866 fma.s1 FR_p_A10 = FR_p_A12, FR_p_XR2, FR_p_A10 // Poly tail
2872 fma.s1 FR_p_Temp1L = FR_p_Poly2L,FR_p_XR,FR_p_Temp1L //High poly
2877 fma.s1 FR_p_Poly1L = FR_p_Poly1L, f1, FR_p_Temp1H // High poly
2883 fma.s1 FR_r_ResL = FR_r_ResL, f1, FR_r_TT // sin for neg
2888 fma.s1 FR_r_TH = FR_r_ResH, FR_r_XS2, f0 // sin for neg
2894 fma.s1 FR_p_Temp4L = FR_p_Temp4L, f1, FR_p_A3L // Low poly
2899 fma.s1 FR_p_Poly3H = FR_p_Poly4H, FR_p_XR3, f0 // Low poly
2905 fma.s1 FR_p_A14 = FR_p_A18, FR_p_XR4, FR_p_A14 // Poly tail
2910 fma.s1 FR_p_XR8 = FR_p_XR4, FR_p_XR4, f0 // Poly tail
2916 fma.s1 FR_r_TL = FR_r_ResH, FR_r_XS2L, f0 // sin for neg
2922 fma.s1 FR_p_Temp1L = FR_p_Temp1L, f1, FR_p_A0L // High poly
2927 fma.s1 FR_p_A6 = FR_p_A10, FR_p_XR4, FR_p_A6 // Poly tail
2938 fma.s1 FR_r_Res3H = FR_r_TH, f1, f1 // sin for neg
2944 fma.s1 FR_p_Poly4L = FR_p_Poly4L, f1, FR_p_Temp4L // Low poly
2949 fma.s1 FR_p_Poly3L = FR_p_Poly4H, FR_p_XR3L, f0 // Low poly
2955 fma.s1 FR_p_Poly0H = FR_p_Poly3H,f1,FR_p_Poly1H //Low & High add
2960 fma.s1 FR_r_A7 = FR_r_A8, FR_r_XS2, FR_r_A7 // sin for neg
2966 fma.s1 FR_r_TL = FR_r_ResL, FR_r_XS2, FR_r_TL // sin for neg
2971 fma.s1 FR_r_XS4 = FR_r_XS2, FR_r_XS2, f0 // sin for neg
2977 fma.s1 FR_p_Poly1L = FR_p_Poly1L, f1, FR_p_Temp1L // High poly
2982 fma.s1 FR_p_PolyTail = FR_p_A14, FR_p_XR8, FR_p_A6 // Poly tail
2993 fma.s1 FR_r_ResH = FR_r_Res3H, FR_r_XS, f0 // sin for neg
3004 fma.s1 FR_p_Poly3L = FR_p_Poly4L,FR_p_XR3,FR_p_Poly3L //Low poly
3015 (p13) fma.s1 FR_p_OddPoly0H = FR_p_Poly0H, FR_p_AbsXM1, f0
3022 fma.s1 FR_r_TL = FR_r_TL, f1, FR_r_TT // sin for neg
3027 fma.s1 FR_r_A3 = FR_r_A4, FR_r_XS2, FR_r_A3 // sin for neg
3033 fma.s1 FR_p_Poly1L = FR_p_PolyTail,FR_p_XR6,FR_p_Poly1L//High
3038 fma.s1 FR_r_A5 = FR_r_A6, FR_r_XS2, FR_r_A5 // sin for neg
3044 fma.s1 FR_r_Res3L = FR_r_Res3L, f1, FR_r_TH // sin for neg
3055 fma.s1 FR_p_Poly3L = FR_p_Poly3L, f1, FR_p_Temp0L // Low poly
3060 fma.s1 FR_r_A7 = FR_r_A9, FR_r_XS4, FR_r_A7 // sin for neg
3066 fma.s1 FR_p_Poly0L = FR_p_Poly0L,f1,FR_p_Poly3H //Low & High add
3078 fma.s1 FR_r_A3 = FR_r_A5, FR_r_XS4, FR_r_A3 // sin for neg
3083 fma.s1 FR_r_XS7 = FR_r_XS4, FR_r_XS2, f0 // xs^6
3089 fma.s1 FR_r_Res3L = FR_r_Res3L, f1, FR_r_TL // sin for neg
3094 fma.s1 FR_r_XS8 = FR_r_XS4, FR_r_XS4, f0 // sin for neg
3100 fma.s1 FR_p_Temp0H = FR_p_Poly3L,f1,FR_p_Poly1L //Low & High add
3106 fma.s1 FR_r_XS7 = FR_r_XS7, FR_r_XS, f0 // xs^7
3112 fma.s1 FR_r_ResL = FR_r_Res3L, FR_r_XS, FR_r_ResL//sin for neg
3117 fma.s1 FR_r_Tail = FR_r_A7, FR_r_XS8, FR_r_A3 // sin tail res
3123 fma.s1 FR_p_Poly0L = FR_p_Poly0L,f1,FR_p_Temp0H //Low & High add
3130 fma.s1 FR_r_ResL = FR_r_Tail,FR_r_XS7,FR_r_ResL //sin for neg
3136 (p13) fma.s1 FR_p_OddPoly0L = FR_p_Poly0L, FR_p_AbsXM1, FR_p_OddPoly0L
3143 fma.s1 FR_r_TT = FR_r_ResL, FR_r_AbsX, f0 // X*sin
3150 (p12) fma.s0 f8 = FR_p_Poly0H, f1, FR_p_Poly0L // Even
3155 (p13) fma.s0 f8 = FR_p_OddPoly0H, f1, FR_p_OddPoly0L // Odd
3161 (p13) fma.s1 FR_p_Poly0H = FR_p_OddPoly0H, f1, f0
3167 (p13) fma.s1 FR_p_Poly0L = FR_p_OddPoly0L, f1, f0
3174 fma.s1 FR_r_Res1H = FR_r_ResH, FR_r_AbsX, FR_r_TT // X*sin
3186 fma.s1 FR_r_Res1L = FR_r_Res1L, f1, FR_r_TT // sin for neg
3191 fma.s1 FR_r_TL = FR_p_Poly0L, FR_r_Res1H, f0 // mult by sin
3197 fma.s1 FR_r_TL = FR_p_Poly0H,FR_r_Res1L,FR_r_TL//mult by sin
3203 fma.s1 FR_r_ResH = FR_p_Poly0H,FR_r_Res1H,FR_r_TL//mult by sin
3226 fma.s1 FR_r_ResL = FR_r_ResL, f1, FR_r_TL //Low result of mult
3232 fma.s1 FR_r_Q0 = f1,FR_r_Y0,f0 // q = a*y
3243 fma.s1 FR_r_E2 = FR_r_E0,FR_r_E0,FR_r_E0 // e2 = e+e^2
3248 fma.s1 FR_r_E1 = FR_r_E0,FR_r_E0,f0 // e1 = e^2
3254 fma.s1 FR_r_Y1 = FR_r_Y0,FR_r_E2,FR_r_Y0 // y1 = y+y*e2
3259 fma.s1 FR_r_E3 = FR_r_E1,FR_r_E1,FR_r_E0 // e3 = e+e1^2
3265 fma.s1 FR_r_Y2 = FR_r_Y1,FR_r_E3,FR_r_Y0 // y2 = y+y1*e3
3281 fma.s1 FR_r_ZH = FR_r_R0,FR_r_Y2,FR_r_Q0 // x = q+r*y2
3287 fma.s1 FR_r_Y3 = FR_r_Y2,FR_r_E4,FR_r_Y2 // y3 = y2+y2*e4
3303 (p12) fma.s1 FR_r_ZHN = FR_r_ZH,FR_r_NegOne, f0 // Negate for evens
3310 (p13) fma.s0 f8 = FR_r_R1,FR_r_Y3,FR_r_ZH // Final result
3326 fma.s1 FR_z_Q0 = f1,FR_z_Y0,f0 // q = a*y
3378 fma.s1 FR_z_E2 = FR_z_E0,FR_z_E0,FR_z_E0 // e2 = e+e^2
3383 fma.s1 FR_z_E1 = FR_z_E0,FR_z_E0,f0 // e1 = e^2
3403 fma.s1 FR_r_XS = FR_r_AbsX , f1, FR_r_XNS // xs = |x|-[x]
3422 fma.s1 FR_z_Y1 = FR_z_Y0,FR_z_E2,FR_z_Y0 // y1 = y+y*e2
3427 fma.s1 FR_z_E3 = FR_z_E1,FR_z_E1,FR_z_E0 // e3 = e+e1^2
3453 fma.s1 FR_r_XS2 = FR_r_XS, FR_r_XS, f0 // xs^2
3471 fma.s1 FR_z_Y2 = FR_z_Y1,FR_z_E3,FR_z_Y0 // y2 = y+y1*e3
3494 fma.s1 FR_r_TH = FR_r_A2H, FR_r_XS2, f0 // neg sin
3499 fma.s1 FR_r_TL = FR_r_A2L, FR_r_XS2, f0 // neg sin
3511 fma.s1 FR_p_Temp5H = FR_p_A5H, FR_p_XR, f0 // Low poly
3516 fma.s1 FR_p_XR2 = FR_p_XR, FR_p_XR, f0 // poly tail
3527 fma.s1 FR_p_Temp2H = FR_p_A2H, FR_p_XR, f0 // High poly
3538 fma.s1 FR_z_ZH = FR_z_R0,FR_z_Y2,FR_z_Q0 // 1/x = q+r*y2
3549 fma.s1 FR_r_ResH = FR_r_TH, f1, FR_r_A1H // neg sin
3555 fma.s1 FR_r_TL = FR_r_A2H, FR_r_XS2L, FR_r_TL // neg sin
3566 fma.s1 FR_p_Poly5H = FR_p_Temp5H, f1, FR_p_A4H // Low poly
3577 fma.s1 FR_p_Poly2H = FR_p_Temp2H, f1, FR_p_A1H // High poly
3583 fma.s1 FR_p_XR3 = FR_p_XR2, FR_p_XR, f0 // r^3
3594 fma.s1 FR_p_A18 = FR_p_A19, FR_p_XR, FR_p_A18 // poly tail
3599 fma.s1 FR_p_A14 = FR_p_A15, FR_p_XR, FR_p_A14 // poly tail
3605 fma.s1 FR_p_XR4 = FR_p_XR2, FR_p_XR2, f0 // poly tail
3610 fma.s1 FR_z_Y3 = FR_z_Y2,FR_z_E4,FR_z_Y2 // y3 = y2+y2*e4
3616 fma.s1 FR_p_Temp5L = FR_p_A5L, FR_p_XR, FR_p_Temp5L // Low poly
3627 fma.s1 FR_p_Temp4H = FR_p_Poly5H, FR_p_XR, f0 // Low poly
3632 fma.s1 FR_p_Temp2L = FR_p_A2L, FR_p_XR, FR_p_Temp2L // High poly
3643 fma.s1 FR_p_Temp1H = FR_p_Poly2H, FR_p_XR, f0 // High poly
3654 fma.s1 FR_p_A16 = FR_p_A17, FR_p_XR, FR_p_A16 //poly tail
3665 fma.s1 FR_r_TL = FR_r_TL, f1, FR_r_TT // neg sin
3671 fma.s1 FR_p_Temp5L = FR_p_Temp5L, f1, FR_p_A4L // Low poly
3676 fma.s1 FR_p_Poly5L = FR_p_Poly5L, f1, FR_p_Temp5H //Low poly
3687 fma.s1 FR_p_Poly4H = FR_p_Temp4H, f1, FR_p_A3H // Low poly
3693 fma.s1 FR_p_Temp2L = FR_p_Temp2L, f1, FR_p_A1L // High poly
3698 fma.s1 FR_p_Poly2L = FR_p_Poly2L, f1, FR_p_Temp2H // High poly
3709 fma.s1 FR_p_Poly1H = FR_p_Temp1H, f1, FR_p_A0H // High poly
3715 fma.s1 FR_p_A12 = FR_p_A13, FR_p_XR, FR_p_A12 // poly tail
3720 fma.s1 FR_p_XR3L = FR_p_XR2L, FR_p_XR, FR_p_XR3L // x^3 low
3726 fma.s1 FR_p_Poly5L = FR_p_Poly5L, f1, FR_p_Temp5L //Low poly
3731 fma.s1 FR_p_A10 = FR_p_A11, FR_p_XR, FR_p_A10 //poly tail
3742 fma.s1 FR_p_A6 = FR_p_A7, FR_p_XR, FR_p_A6 // poly tail
3748 fma.s1 FR_p_A8 = FR_p_A9, FR_p_XR, FR_p_A8 // poly tail
3753 fma.s1 FR_p_XR6 = FR_p_XR4, FR_p_XR2, f0 // r^6
3759 fma.s1 FR_p_Poly2L = FR_p_Poly2L, f1, FR_p_Temp2L // High poly
3770 fma.s1 FR_r_ResL = FR_r_ResL, f1, FR_r_TH // neg sin
3775 fma.s1 FR_r_TT = FR_r_TL, f1, FR_r_A1L // neg sin
3781 fma.s1 FR_p_Temp4L = FR_p_Poly5L,FR_p_XR,FR_p_Temp4L //Low poly
3786 fma.s1 FR_p_A18 = FR_p_A20, FR_p_XR2, FR_p_A18 // poly tail
3792 fma.s1 FR_p_Poly4L = FR_p_Poly4L, f1, FR_p_Temp4H // Low poly
3797 fma.s1 FR_p_A14 = FR_p_A16, FR_p_XR2, FR_p_A14 // poly tail
3803 fma.s1 FR_p_A6 = FR_p_A8, FR_p_XR2, FR_p_A6 // poly tail
3808 fma.s1 FR_p_A10 = FR_p_A12, FR_p_XR2, FR_p_A10 // poly tail
3814 fma.s1 FR_p_Temp1L = FR_p_Poly2L,FR_p_XR,FR_p_Temp1L //High poly
3819 fma.s1 FR_p_Poly1L = FR_p_Poly1L, f1, FR_p_Temp1H // High poly
3825 fma.s1 FR_r_ResL = FR_r_ResL, f1, FR_r_TT // neg sin
3830 fma.s1 FR_r_TH = FR_r_ResH, FR_r_XS2, f0 // neg sin
3836 fma.s1 FR_p_Temp4L = FR_p_Temp4L, f1, FR_p_A3L // Low poly
3841 fma.s1 FR_p_Poly3H = FR_p_Poly4H, FR_p_XR3, f0 // Low poly
3847 fma.s1 FR_p_A14 = FR_p_A18, FR_p_XR4, FR_p_A14 // poly tail
3852 fma.s1 FR_p_XR8 = FR_p_XR4, FR_p_XR4, f0 // r^8
3858 fma.s1 FR_r_TL = FR_r_ResH, FR_r_XS2L, f0 // neg sin
3869 fma.s1 FR_p_Temp1L = FR_p_Temp1L, f1, FR_p_A0L // High poly
3874 fma.s1 FR_p_A6 = FR_p_A10, FR_p_XR4, FR_p_A6 // poly tail
3885 fma.s1 FR_r_Res3H = FR_r_TH, f1, f1 // neg sin
3891 fma.s1 FR_p_Poly4L = FR_p_Poly4L, f1, FR_p_Temp4L // Low poly
3896 fma.s1 FR_p_Poly3L = FR_p_Poly4H, FR_p_XR3L, f0 // Low poly
3902 fma.s1 FR_p_Poly0H = FR_p_Poly3H, f1, FR_p_Poly1H // Result
3907 fma.s1 FR_r_A7 = FR_r_A8, FR_r_XS2, FR_r_A7 // neg sin
3913 fma.s1 FR_r_TL = FR_r_ResL, FR_r_XS2, FR_r_TL // neg sin
3918 fma.s1 FR_r_XS4 = FR_r_XS2, FR_r_XS2, f0 // xs^4
3924 fma.s1 FR_p_Poly1L = FR_p_Poly1L, f1, FR_p_Temp1L // High poly
3929 fma.s1 FR_p_PolyTail = FR_p_A14, FR_p_XR8, FR_p_A6 // poly tail
3940 fma.s1 FR_r_ResH = FR_r_Res3H, FR_r_XS, f0 // neg sin
3951 fma.s1 FR_p_Poly3L = FR_p_Poly4L,FR_p_XR3,FR_p_Poly3L //Low poly
3962 fma.s1 FR_z_ZL = FR_z_R1,FR_z_Y3, f0 // x_lo = r1*y3
3968 fma.s1 FR_r_TL = FR_r_TL, f1, FR_r_TT // neg sin
3973 fma.s1 FR_r_A3 = FR_r_A4, FR_r_XS2, FR_r_A3 /// neg sin
3979 fma.s1 FR_p_Poly1L = FR_p_PolyTail,FR_p_XR6,FR_p_Poly1L // High
3984 fma.s1 FR_r_A5 = FR_r_A6, FR_r_XS2, FR_r_A5 // neg sin
3990 fma.s1 FR_r_Res3L = FR_r_Res3L, f1, FR_r_TH // neg sin
4001 fma.s1 FR_p_Poly3L = FR_p_Poly3L, f1, FR_p_Temp0L // Low poly
4006 fma.s1 FR_r_A7 = FR_r_A9, FR_r_XS4, FR_r_A7 // neg sin
4012 fma.s1 FR_p_Poly0L = FR_p_Poly0L, f1, FR_p_Poly3H // result
4018 (p14) fma.s1 f8 = FR_p_Poly0H, FR_z_ZH, f0 // z*poly
4023 fma.s1 FR_p_Temp1L = FR_p_Poly0H, FR_z_ZL, f0 // z*poly low
4029 fma.s1 FR_r_A3 = FR_r_A5, FR_r_XS4, FR_r_A3 // sin tail
4034 fma.s1 FR_r_XS7 = FR_r_XS4, FR_r_XS2, f0 // xs^6
4040 fma.s1 FR_r_Res3L = FR_r_Res3L, f1, FR_r_TL // sin low
4045 fma.s1 FR_r_XS8 = FR_r_XS4, FR_r_XS4, f0 // xs^8
4051 fma.s1 FR_p_Temp0H = FR_p_Poly3L, f1, FR_p_Poly1L // result
4063 fma.s1 FR_r_XS7 = FR_r_XS7, FR_r_XS, f0 // xs^7
4069 fma.s1 FR_r_ResL = FR_r_Res3L, FR_r_XS, FR_r_ResL // lo result
4074 fma.s1 FR_r_Tail = FR_r_A7, FR_r_XS8, FR_r_A3 // tail result
4080 fma.s1 FR_p_Poly0L = FR_p_Poly0L, f1, FR_p_Temp0H // lo result
4086 fma.s1 FR_r_ResL = FR_r_Tail, FR_r_XS7, FR_r_ResL // lo result
4092 (p14) fma.s1 FR_p_Temp1L = FR_p_Poly0L,FR_z_ZH,FR_p_Temp1L //hi result
4098 fma.s1 FR_r_TT = FR_r_ResL, f1, f0 // for low result
4105 (p14) fma.s1 FR_p_Temp1L = FR_p_Temp1L, f1, FR_p_Temp1H // for lo res
4111 fma.s1 FR_r_Res1H = FR_r_ResH, f1, FR_r_TT // hi res
4117 (p14) fma.s0 f8 = f8, f1, FR_p_Temp1L // Final result
4129 fma.s1 FR_r_Res1L = FR_r_Res1L, f1, FR_r_TT // Low sin result
4134 fma.s1 FR_r_TL = FR_p_Poly0L,FR_r_Res1H,f0 //Low sin result
4140 fma.s1 FR_r_TL = FR_p_Poly0H, FR_r_Res1L, FR_r_TL //Low sin
4146 fma.s1 FR_r_ResH = FR_p_Poly0H, FR_r_Res1H, FR_r_TL //High sin
4169 fma.s1 FR_r_ResL = FR_r_ResL, f1, FR_r_TL // low sin
4175 fma.s1 FR_r_Q0 = f1,FR_r_Y0,f0 // q = a*y
4186 fma.s1 FR_r_E2 = FR_r_E0,FR_r_E0,FR_r_E0 // e2 = e+e^2
4191 fma.s1 FR_r_E1 = FR_r_E0,FR_r_E0,f0 // e1 = e^2
4197 fma.s1 FR_r_Y1 = FR_r_Y0,FR_r_E2,FR_r_Y0 // y1 = y+y*e2
4202 fma.s1 FR_r_E3 = FR_r_E1,FR_r_E1,FR_r_E0 // e3 = e+e1^2
4208 fma.s1 FR_r_Y2 = FR_r_Y1,FR_r_E3,FR_r_Y0 // y2 = y+y1*e3
4224 fma.s1 FR_r_ZH = FR_r_R0,FR_r_Y2,FR_r_Q0 // x = q+r*y2
4230 fma.s1 FR_r_Y3 = FR_r_Y2,FR_r_E4,FR_r_Y2 // y3 = y2+y2*e4
4246 fma.s1 FR_r_ZHN = FR_r_ZH,FR_r_NegOne, f0 // Negate
4309 (p6) fma.s0 f8 = f8,f1,f8 // res = x + x
4372 (p14) fma.s0 f8 = f9,f9,f0 // Set I,O and +INF result
4422 (p7) fma.s0 f8 = f9,f9,f9 // for positives