Lines Matching refs:s1
833 fnorm.s1 FR_norm_x = FR_Input_X // Normalize x
856 fnorm.s1 FR_norm_x = FR_Input_X // Normalize x
957 fma.s1 FR_N_float_signif = FR_Input_X, FR_inv_pi_2to63, FR_rshf_2to64
974 fma.s1 FR_rsq = FR_norm_x, FR_norm_x, f0 // rsq = x*x, in case |x| < pi/4
994 fcmp.lt.s1 p6, p7 = FR_abs_x, FR_Pi_by_4 // Test |x| < pi/4
999 fms.s1 FR_N_float = FR_N_float_signif, FR_2tom64, FR_rshf
1022 (p6) fma.s1 FR_r_cubed = FR_r, FR_rsq, f0 // r^3 if |x| < pi/4
1052 fnma.s1 FR_s = FR_N_float, FR_P_1, FR_Input_X // s = -N * P_1 + Arg
1057 fma.s1 FR_w = FR_N_float, FR_P_2, f0 // w = N * P_2
1063 fms.s1 FR_r = FR_s, f1, FR_w // r = s - w, assume |s| >= 2^-33
1069 fcmp.lt.s1 p7, p6 = FR_s, FR_Two_to_M33
1075 (p7) fcmp.gt.s1 p7, p6 = FR_s, FR_Neg_Two_to_M33 // p6 if |s| >= 2^-33, else p7
1081 fms.s1 FR_c = FR_s, f1, FR_r // c = s - r, for |s| >= 2^-33
1086 fma.s1 FR_rsq = FR_r, FR_r, f0 // rsq = r * r, for |s| >= 2^-33
1092 (p7) fma.s1 FR_w = FR_N_float, FR_P_3, f0
1099 frcpa.s1 FR_r_hi, p15 = f1, FR_r // r_hi = frcpa(r)
1104 (p6) fcmp.lt.unc.s1 p8, p13 = FR_r, FR_Two_to_M3 // If big s, test r with 2^-3
1110 (p7) fma.s1 FR_U_1 = FR_N_float, FR_P_2, FR_w
1120 (p8) fcmp.gt.s1 p8, p13 = FR_r, FR_Neg_Two_to_M3 // If big s, p8 if |r| < 2^-3
1126 fma.s1 FR_polyS = FR_rsq, FR_PP_8, FR_PP_7 // poly = rsq*PP_8+PP_7
1131 fma.s1 FR_polyC = FR_rsq, FR_QQ_8, FR_QQ_7 // poly = rsq*QQ_8+QQ_7
1137 (p7) fms.s1 FR_r = FR_s, f1, FR_U_1
1143 (p6) fma.s1 FR_r_cubed = FR_r, FR_rsq, f0 // rcubed = r * rsq
1162 (p6) fms.s1 FR_c = FR_c, f1, FR_w
1179 fms.s1 FR_U_2 = FR_N_float, FR_P_2, FR_U_1
1191 fma.s1 FR_polyC = f0, f1, FR_Neg_Two_to_M67
1202 fms.s1 FR_s = FR_s, f1, FR_r
1207 fma.s1 FR_rsq = FR_r, FR_r, f0
1213 fma.s1 FR_U_2 = FR_U_2, f1, FR_w
1224 fma.s1 FR_FirstC = f0, f1, f1
1230 fms.s1 FR_c = FR_s, f1, FR_U_1
1236 fma.s1 FR_r = FR_S_1, FR_r, f0
1248 fms.s1 FR_c = FR_c, f1, FR_U_2
1278 fma.s1 FR_polyS = FR_r, FR_rsq, FR_c
1350 fma.s1 FR_N_0 = FR_Input_X, FR_Inv_P_0, f0 // N_0 = Arg * Inv_P_0
1368 fcvt.fx.s1 FR_N_0_fix = FR_N_0 // N_0_fix = integer part of N_0
1380 fnma.s1 FR_ArgPrime = FR_N_0, FR_P_0, FR_Input_X // Arg'=-N_0*P_0+Arg
1385 fma.s1 FR_w = FR_N_0, FR_d_1, f0 // w = N_0 * d_1
1392 fma.s1 FR_N_float = FR_ArgPrime, FR_Inv_pi_by_2, f0 // N = A' * 2/pi
1398 fcvt.fx.s1 FR_N_fix = FR_N_float // N_fix is the integer part
1417 fnma.s1 FR_s = FR_N_float, FR_P_1, FR_ArgPrime // s = -N*P_1 + Arg'
1422 fnma.s1 FR_w = FR_N_float, FR_P_2, FR_w // w = -N*P_2 + w
1432 fcmp.lt.unc.s1 p9, p8 = FR_s, FR_Two_to_M14
1438 (p9) fcmp.gt.s1 p9, p8 = FR_s, FR_Neg_Two_to_M14 // p9 if |s| < 2^-14
1448 (p9) fma.s1 FR_V_hi = FR_N_float, FR_P_2, f0
1453 (p9) fma.s1 FR_U_hi = FR_N_0, FR_d_1, f0
1459 (p8) fma.s1 FR_r = FR_s, f1, FR_w
1464 (p9) fma.s1 FR_w = FR_N_float, FR_P_3, f0
1478 (p9) fms.s1 FR_A = FR_U_hi, f1, FR_V_hi
1483 (p9) fnma.s1 FR_V_lo = FR_N_float, FR_P_2, FR_V_hi
1494 (p9) fms.s1 FR_U_lo = FR_N_0, FR_d_1, FR_U_hi // For small s: U_lo=N_0*d_1-U_hi
1510 (p8) fms.s1 FR_c = FR_s, f1, FR_r // For big s: c = S - r
1522 (p8) fcmp.lt.unc.s1 p12, p13 = FR_r, FR_Two_to_M3
1528 (p12) fcmp.gt.s1 p12, p13 = FR_r, FR_Neg_Two_to_M3
1534 (p8) fma.s1 FR_c = FR_c, f1, FR_w
1539 (p9) fms.s1 FR_w = FR_N_0, FR_d_2, FR_w
1563 fcmp.ge.unc.s1 p6, p7 = FR_U_hiabs, FR_V_hiabs
1568 fma.s1 FR_t = FR_U_lo, f1, FR_V_lo // C_hi = S + A
1574 (p6) fms.s1 FR_a = FR_U_hi, f1, FR_A
1579 (p7) fma.s1 FR_a = FR_V_hi, f1, FR_A
1586 fma.s1 FR_C_hi = FR_s, f1, FR_A
1606 fma.s1 FR_t = FR_t, f1, FR_w // t = t + w
1611 (p6) fms.s1 FR_a = FR_a, f1, FR_V_hi
1622 fms.s1 FR_C_lo = FR_s, f1, FR_C_hi
1627 (p7) fms.s1 FR_a = FR_U_hi, f1, FR_a
1633 fma.s1 FR_C_lo = FR_C_lo, f1, FR_A // C_lo = (S - C_hi) + A
1638 fma.s1 FR_t = FR_t, f1, FR_a // t = t + a
1644 fma.s1 FR_r = FR_C_hi, f1, FR_C_lo
1650 fma.s1 FR_C_lo = FR_C_lo, f1, FR_t // C_lo = C_lo + t
1657 fma.s1 FR_rsq = FR_r, FR_r, f0
1662 fms.s1 FR_c = FR_C_hi, f1, FR_r
1668 fma.s1 FR_FirstS = f0, f1, FR_r
1673 fma.s1 FR_FirstC = f0, f1, f1
1679 fma.s1 FR_polyS = FR_rsq, FR_S_2, FR_S_1
1684 fma.s1 FR_polyC = FR_rsq, FR_C_2, FR_C_1
1690 fma.s1 FR_r_cubed = FR_rsq, FR_r, f0
1695 fma.s1 FR_c = FR_c, f1, FR_C_lo
1726 fma.s1 FR_polyS = FR_r_cubed, FR_polyS, FR_c
1731 fma.s1 FR_polyC = FR_rsq, FR_polyC, f0
1804 fma.s1 FR_rsq = FR_r, FR_r, f0 // rsq = r * r
1826 fma.s1 FR_r6 = FR_rsq, FR_rsq, f0 // Z = rsq * rsq
1837 fnma.s1 FR_cC = FR_c, FR_r, f0 // c = -c * r
1854 fma.s1 FR_r7 = FR_r6, FR_r, f0 // Z = Z * r
1860 fma.s1 FR_poly_loS = FR_rsq, FR_S_5, FR_S_4 // poly_lo=rsq*S_5+S_4
1865 fma.s1 FR_poly_loC = FR_rsq, FR_C_5, FR_C_4 // poly_lo=rsq*C_5+C_4
1871 fma.s1 FR_poly_hiS = FR_rsq, FR_S_2, FR_S_1 // poly_hi=rsq*S_2+S_1
1876 fma.s1 FR_poly_hiC = FR_rsq, FR_C_2, FR_C_1 // poly_hi=rsq*C_2+C_1
1894 fma.s1 FR_r6 = FR_r6, FR_rsq, f0
1899 fma.s1 FR_r7 = FR_r7, FR_rsq, f0
1905 fma.s1 FR_poly_loS = FR_rsq, FR_poly_loS, FR_S_3 // p_lo=p_lo*rsq+S_3
1910 fma.s1 FR_poly_loC = FR_rsq, FR_poly_loC, FR_C_3 // p_lo=p_lo*rsq+C_3
1922 fma.s1 FR_poly_hiS = FR_poly_hiS, FR_rsq, f0 // p_hi=p_hi*rsq
1927 fma.s1 FR_poly_hiC = FR_poly_hiC, FR_rsq, f0 // p_hi=p_hi*rsq
1957 fma.s1 FR_polyS = FR_r7, FR_poly_loS, FR_cS // poly=Z*poly_lo+c
1962 fma.s1 FR_polyC = FR_r6, FR_poly_loC, FR_cC // poly=Z*poly_lo+c
1968 fma.s1 FR_poly_hiS = FR_r, FR_poly_hiS, f0 // p_hi=r*p_hi
1975 fma.s1 FR_polyS = FR_polyS, f1, FR_poly_hiS
1980 fma.s1 FR_polyC = FR_polyC, f1, FR_poly_hiC
2053 fma.s1 FR_rsq = FR_r, FR_r, f0 // rsq = r * r
2076 frcpa.s1 FR_r_hi, p6 = f1, FR_r // r_hi = frcpa(r)
2081 fma.s1 FR_polyS = FR_rsq, FR_PP_8, FR_PP_7 // poly = rsq*PP_8+PP_7
2086 fma.s1 FR_polyC = FR_rsq, FR_QQ_8, FR_QQ_7 // poly = rsq*QQ_8+QQ_7
2092 fma.s1 FR_r_cubed = FR_r, FR_rsq, f0 // rcubed = r * rsq
2103 frcpa.s1 FR_r_hi, p6 = f1, FR_r_hi // r_hi = frpca(frcpa(r))
2108 fma.s1 FR_polyS = FR_rsq, FR_polyS, FR_PP_6 // poly = rsq*poly+PP_6
2113 fma.s1 FR_polyC = FR_rsq, FR_polyC, FR_QQ_6 // poly = rsq*poly+QQ_6
2119 fma.s1 FR_corrS = FR_C_1, FR_rsq, f0 // corr = C_1 * rsq
2124 fma.s1 FR_corrC = FR_S_1, FR_r_cubed, FR_r // corr = S_1 * r^3 + r
2130 fma.s1 FR_r_hi_sq = FR_r_hi, FR_r_hi, f0 // r_hi_sq = r_hi * r_hi
2135 fms.s1 FR_r_lo = FR_r, f1, FR_r_hi // r_lo = r - r_hi
2141 fma.s1 FR_polyS = FR_rsq, FR_polyS, FR_PP_5 // poly = rsq*poly+PP_5
2146 fma.s1 FR_polyC = FR_rsq, FR_polyC, FR_QQ_5 // poly = rsq*poly+QQ_5
2152 fma.s1 FR_corrS = FR_corrS, FR_c, FR_c // corr = corr * c + c
2157 fnma.s1 FR_corrC = FR_corrC, FR_c, f0 // corr = -corr * c
2163 fma.s1 FR_U_loS = FR_r, FR_r_hi, FR_r_hi_sq // U_lo = r*r_hi+r_hi_sq
2168 fma.s1 FR_U_loC = FR_r_hi, f1, FR_r // U_lo = r_hi + r
2174 fma.s1 FR_U_hiS = FR_r_hi, FR_r_hi_sq, f0 // U_hi = r_hi*r_hi_sq
2179 fma.s1 FR_U_hiC = FR_QQ_1, FR_r_hi_sq, f1 // U_hi = QQ_1*r_hi_sq+1
2185 fma.s1 FR_polyS = FR_rsq, FR_polyS, FR_PP_4 // poly = poly*rsq+PP_4
2190 fma.s1 FR_polyC = FR_rsq, FR_polyC, FR_QQ_4 // poly = poly*rsq+QQ_4
2196 fma.s1 FR_U_loS = FR_r, FR_r, FR_U_loS // U_lo = r * r + U_lo
2201 fma.s1 FR_U_loC = FR_r_lo, FR_U_loC, f0 // U_lo = r_lo * U_lo
2207 fma.s1 FR_U_hiS = FR_PP_1, FR_U_hiS, f0 // U_hi = PP_1 * U_hi
2213 fma.s1 FR_polyS = FR_rsq, FR_polyS, FR_PP_3 // poly = poly*rsq+PP_3
2218 fma.s1 FR_polyC = FR_rsq, FR_polyC, FR_QQ_3 // poly = poly*rsq+QQ_3
2224 fma.s1 FR_U_loS = FR_r_lo, FR_U_loS, f0 // U_lo = r_lo * U_lo
2229 fma.s1 FR_U_loC = FR_QQ_1,FR_U_loC, f0 // U_lo = QQ_1 * U_lo
2235 fma.s1 FR_U_hiS = FR_r, f1, FR_U_hiS // U_hi = r + U_hi
2241 fma.s1 FR_polyS = FR_rsq, FR_polyS, FR_PP_2 // poly = poly*rsq+PP_2
2246 fma.s1 FR_polyC = FR_rsq, FR_polyC, FR_QQ_2 // poly = poly*rsq+QQ_2
2252 fma.s1 FR_U_loS = FR_PP_1, FR_U_loS, f0 // U_lo = PP_1 * U_lo
2258 fma.s1 FR_polyS = FR_rsq, FR_polyS, FR_PP_1_lo // poly =poly*rsq+PP1lo
2263 fma.s1 FR_polyC = FR_rsq, FR_polyC, f0 // poly = poly*rsq
2295 fma.s1 FR_VS = FR_U_loS, f1, FR_corrS // V = U_lo + corr
2300 fma.s1 FR_VC = FR_U_loC, f1, FR_corrC // V = U_lo + corr
2313 fma.s1 FR_polyS = FR_r_cubed, FR_polyS, f0 // poly = poly*r^3
2318 fma.s1 FR_polyC = FR_rsq, FR_polyC, f0 // poly = poly*rsq
2325 fma.s1 FR_VS = FR_polyS, f1, FR_VS // V = poly + V
2330 fma.s1 FR_VC = FR_polyC, f1, FR_VC // V = poly + V
2506 fcmp.lt.unc.s1 p6, p0 = FR_r, FR_Two_to_M3
2512 (p6) fcmp.gt.unc.s1 p6, p0 = FR_r, FR_Neg_Two_to_M3