mirror of
				https://sourceware.org/git/glibc.git
				synced 2025-10-24 13:33:08 +03:00 
			
		
		
		
	Various floating-point functions have code to force underflow exceptions if a tiny result was computed in a way that might not have resulted in such exceptions even though the result is inexact. This typically uses math_force_eval to ensure that the underflowing expression is evaluated, but sometimes uses volatile. This patch refactors such code to use three new macros math_check_force_underflow, math_check_force_underflow_nonneg and math_check_force_underflow_complex (which in turn use math_force_eval). In the limited number of cases not suited to a simple conversion to these macros, existing uses of volatile are changed to use math_force_eval instead. The converted code does not always execute exactly the same sequence of operations as the original code, but the overall effects should be the same. Tested for x86_64, x86, mips64 and powerpc. * sysdeps/generic/math_private.h (fabs_tg): New macro. (min_of_type): Likewise. (math_check_force_underflow): Likewise. (math_check_force_underflow_nonneg): Likewise. (math_check_force_underflow_complex): Likewise. * math/e_exp2l.c (__ieee754_exp2l): Use math_check_force_underflow_nonneg. * math/k_casinh.c (__kernel_casinh): Likewise. * math/k_casinhf.c (__kernel_casinhf): Likewise. * math/k_casinhl.c (__kernel_casinhl): Likewise. * math/s_catan.c (__catan): Use math_check_force_underflow_complex. * math/s_catanf.c (__catanf): Likewise. * math/s_catanh.c (__catanh): Likewise. * math/s_catanhf.c (__catanhf): Likewise. * math/s_catanhl.c (__catanhl): Likewise. * math/s_catanl.c (__catanl): Likewise. * math/s_ccosh.c (__ccosh): Likewise. * math/s_ccoshf.c (__ccoshf): Likewise. * math/s_ccoshl.c (__ccoshl): Likewise. * math/s_cexp.c (__cexp): Likewise. * math/s_cexpf.c (__cexpf): Likewise. * math/s_cexpl.c (__cexpl): Likewise. * math/s_clog.c (__clog): Use math_check_force_underflow_nonneg. * math/s_clog10.c (__clog10): Likewise. * math/s_clog10f.c (__clog10f): Likewise. * math/s_clog10l.c (__clog10l): Likewise. * math/s_clogf.c (__clogf): Likewise. * math/s_clogl.c (__clogl): Likewise. * math/s_csin.c (__csin): Use math_check_force_underflow_complex. * math/s_csinf.c (__csinf): Likewise. * math/s_csinh.c (__csinh): Likewise. * math/s_csinhf.c (__csinhf): Likewise. * math/s_csinhl.c (__csinhl): Likewise. * math/s_csinl.c (__csinl): Likewise. * math/s_csqrt.c (__csqrt): Use math_check_force_underflow. * math/s_csqrtf.c (__csqrtf): Likewise. * math/s_csqrtl.c (__csqrtl): Likewise. * math/s_ctan.c (__ctan): Use math_check_force_underflow_complex. * math/s_ctanf.c (__ctanf): Likewise. * math/s_ctanh.c (__ctanh): Likewise. * math/s_ctanhf.c (__ctanhf): Likewise. * math/s_ctanhl.c (__ctanhl): Likewise. * math/s_ctanl.c (__ctanl): Likewise. * stdlib/strtod_l.c (round_and_return): Use math_force_eval instead of volatile. * sysdeps/ieee754/dbl-64/e_asin.c (__ieee754_asin): Use math_check_force_underflow. * sysdeps/ieee754/dbl-64/e_atanh.c (__ieee754_atanh): Likewise. * sysdeps/ieee754/dbl-64/e_exp.c (__ieee754_exp): Do not use volatile when forcing underflow. * sysdeps/ieee754/dbl-64/e_exp2.c (__ieee754_exp2): Use math_check_force_underflow_nonneg. * sysdeps/ieee754/dbl-64/e_gamma_r.c (__ieee754_gamma_r): Likewise. * sysdeps/ieee754/dbl-64/e_j1.c (__ieee754_j1): Use math_check_force_underflow. * sysdeps/ieee754/dbl-64/e_jn.c (__ieee754_jn): Likewise. * sysdeps/ieee754/dbl-64/e_sinh.c (__ieee754_sinh): Likewise. * sysdeps/ieee754/dbl-64/s_asinh.c (__asinh): Likewise. * sysdeps/ieee754/dbl-64/s_atan.c (atan): Use math_check_force_underflow_nonneg. * sysdeps/ieee754/dbl-64/s_erf.c (__erf): Use math_check_force_underflow. * sysdeps/ieee754/dbl-64/s_expm1.c (__expm1): Likewise. * sysdeps/ieee754/dbl-64/s_fma.c (__fma): Use math_force_eval instead of volatile. * sysdeps/ieee754/dbl-64/s_log1p.c (__log1p): Use math_check_force_underflow. * sysdeps/ieee754/dbl-64/s_sin.c (__sin): Likewise. * sysdeps/ieee754/dbl-64/s_tan.c (tan): Use math_check_force_underflow_nonneg. * sysdeps/ieee754/dbl-64/s_tanh.c (__tanh): Use math_check_force_underflow. * sysdeps/ieee754/flt-32/e_asinf.c (__ieee754_asinf): Likewise. * sysdeps/ieee754/flt-32/e_atanhf.c (__ieee754_atanhf): Likewise. * sysdeps/ieee754/flt-32/e_exp2f.c (__ieee754_exp2f): Use math_check_force_underflow_nonneg. * sysdeps/ieee754/flt-32/e_gammaf_r.c (__ieee754_gammaf_r): Likewise. * sysdeps/ieee754/flt-32/e_j1f.c (__ieee754_j1f): Use math_check_force_underflow. * sysdeps/ieee754/flt-32/e_jnf.c (__ieee754_jnf): Likewise. * sysdeps/ieee754/flt-32/e_sinhf.c (__ieee754_sinhf): Likewise. * sysdeps/ieee754/flt-32/k_sinf.c (__kernel_sinf): Likewise. * sysdeps/ieee754/flt-32/k_tanf.c (__kernel_tanf): Likewise. * sysdeps/ieee754/flt-32/s_asinhf.c (__asinhf): Likewise. * sysdeps/ieee754/flt-32/s_atanf.c (__atanf): Likewise. * sysdeps/ieee754/flt-32/s_erff.c (__erff): Likewise. * sysdeps/ieee754/flt-32/s_expm1f.c (__expm1f): Likewise. * sysdeps/ieee754/flt-32/s_log1pf.c (__log1pf): Likewise. * sysdeps/ieee754/flt-32/s_tanhf.c (__tanhf): Likewise. * sysdeps/ieee754/ldbl-128/e_asinl.c (__ieee754_asinl): Likewise. * sysdeps/ieee754/ldbl-128/e_atanhl.c (__ieee754_atanhl): Likewise. * sysdeps/ieee754/ldbl-128/e_expl.c (__ieee754_expl): Use math_check_force_underflow_nonneg. * sysdeps/ieee754/ldbl-128/e_gammal_r.c (__ieee754_gammal_r): Likewise. * sysdeps/ieee754/ldbl-128/e_j1l.c (__ieee754_j1l): Use math_check_force_underflow. * sysdeps/ieee754/ldbl-128/e_jnl.c (__ieee754_jnl): Likewise. * sysdeps/ieee754/ldbl-128/e_sinhl.c (__ieee754_sinhl): Likewise. * sysdeps/ieee754/ldbl-128/k_sincosl.c (__kernel_sincosl): Likewise. * sysdeps/ieee754/ldbl-128/k_sinl.c (__kernel_sinl): Likewise. * sysdeps/ieee754/ldbl-128/k_tanl.c (__kernel_tanl): Likewise. * sysdeps/ieee754/ldbl-128/s_asinhl.c (__asinhl): Likewise. * sysdeps/ieee754/ldbl-128/s_atanl.c (__atanl): Likewise. * sysdeps/ieee754/ldbl-128/s_erfl.c (__erfl): Likewise. * sysdeps/ieee754/ldbl-128/s_expm1l.c (__expm1l): Likewise. * sysdeps/ieee754/ldbl-128/s_fmal.c (__fmal): Use math_force_eval instead of volatile. * sysdeps/ieee754/ldbl-128/s_log1pl.c (__log1pl): Use math_check_force_underflow. * sysdeps/ieee754/ldbl-128/s_tanhl.c (__tanhl): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_asinl.c (__ieee754_asinl): Use math_check_force_underflow. * sysdeps/ieee754/ldbl-128ibm/e_atanhl.c (__ieee754_atanhl): Likewise. * sysdeps/ieee754/ldbl-128ibm/e_gammal_r.c (__ieee754_gammal_r): Use math_check_force_underflow_nonneg. * sysdeps/ieee754/ldbl-128ibm/e_jnl.c (__ieee754_jnl): Use math_check_force_underflow. * sysdeps/ieee754/ldbl-128ibm/e_sinhl.c (__ieee754_sinhl): Likewise. * sysdeps/ieee754/ldbl-128ibm/k_sincosl.c (__kernel_sincosl): Likewise. * sysdeps/ieee754/ldbl-128ibm/k_sinl.c (__kernel_sinl): Likewise. * sysdeps/ieee754/ldbl-128ibm/k_tanl.c (__kernel_tanl): Likewise. * sysdeps/ieee754/ldbl-128ibm/s_asinhl.c (__asinhl): Likewise. * sysdeps/ieee754/ldbl-128ibm/s_atanl.c (__atanl): Likewise. * sysdeps/ieee754/ldbl-128ibm/s_erfl.c (__erfl): Likewise. * sysdeps/ieee754/ldbl-128ibm/s_tanhl.c (__tanhl): Likewise. * sysdeps/ieee754/ldbl-96/e_asinl.c (__ieee754_asinl): Likewise. * sysdeps/ieee754/ldbl-96/e_atanhl.c (__ieee754_atanhl): Likewise. * sysdeps/ieee754/ldbl-96/e_gammal_r.c (__ieee754_gammal_r): Use math_check_force_underflow_nonneg. * sysdeps/ieee754/ldbl-96/e_j1l.c (__ieee754_j1l): Use math_check_force_underflow. * sysdeps/ieee754/ldbl-96/e_jnl.c (__ieee754_jnl): Likewise. * sysdeps/ieee754/ldbl-96/e_sinhl.c (__ieee754_sinhl): Likewise. * sysdeps/ieee754/ldbl-96/k_sinl.c (__kernel_sinl): Likewise. * sysdeps/ieee754/ldbl-96/k_tanl.c (__kernel_tanl): Use math_check_force_underflow_nonneg. * sysdeps/ieee754/ldbl-96/s_asinhl.c (__asinhl): Use math_check_force_underflow. * sysdeps/ieee754/ldbl-96/s_erfl.c (__erfl): Likewise. * sysdeps/ieee754/ldbl-96/s_fmal.c (__fmal): Use math_force_eval instead of volatile. * sysdeps/ieee754/ldbl-96/s_tanhl.c (__tanhl): Use math_check_force_underflow.
		
			
				
	
	
		
			251 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			251 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*							s_atanl.c
 | |
|  *
 | |
|  *	Inverse circular tangent for 128-bit long double precision
 | |
|  *      (arctangent)
 | |
|  *
 | |
|  *
 | |
|  *
 | |
|  * SYNOPSIS:
 | |
|  *
 | |
|  * long double x, y, atanl();
 | |
|  *
 | |
|  * y = atanl( x );
 | |
|  *
 | |
|  *
 | |
|  *
 | |
|  * DESCRIPTION:
 | |
|  *
 | |
|  * Returns radian angle between -pi/2 and +pi/2 whose tangent is x.
 | |
|  *
 | |
|  * The function uses a rational approximation of the form
 | |
|  * t + t^3 P(t^2)/Q(t^2), optimized for |t| < 0.09375.
 | |
|  *
 | |
|  * The argument is reduced using the identity
 | |
|  *    arctan x - arctan u  =  arctan ((x-u)/(1 + ux))
 | |
|  * and an 83-entry lookup table for arctan u, with u = 0, 1/8, ..., 10.25.
 | |
|  * Use of the table improves the execution speed of the routine.
 | |
|  *
 | |
|  *
 | |
|  *
 | |
|  * ACCURACY:
 | |
|  *
 | |
|  *                      Relative error:
 | |
|  * arithmetic   domain     # trials      peak         rms
 | |
|  *    IEEE      -19, 19       4e5       1.7e-34     5.4e-35
 | |
|  *
 | |
|  *
 | |
|  * WARNING:
 | |
|  *
 | |
|  * This program uses integer operations on bit fields of floating-point
 | |
|  * numbers.  It does not work with data structures other than the
 | |
|  * structure assumed.
 | |
|  *
 | |
|  */
 | |
| 
 | |
| /* Copyright 2001 by Stephen L. Moshier <moshier@na-net.ornl.gov>
 | |
| 
 | |
|     This library is free software; you can redistribute it and/or
 | |
|     modify it under the terms of the GNU Lesser General Public
 | |
|     License as published by the Free Software Foundation; either
 | |
|     version 2.1 of the License, or (at your option) any later version.
 | |
| 
 | |
|     This library is distributed in the hope that it will be useful,
 | |
|     but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|     Lesser General Public License for more details.
 | |
| 
 | |
|     You should have received a copy of the GNU Lesser General Public
 | |
|     License along with this library; if not, see
 | |
|     <http://www.gnu.org/licenses/>.  */
 | |
| 
 | |
| 
 | |
| #include <float.h>
 | |
| #include <math.h>
 | |
| #include <math_private.h>
 | |
| #include <math_ldbl_opt.h>
 | |
| 
 | |
| /* arctan(k/8), k = 0, ..., 82 */
 | |
| static const long double atantbl[84] = {
 | |
|   0.0000000000000000000000000000000000000000E0L,
 | |
|   1.2435499454676143503135484916387102557317E-1L, /* arctan(0.125)  */
 | |
|   2.4497866312686415417208248121127581091414E-1L,
 | |
|   3.5877067027057222039592006392646049977698E-1L,
 | |
|   4.6364760900080611621425623146121440202854E-1L,
 | |
|   5.5859931534356243597150821640166127034645E-1L,
 | |
|   6.4350110879328438680280922871732263804151E-1L,
 | |
|   7.1882999962162450541701415152590465395142E-1L,
 | |
|   7.8539816339744830961566084581987572104929E-1L,
 | |
|   8.4415398611317100251784414827164750652594E-1L,
 | |
|   8.9605538457134395617480071802993782702458E-1L,
 | |
|   9.4200004037946366473793717053459358607166E-1L,
 | |
|   9.8279372324732906798571061101466601449688E-1L,
 | |
|   1.0191413442663497346383429170230636487744E0L,
 | |
|   1.0516502125483736674598673120862998296302E0L,
 | |
|   1.0808390005411683108871567292171998202703E0L,
 | |
|   1.1071487177940905030170654601785370400700E0L,
 | |
|   1.1309537439791604464709335155363278047493E0L,
 | |
|   1.1525719972156675180401498626127513797495E0L,
 | |
|   1.1722738811284763866005949441337046149712E0L,
 | |
|   1.1902899496825317329277337748293183376012E0L,
 | |
|   1.2068173702852525303955115800565576303133E0L,
 | |
|   1.2220253232109896370417417439225704908830E0L,
 | |
|   1.2360594894780819419094519711090786987027E0L,
 | |
|   1.2490457723982544258299170772810901230778E0L,
 | |
|   1.2610933822524404193139408812473357720101E0L,
 | |
|   1.2722973952087173412961937498224804940684E0L,
 | |
|   1.2827408797442707473628852511364955306249E0L,
 | |
|   1.2924966677897852679030914214070816845853E0L,
 | |
|   1.3016288340091961438047858503666855921414E0L,
 | |
|   1.3101939350475556342564376891719053122733E0L,
 | |
|   1.3182420510168370498593302023271362531155E0L,
 | |
|   1.3258176636680324650592392104284756311844E0L,
 | |
|   1.3329603993374458675538498697331558093700E0L,
 | |
|   1.3397056595989995393283037525895557411039E0L,
 | |
|   1.3460851583802539310489409282517796256512E0L,
 | |
|   1.3521273809209546571891479413898128509842E0L,
 | |
|   1.3578579772154994751124898859640585287459E0L,
 | |
|   1.3633001003596939542892985278250991189943E0L,
 | |
|   1.3684746984165928776366381936948529556191E0L,
 | |
|   1.3734007669450158608612719264449611486510E0L,
 | |
|   1.3780955681325110444536609641291551522494E0L,
 | |
|   1.3825748214901258580599674177685685125566E0L,
 | |
|   1.3868528702577214543289381097042486034883E0L,
 | |
|   1.3909428270024183486427686943836432060856E0L,
 | |
|   1.3948567013423687823948122092044222644895E0L,
 | |
|   1.3986055122719575950126700816114282335732E0L,
 | |
|   1.4021993871854670105330304794336492676944E0L,
 | |
|   1.4056476493802697809521934019958079881002E0L,
 | |
|   1.4089588955564736949699075250792569287156E0L,
 | |
|   1.4121410646084952153676136718584891599630E0L,
 | |
|   1.4152014988178669079462550975833894394929E0L,
 | |
|   1.4181469983996314594038603039700989523716E0L,
 | |
|   1.4209838702219992566633046424614466661176E0L,
 | |
|   1.4237179714064941189018190466107297503086E0L,
 | |
|   1.4263547484202526397918060597281265695725E0L,
 | |
|   1.4288992721907326964184700745371983590908E0L,
 | |
|   1.4313562697035588982240194668401779312122E0L,
 | |
|   1.4337301524847089866404719096698873648610E0L,
 | |
|   1.4360250423171655234964275337155008780675E0L,
 | |
|   1.4382447944982225979614042479354815855386E0L,
 | |
|   1.4403930189057632173997301031392126865694E0L,
 | |
|   1.4424730991091018200252920599377292525125E0L,
 | |
|   1.4444882097316563655148453598508037025938E0L,
 | |
|   1.4464413322481351841999668424758804165254E0L,
 | |
|   1.4483352693775551917970437843145232637695E0L,
 | |
|   1.4501726582147939000905940595923466567576E0L,
 | |
|   1.4519559822271314199339700039142990228105E0L,
 | |
|   1.4536875822280323362423034480994649820285E0L,
 | |
|   1.4553696664279718992423082296859928222270E0L,
 | |
|   1.4570043196511885530074841089245667532358E0L,
 | |
|   1.4585935117976422128825857356750737658039E0L,
 | |
|   1.4601391056210009726721818194296893361233E0L,
 | |
|   1.4616428638860188872060496086383008594310E0L,
 | |
|   1.4631064559620759326975975316301202111560E0L,
 | |
|   1.4645314639038178118428450961503371619177E0L,
 | |
|   1.4659193880646627234129855241049975398470E0L,
 | |
|   1.4672716522843522691530527207287398276197E0L,
 | |
|   1.4685896086876430842559640450619880951144E0L,
 | |
|   1.4698745421276027686510391411132998919794E0L,
 | |
|   1.4711276743037345918528755717617308518553E0L,
 | |
|   1.4723501675822635384916444186631899205983E0L,
 | |
|   1.4735431285433308455179928682541563973416E0L, /* arctan(10.25) */
 | |
|   1.5707963267948966192313216916397514420986E0L  /* pi/2 */
 | |
| };
 | |
| 
 | |
| 
 | |
| /* arctan t = t + t^3 p(t^2) / q(t^2)
 | |
|    |t| <= 0.09375
 | |
|    peak relative error 5.3e-37 */
 | |
| 
 | |
| static const long double
 | |
|   p0 = -4.283708356338736809269381409828726405572E1L,
 | |
|   p1 = -8.636132499244548540964557273544599863825E1L,
 | |
|   p2 = -5.713554848244551350855604111031839613216E1L,
 | |
|   p3 = -1.371405711877433266573835355036413750118E1L,
 | |
|   p4 = -8.638214309119210906997318946650189640184E-1L,
 | |
|   q0 = 1.285112506901621042780814422948906537959E2L,
 | |
|   q1 = 3.361907253914337187957855834229672347089E2L,
 | |
|   q2 = 3.180448303864130128268191635189365331680E2L,
 | |
|   q3 = 1.307244136980865800160844625025280344686E2L,
 | |
|   q4 = 2.173623741810414221251136181221172551416E1L;
 | |
|   /* q5 = 1.000000000000000000000000000000000000000E0 */
 | |
| 
 | |
| 
 | |
| long double
 | |
| __atanl (long double x)
 | |
| {
 | |
|   int32_t k, sign, lx;
 | |
|   long double t, u, p, q;
 | |
|   double xhi;
 | |
| 
 | |
|   xhi = ldbl_high (x);
 | |
|   EXTRACT_WORDS (k, lx, xhi);
 | |
|   sign = k & 0x80000000;
 | |
| 
 | |
|   /* Check for IEEE special cases.  */
 | |
|   k &= 0x7fffffff;
 | |
|   if (k >= 0x7ff00000)
 | |
|     {
 | |
|       /* NaN. */
 | |
|       if (((k - 0x7ff00000) | lx) != 0)
 | |
| 	return (x + x);
 | |
| 
 | |
|       /* Infinity. */
 | |
|       if (sign)
 | |
| 	return -atantbl[83];
 | |
|       else
 | |
| 	return atantbl[83];
 | |
|     }
 | |
| 
 | |
|   if (k <= 0x3c800000) /* |x| <= 2**-55.  */
 | |
|     {
 | |
|       math_check_force_underflow (x);
 | |
|       /* Raise inexact.  */
 | |
|       if (1e300L + x > 0.0)
 | |
| 	return x;
 | |
|     }
 | |
| 
 | |
|   if (k >= 0x46c00000) /* |x| >= 2**109.  */
 | |
|     {
 | |
|       /* Saturate result to {-,+}pi/2.  */
 | |
|       if (sign)
 | |
| 	return -atantbl[83];
 | |
|       else
 | |
| 	return atantbl[83];
 | |
|     }
 | |
| 
 | |
|   if (sign)
 | |
|       x = -x;
 | |
| 
 | |
|   if (k >= 0x40248000) /* 10.25 */
 | |
|     {
 | |
|       k = 83;
 | |
|       t = -1.0/x;
 | |
|     }
 | |
|   else
 | |
|     {
 | |
|       /* Index of nearest table element.
 | |
| 	 Roundoff to integer is asymmetrical to avoid cancellation when t < 0
 | |
|          (cf. fdlibm). */
 | |
|       k = 8.0 * x + 0.25;
 | |
|       u = 0.125 * k;
 | |
|       /* Small arctan argument.  */
 | |
|       t = (x - u) / (1.0 + x * u);
 | |
|     }
 | |
| 
 | |
|   /* Arctan of small argument t.  */
 | |
|   u = t * t;
 | |
|   p =     ((((p4 * u) + p3) * u + p2) * u + p1) * u + p0;
 | |
|   q = ((((u + q4) * u + q3) * u + q2) * u + q1) * u + q0;
 | |
|   u = t * u * p / q  +  t;
 | |
| 
 | |
|   /* arctan x = arctan u  +  arctan t */
 | |
|   u = atantbl[k] + u;
 | |
|   if (sign)
 | |
|     return (-u);
 | |
|   else
 | |
|     return u;
 | |
| }
 | |
| 
 | |
| long_double_symbol (libm, __atanl, atanl);
 |