blocks|key|1090349|text|下面的代码是基于一个先前的回答的，其中我演示了如何对三角函数执行相当精确的参数约简，方法是使用分裂常数的Cody方法，对于小的大小的参数，使用Payne-Hanek方法。有关佩恩-哈内克算法的详细信息，请参阅此处，有关Cody算法的详细信息，请参阅我的先前的回答。|type|unstyled|depth|inlineStyleRanges|entityRanges|offset|length|data|1090350|在这里，我进行了必要的调整，以适应asker平台的限制，因为不支持64位类型，不支持融合乘法添加，math.h中的辅助函数不可用。我假设float映射到IEEE-754+binary32格式，并且有一种方法可以将这种32位浮点数重新解释为32位无符号整数，反之亦然。我已经通过标准的便携成语(也就是使用memcpy()+)实现了这个重新解释，但是其他方法可能被选择适合于未指定的目标平台，例如内联装配、机器特定的本质或易失性的联合。|style|CODE|1090351|由于这段代码基本上是我前面代码的一个端口，所以它可能缺乏专门针对该环境的新设计的优雅性。我基本上用一些位旋转代替了frexp()助手函数，用32位整数对来模拟64位整数计算，用32位不动点计算代替了双精度计算(这比我预期的要好得多)，并用未融合等效的方法替换了所有的FMAs。|1090352|重新处理Cody部分的论点减少了相当多的工作。显然，如果没有FMA可用，我们需要确保常数π/2的组成部分中有足够数量的尾随零位(最不重要的部分除外)，以确保产品是精确的。我花了几个小时的实验，费解出一个特定的分裂，提供准确的结果，但也推动转换点的佩恩-哈内克方法尽可能高。|1090353|当指定USE_FMA+=+1时，当使用高质量的数学库进行编译时，测试应用程序的输出应该类似于以下内容：|1090354|Testing+sinf+...++PASSED.+max+ulp+err+=+1.493253++diffsum+=+337633490
Testing+cosf+...++PASSED.+max+ulp+err+=+1.495098++diffsum+=+342020968|code-block|syntax|javascript|1090355|对于USE_FMA+=+0，准确度略有变化，情况更糟：|1090356|Testing+sinf+...++PASSED.+max+ulp+err+=+1.498012++diffsum+=+359702532
Testing+cosf+...++PASSED.+max+ulp+err+=+1.504061++diffsum+=+364682650|1090357|diffsum输出是一个总体精度的粗略指标，这里显示了大约90%25的输入结果是一个正确的圆角单精度响应。|1090358|请注意，编译代码时必须使用编译器提供的最严格的浮点设置和最高程度的依从IEEE-754。对于我用来开发和测试这段代码的Intel编译器，可以通过使用/fp:strict进行编译来实现。此外，作为参考的数学库的质量是准确评估这一单精度代码的ulp误差的关键。Intel编译器附带了一个数学库，它提供了双精度的基本数学函数，在HA+(高精度)变体中的误差略高于0.5ULP。多精度参考库的使用可能更好，但在这里会拖慢我的脚步。|1090359|#include+<stdio.h>
#include+<stdlib.h>
#include+<stdint.h>
#include+<string.h>+++//+for+memcpy()
#include+<math.h>+++++//+for+test+purposes,+and+when+PORTABLE=1+or+USE_FMA=1

#define+USE_FMA+++(0)+//+use+fmaf()+calls+for+arithmetic
#define+PORTABLE++(0)+//+allow+helper+functions+from+math.h
#define+HAVE_U64++(0)+//+64-bit+integer+type+available
#define+CW_STAGES+(3)+//+number+of+stages+in+Cody-Waite+reduction+when+USE_FMA=0

#if+USE_FMA
#define+SIN_RED_SWITCHOVER++(117435.992f)
#define+COS_RED_SWITCHOVER++(71476.0625f)
#define+MAX_DIFF++++++++++++(1)
#else+//+USE_FMA
#if+CW_STAGES+==+2
#define+SIN_RED_SWITCHOVER++(3.921875f)
#define+COS_RED_SWITCHOVER++(3.921875f)
#elif+CW_STAGES+==+3
#define+SIN_RED_SWITCHOVER++(201.15625f)
#define+COS_RED_SWITCHOVER++(142.90625f)
#endif+//+CW_STAGES
#define+MAX_DIFF++++++++++++(2)
#endif+//+USE_FMA

/*+re-interpret+the+bit+pattern+of+an+IEEE-754+float+as+a+uint32+*/
uint32_t+float_as_uint32+(float+a)
{
++++uint32_t+r;
++++memcpy+(&r,+&a,+sizeof+r);
++++return+r;
}

/*+re-interpret+the+bit+pattern+of+a+uint32+as+an+IEEE-754+float+*/
float+uint32_as_float+(uint32_t+a)
{
++++float+r;
++++memcpy+(&r,+&a,+sizeof+r);
++++return+r;
}

/*+Compute+the+upper+32+bits+of+the+product+of+two+unsigned+32-bit+integers+*/
#if+HAVE_U64
uint32_t+umul32_hi+(uint32_t+a,+uint32_t+b)
{
++++return+(uint32_t)(((uint64_t)a+*+b)+>>+32);
}
#else+//+HAVE_U64
/*+Henry+S.+Warren,+"Hacker's+Delight,+2nd+ed.",+Addison-Wesley+2012.+Fig.+8-2+*/
uint32_t+umul32_hi+(uint32_t+a,+uint32_t+b)
{
++++uint16_t+a_lo+=+(uint16_t)a;
++++uint16_t+a_hi+=+a+>>+16;
++++uint16_t+b_lo+=+(uint16_t)b;
++++uint16_t+b_hi+=+b+>>+16;
++++uint32_t+p0+=+(uint32_t)a_lo+*+b_lo;
++++uint32_t+p1+=+(uint32_t)a_lo+*+b_hi;
++++uint32_t+p2+=+(uint32_t)a_hi+*+b_lo;
++++uint32_t+p3+=+(uint32_t)a_hi+*+b_hi;
++++uint32_t+t+=+(p0+>>+16)+%2B+p1;
++++return+(t+>>+16)+%2B+(((uint32_t)(uint16_t)t+%2B+p2)+>>+16)+%2B+p3;
}
#endif+//+HAVE_U64

/*+190+bits+of+2/PI+for+Payne-Hanek+style+argument+reduction.+*/
const+uint32_t+two_over_pi_f+[]+=+
{
++++0x28be60db,
++++0x9391054a,
++++0x7f09d5f4,
++++0x7d4d3770,
++++0x36d8a566,
++++0x4f10e410
};

/*+Reduce+a+trig+function+argument+using+the+slow+Payne-Hanek+method+*/
float+trig_red_slowpath_f+(float+a,+int+*quadrant)
{
++++uint32_t+ia,+hi,+mid,+lo,+tmp,+i,+l,+h,+plo,+phi;
++++int32_t+e,+q;
++++float+r;

#if+PORTABLE
++++ia+=+(uint32_t)(fabsf+(frexpf+(a,+&e))+*+4.29496730e%2B9f);+//+0x1.0p32
#else+//+PORTABLE
++++ia+=+((float_as_uint32+(a)+&+0x007fffff)+<<+8)+%7C+0x80000000;
++++e+=+((float_as_uint32+(a)+>>+23)+&+0xff)+-+126;
#endif+//+PORTABLE
++++
++++/*+compute+product+x+*+2/pi+in+2.62+fixed-point+format+*/
++++i+=+(uint32_t)e+>>+5;
++++e+=+(uint32_t)e+&+31;

++++hi++=+i+?+two_over_pi_f+[i-1]+:+0;
++++mid+=+two_over_pi_f+[i%2B0];
++++lo++=+two_over_pi_f+[i%2B1];
++++tmp+=+two_over_pi_f+[i%2B2];
+
++++if+(e)+{
++++++++hi++=+(hi++<<+e)+%7C+(mid+>>+(32+-+e));
++++++++mid+=+(mid+<<+e)+%7C+(lo++>>+(32+-+e));
++++++++lo++=+(lo++<<+e)+%7C+(tmp+>>+(32+-+e));
++++}

++++/*+compute+64-bit+product+phi:plo+*/
++++phi+=+0;
++++l+=+ia+*+lo;
++++h+=+umul32_hi+(ia,+lo);
++++plo+=+phi+%2B+l;
++++phi+=+h+%2B+(plo+<+l);
++++l+=+ia+*+mid;
++++h+=+umul32_hi+(ia,+mid);
++++plo+=+phi+%2B+l;
++++phi+=+h+%2B+(plo+<+l);
++++l+=+ia+*+hi;
++++phi+=+phi+%2B+l;

++++/*+split+fixed-point+result+into+integer+and+fraction+portions+*/
++++q+=+phi+>>+30;+++++++++++++++//+integral+portion+=+quadrant<1:0>
++++phi+=+phi+&+0x3fffffff;++++++//+fraction
++++if+(phi+&+0x20000000)+{++++++//+fraction+>=+0.5
++++++++phi+=+phi+-+0x40000000;++//+fraction+-+1.0
++++++++q+=+q+%2B+1;
++++}

++++/*+compute+remainder+of+x+/+(pi/2)+*/
#if+USE_FMA
++++float+phif,+plof,+chif,+clof,+thif,+tlof;
++++phif+=+1.34217728e%2B8f+*+(float)(int32_t)(phi+&+0xffffffe0);+//+0x1.0p27
++++plof+=+(float)((plo+>>+5)+%7C+(phi+<<+(32-5)));
++++thif+=+phif+%2B+plof;
++++plof+=+(phif+-+thif)+%2B+plof;
++++phif+=+thif;
++++chif+=++1.08995894e-17f;+//++0x1.921fb6p-57+//+(1.5707963267948966+*+0x1.0p-57)_hi+
++++clof+=+-3.03308686e-25f;+//+-0x1.777a5cp-82+//+(1.5707963267948966+*+0x1.0p-57)_lo
++++thif+=+phif+*+chif;
++++tlof+=+fmaf+(phif,+chif,+-thif);
++++tlof+=+fmaf+(phif,+clof,+tlof);
++++tlof+=+fmaf+(plof,+chif,+tlof);
++++r+=+thif+%2B+tlof;
#else+//+USE_FMA
++++/*+record+sign+of+fraction+*/
++++uint32_t+s+=+phi+&+0x80000000;
++++
++++/*+take+absolute+value+of+fraction+*/
++++if+((int32_t)phi+<+0)+{
++++++++phi+=+~phi;
++++++++plo+=+0+-+plo;
++++++++phi+%2B=+(plo+==+0);
++++}
++++
++++/*+normalize+fraction+*/
++++e+=+0;
++++while+((int32_t)phi+>+0)+{
++++++++phi+=+(phi+<<+1)+%7C+(plo+>>+31);
++++++++plo+=+plo+<<+1;
++++++++e--;
++++}
++++
++++/*+multiply+32+high-order+bits+of+fraction+with+pi/2+*/
++++phi+=+umul32_hi+(phi,+0xc90fdaa2);+//+(uint32_t)rint(PI/2+*+2**31)
++++
++++/*+normalize+product+*/
++++if+((int32_t)phi+>+0)+{
++++++++phi+=+phi+<<+1;
++++++++e--;
++++}

++++/*+round+and+convert+to+floating+point+*/
++++uint32_t+ri+=+s+%2B+((e+%2B+128)+<<+23)+%2B+(phi+>>+8)+%2B+((phi+&+0xff)+>+0x7e);
++++r+=+uint32_as_float+(ri);
#endif+//+USE_FMA
++++if+(a+<+0.0f)+{
++++++++r+=+-r;
++++++++q+=+-q;
++++}

++++*quadrant+=+q;
++++return+r;
}

/*+Argument+reduction+for+trigonometric+functions+that+reduces+the+argument
+++to+the+interval+[-PI/4,+%2BPI/4]+and+also+returns+the+quadrant.+It+returns+
+++-0.0f+for+an+input+of+-0.0f+
*/
float+trig_red_f+(float+a,+float+switch_over,+int+*q)
{++++
++++float+j,+r;

++++if+(fabsf+(a)+>+switch_over)+{
++++++++/*+Payne-Hanek+style+reduction.+M.+Payne+and+R.+Hanek,+"Radian+reduction
+++++++++++for+trigonometric+functions".+SIGNUM+Newsletter,+18:19-24,+1983
++++++++*/
++++++++r+=+trig_red_slowpath_f+(a,+q);
++++}+else+{
++++++++/*+Cody-Waite+style+reduction.+W.+J.+Cody+and+W.+Waite,+"Software+Manual
+++++++++++for+the+Elementary+Functions",+Prentice-Hall+1980
++++++++*/
#if+USE_FMA
++++++++j+=+fmaf+(a,+6.36619747e-1f,+1.2582912e%2B7f);+//+0x1.45f306p-1,+0x1.8p%2B23
++++++++j+=+j+-+1.25829120e%2B7f;+//+0x1.8p%2B23
++++++++r+=+fmaf+(j,+-1.57079601e%2B00f,+a);+//+-0x1.921fb0p%2B00+//+pio2_high
++++++++r+=+fmaf+(j,+-3.13916473e-07f,+r);+//+-0x1.5110b4p-22+//+pio2_mid
++++++++r+=+fmaf+(j,+-5.39030253e-15f,+r);+//+-0x1.846988p-48+//+pio2_low
#else+//+USE_FMA
++++++++j+=+(a+*+6.36619747e-1f+%2B+1.2582912e%2B7f);+//+0x1.45f306p-1,+0x1.8p%2B23
++++++++j+=+j+-+1.25829120e%2B7f;+//+0x1.8p%2B23
#if+CW_STAGES+==+2
++++++++r+=+a+-+j+*+1.57079625e%2B00f;+//+0x1.921fb4p%2B0++//+pio2_high+
++++++++r+=+r+-+j+*+7.54979013e-08f;+//+0x1.4442d2p-24+//+pio2_low
#elif+CW_STAGES+==+3
++++++++r+=+a+-+j+*+1.57078552e%2B00f;+//+0x1.921f00p%2B00+//+pio2_high
++++++++r+=+r+-+j+*+1.08043314e-05f;+//+0x1.6a8880p-17+//+pio2_mid
++++++++r+=+r+-+j+*+2.56334407e-12f;+//+0x1.68c234p-39+//+pio2_low
#endif+//+CW_STAGES
#endif+//+USE_FMA
++++++++*q+=+(int)j;
++++}
++++return+r;
}

/*+Approximate+sine+on+[-PI/4,%2BPI/4].+Maximum+ulp+error+with+USE_FMA+=+0.64196
+++Returns+-0.0f+for+an+argument+of+-0.0f
+++Polynomial+approximation+based+on+T.+Myklebust,+"Computing+accurate+
+++Horner+form+approximations+to+special+functions+in+finite+precision
+++arithmetic",+http://arxiv.org/abs/1508.03211,+retrieved+on+8/29/2016
*/
float+sinf_poly+(float+a,+float+s)
{
++++float+r,+t;
#if+USE_FMA
++++r+=++++++++++++++2.86567956e-6f;++//++0x1.80a000p-19+
++++r+=+fmaf+(r,+s,+-1.98559923e-4f);+//+-0x1.a0690cp-13
++++r+=+fmaf+(r,+s,++8.33338592e-3f);+//++0x1.111182p-07
++++r+=+fmaf+(r,+s,+-1.66666672e-1f);+//+-0x1.555556p-03
++++t+=+fmaf+(a,+s,+0.0f);+//+ensure+-0+is+passed+through
++++r+=+fmaf+(r,+t,+a);
#else+//+USE_FMA
++++r+=+++++++++2.86567956e-6f;+//++0x1.80a000p-19
++++r+=+r+*+s+-+1.98559923e-4f;+//+-0x1.a0690cp-13
++++r+=+r+*+s+%2B+8.33338592e-3f;+//++0x1.111182p-07
++++r+=+r+*+s+-+1.66666672e-1f;+//+-0x1.555556p-03
++++t+=+a+*+s+%2B+0.0f;+//+ensure+-0+is+passed+through
++++r+=+r+*+t+%2B+a;
#endif+//+USE_FMA
++++return+r;
}

/*+Approximate+cosine+on+[-PI/4,%2BPI/4].+Maximum+ulp+error+with+USE_FMA+=+0.87444+*/
float+cosf_poly+(float+s)
{
++++float+r;
#if+USE_FMA
++++r+=++++++++++++++2.44677067e-5f;++//++0x1.9a8000p-16
++++r+=+fmaf+(r,+s,+-1.38877297e-3f);+//+-0x1.6c0efap-10
++++r+=+fmaf+(r,+s,++4.16666567e-2f);+//++0x1.555550p-05
++++r+=+fmaf+(r,+s,+-5.00000000e-1f);+//+-0x1.000000p-01
++++r+=+fmaf+(r,+s,++1.00000000e%2B0f);+//++0x1.000000p%2B00
#else+//+USE_FMA
++++r+=+++++++++2.44677067e-5f;+//++0x1.9a8000p-16
++++r+=+r+*+s+-+1.38877297e-3f;+//+-0x1.6c0efap-10
++++r+=+r+*+s+%2B+4.16666567e-2f;+//++0x1.555550p-05
++++r+=+r+*+s+-+5.00000000e-1f;+//+-0x1.000000p-01
++++r+=+r+*+s+%2B+1.00000000e%2B0f;+//++0x1.000000p%2B00
#endif+//+USE_FMA
++++return+r;
}

/*+Map+sine+or+cosine+value+based+on+quadrant+*/
float+sinf_cosf_core+(float+a,+int+i)
{
++++float+r,+s;

++++s+=+a+*+a;
++++r+=+(i+&+1)+?+cosf_poly+(s)+:+sinf_poly+(a,+s);
++++if+(i+&+2)+{
++++++++r+=+0.0f+-+r;+//+don't+change+"sign"+of+NaNs
++++}
++++return+r;
}

/*+maximum+ulp+error+with+USE_FMA+=+1:+1.495098++*/
float+my_sinf+(float+a)
{
++++float+r;
++++int+i;

++++a+=+a+*+0.0f+%2B+a;+//+inf+->+NaN
++++r+=+trig_red_f+(a,+SIN_RED_SWITCHOVER,+&i);
++++r+=+sinf_cosf_core+(r,+i);
++++return+r;
}

/*+maximum+ulp+error+with+USE_FMA+=+1:+1.493253+*/
float+my_cosf+(float+a)
{
++++float+r;
++++int+i;

++++a+=+a+*+0.0f+%2B+a;+//+inf+->+NaN
++++r+=+trig_red_f+(a,+COS_RED_SWITCHOVER,+&i);
++++r+=+sinf_cosf_core+(r,+i+%2B+1);
++++return+r;
}

/*+re-interpret+bit+pattern+of+an+IEEE-754+double+as+a+uint64+*/
uint64_t+double_as_uint64+(double+a)
{
++++uint64_t+r;
++++memcpy+(&r,+&a,+sizeof+r);
++++return+r;
}

double+floatUlpErr+(float+res,+double+ref)
{
++++uint64_t+i,+j,+err,+refi;
++++int+expoRef;
++++
++++/*+ulp+error+cannot+be+computed+if+either+operand+is+NaN,+infinity,+zero+*/
++++if+(isnan+(res)+%7C%7C+isnan+(ref)+%7C%7C+isinf+(res)+%7C%7C+isinf+(ref)+%7C%7C
++++++++(res+==+0.0f)+%7C%7C+(ref+==+0.0f))+{
++++++++return+0.0;
++++}
++++/*+Convert+the+float+result+to+an+"extended+float".+This+is+like+a+float
+++++++with+56+instead+of+24+effective+mantissa+bits.
++++*/
++++i+=+((uint64_t)float_as_uint32(res))+<<+32;
++++/*+Convert+the+double+reference+to+an+"extended+float".+If+the+reference+is
+++++++>=+2%5E129,+we+need+to+clamp+to+the+maximum+"extended+float".+If+reference
+++++++is+<+2%5E-126,+we+need+to+denormalize+because+of+the+float+types's+limited
+++++++exponent+range.
++++*/
++++refi+=+double_as_uint64(ref);
++++expoRef+=+(int)(((refi+>>+52)+&+0x7ff)+-+1023);
++++if+(expoRef+>=+129)+{
++++++++j+=+0x7fffffffffffffffULL;
++++}+else+if+(expoRef+<+-126)+{
++++++++j+=+((refi+<<+11)+%7C+0x8000000000000000ULL)+>>+8;
++++++++j+=+j+>>+(-(expoRef+%2B+126));
++++}+else+{
++++++++j+=+((refi+<<+11)+&+0x7fffffffffffffffULL)+>>+8;
++++++++j+=+j+%7C+((uint64_t)(expoRef+%2B+127)+<<+55);
++++}
++++j+=+j+%7C+(refi+&+0x8000000000000000ULL);
++++err+=+(i+<+j)+?+(j+-+i)+:+(i+-+j);
++++return+err+/+4294967296.0;
}

int+main+(void)+
{
++++float+arg,+res,+reff;
++++uint32_t+argi,+resi,+refi;
++++int64_t+diff,+diffsum;
++++double+ref,+ulp,+maxulp;

++++printf+("Testing+sinf+...++");
++++diffsum+=+0;
++++maxulp+=+0;
++++argi+=+0;
++++do+{
++++++++arg+=+uint32_as_float+(argi);
++++++++res+=+my_sinf+(arg);
++++++++ref+=+sin+((double)arg);
++++++++reff+=+(float)ref;
++++++++resi+=+float_as_uint32+(res);
++++++++refi+=+float_as_uint32+(reff);
++++++++ulp+=+floatUlpErr+(res,+ref);
++++++++if+(ulp+>+maxulp)+{
++++++++++++maxulp+=+ulp;
++++++++}
++++++++diff+=+(resi+>+refi)+?+(resi+-+refi)+:+(refi+-+resi);
++++++++if+(diff+>+MAX_DIFF)+{
++++++++++++printf+("\nerror+@+%2508x+(%25+15.8e):+res=%2508x+(%25+15.8e)++ref=%2508x+(%2515.8e)\n",+argi,+arg,+resi,+res,+refi,+reff);
++++++++++++return+EXIT_FAILURE;
++++++++}
++++++++diffsum+=+diffsum+%2B+diff;
++++++++argi%2B%2B;
++++}+while+(argi);
++++printf+("PASSED.+max+ulp+err+=+%25.6f++diffsum+=+%25lld\n",+maxulp,+diffsum);

++++printf+("Testing+cosf+...++");
++++diffsum+=+0;
++++maxulp+=+0;
++++argi+=+0;
++++do+{
++++++++arg+=+uint32_as_float+(argi);
++++++++res+=+my_cosf+(arg);
++++++++ref+=+cos+((double)arg);
++++++++reff+=+(float)ref;
++++++++resi+=+float_as_uint32+(res);
++++++++refi+=+float_as_uint32+(reff);
++++++++ulp+=+floatUlpErr+(res,+ref);
++++++++if+(ulp+>+maxulp)+{
++++++++++++maxulp+=+ulp;
++++++++}
++++++++diff+=+(resi+>+refi)+?+(resi+-+refi)+:+(refi+-+resi);
++++++++if+(diff+>+MAX_DIFF)+{
++++++++++++printf+("\nerror+@+%2508x+(%25+15.8e):+res=%2508x+(%25+15.8e)++ref=%2508x+(%2515.8e)\n",+argi,+arg,+resi,+res,+refi,+reff);
++++++++++++return+EXIT_FAILURE;
++++++++}
++++++++diffsum+=+diffsum+%2B+diff;
++++++++argi%2B%2B;
++++}+while+(argi);
++++diffsum+=+diffsum+%2B+diff;
++++printf+("PASSED.+max+ulp+err+=+%25.6f++diffsum+=+%25lld\n",+maxulp,+diffsum);
++++return+EXIT_SUCCESS;
}|1090360|entityMap|0|LINK|mutability|MUTABLE|url|https://stackoverflow.com/questions/30463616/payne-hanek-algorithm-implementation-in-c|1|https://stackoverflow.com/a/42541486/780717^0|A|5|0|3I|5|1|0|1D|6|1W|5|2D|8|47|8|0|1L|7|0|0|3|B|0|0|2|B|0|0|0|7|0|22|A|0|0^^$0|@$1|2|3|4|5|6|7|1C|8|@]|9|@$A|1D|B|1E|1|1F]|$A|1G|B|1H|1|1I]]|C|$]]|$1|D|3|E|5|6|7|1J|8|@$A|1K|B|1L|F|G]|$A|1M|B|1N|F|G]|$A|1O|B|1P|F|G]|$A|1Q|B|1R|F|G]]|9|@]|C|$]]|$1|H|3|I|5|6|7|1S|8|@$A|1T|B|1U|F|G]]|9|@]|C|$]]|$1|J|3|K|5|6|7|1V|8|@]|9|@]|C|$]]|$1|L|3|M|5|6|7|1W|8|@$A|1X|B|1Y|F|G]]|9|@]|C|$]]|$1|N|3|O|5|P|7|1Z|8|@]|9|@]|C|$Q|R]]|$1|S|3|T|5|6|7|20|8|@$A|21|B|22|F|G]]|9|@]|C|$]]|$1|U|3|V|5|P|7|23|8|@]|9|@]|C|$Q|R]]|$1|W|3|X|5|6|7|24|8|@$A|25|B|26|F|G]]|9|@]|C|$]]|$1|Y|3|Z|5|6|7|27|8|@$A|28|B|29|F|G]]|9|@]|C|$]]|$1|10|3|11|5|P|7|2A|8|@]|9|@]|C|$Q|R]]|$1|12|3|-4|5|6|7|2B|8|@]|9|@]|C|$]]]|13|$14|$5|15|16|17|C|$18|19]]|1A|$5|15|16|17|C|$18|1B]]]]

The following code is based on a <a href="https://stackoverflow.com/questions/30463616/payne-hanek-algorithm-implementation-in-c">previous answer</a> in which I demonstrated how to perform a fairly accurate argument reduction for trigonometric functions by using the Cody-Waite method of split constants for arguments small in magnitude, and the Payne-Hanek method for arguments large in magnitude. For details on the Payne-Hanek algorithm see there, for details on the Cody-Waite algorithm see this <a href="https://stackoverflow.com/a/42541486/780717">previous answer</a> of mine.
Here I have made adjustments necessary to adjust to the restrictions of the asker's platform, in that no 64-bit types are supported, fused multiply-add is not supported, and helper functions from <code>math.h</code> are not available. I am assuming that <code>float</code> maps to IEEE-754 <code>binary32</code> format, and that there is a way to re-interpret such a 32-bit float as a 32-bit unsigned integer and vice versa. I have implemented this re-interpretation via the standard portable idiom, that is, by using <code>memcpy()</code>, but other methods may be chosen appropriate for the unspecified target platform, such as inline assembly, machine-specific intrinsics, or volatile unions.
Since this code is basically a port of my previous code to a more restrictive environment, it lacks perhaps the elegance of a de novo design specifically targeted at that environment. I have basically replaced the <code>frexp()</code> helper function from <code>math.h</code> with some bit twiddling, emulated 64-bit integer computation with pairs of 32-bit integers, replaced the double-precision computation with 32-bit fixed-point computation (which worked much better than I had anticipated), and replaced all FMAs with the unfused equivalent.
Re-working the Cody-Waite portion of the argument reduction took quite a bit of work. Clearly, without FMA available, we need to ensure a sufficient number of trailing zero bits in the constituent parts of the constant π/2 (except the least significant one) to make sure the products are exact. I spent several hours experimentally puzzling out a particular split that delivers accurate results but also pushes the switchover point to the Payne-Hanek method as high as possible.
When <code>USE_FMA = 1</code> is specified, the output of the test app, when compiled with a high-quality math library, should look similar to this:
<pre><code>Testing sinf ... PASSED. max ulp err = 1.493253 diffsum = 337633490
Testing cosf ... PASSED. max ulp err = 1.495098 diffsum = 342020968
</code></pre>
With <code>USE_FMA = 0</code> the accuracy changes slightly for the worse:
<pre><code>Testing sinf ... PASSED. max ulp err = 1.498012 diffsum = 359702532
Testing cosf ... PASSED. max ulp err = 1.504061 diffsum = 364682650
</code></pre>
The <code>diffsum</code> output is a rough indicator of overall accuracy, here showing that about 90% of all inputs result in a correctly rounded single-precision response.
Note that it is important to compile the code with the strictest floating-point settings and highest degree of adherence to IEEE-754 the compiler offers. For the Intel compiler that I used to develop and test this code, that can be achieved by compiling with <code>/fp:strict</code>. Also, the quality of the math library used for reference is crucial for accurate assessment of the ulp error of this single-precision code. The Intel compiler comes with a math library that provides double-precision elementary math functions with just slightly over 0.5 ulp error in the HA (high accuracy) variant. Use of a multi-precision reference library may be preferable but would have slowed me down too much here.
<pre class="lang-c prettyprint-override"><code>#include &lt;stdio.h&gt;
#include &lt;stdlib.h&gt;
#include &lt;stdint.h&gt;
#include &lt;string.h&gt; // for memcpy()
#include &lt;math.h&gt; // for test purposes, and when PORTABLE=1 or USE_FMA=1

#define USE_FMA (0) // use fmaf() calls for arithmetic
#define PORTABLE (0) // allow helper functions from math.h
#define HAVE_U64 (0) // 64-bit integer type available
#define CW_STAGES (3) // number of stages in Cody-Waite reduction when USE_FMA=0

#if USE_FMA
#define SIN_RED_SWITCHOVER (117435.992f)
#define COS_RED_SWITCHOVER (71476.0625f)
#define MAX_DIFF (1)
#else // USE_FMA
#if CW_STAGES == 2
#define SIN_RED_SWITCHOVER (3.921875f)
#define COS_RED_SWITCHOVER (3.921875f)
#elif CW_STAGES == 3
#define SIN_RED_SWITCHOVER (201.15625f)
#define COS_RED_SWITCHOVER (142.90625f)
#endif // CW_STAGES
#define MAX_DIFF (2)
#endif // USE_FMA

/* re-interpret the bit pattern of an IEEE-754 float as a uint32 */
uint32_t float_as_uint32 (float a)
{
 uint32_t r;
 memcpy (&amp;r, &amp;a, sizeof r);
 return r;
}

/* re-interpret the bit pattern of a uint32 as an IEEE-754 float */
float uint32_as_float (uint32_t a)
{
 float r;
 memcpy (&amp;r, &amp;a, sizeof r);
 return r;
}

/* Compute the upper 32 bits of the product of two unsigned 32-bit integers */
#if HAVE_U64
uint32_t umul32_hi (uint32_t a, uint32_t b)
{
 return (uint32_t)(((uint64_t)a * b) &gt;&gt; 32);
}
#else // HAVE_U64
/* Henry S. Warren, &quot;Hacker's Delight, 2nd ed.&quot;, Addison-Wesley 2012. Fig. 8-2 */
uint32_t umul32_hi (uint32_t a, uint32_t b)
{
 uint16_t a_lo = (uint16_t)a;
 uint16_t a_hi = a &gt;&gt; 16;
 uint16_t b_lo = (uint16_t)b;
 uint16_t b_hi = b &gt;&gt; 16;
 uint32_t p0 = (uint32_t)a_lo * b_lo;
 uint32_t p1 = (uint32_t)a_lo * b_hi;
 uint32_t p2 = (uint32_t)a_hi * b_lo;
 uint32_t p3 = (uint32_t)a_hi * b_hi;
 uint32_t t = (p0 &gt;&gt; 16) + p1;
 return (t &gt;&gt; 16) + (((uint32_t)(uint16_t)t + p2) &gt;&gt; 16) + p3;
}
#endif // HAVE_U64

/* 190 bits of 2/PI for Payne-Hanek style argument reduction. */
const uint32_t two_over_pi_f [] = 
{
 0x28be60db,
 0x9391054a,
 0x7f09d5f4,
 0x7d4d3770,
 0x36d8a566,
 0x4f10e410
};

/* Reduce a trig function argument using the slow Payne-Hanek method */
float trig_red_slowpath_f (float a, int *quadrant)
{
 uint32_t ia, hi, mid, lo, tmp, i, l, h, plo, phi;
 int32_t e, q;
 float r;

#if PORTABLE
 ia = (uint32_t)(fabsf (frexpf (a, &amp;e)) * 4.29496730e+9f); // 0x1.0p32
#else // PORTABLE
 ia = ((float_as_uint32 (a) &amp; 0x007fffff) &lt;&lt; 8) | 0x80000000;
 e = ((float_as_uint32 (a) &gt;&gt; 23) &amp; 0xff) - 126;
#endif // PORTABLE
 
 /* compute product x * 2/pi in 2.62 fixed-point format */
 i = (uint32_t)e &gt;&gt; 5;
 e = (uint32_t)e &amp; 31;

 hi = i ? two_over_pi_f [i-1] : 0;
 mid = two_over_pi_f [i+0];
 lo = two_over_pi_f [i+1];
 tmp = two_over_pi_f [i+2];
 
 if (e) {
 hi = (hi &lt;&lt; e) | (mid &gt;&gt; (32 - e));
 mid = (mid &lt;&lt; e) | (lo &gt;&gt; (32 - e));
 lo = (lo &lt;&lt; e) | (tmp &gt;&gt; (32 - e));
 }

 /* compute 64-bit product phi:plo */
 phi = 0;
 l = ia * lo;
 h = umul32_hi (ia, lo);
 plo = phi + l;
 phi = h + (plo &lt; l);
 l = ia * mid;
 h = umul32_hi (ia, mid);
 plo = phi + l;
 phi = h + (plo &lt; l);
 l = ia * hi;
 phi = phi + l;

 /* split fixed-point result into integer and fraction portions */
 q = phi &gt;&gt; 30; // integral portion = quadrant&lt;1:0&gt;
 phi = phi &amp; 0x3fffffff; // fraction
 if (phi &amp; 0x20000000) { // fraction &gt;= 0.5
 phi = phi - 0x40000000; // fraction - 1.0
 q = q + 1;
 }

 /* compute remainder of x / (pi/2) */
#if USE_FMA
 float phif, plof, chif, clof, thif, tlof;
 phif = 1.34217728e+8f * (float)(int32_t)(phi &amp; 0xffffffe0); // 0x1.0p27
 plof = (float)((plo &gt;&gt; 5) | (phi &lt;&lt; (32-5)));
 thif = phif + plof;
 plof = (phif - thif) + plof;
 phif = thif;
 chif = 1.08995894e-17f; // 0x1.921fb6p-57 // (1.5707963267948966 * 0x1.0p-57)_hi 
 clof = -3.03308686e-25f; // -0x1.777a5cp-82 // (1.5707963267948966 * 0x1.0p-57)_lo
 thif = phif * chif;
 tlof = fmaf (phif, chif, -thif);
 tlof = fmaf (phif, clof, tlof);
 tlof = fmaf (plof, chif, tlof);
 r = thif + tlof;
#else // USE_FMA
 /* record sign of fraction */
 uint32_t s = phi &amp; 0x80000000;
 
 /* take absolute value of fraction */
 if ((int32_t)phi &lt; 0) {
 phi = ~phi;
 plo = 0 - plo;
 phi += (plo == 0);
 }
 
 /* normalize fraction */
 e = 0;
 while ((int32_t)phi &gt; 0) {
 phi = (phi &lt;&lt; 1) | (plo &gt;&gt; 31);
 plo = plo &lt;&lt; 1;
 e--;
 }
 
 /* multiply 32 high-order bits of fraction with pi/2 */
 phi = umul32_hi (phi, 0xc90fdaa2); // (uint32_t)rint(PI/2 * 2**31)
 
 /* normalize product */
 if ((int32_t)phi &gt; 0) {
 phi = phi &lt;&lt; 1;
 e--;
 }

 /* round and convert to floating point */
 uint32_t ri = s + ((e + 128) &lt;&lt; 23) + (phi &gt;&gt; 8) + ((phi &amp; 0xff) &gt; 0x7e);
 r = uint32_as_float (ri);
#endif // USE_FMA
 if (a &lt; 0.0f) {
 r = -r;
 q = -q;
 }

 *quadrant = q;
 return r;
}

/* Argument reduction for trigonometric functions that reduces the argument
 to the interval [-PI/4, +PI/4] and also returns the quadrant. It returns 
 -0.0f for an input of -0.0f 
*/
float trig_red_f (float a, float switch_over, int *q)
{ 
 float j, r;

 if (fabsf (a) &gt; switch_over) {
 /* Payne-Hanek style reduction. M. Payne and R. Hanek, &quot;Radian reduction
 for trigonometric functions&quot;. SIGNUM Newsletter, 18:19-24, 1983
 */
 r = trig_red_slowpath_f (a, q);
 } else {
 /* Cody-Waite style reduction. W. J. Cody and W. Waite, &quot;Software Manual
 for the Elementary Functions&quot;, Prentice-Hall 1980
 */
#if USE_FMA
 j = fmaf (a, 6.36619747e-1f, 1.2582912e+7f); // 0x1.45f306p-1, 0x1.8p+23
 j = j - 1.25829120e+7f; // 0x1.8p+23
 r = fmaf (j, -1.57079601e+00f, a); // -0x1.921fb0p+00 // pio2_high
 r = fmaf (j, -3.13916473e-07f, r); // -0x1.5110b4p-22 // pio2_mid
 r = fmaf (j, -5.39030253e-15f, r); // -0x1.846988p-48 // pio2_low
#else // USE_FMA
 j = (a * 6.36619747e-1f + 1.2582912e+7f); // 0x1.45f306p-1, 0x1.8p+23
 j = j - 1.25829120e+7f; // 0x1.8p+23
#if CW_STAGES == 2
 r = a - j * 1.57079625e+00f; // 0x1.921fb4p+0 // pio2_high 
 r = r - j * 7.54979013e-08f; // 0x1.4442d2p-24 // pio2_low
#elif CW_STAGES == 3
 r = a - j * 1.57078552e+00f; // 0x1.921f00p+00 // pio2_high
 r = r - j * 1.08043314e-05f; // 0x1.6a8880p-17 // pio2_mid
 r = r - j * 2.56334407e-12f; // 0x1.68c234p-39 // pio2_low
#endif // CW_STAGES
#endif // USE_FMA
 *q = (int)j;
 }
 return r;
}

/* Approximate sine on [-PI/4,+PI/4]. Maximum ulp error with USE_FMA = 0.64196
 Returns -0.0f for an argument of -0.0f
 Polynomial approximation based on T. Myklebust, &quot;Computing accurate 
 Horner form approximations to special functions in finite precision
 arithmetic&quot;, http://arxiv.org/abs/1508.03211, retrieved on 8/29/2016
*/
float sinf_poly (float a, float s)
{
 float r, t;
#if USE_FMA
 r = 2.86567956e-6f; // 0x1.80a000p-19 
 r = fmaf (r, s, -1.98559923e-4f); // -0x1.a0690cp-13
 r = fmaf (r, s, 8.33338592e-3f); // 0x1.111182p-07
 r = fmaf (r, s, -1.66666672e-1f); // -0x1.555556p-03
 t = fmaf (a, s, 0.0f); // ensure -0 is passed through
 r = fmaf (r, t, a);
#else // USE_FMA
 r = 2.86567956e-6f; // 0x1.80a000p-19
 r = r * s - 1.98559923e-4f; // -0x1.a0690cp-13
 r = r * s + 8.33338592e-3f; // 0x1.111182p-07
 r = r * s - 1.66666672e-1f; // -0x1.555556p-03
 t = a * s + 0.0f; // ensure -0 is passed through
 r = r * t + a;
#endif // USE_FMA
 return r;
}

/* Approximate cosine on [-PI/4,+PI/4]. Maximum ulp error with USE_FMA = 0.87444 */
float cosf_poly (float s)
{
 float r;
#if USE_FMA
 r = 2.44677067e-5f; // 0x1.9a8000p-16
 r = fmaf (r, s, -1.38877297e-3f); // -0x1.6c0efap-10
 r = fmaf (r, s, 4.16666567e-2f); // 0x1.555550p-05
 r = fmaf (r, s, -5.00000000e-1f); // -0x1.000000p-01
 r = fmaf (r, s, 1.00000000e+0f); // 0x1.000000p+00
#else // USE_FMA
 r = 2.44677067e-5f; // 0x1.9a8000p-16
 r = r * s - 1.38877297e-3f; // -0x1.6c0efap-10
 r = r * s + 4.16666567e-2f; // 0x1.555550p-05
 r = r * s - 5.00000000e-1f; // -0x1.000000p-01
 r = r * s + 1.00000000e+0f; // 0x1.000000p+00
#endif // USE_FMA
 return r;
}

/* Map sine or cosine value based on quadrant */
float sinf_cosf_core (float a, int i)
{
 float r, s;

 s = a * a;
 r = (i &amp; 1) ? cosf_poly (s) : sinf_poly (a, s);
 if (i &amp; 2) {
 r = 0.0f - r; // don't change &quot;sign&quot; of NaNs
 }
 return r;
}

/* maximum ulp error with USE_FMA = 1: 1.495098 */
float my_sinf (float a)
{
 float r;
 int i;

 a = a * 0.0f + a; // inf -&gt; NaN
 r = trig_red_f (a, SIN_RED_SWITCHOVER, &amp;i);
 r = sinf_cosf_core (r, i);
 return r;
}

/* maximum ulp error with USE_FMA = 1: 1.493253 */
float my_cosf (float a)
{
 float r;
 int i;

 a = a * 0.0f + a; // inf -&gt; NaN
 r = trig_red_f (a, COS_RED_SWITCHOVER, &amp;i);
 r = sinf_cosf_core (r, i + 1);
 return r;
}

/* re-interpret bit pattern of an IEEE-754 double as a uint64 */
uint64_t double_as_uint64 (double a)
{
 uint64_t r;
 memcpy (&amp;r, &amp;a, sizeof r);
 return r;
}

double floatUlpErr (float res, double ref)
{
 uint64_t i, j, err, refi;
 int expoRef;
 
 /* ulp error cannot be computed if either operand is NaN, infinity, zero */
 if (isnan (res) || isnan (ref) || isinf (res) || isinf (ref) ||
 (res == 0.0f) || (ref == 0.0f)) {
 return 0.0;
 }
 /* Convert the float result to an &quot;extended float&quot;. This is like a float
 with 56 instead of 24 effective mantissa bits.
 */
 i = ((uint64_t)float_as_uint32(res)) &lt;&lt; 32;
 /* Convert the double reference to an &quot;extended float&quot;. If the reference is
 &gt;= 2^129, we need to clamp to the maximum &quot;extended float&quot;. If reference
 is &lt; 2^-126, we need to denormalize because of the float types's limited
 exponent range.
 */
 refi = double_as_uint64(ref);
 expoRef = (int)(((refi &gt;&gt; 52) &amp; 0x7ff) - 1023);
 if (expoRef &gt;= 129) {
 j = 0x7fffffffffffffffULL;
 } else if (expoRef &lt; -126) {
 j = ((refi &lt;&lt; 11) | 0x8000000000000000ULL) &gt;&gt; 8;
 j = j &gt;&gt; (-(expoRef + 126));
 } else {
 j = ((refi &lt;&lt; 11) &amp; 0x7fffffffffffffffULL) &gt;&gt; 8;
 j = j | ((uint64_t)(expoRef + 127) &lt;&lt; 55);
 }
 j = j | (refi &amp; 0x8000000000000000ULL);
 err = (i &lt; j) ? (j - i) : (i - j);
 return err / 4294967296.0;
}

int main (void) 
{
 float arg, res, reff;
 uint32_t argi, resi, refi;
 int64_t diff, diffsum;
 double ref, ulp, maxulp;

 printf (&quot;Testing sinf ... &quot;);
 diffsum = 0;
 maxulp = 0;
 argi = 0;
 do {
 arg = uint32_as_float (argi);
 res = my_sinf (arg);
 ref = sin ((double)arg);
 reff = (float)ref;
 resi = float_as_uint32 (res);
 refi = float_as_uint32 (reff);
 ulp = floatUlpErr (res, ref);
 if (ulp &gt; maxulp) {
 maxulp = ulp;
 }
 diff = (resi &gt; refi) ? (resi - refi) : (refi - resi);
 if (diff &gt; MAX_DIFF) {
 printf (&quot;\nerror @ %08x (% 15.8e): res=%08x (% 15.8e) ref=%08x (%15.8e)\n&quot;, argi, arg, resi, res, refi, reff);
 return EXIT_FAILURE;
 }
 diffsum = diffsum + diff;
 argi++;
 } while (argi);
 printf (&quot;PASSED. max ulp err = %.6f diffsum = %lld\n&quot;, maxulp, diffsum);

 printf (&quot;Testing cosf ... &quot;);
 diffsum = 0;
 maxulp = 0;
 argi = 0;
 do {
 arg = uint32_as_float (argi);
 res = my_cosf (arg);
 ref = cos ((double)arg);
 reff = (float)ref;
 resi = float_as_uint32 (res);
 refi = float_as_uint32 (reff);
 ulp = floatUlpErr (res, ref);
 if (ulp &gt; maxulp) {
 maxulp = ulp;
 }
 diff = (resi &gt; refi) ? (resi - refi) : (refi - resi);
 if (diff &gt; MAX_DIFF) {
 printf (&quot;\nerror @ %08x (% 15.8e): res=%08x (% 15.8e) ref=%08x (%15.8e)\n&quot;, argi, arg, resi, res, refi, reff);
 return EXIT_FAILURE;
 }
 diffsum = diffsum + diff;
 argi++;
 } while (argi);
 diffsum = diffsum + diff;
 printf (&quot;PASSED. max ulp err = %.6f diffsum = %lld\n&quot;, maxulp, diffsum);
 return EXIT_SUCCESS;
}
</code></pre>

blocks|key|2476530|text|有一个数学论坛，用户J.M.不是数学家，它引入了改进的Taylor/Padé思想来逼近-pi，pi范围内的cos和sin函数。这里是正弦版翻译成C%2B%2B。这种近似不像库std::sin()函数那么快，但可能值得检查SSE/AVX/FMA实现是否足够快。|type|unstyled|depth|inlineStyleRanges|entityRanges|offset|length|data|2476531|我没有针对库sin()或cos()函数测试ULP错误，但是通过Julia函数精度检验工具，它看起来是一种很好的近似方法(将下面的代码添加到属于朱莉娅测试套件的runtest.jl模块中)：|2476532|function+test_sine(x::AbstractFloat)++
+f=0.5++
+z=x*0.5
+k=0
++++while+(abs(z)>f)
++++++++z*=0.5
++++++++k=k%2B1++
++++end+
++++z2=z%5E2;++
++++r=z*(1%2B(z2/105-1)*((z/3)%5E2))/++
++++++++++(1%2B(z2/7-4)*((z/3)%5E2));++
++++while(k+>+0)
++++++++r+=+(2*r)/(1-r*r);++
++++++++k=k-1
++++end
++++return+(2*r)/(1%2Br*r)
+end

function+test_cosine(x::AbstractFloat)++
f=0.5++
z=x*0.5
k=0
+++while+(abs(z)>f)
+++++++z*=0.5
+++++++k=k%2B1++
+++end+
+++z2=z%5E2;++
+++r=z*(1%2B(z2/105-1)*((z/3)%5E2))/++
++++++(1%2B(z2/7-4)*((z/3)%5E2));++
+++while+(k+>+0)
+++++++r+=+(2*r)/(1-r*r);++
+++++++k=k-1
+++end
+++return+(1-r*r)/(1%2Br*r)
end++

++
pii+=+3.141592653589793238462643383279502884

MAX_SIN(n::Val{pii},+::Type{Float16})+=+3.1415926535897932f0
MAX_SIN(n::Val{pii},+::Type{Float32})+=+3.1415926535897932f0
#MAX_SIN(n::Val{pii},+::Type{Float64})+=+3.141592653589793238462643383279502884
MIN_SIN(n::Val{pii},+::Type{Float16})+=+-3.1415926535897932f0
MIN_SIN(n::Val{pii},+::Type{Float32})+=+-3.1415926535897932f0
#MIN_SIN(n::Val{pii},+::Type{Float64})+=+-3.141592653589793238462643383279502884

for+(func,+base)+in+(sin=>Val(pii),+test_sine=>Val(pii),+cos=>Val(pii),+test_cosine=>Val(pii))++++
++++for+T+in+(Float16,+Float32)
++++++++xx+=+range(MIN_SIN(base,T),++MAX_SIN(base,T),+length+=+10%5E6);
++++++++test_acc(func,+xx)
++++end
end|code-block|syntax|javascript|2476533|在范围-pi，pi中逼近和sin()和cos()的结果|2476534|Tol+debug+failed+0.0%25+of+the+time.
sin
ULP+max+0.5008857846260071+at+x+=+2.203355
ULP+mean+0.24990503381476237
Test+Summary:+%7C+Pass++Total
Float32+sin+++%7C++++1++++++1
Tol+debug+failed+0.0%25+of+the+time.
sin
ULP+max+0.5008857846260071+at+x+=+2.203355
ULP+mean+0.24990503381476237
Test+Summary:+%7C+Pass++Total
Float32+sin+++%7C++++1++++++1
Tol+debug+failed+0.0%25+of+the+time.
test_sine
ULP+max+0.001272978144697845+at+x+=+2.899093
ULP+mean+1.179825295005716e-8
Test+Summary:+++++%7C+Pass++Total
Float32+test_sine+%7C++++1++++++1
Tol+debug+failed+0.0%25+of+the+time.
test_sine
ULP+max+0.001272978144697845+at+x+=+2.899093
ULP+mean+1.179825295005716e-8
Test+Summary:+++++%7C+Pass++Total
Float32+test_sine+%7C++++1++++++1
Tol+debug+failed+0.0%25+of+the+time.
cos
ULP+max+0.5008531212806702+at+x+=+0.45568538
ULP+mean+0.2499933592458589
Test+Summary:+%7C+Pass++Total
Float32+cos+++%7C++++1++++++1
Tol+debug+failed+0.0%25+of+the+time.
cos
ULP+max+0.5008531212806702+at+x+=+0.45568538
ULP+mean+0.2499933592458589
Test+Summary:+%7C+Pass++Total
Float32+cos+++%7C++++1++++++1
Tol+debug+failed+0.0%25+of+the+time.
test_cosine
ULP+max+0.0011584102176129818+at+x+=+1.4495481
ULP+mean+1.6793535615395134e-8
Test+Summary:+++++++%7C+Pass++Total
Float32+test_cosine+%7C++++1++++++1
Tol+debug+failed+0.0%25+of+the+time.
test_cosine
ULP+max+0.0011584102176129818+at+x+=+1.4495481
ULP+mean+1.6793535615395134e-8
Test+Summary:+++++++%7C+Pass++Total
Float32+test_cosine+%7C++++1++++++1|2476535|entityMap|0|LINK|mutability|MUTABLE|url|https://math.stackexchange.com/questions/97560/numerically-efficient-approximation-of-coss|1|https://godbolt.org/z/Yfe61a1Pa|2|https://github.com/JuliaMath/FunctionAccuracyTests.jl^0|3|4|0|1R|6|1|0|V|B|2|0|0|0|0^^$0|@$1|2|3|4|5|6|7|10|8|@]|9|@$A|11|B|12|1|13]|$A|14|B|15|1|16]]|C|$]]|$1|D|3|E|5|6|7|17|8|@]|9|@$A|18|B|19|1|1A]]|C|$]]|$1|F|3|G|5|H|7|1B|8|@]|9|@]|C|$I|J]]|$1|K|3|L|5|6|7|1C|8|@]|9|@]|C|$]]|$1|M|3|N|5|H|7|1D|8|@]|9|@]|C|$I|J]]|$1|O|3|-4|5|6|7|1E|8|@]|9|@]|C|$]]]|P|$Q|$5|R|S|T|C|$U|V]]|W|$5|R|S|T|C|$U|X]]|Y|$5|R|S|T|C|$U|Z]]]]

There's a <a href="https://math.stackexchange.com/questions/97560/numerically-efficient-approximation-of-coss">thread on Mathematics forum</a> where user J. M. ain't a mathematician introduced improved Taylor/Padé idea to approximate cos and sin functions in range [-pi,pi]. <a href="https://godbolt.org/z/Yfe61a1Pa" rel="nofollow noreferrer">Here's sine version</a> translated to C++. This approximation is not as fast as library std::sin() function but might be worth to check if SSE/AVX/FMA implementation helps enough with the speed.
I have not tested ULP error against library sin() nor cos() function but by <a href="https://github.com/JuliaMath/FunctionAccuracyTests.jl" rel="nofollow noreferrer">Julia Function Accuracy Test</a> tool it looks like an excellent approximation method (add below code to the runtest.jl module which belongs to the Julia test suite):
<pre><code>function test_sine(x::AbstractFloat) 
 f=0.5 
 z=x*0.5
 k=0
 while (abs(z)&gt;f)
 z*=0.5
 k=k+1 
 end 
 z2=z^2; 
 r=z*(1+(z2/105-1)*((z/3)^2))/ 
 (1+(z2/7-4)*((z/3)^2)); 
 while(k &gt; 0)
 r = (2*r)/(1-r*r); 
 k=k-1
 end
 return (2*r)/(1+r*r)
 end

function test_cosine(x::AbstractFloat) 
f=0.5 
z=x*0.5
k=0
 while (abs(z)&gt;f)
 z*=0.5
 k=k+1 
 end 
 z2=z^2; 
 r=z*(1+(z2/105-1)*((z/3)^2))/ 
 (1+(z2/7-4)*((z/3)^2)); 
 while (k &gt; 0)
 r = (2*r)/(1-r*r); 
 k=k-1
 end
 return (1-r*r)/(1+r*r)
end 

 
pii = 3.141592653589793238462643383279502884

MAX_SIN(n::Val{pii}, ::Type{Float16}) = 3.1415926535897932f0
MAX_SIN(n::Val{pii}, ::Type{Float32}) = 3.1415926535897932f0
#MAX_SIN(n::Val{pii}, ::Type{Float64}) = 3.141592653589793238462643383279502884
MIN_SIN(n::Val{pii}, ::Type{Float16}) = -3.1415926535897932f0
MIN_SIN(n::Val{pii}, ::Type{Float32}) = -3.1415926535897932f0
#MIN_SIN(n::Val{pii}, ::Type{Float64}) = -3.141592653589793238462643383279502884

for (func, base) in (sin=&gt;Val(pii), test_sine=&gt;Val(pii), cos=&gt;Val(pii), test_cosine=&gt;Val(pii)) 
 for T in (Float16, Float32)
 xx = range(MIN_SIN(base,T), MAX_SIN(base,T), length = 10^6);
 test_acc(func, xx)
 end
end
</code></pre>
Results for approximation and sin() and cos() in range [-pi,pi]:
<pre><code>Tol debug failed 0.0% of the time.
sin
ULP max 0.5008857846260071 at x = 2.203355
ULP mean 0.24990503381476237
Test Summary: | Pass Total
Float32 sin | 1 1
Tol debug failed 0.0% of the time.
sin
ULP max 0.5008857846260071 at x = 2.203355
ULP mean 0.24990503381476237
Test Summary: | Pass Total
Float32 sin | 1 1
Tol debug failed 0.0% of the time.
test_sine
ULP max 0.001272978144697845 at x = 2.899093
ULP mean 1.179825295005716e-8
Test Summary: | Pass Total
Float32 test_sine | 1 1
Tol debug failed 0.0% of the time.
test_sine
ULP max 0.001272978144697845 at x = 2.899093
ULP mean 1.179825295005716e-8
Test Summary: | Pass Total
Float32 test_sine | 1 1
Tol debug failed 0.0% of the time.
cos
ULP max 0.5008531212806702 at x = 0.45568538
ULP mean 0.2499933592458589
Test Summary: | Pass Total
Float32 cos | 1 1
Tol debug failed 0.0% of the time.
cos
ULP max 0.5008531212806702 at x = 0.45568538
ULP mean 0.2499933592458589
Test Summary: | Pass Total
Float32 cos | 1 1
Tol debug failed 0.0% of the time.
test_cosine
ULP max 0.0011584102176129818 at x = 1.4495481
ULP mean 1.6793535615395134e-8
Test Summary: | Pass Total
Float32 test_cosine | 1 1
Tol debug failed 0.0% of the time.
test_cosine
ULP max 0.0011584102176129818 at x = 1.4495481
ULP mean 1.6793535615395134e-8
Test Summary: | Pass Total
Float32 test_cosine | 1 1
</code></pre>

I have implemented some approximations for trigonometric functions (sin,cos,arctan) computed with single precision (32 bit floating point) in C. They are accurate to about +/- 2 ulp.
My target device does not support any <code>&lt;cmath&gt;</code> or <code>&lt;math.h&gt;</code> methods. It does not provide a FMA, but a MAC ALU. ALU and LU compute in 32 bit format.
My arctan approximation is actually a modified version of the <a href="https://stackoverflow.com/questions/26692859/best-machine-optimized-polynomial-minimax-approximation-to-arctangent-on-1-1">approximation of N.juffa</a>, which approximates arctan on the full range. Sine and cosine function are accurate up to 2 ulp within the range [-pi,pi].
I am now aiming to provide a larger input range (as large as possible, ideally [FLT_MIN,FLT_MAX]) for sine and cosine, which leads me to argument reduction.
I'm currently reading different papers like A<a href="https://www.csee.umbc.edu/%7Ephatak/645/supl/Ng-ArgReduction.pdf" rel="nofollow noreferrer">RGUMENT REDUCTION FOR HUGE ARGUMENTS:
Good to the Last Bit by K.C.Ng</a> or the paper about this <a href="https://core.ac.uk/download/pdf/189657632.pdf" rel="nofollow noreferrer">new argument reduction algorithm</a>, but I wasn't able to derive an implementation from it.
Also I want to mention two stackoverflow questions that refer to related problems: There is a <a href="https://stackoverflow.com/questions/9423516/range-reduction-poor-precision-for-single-precision-floating-point">approach with matlab and c++</a> which is based on the first paper I linked. It is actually using matlab, cmath methods and it limits the input to [0,20.000]. The other one was already mentioned in the comments. It is an approach to an implementation of sin and cos in C, using various c-libraries which are not available for me. Since both posts are already several years old, there might be some new findings.
It seems like the algorithm mostly used in this case is to store the number of 2/pi accurate up to the needed number of bits, to be able to compute the modulo calculation accurately and simultaneously avoid cancellation. My device does not provide a large DMEM, which means large look-up tables with hundreds of bits are not possible. This procedure is actually described on page 70 of <a href="https://www5.in.tum.de/%7Ehuckle/numericalcomputationguide.pdf" rel="nofollow noreferrer">this</a> reference, which by the way provides a lot of useful informatin about floating point math.
So my question is: Is there another efficient way to reduce the arguments for sine and cosine obtaining single precision avoiding large LUTs? The papers mentioned above actually focus on double precision and use up to 1000 digits, which is not suitable for my usecase.
I actually haven't found any implementation in C nor an implementation aiming single precision calculation, I would be grateful for any sorts of hints /links /examples...

Single precision argument reduction for trigonometric functions in C

翻译质量差，导致语言生硬或混乱。

没有提供实际的解决方法或示例。

解答不清晰，无法理解或解决问题。

页面排版不美观，阅读体验差。

文章

问答

视频

学习中心

腾讯云实验室

直播

竞赛

腾讯云代码分析专区

腾讯iOA零信任安全管理系统专区

腾讯云架构师技术同盟交流圈

腾讯云数据库专区

腾讯云顾问专区

腾讯云原生专区

腾讯混元专区

腾讯云TCE专区

腾讯云Lighthouse专区

腾讯云HAI专区

腾讯云Edgeone专区

腾讯云存储专区

腾讯云智能专区

腾讯轻联专区 

腾讯云开发专区

TAPD专区

腾讯轻量云游戏服专区

腾讯云最具价值专家

腾讯云架构师技术同盟

腾讯云创作之星

腾讯云开发者先锋

腾讯云代码助手

云原生构建

TAPD 敏捷项目管理

Cloud Studio

SDK中心

API中心

命令行工具

涵盖代码开发、场景应用、自动测试全流程，助你从零构建专属AI助手

一站式MCP教程库，解锁AI应用新玩法

用C语言实现了用单精度(32位浮点)计算三角函数(sin，cos，arctan)的一些逼近，它们的精度可达到+/- 2 ulp。我的目标设备不支持任何<cmath>或<math.h>方法。它不提供FMA，但提供MAC ALU。ALU和LU以32位格式计算。我的arctan近似实际上是的一个修改版本，它在整个范围内近似于...

问C中三角函数的单精度变元约简
EN

社区

活动

圈层

关于

腾讯云开发者

热门产品

热门推荐

更多推荐

问C中三角函数的单精度变元约简EN

社区

活动

圈层

关于

腾讯云开发者

热门产品

热门推荐

更多推荐

问C中三角函数的单精度变元约简
EN