-                      redf06e1
+                      rb3796fa
 #  endif
    // OpenCL only has type generic math
+   #define expf exp
    #define erff erf
    #define erfcf erfc
+   // Intel CPU on Mac gives strange values for erf(), so maybe don't use it
+   //#define NEED_ERF
 #else // !USE_OPENCL
 // Use SAS_DOUBLE to force the use of double even for float kernels
 …
 #  define M_E 2.718281828459045091
 #endif
+#ifndef M_SQRT1_2
+#  define M_SQRT1_2 0.70710678118654746
+#endif
 // Non-standard function library

sasmodels/models/lib/sas_erf.c

-                      redf06e1
+                      rb3796fa
 #if FLOAT_SIZE>4  // DOUBLE_PRECISION
+double erf(double x);
+double erfc(double a);
+double cephes_erf(double x);
+double cephes_erfc(double a);
 constant double PD[] = {
 …
 };
 double erfc(double a)
+double cephes_erfc(double a)
+{
     double MAXLOG = 88.72283905206835;
 …
-    /*if (a < 0.0)
-        x = -a;
-    else
-        x = a;*/
     x = fabs(a);
     if (x < 1.0) {
         //The line bellow is a troublemaker for GPU, so sas_erf function
         //is explicit here for the case < 1.0
         //return (1.0 - sas_erf(a));
+        // The line below causes problems on the GPU, so inline
+        // the erf function instead and z < 1.0.
+        //return (1.0 - cephes_erf(a));
         z = x * x;
         y = x * polevl(z, TD, 4) / p1evl(z, UD, 5);
 …
 double erf(double x)
+double cephes_erf(double x)
+{
     double y, z;
     if (fabs(x) > 1.0)
         return (1.0 - erfc(x));
+        return (1.0 - cephes_erfc(x));
     z = x * x;
+    #if FLOAT_SIZE>4
+        y = x * polevl(z, TD, 4) / p1evl(z, UD, 5);
+    #else
+        y = x * polevl( z, TF, 6 );
+    #endif
+    y = x * polevl(z, TD, 4) / p1evl(z, UD, 5);
     return y;
 …
 #else // SINGLE PRECISION
 double erff(double x);
 double erfcf(double a);
+float cephes_erff(float x);
+float cephes_erfcf(float a);
 /* erfc(x) = exp(-x^2) P(1/x), 1 < x < 2 */
 constant double PF[] = {
+constant float PF[] = {
 .326819970068386E-002,
     -1.387039388740657E-001,
 …
 /* erfc(x) = exp(-x^2) 1/x P(1/x^2), 2 < x < 14 */
 constant double RF[] = {
+constant float RF[] = {
     -1.047766399936249E+001,
 .297719955372516E+001,
 …
 /* erf(x) = x P(x^2), 0 < x < 1 */
  constant double TF[] = {
+ constant float TF[] = {
 .853861353153693E-005,
     -8.010193625184903E-004,
 …
 float erfcf(float a)
+float cephes_erfcf(float a)
+{
     float MAXLOG = 88.72283905206835;
 …
 float erff(float x)
+float cephes_erff(float x)
+{
     float y, z;
 …
     // TODO: tinycc does not support fabsf
     if (fabs(x) > 1.0)
         return (1.0 - erfcf(x));
+        return (1.0 - cephes_erfcf(x));
     z = x * x;
 …
 #endif // SINGLE_PRECISION
-#endif // NEED_ERF
 #if FLOAT_SIZE>4
+//static double sas_erf(double x) { return erf(x); }
+//static double sas_erfc(double x) { return erfc(x); }
+#define sas_erf cephes_erf
+#define sas_erfc cephes_erfc
+#else
+#define sas_erf cephes_erff
+#define sas_erfc cephes_erfcf
+#endif
+#else // !NEED_ERF
+#if FLOAT_SIZE>4
+//static double sas_erf(double x) { return erf(x); }
+//static double sas_erfc(double x) { return erfc(x); }
 #define sas_erf erf
 #define sas_erfc erfc
 …
 #define sas_erfc erfcf
 #endif
+#endif // !NEED_ERF

Note: See TracChangeset for help on using the changeset viewer.

SasView

Changeset b3796fa in sasmodels

Legend:

sasmodels/kernel_header.c

sasmodels/models/lib/sas_erf.c

Download in other formats: