d2/d11/VDTMath_8h_source.html

 #ifndef vdt_math_h

 #define vdt_math_h


 /*******************************************************************************

  *

  * VDT math library: collection of double precision vectorisable trascendental

  * functions.

  * The c++11 standard is used: remember to enable it for the compilation.

  *

  * The basic idea is to exploit pade polinomials.

  * A lot of ideas were inspired by the cephes math library (by Stephen L. Moshier

  * moshier@na-net.ornl.gov) as well as actual code for the exp, log, sin, cos,

  * tan, asin, acos and atan functions. The Cephes library can be found here:

  * http://www.netlib.org/cephes/

  *

  ******************************************************************************/


 #include <iostream>

 #include <cmath>

 #include <limits>


 // used to enable some compiler option internally if needed

 #define CMS_VECTORIZE

 //#define CMS_VECTORIZE_VERBOSE __attribute__ ((optimize("-ftree-vectorizer-verbose=7")))

 #define CMS_VECTORIZE_VERBOSE

 //#define VDT_RESTRICT __restrict__

 #define VDT_RESTRICT


 #define VDT_FORCE_INLINE __attribute__((always_inline)) inline


 namespace vdt {


 // paramters

 constexpr double LOG2E = 1.4426950408889634073599; // 1/log(2)

 constexpr double SQRTH = 0.70710678118654752440;


 /*

 Pade' polinomials coefficients and constants needed throughout the code.

 The result of constexpr *here* is likely to be the same of const static

 nevertheless we show its power: all the computations will take place at compile

 time

 */


 // exp

 constexpr double EXP_LIMIT = 708.;

 constexpr double PX1exp = 1.26177193074810590878E-4;

 constexpr double PX2exp = 3.02994407707441961300E-2;

 constexpr double PX3exp = 9.99999999999999999910E-1;

 constexpr double QX1exp = 3.00198505138664455042E-6;

 constexpr double QX2exp = 2.52448340349684104192E-3;

 constexpr double QX3exp = 2.27265548208155028766E-1;

 constexpr double QX4exp = 2.00000000000000000009E0;


 // logarithm

 constexpr double LOG_UPPER_LIMIT = 1e307;

 constexpr double LOG_LOWER_LIMIT = 1e-307;

 constexpr double PX1log = 1.01875663804580931796E-4;

 constexpr double PX2log = 4.97494994976747001425E-1;

 constexpr double PX3log = 4.70579119878881725854E0;

 constexpr double PX4log = 1.44989225341610930846E1;

 constexpr double PX5log = 1.79368678507819816313E1;

 constexpr double PX6log = 7.70838733755885391666E0;


 constexpr double QX1log = 1.12873587189167450590E1;

 constexpr double QX2log = 4.52279145837532221105E1;

 constexpr double QX3log = 8.29875266912776603211E1;

 constexpr double QX4log = 7.11544750618563894466E1;

 constexpr double QX5log = 2.31251620126765340583E1;


 // Sin and cos

 constexpr double DP1sc = 7.85398125648498535156E-1;

 constexpr double DP2sc = 3.77489470793079817668E-8;

 constexpr double DP3sc = 2.69515142907905952645E-15;

 constexpr double TWOPI = 2.*M_PI;

 constexpr double PI = M_PI;

 constexpr double PIO2 = M_PI_2;

 constexpr double PIO4 = M_PI_4;


 // Sin

 constexpr double SIN_UPPER_LIMIT = TWOPI;

 constexpr double SIN_LOWER_LIMIT = -SIN_UPPER_LIMIT;

 constexpr double C1sin = 1.58962301576546568060E-10;

 constexpr double C2sin =-2.50507477628578072866E-8;

 constexpr double C3sin = 2.75573136213857245213E-6;

 constexpr double C4sin =-1.98412698295895385996E-4;

 constexpr double C5sin = 8.33333333332211858878E-3;

 constexpr double C6sin =-1.66666666666666307295E-1;


 //Cos

 constexpr double C1cos =-1.13585365213876817300E-11;

 constexpr double C2cos = 2.08757008419747316778E-9;

 constexpr double C3cos =-2.75573141792967388112E-7;

 constexpr double C4cos = 2.48015872888517045348E-5;

 constexpr double C5cos =-1.38888888888730564116E-3;

 constexpr double C6cos = 4.16666666666665929218E-2;


 // Asin and acos


 constexpr double RX1asin = 2.967721961301243206100E-3;

 constexpr double RX2asin = -5.634242780008963776856E-1;

 constexpr double RX3asin = 6.968710824104713396794E0;

 constexpr double RX4asin = -2.556901049652824852289E1;

 constexpr double RX5asin = 2.853665548261061424989E1;


 constexpr double SX1asin = -2.194779531642920639778E1;

 constexpr double SX2asin =  1.470656354026814941758E2;

 constexpr double SX3asin = -3.838770957603691357202E2;

 constexpr double SX4asin = 3.424398657913078477438E2;


 constexpr double PX1asin = 4.253011369004428248960E-3;

 constexpr double PX2asin = -6.019598008014123785661E-1;

 constexpr double PX3asin = 5.444622390564711410273E0;

 constexpr double PX4asin = -1.626247967210700244449E1;

 constexpr double PX5asin = 1.956261983317594739197E1;

 constexpr double PX6asin = -8.198089802484824371615E0;


 constexpr double QX1asin = -1.474091372988853791896E1;

 constexpr double QX2asin =  7.049610280856842141659E1;

 constexpr double QX3asin = -1.471791292232726029859E2;

 constexpr double QX4asin = 1.395105614657485689735E2;

 constexpr double QX5asin = -4.918853881490881290097E1;


 //Tan

 constexpr double PX1tan=-1.30936939181383777646E4;

 constexpr double PX2tan=1.15351664838587416140E6;

 constexpr double PX3tan=-1.79565251976484877988E7;


 constexpr double QX1tan = 1.36812963470692954678E4;

 constexpr double QX2tan = -1.32089234440210967447E6;

 constexpr double QX3tan = 2.50083801823357915839E7;

 constexpr double QX4tan = -5.38695755929454629881E7;


 constexpr double DP1tan = 7.853981554508209228515625E-1;

 constexpr double DP2tan = 7.94662735614792836714E-9;

 constexpr double DP3tan = 3.06161699786838294307E-17;

 constexpr double TAN_LIMIT = TWOPI;


 // Atan

 constexpr double T3PO8 = 2.41421356237309504880;

 constexpr double MOREBITS = 6.123233995736765886130E-17;

 constexpr double MOREBITSO2 = MOREBITS/2.;


 constexpr double PX1atan = -8.750608600031904122785E-1;

 constexpr double PX2atan = -1.615753718733365076637E1;

 constexpr double PX3atan = -7.500855792314704667340E1;

 constexpr double PX4atan = -1.228866684490136173410E2;

 constexpr double PX5atan = -6.485021904942025371773E1;


 constexpr double QX1atan = - 2.485846490142306297962E1;

 constexpr double QX2atan = 1.650270098316988542046E2;

 constexpr double QX3atan = 4.328810604912902668951E2;

 constexpr double QX4atan = 4.853903996359136964868E2;

 constexpr double QX5atan = 1.945506571482613964425E2;


 constexpr double ATAN_LIMIT = 1e307;


 // Inverse Sqrt

 // constexpr unsigned int ISQRT_ITERATIONS = 4;

 constexpr double SQRT_LIMIT = 1e307;


 // Service----------------------------------------------------------------------

 void print_instructions_info();


 //------------------------------------------------------------------------------


 typedef union {

   double d;

   int i[2];

   long long ll;

   unsigned short s[4];

 } ieee754;


 //------------------------------------------------------------------------------


 VDT_FORCE_INLINE double ll2d(unsigned long long x) {

   ieee754 tmp;

   tmp.ll=x;

   return tmp.d;

 }


 //------------------------------------------------------------------------------


 VDT_FORCE_INLINE unsigned long long d2ll(double x) {

   ieee754 tmp;

   tmp.d=x;

   return tmp.ll;

 }


 //------------------------------------------------------------------------------

 VDT_FORCE_INLINE double getMantExponent(double x, double& fe){


   unsigned long long n = d2ll(x);


   // shift to the right up to the beginning of the exponent

   // then with a mask, cut off the sign bit

   unsigned long long le = ((n >> 52) & 0x7ffLL);


   // chop the head of the number: an int contains more than 11 bits (32)

   int e = le; // This is important since sums on ull do not vectorise

   fe = (e-1023) +1 ; // the plus one to make the result identical to frexp


   // 13 times f means 52 1. Masking with this means putting to 0 exponent

   // and sign of a double, leaving the Mantissa, the first 52 bits of a double.

   n &=0xfffffffffffffLL;


   // build a mask which is 0.5, i.e. an exponent equal to 1022

   // which means *2, see the above +1.

   const unsigned long long p05 = d2ll(0.5);

   n |= p05;

   x = ll2d(n);

   return x;

 }


 //------------------------------------------------------------------------------

 // Now the mathematical functions are encoded.


 // Exp -------------------------------------------------------------------------

 // Vectorises in a loop without any change in 4.7

 VDT_FORCE_INLINE double fast_exp(double x){


     double initial_x = x;


 //    double px =int(LOG2E * x + 0.5); // std::floor(LOG2E * x + 0.5);

     double px = std::floor(LOG2E * x + 0.5);


     int n = px;


     x -= px * 6.93145751953125E-1;

     x -= px * 1.42860682030941723212E-6;


     double xx = x * x;


     // px = x * P(x**2).

     px = PX1exp;

     px *= xx;

     px += PX2exp;

     px *= xx;

     px += PX3exp;

     px *= x;


     // Evaluate Q(x**2).

     double qx = QX1exp;

     qx *= xx;

     qx += QX2exp;

     qx *= xx;

     qx += QX3exp;

     qx *= xx;

     qx += QX4exp;


     // e**x = 1 + 2x P(x**2)/( Q(x**2) - P(x**2) )

     x = px / (qx - px);

     x = 1.0 + 2.0 * x;


     // Build 2^n in double.

     ieee754 u;

     u.d = 0;

     n += 1023;

     u.ll = (long long) (n) << 52;


     double res = x * u.d;

     if (initial_x > EXP_LIMIT)

             res = std::numeric_limits<double>::infinity();

     if (initial_x < -EXP_LIMIT)

             res = 0.;


     return res;

 }


 // Log -------------------------------------------------------------------------


 VDT_FORCE_INLINE double fast_log(double x){


     double input_x=x;


     /* separate mantissa from exponent */

     double fe;

     x = getMantExponent(x,fe);


     // blending

     if( x < SQRTH ) {

       fe-=1;

       x +=  x ;

       }

     x -= 1.0;


     /* rational form */


     double z = x*x;

     double px =  PX1log;

     px *= x;

     px += PX2log;

     px *= x;

     px += PX3log;

     px *= x;

     px += PX4log;

     px *= x;

     px += PX5log;

     px *= x;

     px += PX6log;

     //

     //for the final formula

     px *= x;

     px *= z;


     double qx = x;

     qx += QX1log;

     qx *=x;

     qx += QX2log;

     qx *=x;

     qx += QX3log;

     qx *=x;

     qx += QX4log;

     qx *=x;

     qx += QX5log;


     double y = px / qx ;


     y -= fe * 2.121944400546905827679e-4;

     y -= 0.5 * z  ;


     z = x + y;

     z += fe * 0.693359375;


     if (input_x > LOG_UPPER_LIMIT)

       z = std::numeric_limits<double>::infinity();

     if (input_x < LOG_LOWER_LIMIT)

       z =  - std::numeric_limits<double>::infinity();


 //     std::cout << input_x << " " << std::log(input_x) << " " << z << std::endl;


     return( z );


   }


 //------------------------------------------------------------------------------

 VDT_FORCE_INLINE double fast_sin(double x){


   int sign = 1;


   if (x < 0){

     x = - x;

     sign = -1;

     }


   if( x > PI ){

     x = TWOPI - x;

     sign = - sign;

     }


   if( x > PIO2 )

     x = PI - x ;


   double y = int( x/PIO4 ); // integer part of x/PIO4


   int j=0;

   if (x>PIO4){

      j=2;

      y+=1;

      }


   /* Extended precision modular arithmetic */

   double z = ((x - y * DP1sc) - y * DP2sc) - y * DP3sc;


   double zz = z * z;


   double px=0;


   if( j==2 ){

     px  = C1cos;

     px *= zz;

     px += C2cos;

     px *= zz;

     px += C3cos;

     px *= zz;

     px += C4cos;

     px *= zz;

     px += C5cos;

     px *= zz;

     px += C6cos;

     y = 1.0 - zz * .5 + zz * zz * px;

     }

   else{

     px  = C1sin;

     px *= zz;

     px += C2sin;

     px *= zz;

     px += C3sin;

     px *= zz;

     px += C4sin;

     px *= zz;

     px += C5sin;

     px *= zz;

     px += C6sin;

     y = z  +  z * zz * px;

     }


   y *= sign;


   return y;

   }


 //------------------------------------------------------------------------------


 VDT_FORCE_INLINE double fast_asin(double x){


   int sign=1;

   double a = x; //necessary for linear approx


   if ( x < 0. ){

     sign *= -1;

     a *= -1;

     }


   double p, z, zz;

   double px,qx;


   /* arcsin(1-x) = pi/2 - sqrt(2x)(1+R(x))  */

   zz = 1.0 - a;


   px = RX1asin;

   px*= zz;

   px+= RX2asin;

   px*= zz;

   px+= RX3asin;

   px*= zz;

   px+= RX4asin;

   px*= zz;

   px+= RX5asin;


   qx = zz;

   qx+= SX1asin;

   qx*= zz;

   qx+= SX2asin;

   qx*= zz;

   qx+= SX3asin;

   qx*= zz;

   qx+= SX4asin;


   p =zz* px/qx;


 //     p = zz * polevl( zz, R, 4)/p1evl( zz, S, 4);


   zz = std::sqrt(zz+zz);

   z = PIO4 - zz;

   zz = zz * p - MOREBITS;

   z -= zz;

   z += PIO4;


   if( a < 0.625 ){

     zz = a * a;

     px = PX1asin;

     px*= zz;

     px+= PX2asin;

     px*= zz;

     px+= PX3asin;

     px*= zz;

     px+= PX4asin;

     px*= zz;

     px+= PX5asin;

     px*= zz;

     px+= PX6asin;


     qx = zz;

     qx+= QX1asin;

     qx*= zz;

     qx+= QX2asin;

     qx*= zz;

     qx+= QX3asin;

     qx*= zz;

     qx+= QX4asin;

     qx*= zz;

     qx+= QX5asin;


     z = zz*px/qx;


     z = a * z + a;

     }


   z *= sign;


    //linear approx, not sooo needed but seable. Price is cheap though

   if( a < 1.0e-8 )

     z = a;


   return z;

   }


 //------------------------------------------------------------------------------


 VDT_FORCE_INLINE double fast_cos(double x){


   x = std::abs(x);


   if( x > PI )

     x = TWOPI - x ;


   int sign = 1;

    if( x > PIO2 ){

      x = PI - x;

      sign=-1;

      }


   double y = int( x/PIO4 ); // integer part of x/PIO4


   int j=0;

   if (x>PIO4){

     j=2;

     y+=1;

     sign = -sign;

     }


   /* Extended precision modular arithmetic */

   double z = ((x - y * DP1sc) - y * DP2sc) - y * DP3sc;


   double zz = z * z;


   double px=0;

   if( j==2 ){

     px  = C1sin;

     px *= zz;

     px += C2sin;

     px *= zz;

     px += C3sin;

     px *= zz;

     px += C4sin;

     px *= zz;

     px += C5sin;

     px *= zz;

     px += C6sin;

     y = z  +  z * zz * px;

     }

   else{

     px  = C1cos;

     px *= zz;

     px += C2cos;

     px *= zz;

     px += C3cos;

     px *= zz;

     px += C4cos;

     px *= zz;

     px += C5cos;

     px *= zz;

     px += C6cos;

     y = 1. - zz * .5 + zz * zz * px;

     }


   y *= sign;


   return y;

   }


 // Acos ------------------------------------------------------------------------

 VDT_FORCE_INLINE double fast_acos(double x){

   double z;


 //   z = PIO4 - fast_asin(x);

 //   z += MOREBITS;

 //   z += PIO4;


 //   if (x > .5 )

     z = 2.0 * fast_asin(  sqrt(0.5 - 0.5 * x ) ) ;


   return z;

   }


 // Tangent  --------------------------------------------------------------------

 VDT_FORCE_INLINE double fast_tan( double x ){

 /* DP

  * Some of the ifs had to be skipped and replaced by calculations. This allowed

  * the vectorisation but introduced a loss of performance.

  * A solution should be found

 */


    // make argument positive but save the sign

    // without ifs

    double abs_x =std::abs(x);

    int sign = x/abs_x;

    x = abs_x;


 // remove this if

 //     if (x > PI)

 //        x = x - PI;

 // like this:

    int nPI  = x /PI;

    x = x - nPI * PI;


 //     reflect and flip with if

 //     if (x > PIO2){

 //        x = PI - x ;

 //        sign = - sign;

 //       }

 // and without

     int nPIO2 = x/PIO2;

     int factor = ( 1 - 2* nPIO2);

     x = nPIO2* PI + factor * x;

     sign *= factor;


     /* compute x mod PIO4 */

     int nPIO4 = x/PIO4;

     double y = 2 * nPIO4;


     /* integer and fractional part modulo one octant */


 //     This if can be removed and the expression becomes

 //     if (x > PIO4){

 //        y=2.0;

 //       }

 //   like this:

 //     y = y  + nPIO4;


     double z = ((x - y * DP1tan) - y * DP2tan) - y * DP3tan;


     double zz = z * z;


     y=z;


     if( zz > 1.0e-14 ){

         double px = PX1tan;

         px *= zz;

         px += PX2tan;

         px *= zz;

         px += PX3tan;


         double qx=zz;

         qx += QX1tan;

         qx *=zz;

         qx += QX2tan;

         qx *=zz;

         qx += QX3tan;

         qx *=zz;

         qx += QX4tan;


         y = z + z * zz * px / qx;

     }


     // here if we are in the second octant we have

     //  y = -1 /y

    // else we have y!

    // again a trick not to use ifs...

     y -= nPIO4 * (  y  + 1.0 / y);


     y *= sign;


     return y ;

     }


 // Atan -------------------------------------------------------------------------

 // REMEMBER pi/2 == inf!!

 VDT_FORCE_INLINE double fast_atan(double x){


     /* make argument positive and save the sign */

     int sign = 1;

     if( x < 0.0 ) {

         x = - x;

         sign = -1;

         }


     /* range reduction */

     double originalx=x;


 // This is slower!

 //     double y = 0.0;

 //     double factor = 0.;

 //

 //     if (x  > .66){

 //         y = PIO4;

 //         factor = MOREBITSO2;

 //         x = (x-1.0) / (x+1.0);

 //         }

 //     if( originalx > T3PO8 ) {

 //         y = PIO2;

 //         factor = MOREBITS;

 //         x = -1.0 / originalx ;

 //         }


     double y = PIO4;

     double factor = MOREBITSO2;

     x = (x-1.0) / (x+1.0);


     if( originalx > T3PO8 ) {

         y = PIO2;

         //flag = 1.;

         factor = MOREBITS;

         x = -1.0 / originalx ;

         }

     if ( originalx <= 0.66 ) {

         y = 0.0;

         x = originalx;

         //flag = 0.;

         factor = 0.;

         }


     double z = x * x;


     double px = PX1atan;

     px *= z;

     px += PX2atan;

     px *= z;

     px += PX3atan;

     px *= z;

     px += PX4atan;

     px *= z;

     px += PX5atan;

     px *= z; // for the final formula


     double qx=z;

     qx += QX1atan;

     qx *=z;

     qx += QX2atan;

     qx *=z;

     qx += QX3atan;

     qx *=z;

     qx += QX4atan;

     qx *=z;

     qx += QX5atan;


 //     z = px / qx;

 //     z = x * px / qx + x;


     y = y +x * px / qx + x +factor;


     y = sign * y;


     return y;

     }


 //------------------------------------------------------------------------------


 // Taken from from quake and remixed :-)


 VDT_FORCE_INLINE double fast_isqrt_general(double x, const unsigned short ISQRT_ITERATIONS) {


   double x2 = x * 0.5;

   double y  = x;

   unsigned long long i  = d2ll(y);

   // Evil!

   i  = 0x5fe6eb50c7aa19f9  - ( i >> 1 );

   y  = ll2d(i);

   for (unsigned int j=0;j<ISQRT_ITERATIONS;++j)

       y *= 1.5 - ( x2 * y * y ) ;


   return y;

 }


 //------------------------------------------------------------------------------


 // Four iterations

 VDT_FORCE_INLINE double fast_isqrt(double x) {return fast_isqrt_general(x,4);}


 // Two iterations

 VDT_FORCE_INLINE double fast_approx_isqrt(double x) {return fast_isqrt_general(x,3);}


 //------------------------------------------------------------------------------


 VDT_FORCE_INLINE double std_isqrt (double x) {return 1./std::sqrt(x);}


 //------------------------------------------------------------------------------


 VDT_FORCE_INLINE double fast_inv (double x) {

     double sign = 1;

     if( x < 0.0 ) {

         x = - x;

         sign = -1;

         }

     double y=fast_isqrt(x);

     return y*y*sign;

     }


 VDT_FORCE_INLINE double fast_approx_inv (double x) {

     double sign = 1;

     if( x < 0.0 ) {

         x = - x;

         sign = -1;

         }

     double y=fast_approx_isqrt(x);

     return y*y*sign;}


 VDT_FORCE_INLINE double std_inv (double x) {return 1./x;}


 //------------------------------------------------------------------------------

 // Some preprocessor in order to avoid a lot of error prone repetitions

 // CMS_VECTORIZE_VERBOSE is a preprocessor variable in a preprocessor function


 // Fast vector functions

 #define FAST_VECT_FUNC(NAME) __attribute__((always_inline)) inline void NAME##_vect(double const * VDT_RESTRICT input , double * VDT_RESTRICT outupt, const unsigned int arr_size) { \

   for (unsigned int i=0;i<arr_size;++i) \

     outupt[i] = NAME ( input[i] ) CMS_VECTORIZE_VERBOSE; \

     }


 void fast_exp_vect_46(double const* input, double* output, const unsigned int arr_size);


 // Profitability threshold = 3

 FAST_VECT_FUNC(fast_exp)


 void fast_log_vect_46(double const* input, double* output, const unsigned int arr_size);


 // Profitability threshold = 3

 FAST_VECT_FUNC(fast_log)


 // Profitability threshold = 7

 FAST_VECT_FUNC(fast_sin)


 // Profitability threshold = 3

 FAST_VECT_FUNC(fast_asin)


 // Profitability threshold = 7

 FAST_VECT_FUNC(fast_cos)


 // Profitability threshold = 3

 FAST_VECT_FUNC(fast_acos)


 //Profitability threshold = 3

 FAST_VECT_FUNC(fast_tan)


 //Profitability threshold = 3

 FAST_VECT_FUNC(fast_atan)


 //Profitability threshold = 2 (2!!!)

 FAST_VECT_FUNC(fast_isqrt)


 //Profitability threshold = 2 (2!!!)

 FAST_VECT_FUNC(fast_approx_isqrt)


 //Profitability threshold = 2

 FAST_VECT_FUNC(fast_inv)


 //Profitability threshold = 2

 FAST_VECT_FUNC(fast_approx_inv)


 //------------------------------------------------------------------------------

 // Reference vector functions

 #define VECT_FUNC(NAME) __attribute__((always_inline)) inline void std_##NAME##_vect(double const * VDT_RESTRICT input , double* VDT_RESTRICT outupt, const unsigned int arr_size) { \

   for (unsigned int i=0;i<arr_size;++i) \

     outupt[i] = std::NAME ( input[i] ) CMS_VECTORIZE_VERBOSE; \

     }


 VECT_FUNC(exp)


 VECT_FUNC(log)


 VECT_FUNC(sin)


 VECT_FUNC(asin)


 VECT_FUNC(cos)


 VECT_FUNC(acos)


 VECT_FUNC(tan)


 VECT_FUNC(atan)


 VDT_FORCE_INLINE void std_isqrt_vect(double const * VDT_RESTRICT input ,

                     double* VDT_RESTRICT output,

                     const unsigned int arr_size) CMS_VECTORIZE_VERBOSE{

   //Profitability threshold = 6

   for (unsigned int i=0;i<arr_size;++i)

     output[i] = vdt::std_isqrt(input[i]);

   }


 VDT_FORCE_INLINE void std_inv_vect(double const * VDT_RESTRICT input ,

                     double* VDT_RESTRICT output,

                     const unsigned int arr_size) CMS_VECTORIZE_VERBOSE{

   //Profitability threshold = 6

   for (unsigned int i=0;i<arr_size;++i)

     output[i] = vdt::std_inv(input[i]);

   }


 //------------------------------------------------------------------------------


 } // end of vdt namespace


 #endif


vdt::PX3tan
constexpr double PX3tan
Definition: VDTMath.h:127

vdt::fast_approx_isqrt
VDT_FORCE_INLINE double fast_approx_isqrt(double x)
Definition: VDTMath.h:768

vdt::QX4log
constexpr double QX4log
Definition: VDTMath.h:68

vdt::QX3log
constexpr double QX3log
Definition: VDTMath.h:67

vdt::QX1asin
constexpr double QX1asin
Definition: VDTMath.h:118

i
int i
Definition: DBlmapReader.cc:9

vdt::PI
constexpr double PI
Definition: VDTMath.h:76

vdt::C5cos
constexpr double C5cos
Definition: VDTMath.h:95

vdt::QX1tan
constexpr double QX1tan
Definition: VDTMath.h:129

vdt::PIO4
constexpr double PIO4
Definition: VDTMath.h:78

vdt::QX4asin
constexpr double QX4asin
Definition: VDTMath.h:121

create_public_lumi_plots.exp
tuple exp
Definition: create_public_lumi_plots.py:1093

vdt::PX1log
constexpr double PX1log
Definition: VDTMath.h:58

vdt::ieee754::d
double d
Definition: VDTMath.h:170

vdt::ieee754::ll
long long ll
Definition: VDTMath.h:172

vdt::QX2asin
constexpr double QX2asin
Definition: VDTMath.h:119

vdt::SQRT_LIMIT
constexpr double SQRT_LIMIT
Definition: VDTMath.h:160

vdt::PX4asin
constexpr double PX4asin
Definition: VDTMath.h:114

vdt::C5sin
constexpr double C5sin
Definition: VDTMath.h:87

vdt::PX2log
constexpr double PX2log
Definition: VDTMath.h:59

vdt::C3cos
constexpr double C3cos
Definition: VDTMath.h:93

vdt::SX2asin
constexpr double SX2asin
Definition: VDTMath.h:107

vdt::PX1asin
constexpr double PX1asin
Definition: VDTMath.h:111

vdt::PX3asin
constexpr double PX3asin
Definition: VDTMath.h:113

LaserDQM_cfg.input
tuple input
Definition: LaserDQM_cfg.py:38

vdt::C6cos
constexpr double C6cos
Definition: VDTMath.h:96

funct::sin
Sin< T >::type sin(const T &t)
Definition: Sin.h:22

vdt::fast_exp_vect_46
void fast_exp_vect_46(double const *input, double *output, const unsigned int arr_size)
Some tweaks to make it vectorise with gcc46.
Definition: VDTMath.cc:63

create_public_lumi_plots.log
log
Definition: create_public_lumi_plots.py:1108

abs
#define abs(x)
Definition: mlp_lapack.h:159

vdt::std_isqrt
VDT_FORCE_INLINE double std_isqrt(double x)
Definition: VDTMath.h:772

vdt::fast_isqrt
VDT_FORCE_INLINE double fast_isqrt(double x)
Definition: VDTMath.h:765

M_PI_2
#define M_PI_2
Definition: CSCGattiFunction.cc:6

vdt::RX5asin
constexpr double RX5asin
Definition: VDTMath.h:104

vdt::DP2tan
constexpr double DP2tan
Definition: VDTMath.h:135

vdt::EXP_LIMIT
constexpr double EXP_LIMIT
Definition: VDTMath.h:46

vdt::QX5asin
constexpr double QX5asin
Definition: VDTMath.h:122

vdt::QX2tan
constexpr double QX2tan
Definition: VDTMath.h:130

vdt::d2ll
VDT_FORCE_INLINE unsigned long long d2ll(double x)
Converts a double to an unsigned long long.
Definition: VDTMath.h:188

vdt::PX2exp
constexpr double PX2exp
Definition: VDTMath.h:48

vdt::TAN_LIMIT
constexpr double TAN_LIMIT
Definition: VDTMath.h:137

vdt::C2sin
constexpr double C2sin
Definition: VDTMath.h:84

vdt::QX3tan
constexpr double QX3tan
Definition: VDTMath.h:131

vdt::DP3tan
constexpr double DP3tan
Definition: VDTMath.h:136

vdt::C3sin
constexpr double C3sin
Definition: VDTMath.h:85

detailsBasic3DVector::z
double double double z
Definition: newBasic3DVector.h:17

FAST_VECT_FUNC
#define FAST_VECT_FUNC(NAME)
Definition: VDTMath.h:802

vdt::SX4asin
constexpr double SX4asin
Definition: VDTMath.h:109

vdt::PX3atan
constexpr double PX3atan
Definition: VDTMath.h:146

vdt::print_instructions_info
void print_instructions_info()
Print the instructions used on screen.
Definition: VDTMath.cc:24

vdt::LOG_UPPER_LIMIT
constexpr double LOG_UPPER_LIMIT
Definition: VDTMath.h:56

vdt::getMantExponent
VDT_FORCE_INLINE double getMantExponent(double x, double &fe)
Like frexp but vectorising and the exponent is a double.
Definition: VDTMath.h:196

vdt::fast_asin
VDT_FORCE_INLINE double fast_asin(double x)
Definition: VDTMath.h:413

vdt::MOREBITSO2
constexpr double MOREBITSO2
Definition: VDTMath.h:142

vdt::fast_exp
VDT_FORCE_INLINE double fast_exp(double x)
Exponential Function.
Definition: VDTMath.h:226

vdt::QX1log
constexpr double QX1log
Definition: VDTMath.h:65

vdt::QX3asin
constexpr double QX3asin
Definition: VDTMath.h:120

vdt::PX2tan
constexpr double PX2tan
Definition: VDTMath.h:126

vdt::RX1asin
constexpr double RX1asin
Definition: VDTMath.h:100

vdt::std_inv_vect
VDT_FORCE_INLINE void std_inv_vect(double const *VDT_RESTRICT input, double *VDT_RESTRICT output, const unsigned int arr_size) CMS_VECTORIZE_VERBOSE
Definition: VDTMath.h:880

vdt::SX1asin
constexpr double SX1asin
Definition: VDTMath.h:106

vdt::SX3asin
constexpr double SX3asin
Definition: VDTMath.h:108

vdt::DP1sc
constexpr double DP1sc
Definition: VDTMath.h:72

mathSSE::sqrt
T sqrt(T t)
Definition: SSEVec.h:46

vdt::std_inv
VDT_FORCE_INLINE double std_inv(double x)
Definition: VDTMath.h:795

vdt::SQRTH
constexpr double SQRTH
Definition: VDTMath.h:36

vdt::LOG_LOWER_LIMIT
constexpr double LOG_LOWER_LIMIT
Definition: VDTMath.h:57

vdt::PX4atan
constexpr double PX4atan
Definition: VDTMath.h:147

funct::cos
Cos< T >::type cos(const T &t)
Definition: Cos.h:22

vdt::QX5log
constexpr double QX5log
Definition: VDTMath.h:69

vdt::std_isqrt_vect
VDT_FORCE_INLINE void std_isqrt_vect(double const *VDT_RESTRICT input, double *VDT_RESTRICT output, const unsigned int arr_size) CMS_VECTORIZE_VERBOSE
Definition: VDTMath.h:872

infinity
const double infinity
Definition: CSCChamberFitter.cc:10

funct::tan
Tan< T >::type tan(const T &t)
Definition: Tan.h:22

j
int j
Definition: DBlmapReader.cc:9

vdt::QX2log
constexpr double QX2log
Definition: VDTMath.h:66

vdt::QX4exp
constexpr double QX4exp
Definition: VDTMath.h:53

vdt::fast_log_vect_46
void fast_log_vect_46(double const *input, double *output, const unsigned int arr_size)
Some tweaks to make it vectorise with gcc46.
Definition: VDTMath.cc:150

vdt::fast_tan
VDT_FORCE_INLINE double fast_tan(double x)
Sin defined between -2pi and 2pi.
Definition: VDTMath.h:579

vdt::SIN_UPPER_LIMIT
constexpr double SIN_UPPER_LIMIT
Definition: VDTMath.h:81

vdt::PX5atan
constexpr double PX5atan
Definition: VDTMath.h:148

vdt::C4sin
constexpr double C4sin
Definition: VDTMath.h:86

vdt::PX1tan
constexpr double PX1tan
Definition: VDTMath.h:125

vdt::PX1atan
constexpr double PX1atan
Definition: VDTMath.h:144

vdt::DP3sc
constexpr double DP3sc
Definition: VDTMath.h:74

vdt::QX4atan
constexpr double QX4atan
Definition: VDTMath.h:153

vdt::QX4tan
constexpr double QX4tan
Definition: VDTMath.h:132

VDT_RESTRICT
#define VDT_RESTRICT
Definition: VDTMath.h:28

vdt::ATAN_LIMIT
constexpr double ATAN_LIMIT
Definition: VDTMath.h:156

vdt::PX1exp
constexpr double PX1exp
Definition: VDTMath.h:47

vdt::RX2asin
constexpr double RX2asin
Definition: VDTMath.h:101

vdt::QX2exp
constexpr double QX2exp
Definition: VDTMath.h:51

VECT_FUNC
#define VECT_FUNC(NAME)
Definition: VDTMath.h:851

vdt::fast_isqrt_general
VDT_FORCE_INLINE double fast_isqrt_general(double x, const unsigned short ISQRT_ITERATIONS)
Definition: VDTMath.h:746

convertSQLitetoXML_cfg.output
tuple output
Definition: convertSQLitetoXML_cfg.py:32

vdt::PX5log
constexpr double PX5log
Definition: VDTMath.h:62

vdt::SIN_LOWER_LIMIT
constexpr double SIN_LOWER_LIMIT
Definition: VDTMath.h:82

M_PI
#define M_PI
Definition: BFit3D.cc:3

vdt::C1cos
constexpr double C1cos
Definition: VDTMath.h:91

detailsBasic3DVector::y
float float y
Definition: newBasic3DVector.h:15

n
int n
Definition: DTDataIntegrityTask.cc:33

vdt::RX3asin
constexpr double RX3asin
Definition: VDTMath.h:102

alignCSCRings.s
list s
Definition: alignCSCRings.py:91

vdt::QX2atan
constexpr double QX2atan
Definition: VDTMath.h:151

compareJSON.const
string const
Definition: compareJSON.py:14

vdt::RX4asin
constexpr double RX4asin
Definition: VDTMath.h:103

vdt::PX2asin
constexpr double PX2asin
Definition: VDTMath.h:112

vdt::fast_cos
VDT_FORCE_INLINE double fast_cos(double x)
Cos defined between -2pi and 2pi.
Definition: VDTMath.h:501

alignCSCRings.e
list e
Definition: alignCSCRings.py:90

vdt::C4cos
constexpr double C4cos
Definition: VDTMath.h:94

vdt::PX2atan
constexpr double PX2atan
Definition: VDTMath.h:145

vdt::fast_sin
VDT_FORCE_INLINE double fast_sin(double x)
Sin defined between -2pi and 2pi.
Definition: VDTMath.h:345

AlCaHLTBitMon_ParallelJobs.p
tuple p
Definition: AlCaHLTBitMon_ParallelJobs.py:152

tmp
std::vector< std::vector< double > > tmp
Definition: MVATrainer.cc:100

vdt::fast_acos
VDT_FORCE_INLINE double fast_acos(double x)
Definition: VDTMath.h:564

vdt::PX3log
constexpr double PX3log
Definition: VDTMath.h:60

vdt::QX1exp
constexpr double QX1exp
Definition: VDTMath.h:50

vdt::PX4log
constexpr double PX4log
Definition: VDTMath.h:61

vdt::PX3exp
constexpr double PX3exp
Definition: VDTMath.h:49

a
double a
Definition: hdecay.h:121

CMS_VECTORIZE_VERBOSE
#define CMS_VECTORIZE_VERBOSE
Definition: VDTMath.h:26

vdt::DP1tan
constexpr double DP1tan
Definition: VDTMath.h:134

vdt::fast_atan
VDT_FORCE_INLINE double fast_atan(double x)
Definition: VDTMath.h:664

vdt::QX3atan
constexpr double QX3atan
Definition: VDTMath.h:152

asciidump.le
int le
Definition: asciidump.py:443

vdt::C1sin
constexpr double C1sin
Definition: VDTMath.h:83

vdt::MOREBITS
constexpr double MOREBITS
Definition: VDTMath.h:141

vdt::TWOPI
constexpr double TWOPI
Definition: VDTMath.h:75

vdt::QX5atan
constexpr double QX5atan
Definition: VDTMath.h:154

vdt::C6sin
constexpr double C6sin
Definition: VDTMath.h:88

vdt::PX6log
constexpr double PX6log
Definition: VDTMath.h:63

vdt::C2cos
constexpr double C2cos
Definition: VDTMath.h:92

vdt::PX5asin
constexpr double PX5asin
Definition: VDTMath.h:115

vdt::DP2sc
constexpr double DP2sc
Definition: VDTMath.h:73

vdt::T3PO8
constexpr double T3PO8
Definition: VDTMath.h:140

x
Definition: DDAxes.h:10

vdt::fast_log
VDT_FORCE_INLINE double fast_log(double x)
Definition: VDTMath.h:279

vdt::PIO2
constexpr double PIO2
Definition: VDTMath.h:77

vdt::PX6asin
constexpr double PX6asin
Definition: VDTMath.h:116

vdt::fast_inv
VDT_FORCE_INLINE double fast_inv(double x)
Definition: VDTMath.h:776

vdt::fast_approx_inv
VDT_FORCE_INLINE double fast_approx_inv(double x)
Definition: VDTMath.h:786

vdt::LOG2E
constexpr double LOG2E
Definition: VDTMath.h:35

constexpr
#define constexpr
Definition: GCC11Compatibility.h:29

vdt::QX3exp
constexpr double QX3exp
Definition: VDTMath.h:52

vdt::QX1atan
constexpr double QX1atan
Definition: VDTMath.h:150

vdt::ll2d
VDT_FORCE_INLINE double ll2d(unsigned long long x)
Converts an unsigned long long to a double.
Definition: VDTMath.h:179

VDT_FORCE_INLINE
#define VDT_FORCE_INLINE
Definition: VDTMath.h:30

vdt::ieee754
Used to switch between different type of interpretations of the data (64 bits)
Definition: VDTMath.h:169