[bb82c03] | 1 | // |
---|
[6e991d6] | 2 | // Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo |
---|
| 3 | // |
---|
| 4 | // The contents of this file are covered under the licence agreement in the |
---|
| 5 | // file "LICENCE" distributed with Cforall. |
---|
| 6 | // |
---|
[2f5ea69] | 7 | // math.hfa -- |
---|
[bb82c03] | 8 | // |
---|
[6e991d6] | 9 | // Author : Peter A. Buhr |
---|
| 10 | // Created On : Mon Apr 18 23:37:04 2016 |
---|
| 11 | // Last Modified By : Peter A. Buhr |
---|
[95bda0a] | 12 | // Last Modified On : Sat Oct 8 08:40:42 2022 |
---|
| 13 | // Update Count : 136 |
---|
[bb82c03] | 14 | // |
---|
[17e5e2b] | 15 | |
---|
[53a6c2a] | 16 | #pragma once |
---|
[17e5e2b] | 17 | |
---|
[dab7ac7] | 18 | #include <math.h> |
---|
| 19 | #include <complex.h> |
---|
[6e991d6] | 20 | |
---|
[7cfef0d] | 21 | //--------------------------------------- |
---|
[dab7ac7] | 22 | |
---|
[7cfef0d] | 23 | #include "common.hfa" |
---|
[0deeaad] | 24 | #include "bits/debug.hfa" |
---|
[6e991d6] | 25 | |
---|
[7cfef0d] | 26 | //---------------------- General ---------------------- |
---|
[6e991d6] | 27 | |
---|
[95bda0a] | 28 | static inline __attribute__((always_inline)) { |
---|
[7cfef0d] | 29 | float ?%?( float x, float y ) { return fmodf( x, y ); } |
---|
| 30 | float fmod( float x, float y ) { return fmodf( x, y ); } |
---|
| 31 | double ?%?( double x, double y ) { return fmod( x, y ); } |
---|
| 32 | // extern "C" { double fmod( double, double ); } |
---|
| 33 | long double ?%?( long double x, long double y ) { return fmodl( x, y ); } |
---|
| 34 | long double fmod( long double x, long double y ) { return fmodl( x, y ); } |
---|
| 35 | |
---|
| 36 | float remainder( float x, float y ) { return remainderf( x, y ); } |
---|
| 37 | // extern "C" { double remainder( double, double ); } |
---|
| 38 | long double remainder( long double x, long double y ) { return remainderl( x, y ); } |
---|
| 39 | |
---|
| 40 | float remquo( float x, float y, int * quo ) { return remquof( x, y, quo ); } |
---|
| 41 | // extern "C" { double remquo( double x, double y, int * quo ); } |
---|
| 42 | long double remquo( long double x, long double y, int * quo ) { return remquol( x, y, quo ); } |
---|
| 43 | [ int, float ] remquo( float x, float y ) { int quo; x = remquof( x, y, &quo ); return [ quo, x ]; } |
---|
| 44 | [ int, double ] remquo( double x, double y ) { int quo; x = remquo( x, y, &quo ); return [ quo, x ]; } |
---|
| 45 | [ int, long double ] remquo( long double x, long double y ) { int quo; x = remquol( x, y, &quo ); return [ quo, x ]; } |
---|
| 46 | |
---|
| 47 | [ float, float ] div( float x, float y ) { y = modff( x / y, &x ); return [ x, y ]; } |
---|
| 48 | [ double, double ] div( double x, double y ) { y = modf( x / y, &x ); return [ x, y ]; } |
---|
| 49 | [ long double, long double ] div( long double x, long double y ) { y = modfl( x / y, &x ); return [ x, y ]; } |
---|
| 50 | |
---|
| 51 | float fma( float x, float y, float z ) { return fmaf( x, y, z ); } |
---|
| 52 | // extern "C" { double fma( double, double, double ); } |
---|
| 53 | long double fma( long double x, long double y, long double z ) { return fmal( x, y, z ); } |
---|
| 54 | |
---|
| 55 | float fdim( float x, float y ) { return fdimf( x, y ); } |
---|
| 56 | // extern "C" { double fdim( double, double ); } |
---|
| 57 | long double fdim( long double x, long double y ) { return fdiml( x, y ); } |
---|
| 58 | |
---|
| 59 | float nan( const char tag[] ) { return nanf( tag ); } |
---|
| 60 | // extern "C" { double nan( const char [] ); } |
---|
| 61 | long double nan( const char tag[] ) { return nanl( tag ); } |
---|
| 62 | } // distribution |
---|
[6e991d6] | 63 | |
---|
[dc5376a] | 64 | //---------------------- Exponential ---------------------- |
---|
[6e991d6] | 65 | |
---|
[95bda0a] | 66 | static inline __attribute__((always_inline)) { |
---|
[7cfef0d] | 67 | float exp( float x ) { return expf( x ); } |
---|
| 68 | // extern "C" { double exp( double ); } |
---|
| 69 | long double exp( long double x ) { return expl( x ); } |
---|
| 70 | float _Complex exp( float _Complex x ) { return cexpf( x ); } |
---|
| 71 | double _Complex exp( double _Complex x ) { return cexp( x ); } |
---|
| 72 | long double _Complex exp( long double _Complex x ) { return cexpl( x ); } |
---|
| 73 | |
---|
| 74 | float exp2( float x ) { return exp2f( x ); } |
---|
| 75 | // extern "C" { double exp2( double ); } |
---|
| 76 | long double exp2( long double x ) { return exp2l( x ); } |
---|
| 77 | //float _Complex exp2( float _Complex x ) { return cexp2f( x ); } |
---|
| 78 | //double _Complex exp2( double _Complex x ) { return cexp2( x ); } |
---|
| 79 | //long double _Complex exp2( long double _Complex x ) { return cexp2l( x ); } |
---|
| 80 | |
---|
| 81 | float expm1( float x ) { return expm1f( x ); } |
---|
| 82 | // extern "C" { double expm1( double ); } |
---|
| 83 | long double expm1( long double x ) { return expm1l( x ); } |
---|
| 84 | |
---|
| 85 | float pow( float x, float y ) { return powf( x, y ); } |
---|
| 86 | // extern "C" { double pow( double, double ); } |
---|
| 87 | long double pow( long double x, long double y ) { return powl( x, y ); } |
---|
| 88 | float _Complex pow( float _Complex x, float _Complex y ) { return cpowf( x, y ); } |
---|
| 89 | double _Complex pow( double _Complex x, double _Complex y ) { return cpow( x, y ); } |
---|
| 90 | long double _Complex pow( long double _Complex x, long double _Complex y ) { return cpowl( x, y ); } |
---|
| 91 | } // distribution |
---|
[dab7ac7] | 92 | |
---|
| 93 | //---------------------- Logarithm ---------------------- |
---|
| 94 | |
---|
[95bda0a] | 95 | static inline __attribute__((always_inline)) { |
---|
[7cfef0d] | 96 | float log( float x ) { return logf( x ); } |
---|
| 97 | // extern "C" { double log( double ); } |
---|
| 98 | long double log( long double x ) { return logl( x ); } |
---|
| 99 | float _Complex log( float _Complex x ) { return clogf( x ); } |
---|
| 100 | double _Complex log( double _Complex x ) { return clog( x ); } |
---|
| 101 | long double _Complex log( long double _Complex x ) { return clogl( x ); } |
---|
| 102 | |
---|
[4c4e444] | 103 | // O(1) polymorphic integer log2, using clz, which returns the number of leading 0-bits, starting at the most |
---|
| 104 | // significant bit (single instruction on x86) |
---|
| 105 | int log2( unsigned int n ) { return n == 0 ? -1 : sizeof(n) * __CHAR_BIT__ - 1 - __builtin_clz( n ); } |
---|
| 106 | long int log2( unsigned long int n ) { return n == 0 ? -1 : sizeof(n) * __CHAR_BIT__ - 1 - __builtin_clzl( n ); } |
---|
[2f5ea69] | 107 | long long int log2( unsigned long long int n ) { return n == 0 ? -1 : sizeof(n) * __CHAR_BIT__ - 1 - __builtin_clzll( n ); } |
---|
[7cfef0d] | 108 | float log2( float x ) { return log2f( x ); } |
---|
| 109 | // extern "C" { double log2( double ); } |
---|
| 110 | long double log2( long double x ) { return log2l( x ); } |
---|
| 111 | // float _Complex log2( float _Complex x ) { return clog2f( x ); } |
---|
| 112 | // double _Complex log2( double _Complex x ) { return clog2( x ); } |
---|
| 113 | // long double _Complex log2( long double _Complex x ) { return clog2l( x ); } |
---|
| 114 | |
---|
| 115 | float log10( float x ) { return log10f( x ); } |
---|
| 116 | // extern "C" { double log10( double ); } |
---|
| 117 | long double log10( long double x ) { return log10l( x ); } |
---|
| 118 | // float _Complex log10( float _Complex x ) { return clog10f( x ); } |
---|
| 119 | // double _Complex log10( double _Complex x ) { return clog10( x ); } |
---|
| 120 | // long double _Complex log10( long double _Complex x ) { return clog10l( x ); } |
---|
| 121 | |
---|
| 122 | float log1p( float x ) { return log1pf( x ); } |
---|
| 123 | // extern "C" { double log1p( double ); } |
---|
| 124 | long double log1p( long double x ) { return log1pl( x ); } |
---|
| 125 | |
---|
| 126 | int ilogb( float x ) { return ilogbf( x ); } |
---|
| 127 | // extern "C" { int ilogb( double ); } |
---|
| 128 | int ilogb( long double x ) { return ilogbl( x ); } |
---|
| 129 | |
---|
| 130 | float logb( float x ) { return logbf( x ); } |
---|
| 131 | // extern "C" { double logb( double ); } |
---|
| 132 | long double logb( long double x ) { return logbl( x ); } |
---|
| 133 | |
---|
| 134 | float sqrt( float x ) { return sqrtf( x ); } |
---|
| 135 | // extern "C" { double sqrt( double ); } |
---|
| 136 | long double sqrt( long double x ) { return sqrtl( x ); } |
---|
| 137 | float _Complex sqrt( float _Complex x ) { return csqrtf( x ); } |
---|
| 138 | double _Complex sqrt( double _Complex x ) { return csqrt( x ); } |
---|
| 139 | long double _Complex sqrt( long double _Complex x ) { return csqrtl( x ); } |
---|
| 140 | |
---|
| 141 | float cbrt( float x ) { return cbrtf( x ); } |
---|
| 142 | // extern "C" { double cbrt( double ); } |
---|
| 143 | long double cbrt( long double x ) { return cbrtl( x ); } |
---|
| 144 | |
---|
| 145 | float hypot( float x, float y ) { return hypotf( x, y ); } |
---|
| 146 | // extern "C" { double hypot( double, double ); } |
---|
| 147 | long double hypot( long double x, long double y ) { return hypotl( x, y ); } |
---|
| 148 | } // distribution |
---|
[6e991d6] | 149 | |
---|
[95bda0a] | 150 | static inline unsigned long long log2_u32_32( unsigned long long val ) { |
---|
| 151 | enum { |
---|
| 152 | TABLE_BITS = 6, |
---|
| 153 | TABLE_SIZE = (1 << TABLE_BITS) + 2, |
---|
| 154 | }; |
---|
| 155 | // for(i; TABLE_SIZE) { |
---|
| 156 | // table[i] = (unsigned long long)(log2(1.0 + i / pow(2, TABLE_BITS)) * pow(2, 32))); |
---|
| 157 | // } |
---|
| 158 | static const unsigned long long table[] = { |
---|
| 159 | 0x0000000000, 0x0005b9e5a1, 0x000b5d69ba, 0x0010eb389f, |
---|
| 160 | 0x001663f6fa, 0x001bc84240, 0x002118b119, 0x002655d3c4, |
---|
| 161 | 0x002b803473, 0x00309857a0, 0x00359ebc5b, 0x003a93dc98, |
---|
| 162 | 0x003f782d72, 0x00444c1f6b, 0x0049101eac, 0x004dc4933a, |
---|
| 163 | 0x005269e12f, 0x00570068e7, 0x005b888736, 0x006002958c, |
---|
| 164 | 0x00646eea24, 0x0068cdd829, 0x006d1fafdc, 0x007164beb4, |
---|
| 165 | 0x00759d4f80, 0x0079c9aa87, 0x007dea15a3, 0x0081fed45c, |
---|
| 166 | 0x0086082806, 0x008a064fd5, 0x008df988f4, 0x0091e20ea1, |
---|
| 167 | 0x0095c01a39, 0x009993e355, 0x009d5d9fd5, 0x00a11d83f4, |
---|
| 168 | 0x00a4d3c25e, 0x00a8808c38, 0x00ac241134, 0x00afbe7fa0, |
---|
| 169 | 0x00b3500472, 0x00b6d8cb53, 0x00ba58feb2, 0x00bdd0c7c9, |
---|
| 170 | 0x00c1404ead, 0x00c4a7ba58, 0x00c80730b0, 0x00cb5ed695, |
---|
| 171 | 0x00ceaecfea, 0x00d1f73f9c, 0x00d53847ac, 0x00d8720935, |
---|
| 172 | 0x00dba4a47a, 0x00ded038e6, 0x00e1f4e517, 0x00e512c6e5, |
---|
| 173 | 0x00e829fb69, 0x00eb3a9f01, 0x00ee44cd59, 0x00f148a170, |
---|
| 174 | 0x00f446359b, 0x00f73da38d, 0x00fa2f045e, 0x00fd1a708b, |
---|
| 175 | 0x0100000000, 0x0102dfca16, |
---|
| 176 | }; |
---|
| 177 | _Static_assert((sizeof(table) / sizeof(table[0])) == TABLE_SIZE, "TABLE_SIZE should be accurate"); |
---|
| 178 | // starting from val = (2 ** i)*(1 + f) where 0 <= f < 1 |
---|
| 179 | // log identities mean log2(val) = log2((2 ** i)*(1 + f)) = log2(2**i) + log2(1+f) |
---|
| 180 | // |
---|
| 181 | // getting i is easy to do using builtin_clz (count leading zero) |
---|
| 182 | // |
---|
| 183 | // we want to calculate log2(1+f) independently to have a many bits of precision as possible. |
---|
| 184 | // val = (2 ** i)*(1 + f) = 2 ** i + f * 2 ** i |
---|
| 185 | // isolating f we get |
---|
| 186 | // val - 2 ** i = f * 2 ** i |
---|
| 187 | // (val - 2 ** i) / 2 ** i = f |
---|
| 188 | // |
---|
| 189 | // we want to interpolate from the table to get the values |
---|
| 190 | // and compromise by doing quadratic interpolation (rather than higher degree interpolation) |
---|
| 191 | // |
---|
| 192 | // for the interpolation we want to shift everything the fist sample point |
---|
| 193 | // so our parabola becomes x = 0 |
---|
| 194 | // this further simplifies the equations |
---|
| 195 | // |
---|
| 196 | // the consequence is that we need f in 2 forms: |
---|
| 197 | // - finding the index of x0 |
---|
| 198 | // - finding the distance between f and x0 |
---|
| 199 | // |
---|
| 200 | // since sample points are equidistant we can significantly simplify the equations |
---|
| 201 | |
---|
| 202 | // get i |
---|
| 203 | const unsigned long long bits = sizeof(val) * __CHAR_BIT__; |
---|
| 204 | const unsigned long long lz = __builtin_clzl(val); |
---|
| 205 | const unsigned long long i = bits - 1 - lz; |
---|
| 206 | |
---|
| 207 | // get the fractinal part as a u32.32 |
---|
| 208 | const unsigned long long frac = (val << (lz + 1)) >> 32; |
---|
| 209 | |
---|
| 210 | // get high order bits for the index into the table |
---|
| 211 | const unsigned long long idx0 = frac >> (32 - TABLE_BITS); |
---|
| 212 | |
---|
| 213 | // get the x offset, i.e., the difference between the first sample point and the actual fractional part |
---|
| 214 | const long long udx = frac - (idx0 << (32 - TABLE_BITS)); |
---|
| 215 | /* paranoid */ verify((idx0 + 2) < TABLE_SIZE); |
---|
| 216 | |
---|
| 217 | const long long y0 = table[idx0 + 0]; |
---|
| 218 | const long long y1 = table[idx0 + 1]; |
---|
| 219 | const long long y2 = table[idx0 + 2]; |
---|
| 220 | |
---|
| 221 | // from there we can quadraticly interpolate to get the data, using the lagrange polynomial |
---|
| 222 | // normally it would look like: |
---|
| 223 | // double r0 = y0 * ((x - x1) / (x0 - x1)) * ((x - x2) / (x0 - x2)); |
---|
| 224 | // double r1 = y1 * ((x - x0) / (x1 - x0)) * ((x - x2) / (x1 - x2)); |
---|
| 225 | // double r2 = y2 * ((x - x0) / (x2 - x0)) * ((x - x1) / (x2 - x1)); |
---|
| 226 | // but since the spacing between sample points is fixed, we can simplify it and extract common expressions |
---|
| 227 | const long long f1 = (y1 - y0); |
---|
| 228 | const long long f2 = (y2 - y0); |
---|
| 229 | const long long a = f2 - (f1 * 2l); |
---|
| 230 | const long long b = (f1 * 2l) - a; |
---|
| 231 | |
---|
| 232 | // Now we can compute it in the form (ax + b)x + c (which avoid repeating steps) |
---|
| 233 | long long sum = ((a*udx) >> (32 - TABLE_BITS)) + b; |
---|
| 234 | sum = (sum*udx) >> (32 - TABLE_BITS + 1); |
---|
| 235 | sum = y0 + sum; |
---|
| 236 | |
---|
| 237 | return (i << 32) + (sum); |
---|
| 238 | } |
---|
| 239 | |
---|
[dc5376a] | 240 | //---------------------- Trigonometric ---------------------- |
---|
[6e991d6] | 241 | |
---|
[95bda0a] | 242 | static inline __attribute__((always_inline)) { |
---|
[7cfef0d] | 243 | float sin( float x ) { return sinf( x ); } |
---|
| 244 | // extern "C" { double sin( double ); } |
---|
| 245 | long double sin( long double x ) { return sinl( x ); } |
---|
| 246 | float _Complex sin( float _Complex x ) { return csinf( x ); } |
---|
| 247 | double _Complex sin( double _Complex x ) { return csin( x ); } |
---|
| 248 | long double _Complex sin( long double _Complex x ) { return csinl( x ); } |
---|
| 249 | |
---|
| 250 | float cos( float x ) { return cosf( x ); } |
---|
| 251 | // extern "C" { double cos( double ); } |
---|
| 252 | long double cos( long double x ) { return cosl( x ); } |
---|
| 253 | float _Complex cos( float _Complex x ) { return ccosf( x ); } |
---|
| 254 | double _Complex cos( double _Complex x ) { return ccos( x ); } |
---|
| 255 | long double _Complex cos( long double _Complex x ) { return ccosl( x ); } |
---|
| 256 | |
---|
| 257 | float tan( float x ) { return tanf( x ); } |
---|
| 258 | // extern "C" { double tan( double ); } |
---|
| 259 | long double tan( long double x ) { return tanl( x ); } |
---|
| 260 | float _Complex tan( float _Complex x ) { return ctanf( x ); } |
---|
| 261 | double _Complex tan( double _Complex x ) { return ctan( x ); } |
---|
| 262 | long double _Complex tan( long double _Complex x ) { return ctanl( x ); } |
---|
| 263 | |
---|
| 264 | float asin( float x ) { return asinf( x ); } |
---|
| 265 | // extern "C" { double asin( double ); } |
---|
| 266 | long double asin( long double x ) { return asinl( x ); } |
---|
| 267 | float _Complex asin( float _Complex x ) { return casinf( x ); } |
---|
| 268 | double _Complex asin( double _Complex x ) { return casin( x ); } |
---|
| 269 | long double _Complex asin( long double _Complex x ) { return casinl( x ); } |
---|
| 270 | |
---|
| 271 | float acos( float x ) { return acosf( x ); } |
---|
| 272 | // extern "C" { double acos( double ); } |
---|
| 273 | long double acos( long double x ) { return acosl( x ); } |
---|
| 274 | float _Complex acos( float _Complex x ) { return cacosf( x ); } |
---|
| 275 | double _Complex acos( double _Complex x ) { return cacos( x ); } |
---|
| 276 | long double _Complex acos( long double _Complex x ) { return cacosl( x ); } |
---|
| 277 | |
---|
| 278 | float atan( float x ) { return atanf( x ); } |
---|
| 279 | // extern "C" { double atan( double ); } |
---|
| 280 | long double atan( long double x ) { return atanl( x ); } |
---|
| 281 | float _Complex atan( float _Complex x ) { return catanf( x ); } |
---|
| 282 | double _Complex atan( double _Complex x ) { return catan( x ); } |
---|
| 283 | long double _Complex atan( long double _Complex x ) { return catanl( x ); } |
---|
| 284 | |
---|
| 285 | float atan2( float x, float y ) { return atan2f( x, y ); } |
---|
| 286 | // extern "C" { double atan2( double, double ); } |
---|
| 287 | long double atan2( long double x, long double y ) { return atan2l( x, y ); } |
---|
| 288 | |
---|
| 289 | // alternative name for atan2 |
---|
| 290 | float atan( float x, float y ) { return atan2f( x, y ); } |
---|
| 291 | double atan( double x, double y ) { return atan2( x, y ); } |
---|
| 292 | long double atan( long double x, long double y ) { return atan2l( x, y ); } |
---|
| 293 | } // distribution |
---|
[6e991d6] | 294 | |
---|
[dc5376a] | 295 | //---------------------- Hyperbolic ---------------------- |
---|
[6e991d6] | 296 | |
---|
[95bda0a] | 297 | static inline __attribute__((always_inline)) { |
---|
[7cfef0d] | 298 | float sinh( float x ) { return sinhf( x ); } |
---|
| 299 | // extern "C" { double sinh( double ); } |
---|
| 300 | long double sinh( long double x ) { return sinhl( x ); } |
---|
| 301 | float _Complex sinh( float _Complex x ) { return csinhf( x ); } |
---|
| 302 | double _Complex sinh( double _Complex x ) { return csinh( x ); } |
---|
| 303 | long double _Complex sinh( long double _Complex x ) { return csinhl( x ); } |
---|
| 304 | |
---|
| 305 | float cosh( float x ) { return coshf( x ); } |
---|
| 306 | // extern "C" { double cosh( double ); } |
---|
| 307 | long double cosh( long double x ) { return coshl( x ); } |
---|
| 308 | float _Complex cosh( float _Complex x ) { return ccoshf( x ); } |
---|
| 309 | double _Complex cosh( double _Complex x ) { return ccosh( x ); } |
---|
| 310 | long double _Complex cosh( long double _Complex x ) { return ccoshl( x ); } |
---|
| 311 | |
---|
| 312 | float tanh( float x ) { return tanhf( x ); } |
---|
| 313 | // extern "C" { double tanh( double ); } |
---|
| 314 | long double tanh( long double x ) { return tanhl( x ); } |
---|
| 315 | float _Complex tanh( float _Complex x ) { return ctanhf( x ); } |
---|
| 316 | double _Complex tanh( double _Complex x ) { return ctanh( x ); } |
---|
| 317 | long double _Complex tanh( long double _Complex x ) { return ctanhl( x ); } |
---|
| 318 | |
---|
| 319 | float asinh( float x ) { return asinhf( x ); } |
---|
| 320 | // extern "C" { double asinh( double ); } |
---|
| 321 | long double asinh( long double x ) { return asinhl( x ); } |
---|
| 322 | float _Complex asinh( float _Complex x ) { return casinhf( x ); } |
---|
| 323 | double _Complex asinh( double _Complex x ) { return casinh( x ); } |
---|
| 324 | long double _Complex asinh( long double _Complex x ) { return casinhl( x ); } |
---|
| 325 | |
---|
| 326 | float acosh( float x ) { return acoshf( x ); } |
---|
| 327 | // extern "C" { double acosh( double ); } |
---|
| 328 | long double acosh( long double x ) { return acoshl( x ); } |
---|
| 329 | float _Complex acosh( float _Complex x ) { return cacoshf( x ); } |
---|
| 330 | double _Complex acosh( double _Complex x ) { return cacosh( x ); } |
---|
| 331 | long double _Complex acosh( long double _Complex x ) { return cacoshl( x ); } |
---|
| 332 | |
---|
| 333 | float atanh( float x ) { return atanhf( x ); } |
---|
| 334 | // extern "C" { double atanh( double ); } |
---|
| 335 | long double atanh( long double x ) { return atanhl( x ); } |
---|
| 336 | float _Complex atanh( float _Complex x ) { return catanhf( x ); } |
---|
| 337 | double _Complex atanh( double _Complex x ) { return catanh( x ); } |
---|
| 338 | long double _Complex atanh( long double _Complex x ) { return catanhl( x ); } |
---|
| 339 | } // distribution |
---|
[dc5376a] | 340 | |
---|
| 341 | //---------------------- Error / Gamma ---------------------- |
---|
| 342 | |
---|
[95bda0a] | 343 | static inline __attribute__((always_inline)) { |
---|
[7cfef0d] | 344 | float erf( float x ) { return erff( x ); } |
---|
| 345 | // extern "C" { double erf( double ); } |
---|
| 346 | long double erf( long double x ) { return erfl( x ); } |
---|
| 347 | // float _Complex erf( float _Complex ); |
---|
| 348 | // double _Complex erf( double _Complex ); |
---|
| 349 | // long double _Complex erf( long double _Complex ); |
---|
| 350 | |
---|
| 351 | float erfc( float x ) { return erfcf( x ); } |
---|
| 352 | // extern "C" { double erfc( double ); } |
---|
| 353 | long double erfc( long double x ) { return erfcl( x ); } |
---|
| 354 | // float _Complex erfc( float _Complex ); |
---|
| 355 | // double _Complex erfc( double _Complex ); |
---|
| 356 | // long double _Complex erfc( long double _Complex ); |
---|
| 357 | |
---|
| 358 | float lgamma( float x ) { return lgammaf( x ); } |
---|
| 359 | // extern "C" { double lgamma( double ); } |
---|
| 360 | long double lgamma( long double x ) { return lgammal( x ); } |
---|
| 361 | float lgamma( float x, int * sign ) { return lgammaf_r( x, sign ); } |
---|
| 362 | double lgamma( double x, int * sign ) { return lgamma_r( x, sign ); } |
---|
| 363 | long double lgamma( long double x, int * sign ) { return lgammal_r( x, sign ); } |
---|
| 364 | |
---|
| 365 | float tgamma( float x ) { return tgammaf( x ); } |
---|
| 366 | // extern "C" { double tgamma( double ); } |
---|
| 367 | long double tgamma( long double x ) { return tgammal( x ); } |
---|
| 368 | } // distribution |
---|
[6e991d6] | 369 | |
---|
[dc5376a] | 370 | //---------------------- Nearest Integer ---------------------- |
---|
| 371 | |
---|
[95bda0a] | 372 | inline __attribute__((always_inline)) static { |
---|
[7cfef0d] | 373 | signed char floor( signed char n, signed char align ) { return n / align * align; } |
---|
| 374 | unsigned char floor( unsigned char n, unsigned char align ) { return n / align * align; } |
---|
| 375 | short int floor( short int n, short int align ) { return n / align * align; } |
---|
| 376 | unsigned short int floor( unsigned short int n, unsigned short int align ) { return n / align * align; } |
---|
| 377 | int floor( int n, int align ) { return n / align * align; } |
---|
| 378 | unsigned int floor( unsigned int n, unsigned int align ) { return n / align * align; } |
---|
| 379 | long int floor( long int n, long int align ) { return n / align * align; } |
---|
| 380 | unsigned long int floor( unsigned long int n, unsigned long int align ) { return n / align * align; } |
---|
| 381 | long long int floor( long long int n, long long int align ) { return n / align * align; } |
---|
| 382 | unsigned long long int floor( unsigned long long int n, unsigned long long int align ) { return n / align * align; } |
---|
| 383 | |
---|
[fd54fef] | 384 | // forall( T | { T ?/?( T, T ); T ?*?( T, T ); } ) |
---|
[7cfef0d] | 385 | // T floor( T n, T align ) { return n / align * align; } |
---|
| 386 | |
---|
| 387 | signed char ceiling_div( signed char n, char align ) { return (n + (align - 1)) / align; } |
---|
| 388 | unsigned char ceiling_div( unsigned char n, unsigned char align ) { return (n + (align - 1)) / align; } |
---|
| 389 | short int ceiling_div( short int n, short int align ) { return (n + (align - 1)) / align; } |
---|
| 390 | unsigned short int ceiling_div( unsigned short int n, unsigned short int align ) { return (n + (align - 1)) / align; } |
---|
| 391 | int ceiling_div( int n, int align ) { return (n + (align - 1)) / align; } |
---|
| 392 | unsigned int ceiling_div( unsigned int n, unsigned int align ) { return (n + (align - 1)) / align; } |
---|
| 393 | long int ceiling_div( long int n, long int align ) { return (n + (align - 1)) / align; } |
---|
| 394 | unsigned long int ceiling_div( unsigned long int n, unsigned long int align ) { return (n + (align - 1)) / align; } |
---|
| 395 | long long int ceiling_div( long long int n, long long int align ) { return (n + (align - 1)) / align; } |
---|
| 396 | unsigned long long int ceiling_div( unsigned long long int n, unsigned long long int align ) { return (n + (align - 1)) / align; } |
---|
| 397 | |
---|
[fd54fef] | 398 | // forall( T | { T ?+?( T, T ); T ?-?( T, T ); T ?%?( T, T ); } ) |
---|
[7cfef0d] | 399 | // T ceiling_div( T n, T align ) { verify( is_pow2( align ) );return (n + (align - 1)) / align; } |
---|
[0deeaad] | 400 | |
---|
[7cfef0d] | 401 | // gcc notices the div/mod pair and saves both so only one div. |
---|
| 402 | signed char ceiling( signed char n, signed char align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); } |
---|
| 403 | unsigned char ceiling( unsigned char n, unsigned char align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); } |
---|
| 404 | short int ceiling( short int n, short int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); } |
---|
| 405 | unsigned short int ceiling( unsigned short int n, unsigned short int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); } |
---|
| 406 | int ceiling( int n, int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); } |
---|
| 407 | unsigned int ceiling( unsigned int n, unsigned int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); } |
---|
| 408 | long int ceiling( long int n, long int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); } |
---|
| 409 | unsigned long int ceiling( unsigned long int n, unsigned long int align ) { return floor( n + (n % align != 0 ? align - 1 : 0) , align); } |
---|
| 410 | long long int ceiling( long long int n, long long int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); } |
---|
| 411 | unsigned long long int ceiling( unsigned long long int n, unsigned long long int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); } |
---|
| 412 | |
---|
[fd54fef] | 413 | // forall( T | { void ?{}( T &, one_t ); T ?+?( T, T ); T ?-?( T, T ); T ?/?( T, T ); } ) |
---|
[7cfef0d] | 414 | // T ceiling( T n, T align ) { return return floor( n + (n % align != 0 ? align - 1 : 0), align ); *} |
---|
| 415 | |
---|
| 416 | float floor( float x ) { return floorf( x ); } |
---|
| 417 | // extern "C" { double floor( double ); } |
---|
| 418 | long double floor( long double x ) { return floorl( x ); } |
---|
| 419 | |
---|
| 420 | float ceil( float x ) { return ceilf( x ); } |
---|
| 421 | // extern "C" { double ceil( double ); } |
---|
| 422 | long double ceil( long double x ) { return ceill( x ); } |
---|
| 423 | |
---|
| 424 | float trunc( float x ) { return truncf( x ); } |
---|
| 425 | // extern "C" { double trunc( double ); } |
---|
| 426 | long double trunc( long double x ) { return truncl( x ); } |
---|
| 427 | |
---|
| 428 | float rint( float x ) { return rintf( x ); } |
---|
| 429 | // extern "C" { double rint( double x ); } |
---|
| 430 | long double rint( long double x ) { return rintl( x ); } |
---|
| 431 | long int rint( float x ) { return lrintf( x ); } |
---|
| 432 | long int rint( double x ) { return lrint( x ); } |
---|
| 433 | long int rint( long double x ) { return lrintl( x ); } |
---|
| 434 | long long int rint( float x ) { return llrintf( x ); } |
---|
| 435 | long long int rint( double x ) { return llrint( x ); } |
---|
| 436 | long long int rint( long double x ) { return llrintl( x ); } |
---|
| 437 | |
---|
| 438 | long int lrint( float x ) { return lrintf( x ); } |
---|
| 439 | // extern "C" { long int lrint( double ); } |
---|
| 440 | long int lrint( long double x ) { return lrintl( x ); } |
---|
| 441 | long long int llrint( float x ) { return llrintf( x ); } |
---|
| 442 | // extern "C" { long long int llrint( double ); } |
---|
| 443 | long long int llrint( long double x ) { return llrintl( x ); } |
---|
| 444 | |
---|
| 445 | float nearbyint( float x ) { return nearbyintf( x ); } |
---|
| 446 | // extern "C" { double nearbyint( double ); } |
---|
| 447 | long double nearbyint( long double x ) { return nearbyintl( x ); } |
---|
| 448 | |
---|
| 449 | float round( float x ) { return roundf( x ); } |
---|
| 450 | // extern "C" { double round( double x ); } |
---|
| 451 | long double round( long double x ) { return roundl( x ); } |
---|
| 452 | long int round( float x ) { return lroundf( x ); } |
---|
| 453 | long int round( double x ) { return lround( x ); } |
---|
| 454 | long int round( long double x ) { return lroundl( x ); } |
---|
| 455 | long long int round( float x ) { return llroundf( x ); } |
---|
| 456 | long long int round( double x ) { return llround( x ); } |
---|
| 457 | long long int round( long double x ) { return llroundl( x ); } |
---|
| 458 | |
---|
| 459 | long int lround( float x ) { return lroundf( x ); } |
---|
| 460 | // extern "C" { long int lround( double ); } |
---|
| 461 | long int lround( long double x ) { return lroundl( x ); } |
---|
| 462 | long long int llround( float x ) { return llroundf( x ); } |
---|
| 463 | // extern "C" { long long int llround( double ); } |
---|
| 464 | long long int llround( long double x ) { return llroundl( x ); } |
---|
| 465 | } // distribution |
---|
[6e991d6] | 466 | |
---|
[dc5376a] | 467 | //---------------------- Manipulation ---------------------- |
---|
[6e991d6] | 468 | |
---|
[95bda0a] | 469 | static inline __attribute__((always_inline)) { |
---|
[7cfef0d] | 470 | float copysign( float x, float y ) { return copysignf( x, y ); } |
---|
| 471 | // extern "C" { double copysign( double, double ); } |
---|
| 472 | long double copysign( long double x, long double y ) { return copysignl( x, y ); } |
---|
| 473 | |
---|
| 474 | float frexp( float x, int * ip ) { return frexpf( x, ip ); } |
---|
| 475 | // extern "C" { double frexp( double, int * ); } |
---|
| 476 | long double frexp( long double x, int * ip ) { return frexpl( x, ip ); } |
---|
| 477 | |
---|
| 478 | float ldexp( float x, int exp2 ) { return ldexpf( x, exp2 ); } |
---|
| 479 | // extern "C" { double ldexp( double, int ); } |
---|
| 480 | long double ldexp( long double x, int exp2 ) { return ldexpl( x, exp2 ); } |
---|
| 481 | |
---|
| 482 | [ float, float ] modf( float x ) { float i; x = modff( x, &i ); return [ i, x ]; } |
---|
| 483 | float modf( float x, float * i ) { return modff( x, i ); } |
---|
| 484 | [ double, double ] modf( double x ) { double i; x = modf( x, &i ); return [ i, x ]; } |
---|
| 485 | // extern "C" { double modf( double, double * ); } |
---|
| 486 | [ long double, long double ] modf( long double x ) { long double i; x = modfl( x, &i ); return [ i, x ]; } |
---|
| 487 | long double modf( long double x, long double * i ) { return modfl( x, i ); } |
---|
| 488 | |
---|
| 489 | float nextafter( float x, float y ) { return nextafterf( x, y ); } |
---|
| 490 | // extern "C" { double nextafter( double, double ); } |
---|
| 491 | long double nextafter( long double x, long double y ) { return nextafterl( x, y ); } |
---|
| 492 | |
---|
| 493 | float nexttoward( float x, long double y ) { return nexttowardf( x, y ); } |
---|
| 494 | // extern "C" { double nexttoward( double, long double ); } |
---|
| 495 | long double nexttoward( long double x, long double y ) { return nexttowardl( x, y ); } |
---|
| 496 | |
---|
| 497 | float scalbn( float x, int exp ) { return scalbnf( x, exp ); } |
---|
| 498 | // extern "C" { double scalbn( double, int ); } |
---|
| 499 | long double scalbn( long double x, int exp ) { return scalbnl( x, exp ); } |
---|
| 500 | float scalbn( float x, long int exp ) { return scalblnf( x, exp ); } |
---|
| 501 | double scalbn( double x, long int exp ) { return scalbln( x, exp ); } |
---|
| 502 | long double scalbn( long double x, long int exp ) { return scalblnl( x, exp ); } |
---|
| 503 | |
---|
| 504 | float scalbln( float x, long int exp ) { return scalblnf( x, exp ); } |
---|
| 505 | // extern "C" { double scalbln( double, long int ); } |
---|
| 506 | long double scalbln( long double x, long int exp ) { return scalblnl( x, exp ); } |
---|
| 507 | } // distribution |
---|
[0fc52b6] | 508 | |
---|
[6b8b767] | 509 | //--------------------------------------- |
---|
| 510 | |
---|
[95bda0a] | 511 | static inline __attribute__((always_inline)) { |
---|
[fd54fef] | 512 | forall( T | { void ?{}( T &, one_t ); T ?+?( T, T ); T ?-?( T, T );T ?*?( T, T ); } ) |
---|
[7cfef0d] | 513 | T lerp( T x, T y, T a ) { return x * ((T){1} - a) + y * a; } |
---|
[6b8b767] | 514 | |
---|
[fd54fef] | 515 | forall( T | { void ?{}( T &, zero_t ); void ?{}( T &, one_t ); int ?<?( T, T ); } ) |
---|
[7cfef0d] | 516 | T step( T edge, T x ) { return x < edge ? (T){0} : (T){1}; } |
---|
[6b8b767] | 517 | |
---|
[fd54fef] | 518 | forall( T | { void ?{}( T &, int ); T clamp( T, T, T ); T ?-?( T, T ); T ?*?( T, T ); T ?/?( T, T ); } ) |
---|
[7cfef0d] | 519 | T smoothstep( T edge0, T edge1, T x ) { T t = clamp( (x - edge0) / (edge1 - edge0), (T){0}, (T){1} ); return t * t * ((T){3} - (T){2} * t); } |
---|
| 520 | } // distribution |
---|
[6b8b767] | 521 | |
---|
[6e991d6] | 522 | // Local Variables: // |
---|
| 523 | // mode: c // |
---|
| 524 | // tab-width: 4 // |
---|
| 525 | // End: // |
---|