[bb82c03] | 1 | //
|
---|
[6e991d6] | 2 | // Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo
|
---|
| 3 | //
|
---|
| 4 | // The contents of this file are covered under the licence agreement in the
|
---|
| 5 | // file "LICENCE" distributed with Cforall.
|
---|
| 6 | //
|
---|
[2f5ea69] | 7 | // math.hfa --
|
---|
[bb82c03] | 8 | //
|
---|
[6e991d6] | 9 | // Author : Peter A. Buhr
|
---|
| 10 | // Created On : Mon Apr 18 23:37:04 2016
|
---|
| 11 | // Last Modified By : Peter A. Buhr
|
---|
[95bda0a] | 12 | // Last Modified On : Sat Oct 8 08:40:42 2022
|
---|
| 13 | // Update Count : 136
|
---|
[bb82c03] | 14 | //
|
---|
[17e5e2b] | 15 |
|
---|
[53a6c2a] | 16 | #pragma once
|
---|
[17e5e2b] | 17 |
|
---|
[dab7ac7] | 18 | #include <math.h>
|
---|
| 19 | #include <complex.h>
|
---|
[6e991d6] | 20 |
|
---|
[7cfef0d] | 21 | //---------------------------------------
|
---|
[dab7ac7] | 22 |
|
---|
[7cfef0d] | 23 | #include "common.hfa"
|
---|
[0deeaad] | 24 | #include "bits/debug.hfa"
|
---|
[6e991d6] | 25 |
|
---|
[7cfef0d] | 26 | //---------------------- General ----------------------
|
---|
[6e991d6] | 27 |
|
---|
[95bda0a] | 28 | static inline __attribute__((always_inline)) {
|
---|
[7cfef0d] | 29 | float ?%?( float x, float y ) { return fmodf( x, y ); }
|
---|
| 30 | float fmod( float x, float y ) { return fmodf( x, y ); }
|
---|
| 31 | double ?%?( double x, double y ) { return fmod( x, y ); }
|
---|
| 32 | // extern "C" { double fmod( double, double ); }
|
---|
| 33 | long double ?%?( long double x, long double y ) { return fmodl( x, y ); }
|
---|
| 34 | long double fmod( long double x, long double y ) { return fmodl( x, y ); }
|
---|
| 35 |
|
---|
| 36 | float remainder( float x, float y ) { return remainderf( x, y ); }
|
---|
| 37 | // extern "C" { double remainder( double, double ); }
|
---|
| 38 | long double remainder( long double x, long double y ) { return remainderl( x, y ); }
|
---|
| 39 |
|
---|
| 40 | float remquo( float x, float y, int * quo ) { return remquof( x, y, quo ); }
|
---|
| 41 | // extern "C" { double remquo( double x, double y, int * quo ); }
|
---|
| 42 | long double remquo( long double x, long double y, int * quo ) { return remquol( x, y, quo ); }
|
---|
| 43 | [ int, float ] remquo( float x, float y ) { int quo; x = remquof( x, y, &quo ); return [ quo, x ]; }
|
---|
| 44 | [ int, double ] remquo( double x, double y ) { int quo; x = remquo( x, y, &quo ); return [ quo, x ]; }
|
---|
| 45 | [ int, long double ] remquo( long double x, long double y ) { int quo; x = remquol( x, y, &quo ); return [ quo, x ]; }
|
---|
| 46 |
|
---|
| 47 | [ float, float ] div( float x, float y ) { y = modff( x / y, &x ); return [ x, y ]; }
|
---|
| 48 | [ double, double ] div( double x, double y ) { y = modf( x / y, &x ); return [ x, y ]; }
|
---|
| 49 | [ long double, long double ] div( long double x, long double y ) { y = modfl( x / y, &x ); return [ x, y ]; }
|
---|
| 50 |
|
---|
| 51 | float fma( float x, float y, float z ) { return fmaf( x, y, z ); }
|
---|
| 52 | // extern "C" { double fma( double, double, double ); }
|
---|
| 53 | long double fma( long double x, long double y, long double z ) { return fmal( x, y, z ); }
|
---|
| 54 |
|
---|
| 55 | float fdim( float x, float y ) { return fdimf( x, y ); }
|
---|
| 56 | // extern "C" { double fdim( double, double ); }
|
---|
| 57 | long double fdim( long double x, long double y ) { return fdiml( x, y ); }
|
---|
| 58 |
|
---|
| 59 | float nan( const char tag[] ) { return nanf( tag ); }
|
---|
| 60 | // extern "C" { double nan( const char [] ); }
|
---|
| 61 | long double nan( const char tag[] ) { return nanl( tag ); }
|
---|
| 62 | } // distribution
|
---|
[6e991d6] | 63 |
|
---|
[dc5376a] | 64 | //---------------------- Exponential ----------------------
|
---|
[6e991d6] | 65 |
|
---|
[95bda0a] | 66 | static inline __attribute__((always_inline)) {
|
---|
[7cfef0d] | 67 | float exp( float x ) { return expf( x ); }
|
---|
| 68 | // extern "C" { double exp( double ); }
|
---|
| 69 | long double exp( long double x ) { return expl( x ); }
|
---|
| 70 | float _Complex exp( float _Complex x ) { return cexpf( x ); }
|
---|
| 71 | double _Complex exp( double _Complex x ) { return cexp( x ); }
|
---|
| 72 | long double _Complex exp( long double _Complex x ) { return cexpl( x ); }
|
---|
| 73 |
|
---|
| 74 | float exp2( float x ) { return exp2f( x ); }
|
---|
| 75 | // extern "C" { double exp2( double ); }
|
---|
| 76 | long double exp2( long double x ) { return exp2l( x ); }
|
---|
| 77 | //float _Complex exp2( float _Complex x ) { return cexp2f( x ); }
|
---|
| 78 | //double _Complex exp2( double _Complex x ) { return cexp2( x ); }
|
---|
| 79 | //long double _Complex exp2( long double _Complex x ) { return cexp2l( x ); }
|
---|
| 80 |
|
---|
| 81 | float expm1( float x ) { return expm1f( x ); }
|
---|
| 82 | // extern "C" { double expm1( double ); }
|
---|
| 83 | long double expm1( long double x ) { return expm1l( x ); }
|
---|
| 84 |
|
---|
| 85 | float pow( float x, float y ) { return powf( x, y ); }
|
---|
| 86 | // extern "C" { double pow( double, double ); }
|
---|
| 87 | long double pow( long double x, long double y ) { return powl( x, y ); }
|
---|
| 88 | float _Complex pow( float _Complex x, float _Complex y ) { return cpowf( x, y ); }
|
---|
| 89 | double _Complex pow( double _Complex x, double _Complex y ) { return cpow( x, y ); }
|
---|
| 90 | long double _Complex pow( long double _Complex x, long double _Complex y ) { return cpowl( x, y ); }
|
---|
| 91 | } // distribution
|
---|
[dab7ac7] | 92 |
|
---|
| 93 | //---------------------- Logarithm ----------------------
|
---|
| 94 |
|
---|
[95bda0a] | 95 | static inline __attribute__((always_inline)) {
|
---|
[7cfef0d] | 96 | float log( float x ) { return logf( x ); }
|
---|
| 97 | // extern "C" { double log( double ); }
|
---|
| 98 | long double log( long double x ) { return logl( x ); }
|
---|
| 99 | float _Complex log( float _Complex x ) { return clogf( x ); }
|
---|
| 100 | double _Complex log( double _Complex x ) { return clog( x ); }
|
---|
| 101 | long double _Complex log( long double _Complex x ) { return clogl( x ); }
|
---|
| 102 |
|
---|
[4c4e444] | 103 | // O(1) polymorphic integer log2, using clz, which returns the number of leading 0-bits, starting at the most
|
---|
| 104 | // significant bit (single instruction on x86)
|
---|
| 105 | int log2( unsigned int n ) { return n == 0 ? -1 : sizeof(n) * __CHAR_BIT__ - 1 - __builtin_clz( n ); }
|
---|
| 106 | long int log2( unsigned long int n ) { return n == 0 ? -1 : sizeof(n) * __CHAR_BIT__ - 1 - __builtin_clzl( n ); }
|
---|
[2f5ea69] | 107 | long long int log2( unsigned long long int n ) { return n == 0 ? -1 : sizeof(n) * __CHAR_BIT__ - 1 - __builtin_clzll( n ); }
|
---|
[7cfef0d] | 108 | float log2( float x ) { return log2f( x ); }
|
---|
| 109 | // extern "C" { double log2( double ); }
|
---|
| 110 | long double log2( long double x ) { return log2l( x ); }
|
---|
| 111 | // float _Complex log2( float _Complex x ) { return clog2f( x ); }
|
---|
| 112 | // double _Complex log2( double _Complex x ) { return clog2( x ); }
|
---|
| 113 | // long double _Complex log2( long double _Complex x ) { return clog2l( x ); }
|
---|
| 114 |
|
---|
| 115 | float log10( float x ) { return log10f( x ); }
|
---|
| 116 | // extern "C" { double log10( double ); }
|
---|
| 117 | long double log10( long double x ) { return log10l( x ); }
|
---|
| 118 | // float _Complex log10( float _Complex x ) { return clog10f( x ); }
|
---|
| 119 | // double _Complex log10( double _Complex x ) { return clog10( x ); }
|
---|
| 120 | // long double _Complex log10( long double _Complex x ) { return clog10l( x ); }
|
---|
| 121 |
|
---|
| 122 | float log1p( float x ) { return log1pf( x ); }
|
---|
| 123 | // extern "C" { double log1p( double ); }
|
---|
| 124 | long double log1p( long double x ) { return log1pl( x ); }
|
---|
| 125 |
|
---|
| 126 | int ilogb( float x ) { return ilogbf( x ); }
|
---|
| 127 | // extern "C" { int ilogb( double ); }
|
---|
| 128 | int ilogb( long double x ) { return ilogbl( x ); }
|
---|
| 129 |
|
---|
| 130 | float logb( float x ) { return logbf( x ); }
|
---|
| 131 | // extern "C" { double logb( double ); }
|
---|
| 132 | long double logb( long double x ) { return logbl( x ); }
|
---|
| 133 |
|
---|
| 134 | float sqrt( float x ) { return sqrtf( x ); }
|
---|
| 135 | // extern "C" { double sqrt( double ); }
|
---|
| 136 | long double sqrt( long double x ) { return sqrtl( x ); }
|
---|
| 137 | float _Complex sqrt( float _Complex x ) { return csqrtf( x ); }
|
---|
| 138 | double _Complex sqrt( double _Complex x ) { return csqrt( x ); }
|
---|
| 139 | long double _Complex sqrt( long double _Complex x ) { return csqrtl( x ); }
|
---|
| 140 |
|
---|
| 141 | float cbrt( float x ) { return cbrtf( x ); }
|
---|
| 142 | // extern "C" { double cbrt( double ); }
|
---|
| 143 | long double cbrt( long double x ) { return cbrtl( x ); }
|
---|
| 144 |
|
---|
| 145 | float hypot( float x, float y ) { return hypotf( x, y ); }
|
---|
| 146 | // extern "C" { double hypot( double, double ); }
|
---|
| 147 | long double hypot( long double x, long double y ) { return hypotl( x, y ); }
|
---|
| 148 | } // distribution
|
---|
[6e991d6] | 149 |
|
---|
[95bda0a] | 150 | static inline unsigned long long log2_u32_32( unsigned long long val ) {
|
---|
| 151 | enum {
|
---|
| 152 | TABLE_BITS = 6,
|
---|
| 153 | TABLE_SIZE = (1 << TABLE_BITS) + 2,
|
---|
| 154 | };
|
---|
| 155 | // for(i; TABLE_SIZE) {
|
---|
| 156 | // table[i] = (unsigned long long)(log2(1.0 + i / pow(2, TABLE_BITS)) * pow(2, 32)));
|
---|
| 157 | // }
|
---|
| 158 | static const unsigned long long table[] = {
|
---|
| 159 | 0x0000000000, 0x0005b9e5a1, 0x000b5d69ba, 0x0010eb389f,
|
---|
| 160 | 0x001663f6fa, 0x001bc84240, 0x002118b119, 0x002655d3c4,
|
---|
| 161 | 0x002b803473, 0x00309857a0, 0x00359ebc5b, 0x003a93dc98,
|
---|
| 162 | 0x003f782d72, 0x00444c1f6b, 0x0049101eac, 0x004dc4933a,
|
---|
| 163 | 0x005269e12f, 0x00570068e7, 0x005b888736, 0x006002958c,
|
---|
| 164 | 0x00646eea24, 0x0068cdd829, 0x006d1fafdc, 0x007164beb4,
|
---|
| 165 | 0x00759d4f80, 0x0079c9aa87, 0x007dea15a3, 0x0081fed45c,
|
---|
| 166 | 0x0086082806, 0x008a064fd5, 0x008df988f4, 0x0091e20ea1,
|
---|
| 167 | 0x0095c01a39, 0x009993e355, 0x009d5d9fd5, 0x00a11d83f4,
|
---|
| 168 | 0x00a4d3c25e, 0x00a8808c38, 0x00ac241134, 0x00afbe7fa0,
|
---|
| 169 | 0x00b3500472, 0x00b6d8cb53, 0x00ba58feb2, 0x00bdd0c7c9,
|
---|
| 170 | 0x00c1404ead, 0x00c4a7ba58, 0x00c80730b0, 0x00cb5ed695,
|
---|
| 171 | 0x00ceaecfea, 0x00d1f73f9c, 0x00d53847ac, 0x00d8720935,
|
---|
| 172 | 0x00dba4a47a, 0x00ded038e6, 0x00e1f4e517, 0x00e512c6e5,
|
---|
| 173 | 0x00e829fb69, 0x00eb3a9f01, 0x00ee44cd59, 0x00f148a170,
|
---|
| 174 | 0x00f446359b, 0x00f73da38d, 0x00fa2f045e, 0x00fd1a708b,
|
---|
| 175 | 0x0100000000, 0x0102dfca16,
|
---|
| 176 | };
|
---|
| 177 | _Static_assert((sizeof(table) / sizeof(table[0])) == TABLE_SIZE, "TABLE_SIZE should be accurate");
|
---|
| 178 | // starting from val = (2 ** i)*(1 + f) where 0 <= f < 1
|
---|
| 179 | // log identities mean log2(val) = log2((2 ** i)*(1 + f)) = log2(2**i) + log2(1+f)
|
---|
| 180 | //
|
---|
| 181 | // getting i is easy to do using builtin_clz (count leading zero)
|
---|
| 182 | //
|
---|
| 183 | // we want to calculate log2(1+f) independently to have a many bits of precision as possible.
|
---|
| 184 | // val = (2 ** i)*(1 + f) = 2 ** i + f * 2 ** i
|
---|
| 185 | // isolating f we get
|
---|
| 186 | // val - 2 ** i = f * 2 ** i
|
---|
| 187 | // (val - 2 ** i) / 2 ** i = f
|
---|
| 188 | //
|
---|
| 189 | // we want to interpolate from the table to get the values
|
---|
| 190 | // and compromise by doing quadratic interpolation (rather than higher degree interpolation)
|
---|
| 191 | //
|
---|
| 192 | // for the interpolation we want to shift everything the fist sample point
|
---|
| 193 | // so our parabola becomes x = 0
|
---|
| 194 | // this further simplifies the equations
|
---|
| 195 | //
|
---|
| 196 | // the consequence is that we need f in 2 forms:
|
---|
| 197 | // - finding the index of x0
|
---|
| 198 | // - finding the distance between f and x0
|
---|
| 199 | //
|
---|
| 200 | // since sample points are equidistant we can significantly simplify the equations
|
---|
| 201 |
|
---|
| 202 | // get i
|
---|
| 203 | const unsigned long long bits = sizeof(val) * __CHAR_BIT__;
|
---|
| 204 | const unsigned long long lz = __builtin_clzl(val);
|
---|
| 205 | const unsigned long long i = bits - 1 - lz;
|
---|
| 206 |
|
---|
| 207 | // get the fractinal part as a u32.32
|
---|
| 208 | const unsigned long long frac = (val << (lz + 1)) >> 32;
|
---|
| 209 |
|
---|
| 210 | // get high order bits for the index into the table
|
---|
| 211 | const unsigned long long idx0 = frac >> (32 - TABLE_BITS);
|
---|
| 212 |
|
---|
| 213 | // get the x offset, i.e., the difference between the first sample point and the actual fractional part
|
---|
| 214 | const long long udx = frac - (idx0 << (32 - TABLE_BITS));
|
---|
| 215 | /* paranoid */ verify((idx0 + 2) < TABLE_SIZE);
|
---|
| 216 |
|
---|
| 217 | const long long y0 = table[idx0 + 0];
|
---|
| 218 | const long long y1 = table[idx0 + 1];
|
---|
| 219 | const long long y2 = table[idx0 + 2];
|
---|
| 220 |
|
---|
| 221 | // from there we can quadraticly interpolate to get the data, using the lagrange polynomial
|
---|
| 222 | // normally it would look like:
|
---|
| 223 | // double r0 = y0 * ((x - x1) / (x0 - x1)) * ((x - x2) / (x0 - x2));
|
---|
| 224 | // double r1 = y1 * ((x - x0) / (x1 - x0)) * ((x - x2) / (x1 - x2));
|
---|
| 225 | // double r2 = y2 * ((x - x0) / (x2 - x0)) * ((x - x1) / (x2 - x1));
|
---|
| 226 | // but since the spacing between sample points is fixed, we can simplify it and extract common expressions
|
---|
| 227 | const long long f1 = (y1 - y0);
|
---|
| 228 | const long long f2 = (y2 - y0);
|
---|
| 229 | const long long a = f2 - (f1 * 2l);
|
---|
| 230 | const long long b = (f1 * 2l) - a;
|
---|
| 231 |
|
---|
| 232 | // Now we can compute it in the form (ax + b)x + c (which avoid repeating steps)
|
---|
| 233 | long long sum = ((a*udx) >> (32 - TABLE_BITS)) + b;
|
---|
| 234 | sum = (sum*udx) >> (32 - TABLE_BITS + 1);
|
---|
| 235 | sum = y0 + sum;
|
---|
| 236 |
|
---|
| 237 | return (i << 32) + (sum);
|
---|
| 238 | }
|
---|
| 239 |
|
---|
[dc5376a] | 240 | //---------------------- Trigonometric ----------------------
|
---|
[6e991d6] | 241 |
|
---|
[95bda0a] | 242 | static inline __attribute__((always_inline)) {
|
---|
[7cfef0d] | 243 | float sin( float x ) { return sinf( x ); }
|
---|
| 244 | // extern "C" { double sin( double ); }
|
---|
| 245 | long double sin( long double x ) { return sinl( x ); }
|
---|
| 246 | float _Complex sin( float _Complex x ) { return csinf( x ); }
|
---|
| 247 | double _Complex sin( double _Complex x ) { return csin( x ); }
|
---|
| 248 | long double _Complex sin( long double _Complex x ) { return csinl( x ); }
|
---|
| 249 |
|
---|
| 250 | float cos( float x ) { return cosf( x ); }
|
---|
| 251 | // extern "C" { double cos( double ); }
|
---|
| 252 | long double cos( long double x ) { return cosl( x ); }
|
---|
| 253 | float _Complex cos( float _Complex x ) { return ccosf( x ); }
|
---|
| 254 | double _Complex cos( double _Complex x ) { return ccos( x ); }
|
---|
| 255 | long double _Complex cos( long double _Complex x ) { return ccosl( x ); }
|
---|
| 256 |
|
---|
| 257 | float tan( float x ) { return tanf( x ); }
|
---|
| 258 | // extern "C" { double tan( double ); }
|
---|
| 259 | long double tan( long double x ) { return tanl( x ); }
|
---|
| 260 | float _Complex tan( float _Complex x ) { return ctanf( x ); }
|
---|
| 261 | double _Complex tan( double _Complex x ) { return ctan( x ); }
|
---|
| 262 | long double _Complex tan( long double _Complex x ) { return ctanl( x ); }
|
---|
| 263 |
|
---|
| 264 | float asin( float x ) { return asinf( x ); }
|
---|
| 265 | // extern "C" { double asin( double ); }
|
---|
| 266 | long double asin( long double x ) { return asinl( x ); }
|
---|
| 267 | float _Complex asin( float _Complex x ) { return casinf( x ); }
|
---|
| 268 | double _Complex asin( double _Complex x ) { return casin( x ); }
|
---|
| 269 | long double _Complex asin( long double _Complex x ) { return casinl( x ); }
|
---|
| 270 |
|
---|
| 271 | float acos( float x ) { return acosf( x ); }
|
---|
| 272 | // extern "C" { double acos( double ); }
|
---|
| 273 | long double acos( long double x ) { return acosl( x ); }
|
---|
| 274 | float _Complex acos( float _Complex x ) { return cacosf( x ); }
|
---|
| 275 | double _Complex acos( double _Complex x ) { return cacos( x ); }
|
---|
| 276 | long double _Complex acos( long double _Complex x ) { return cacosl( x ); }
|
---|
| 277 |
|
---|
| 278 | float atan( float x ) { return atanf( x ); }
|
---|
| 279 | // extern "C" { double atan( double ); }
|
---|
| 280 | long double atan( long double x ) { return atanl( x ); }
|
---|
| 281 | float _Complex atan( float _Complex x ) { return catanf( x ); }
|
---|
| 282 | double _Complex atan( double _Complex x ) { return catan( x ); }
|
---|
| 283 | long double _Complex atan( long double _Complex x ) { return catanl( x ); }
|
---|
| 284 |
|
---|
| 285 | float atan2( float x, float y ) { return atan2f( x, y ); }
|
---|
| 286 | // extern "C" { double atan2( double, double ); }
|
---|
| 287 | long double atan2( long double x, long double y ) { return atan2l( x, y ); }
|
---|
| 288 |
|
---|
| 289 | // alternative name for atan2
|
---|
| 290 | float atan( float x, float y ) { return atan2f( x, y ); }
|
---|
| 291 | double atan( double x, double y ) { return atan2( x, y ); }
|
---|
| 292 | long double atan( long double x, long double y ) { return atan2l( x, y ); }
|
---|
| 293 | } // distribution
|
---|
[6e991d6] | 294 |
|
---|
[dc5376a] | 295 | //---------------------- Hyperbolic ----------------------
|
---|
[6e991d6] | 296 |
|
---|
[95bda0a] | 297 | static inline __attribute__((always_inline)) {
|
---|
[7cfef0d] | 298 | float sinh( float x ) { return sinhf( x ); }
|
---|
| 299 | // extern "C" { double sinh( double ); }
|
---|
| 300 | long double sinh( long double x ) { return sinhl( x ); }
|
---|
| 301 | float _Complex sinh( float _Complex x ) { return csinhf( x ); }
|
---|
| 302 | double _Complex sinh( double _Complex x ) { return csinh( x ); }
|
---|
| 303 | long double _Complex sinh( long double _Complex x ) { return csinhl( x ); }
|
---|
| 304 |
|
---|
| 305 | float cosh( float x ) { return coshf( x ); }
|
---|
| 306 | // extern "C" { double cosh( double ); }
|
---|
| 307 | long double cosh( long double x ) { return coshl( x ); }
|
---|
| 308 | float _Complex cosh( float _Complex x ) { return ccoshf( x ); }
|
---|
| 309 | double _Complex cosh( double _Complex x ) { return ccosh( x ); }
|
---|
| 310 | long double _Complex cosh( long double _Complex x ) { return ccoshl( x ); }
|
---|
| 311 |
|
---|
| 312 | float tanh( float x ) { return tanhf( x ); }
|
---|
| 313 | // extern "C" { double tanh( double ); }
|
---|
| 314 | long double tanh( long double x ) { return tanhl( x ); }
|
---|
| 315 | float _Complex tanh( float _Complex x ) { return ctanhf( x ); }
|
---|
| 316 | double _Complex tanh( double _Complex x ) { return ctanh( x ); }
|
---|
| 317 | long double _Complex tanh( long double _Complex x ) { return ctanhl( x ); }
|
---|
| 318 |
|
---|
| 319 | float asinh( float x ) { return asinhf( x ); }
|
---|
| 320 | // extern "C" { double asinh( double ); }
|
---|
| 321 | long double asinh( long double x ) { return asinhl( x ); }
|
---|
| 322 | float _Complex asinh( float _Complex x ) { return casinhf( x ); }
|
---|
| 323 | double _Complex asinh( double _Complex x ) { return casinh( x ); }
|
---|
| 324 | long double _Complex asinh( long double _Complex x ) { return casinhl( x ); }
|
---|
| 325 |
|
---|
| 326 | float acosh( float x ) { return acoshf( x ); }
|
---|
| 327 | // extern "C" { double acosh( double ); }
|
---|
| 328 | long double acosh( long double x ) { return acoshl( x ); }
|
---|
| 329 | float _Complex acosh( float _Complex x ) { return cacoshf( x ); }
|
---|
| 330 | double _Complex acosh( double _Complex x ) { return cacosh( x ); }
|
---|
| 331 | long double _Complex acosh( long double _Complex x ) { return cacoshl( x ); }
|
---|
| 332 |
|
---|
| 333 | float atanh( float x ) { return atanhf( x ); }
|
---|
| 334 | // extern "C" { double atanh( double ); }
|
---|
| 335 | long double atanh( long double x ) { return atanhl( x ); }
|
---|
| 336 | float _Complex atanh( float _Complex x ) { return catanhf( x ); }
|
---|
| 337 | double _Complex atanh( double _Complex x ) { return catanh( x ); }
|
---|
| 338 | long double _Complex atanh( long double _Complex x ) { return catanhl( x ); }
|
---|
| 339 | } // distribution
|
---|
[dc5376a] | 340 |
|
---|
| 341 | //---------------------- Error / Gamma ----------------------
|
---|
| 342 |
|
---|
[95bda0a] | 343 | static inline __attribute__((always_inline)) {
|
---|
[7cfef0d] | 344 | float erf( float x ) { return erff( x ); }
|
---|
| 345 | // extern "C" { double erf( double ); }
|
---|
| 346 | long double erf( long double x ) { return erfl( x ); }
|
---|
| 347 | // float _Complex erf( float _Complex );
|
---|
| 348 | // double _Complex erf( double _Complex );
|
---|
| 349 | // long double _Complex erf( long double _Complex );
|
---|
| 350 |
|
---|
| 351 | float erfc( float x ) { return erfcf( x ); }
|
---|
| 352 | // extern "C" { double erfc( double ); }
|
---|
| 353 | long double erfc( long double x ) { return erfcl( x ); }
|
---|
| 354 | // float _Complex erfc( float _Complex );
|
---|
| 355 | // double _Complex erfc( double _Complex );
|
---|
| 356 | // long double _Complex erfc( long double _Complex );
|
---|
| 357 |
|
---|
| 358 | float lgamma( float x ) { return lgammaf( x ); }
|
---|
| 359 | // extern "C" { double lgamma( double ); }
|
---|
| 360 | long double lgamma( long double x ) { return lgammal( x ); }
|
---|
| 361 | float lgamma( float x, int * sign ) { return lgammaf_r( x, sign ); }
|
---|
| 362 | double lgamma( double x, int * sign ) { return lgamma_r( x, sign ); }
|
---|
| 363 | long double lgamma( long double x, int * sign ) { return lgammal_r( x, sign ); }
|
---|
| 364 |
|
---|
| 365 | float tgamma( float x ) { return tgammaf( x ); }
|
---|
| 366 | // extern "C" { double tgamma( double ); }
|
---|
| 367 | long double tgamma( long double x ) { return tgammal( x ); }
|
---|
| 368 | } // distribution
|
---|
[6e991d6] | 369 |
|
---|
[dc5376a] | 370 | //---------------------- Nearest Integer ----------------------
|
---|
| 371 |
|
---|
[95bda0a] | 372 | inline __attribute__((always_inline)) static {
|
---|
[7cfef0d] | 373 | signed char floor( signed char n, signed char align ) { return n / align * align; }
|
---|
| 374 | unsigned char floor( unsigned char n, unsigned char align ) { return n / align * align; }
|
---|
| 375 | short int floor( short int n, short int align ) { return n / align * align; }
|
---|
| 376 | unsigned short int floor( unsigned short int n, unsigned short int align ) { return n / align * align; }
|
---|
| 377 | int floor( int n, int align ) { return n / align * align; }
|
---|
| 378 | unsigned int floor( unsigned int n, unsigned int align ) { return n / align * align; }
|
---|
| 379 | long int floor( long int n, long int align ) { return n / align * align; }
|
---|
| 380 | unsigned long int floor( unsigned long int n, unsigned long int align ) { return n / align * align; }
|
---|
| 381 | long long int floor( long long int n, long long int align ) { return n / align * align; }
|
---|
| 382 | unsigned long long int floor( unsigned long long int n, unsigned long long int align ) { return n / align * align; }
|
---|
| 383 |
|
---|
[fd54fef] | 384 | // forall( T | { T ?/?( T, T ); T ?*?( T, T ); } )
|
---|
[7cfef0d] | 385 | // T floor( T n, T align ) { return n / align * align; }
|
---|
| 386 |
|
---|
| 387 | signed char ceiling_div( signed char n, char align ) { return (n + (align - 1)) / align; }
|
---|
| 388 | unsigned char ceiling_div( unsigned char n, unsigned char align ) { return (n + (align - 1)) / align; }
|
---|
| 389 | short int ceiling_div( short int n, short int align ) { return (n + (align - 1)) / align; }
|
---|
| 390 | unsigned short int ceiling_div( unsigned short int n, unsigned short int align ) { return (n + (align - 1)) / align; }
|
---|
| 391 | int ceiling_div( int n, int align ) { return (n + (align - 1)) / align; }
|
---|
| 392 | unsigned int ceiling_div( unsigned int n, unsigned int align ) { return (n + (align - 1)) / align; }
|
---|
| 393 | long int ceiling_div( long int n, long int align ) { return (n + (align - 1)) / align; }
|
---|
| 394 | unsigned long int ceiling_div( unsigned long int n, unsigned long int align ) { return (n + (align - 1)) / align; }
|
---|
| 395 | long long int ceiling_div( long long int n, long long int align ) { return (n + (align - 1)) / align; }
|
---|
| 396 | unsigned long long int ceiling_div( unsigned long long int n, unsigned long long int align ) { return (n + (align - 1)) / align; }
|
---|
| 397 |
|
---|
[fd54fef] | 398 | // forall( T | { T ?+?( T, T ); T ?-?( T, T ); T ?%?( T, T ); } )
|
---|
[7cfef0d] | 399 | // T ceiling_div( T n, T align ) { verify( is_pow2( align ) );return (n + (align - 1)) / align; }
|
---|
[0deeaad] | 400 |
|
---|
[7cfef0d] | 401 | // gcc notices the div/mod pair and saves both so only one div.
|
---|
| 402 | signed char ceiling( signed char n, signed char align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); }
|
---|
| 403 | unsigned char ceiling( unsigned char n, unsigned char align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); }
|
---|
| 404 | short int ceiling( short int n, short int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); }
|
---|
| 405 | unsigned short int ceiling( unsigned short int n, unsigned short int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); }
|
---|
| 406 | int ceiling( int n, int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); }
|
---|
| 407 | unsigned int ceiling( unsigned int n, unsigned int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); }
|
---|
| 408 | long int ceiling( long int n, long int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); }
|
---|
| 409 | unsigned long int ceiling( unsigned long int n, unsigned long int align ) { return floor( n + (n % align != 0 ? align - 1 : 0) , align); }
|
---|
| 410 | long long int ceiling( long long int n, long long int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); }
|
---|
| 411 | unsigned long long int ceiling( unsigned long long int n, unsigned long long int align ) { return floor( n + (n % align != 0 ? align - 1 : 0), align ); }
|
---|
| 412 |
|
---|
[fd54fef] | 413 | // forall( T | { void ?{}( T &, one_t ); T ?+?( T, T ); T ?-?( T, T ); T ?/?( T, T ); } )
|
---|
[7cfef0d] | 414 | // T ceiling( T n, T align ) { return return floor( n + (n % align != 0 ? align - 1 : 0), align ); *}
|
---|
| 415 |
|
---|
| 416 | float floor( float x ) { return floorf( x ); }
|
---|
| 417 | // extern "C" { double floor( double ); }
|
---|
| 418 | long double floor( long double x ) { return floorl( x ); }
|
---|
| 419 |
|
---|
| 420 | float ceil( float x ) { return ceilf( x ); }
|
---|
| 421 | // extern "C" { double ceil( double ); }
|
---|
| 422 | long double ceil( long double x ) { return ceill( x ); }
|
---|
| 423 |
|
---|
| 424 | float trunc( float x ) { return truncf( x ); }
|
---|
| 425 | // extern "C" { double trunc( double ); }
|
---|
| 426 | long double trunc( long double x ) { return truncl( x ); }
|
---|
| 427 |
|
---|
| 428 | float rint( float x ) { return rintf( x ); }
|
---|
| 429 | // extern "C" { double rint( double x ); }
|
---|
| 430 | long double rint( long double x ) { return rintl( x ); }
|
---|
| 431 | long int rint( float x ) { return lrintf( x ); }
|
---|
| 432 | long int rint( double x ) { return lrint( x ); }
|
---|
| 433 | long int rint( long double x ) { return lrintl( x ); }
|
---|
| 434 | long long int rint( float x ) { return llrintf( x ); }
|
---|
| 435 | long long int rint( double x ) { return llrint( x ); }
|
---|
| 436 | long long int rint( long double x ) { return llrintl( x ); }
|
---|
| 437 |
|
---|
| 438 | long int lrint( float x ) { return lrintf( x ); }
|
---|
| 439 | // extern "C" { long int lrint( double ); }
|
---|
| 440 | long int lrint( long double x ) { return lrintl( x ); }
|
---|
| 441 | long long int llrint( float x ) { return llrintf( x ); }
|
---|
| 442 | // extern "C" { long long int llrint( double ); }
|
---|
| 443 | long long int llrint( long double x ) { return llrintl( x ); }
|
---|
| 444 |
|
---|
| 445 | float nearbyint( float x ) { return nearbyintf( x ); }
|
---|
| 446 | // extern "C" { double nearbyint( double ); }
|
---|
| 447 | long double nearbyint( long double x ) { return nearbyintl( x ); }
|
---|
| 448 |
|
---|
| 449 | float round( float x ) { return roundf( x ); }
|
---|
| 450 | // extern "C" { double round( double x ); }
|
---|
| 451 | long double round( long double x ) { return roundl( x ); }
|
---|
| 452 | long int round( float x ) { return lroundf( x ); }
|
---|
| 453 | long int round( double x ) { return lround( x ); }
|
---|
| 454 | long int round( long double x ) { return lroundl( x ); }
|
---|
| 455 | long long int round( float x ) { return llroundf( x ); }
|
---|
| 456 | long long int round( double x ) { return llround( x ); }
|
---|
| 457 | long long int round( long double x ) { return llroundl( x ); }
|
---|
| 458 |
|
---|
| 459 | long int lround( float x ) { return lroundf( x ); }
|
---|
| 460 | // extern "C" { long int lround( double ); }
|
---|
| 461 | long int lround( long double x ) { return lroundl( x ); }
|
---|
| 462 | long long int llround( float x ) { return llroundf( x ); }
|
---|
| 463 | // extern "C" { long long int llround( double ); }
|
---|
| 464 | long long int llround( long double x ) { return llroundl( x ); }
|
---|
| 465 | } // distribution
|
---|
[6e991d6] | 466 |
|
---|
[dc5376a] | 467 | //---------------------- Manipulation ----------------------
|
---|
[6e991d6] | 468 |
|
---|
[95bda0a] | 469 | static inline __attribute__((always_inline)) {
|
---|
[7cfef0d] | 470 | float copysign( float x, float y ) { return copysignf( x, y ); }
|
---|
| 471 | // extern "C" { double copysign( double, double ); }
|
---|
| 472 | long double copysign( long double x, long double y ) { return copysignl( x, y ); }
|
---|
| 473 |
|
---|
| 474 | float frexp( float x, int * ip ) { return frexpf( x, ip ); }
|
---|
| 475 | // extern "C" { double frexp( double, int * ); }
|
---|
| 476 | long double frexp( long double x, int * ip ) { return frexpl( x, ip ); }
|
---|
| 477 |
|
---|
| 478 | float ldexp( float x, int exp2 ) { return ldexpf( x, exp2 ); }
|
---|
| 479 | // extern "C" { double ldexp( double, int ); }
|
---|
| 480 | long double ldexp( long double x, int exp2 ) { return ldexpl( x, exp2 ); }
|
---|
| 481 |
|
---|
| 482 | [ float, float ] modf( float x ) { float i; x = modff( x, &i ); return [ i, x ]; }
|
---|
| 483 | float modf( float x, float * i ) { return modff( x, i ); }
|
---|
| 484 | [ double, double ] modf( double x ) { double i; x = modf( x, &i ); return [ i, x ]; }
|
---|
| 485 | // extern "C" { double modf( double, double * ); }
|
---|
| 486 | [ long double, long double ] modf( long double x ) { long double i; x = modfl( x, &i ); return [ i, x ]; }
|
---|
| 487 | long double modf( long double x, long double * i ) { return modfl( x, i ); }
|
---|
| 488 |
|
---|
| 489 | float nextafter( float x, float y ) { return nextafterf( x, y ); }
|
---|
| 490 | // extern "C" { double nextafter( double, double ); }
|
---|
| 491 | long double nextafter( long double x, long double y ) { return nextafterl( x, y ); }
|
---|
| 492 |
|
---|
| 493 | float nexttoward( float x, long double y ) { return nexttowardf( x, y ); }
|
---|
| 494 | // extern "C" { double nexttoward( double, long double ); }
|
---|
| 495 | long double nexttoward( long double x, long double y ) { return nexttowardl( x, y ); }
|
---|
| 496 |
|
---|
| 497 | float scalbn( float x, int exp ) { return scalbnf( x, exp ); }
|
---|
| 498 | // extern "C" { double scalbn( double, int ); }
|
---|
| 499 | long double scalbn( long double x, int exp ) { return scalbnl( x, exp ); }
|
---|
| 500 | float scalbn( float x, long int exp ) { return scalblnf( x, exp ); }
|
---|
| 501 | double scalbn( double x, long int exp ) { return scalbln( x, exp ); }
|
---|
| 502 | long double scalbn( long double x, long int exp ) { return scalblnl( x, exp ); }
|
---|
| 503 |
|
---|
| 504 | float scalbln( float x, long int exp ) { return scalblnf( x, exp ); }
|
---|
| 505 | // extern "C" { double scalbln( double, long int ); }
|
---|
| 506 | long double scalbln( long double x, long int exp ) { return scalblnl( x, exp ); }
|
---|
| 507 | } // distribution
|
---|
[0fc52b6] | 508 |
|
---|
[6b8b767] | 509 | //---------------------------------------
|
---|
| 510 |
|
---|
[95bda0a] | 511 | static inline __attribute__((always_inline)) {
|
---|
[fd54fef] | 512 | forall( T | { void ?{}( T &, one_t ); T ?+?( T, T ); T ?-?( T, T );T ?*?( T, T ); } )
|
---|
[7cfef0d] | 513 | T lerp( T x, T y, T a ) { return x * ((T){1} - a) + y * a; }
|
---|
[6b8b767] | 514 |
|
---|
[fd54fef] | 515 | forall( T | { void ?{}( T &, zero_t ); void ?{}( T &, one_t ); int ?<?( T, T ); } )
|
---|
[7cfef0d] | 516 | T step( T edge, T x ) { return x < edge ? (T){0} : (T){1}; }
|
---|
[6b8b767] | 517 |
|
---|
[fd54fef] | 518 | forall( T | { void ?{}( T &, int ); T clamp( T, T, T ); T ?-?( T, T ); T ?*?( T, T ); T ?/?( T, T ); } )
|
---|
[7cfef0d] | 519 | T smoothstep( T edge0, T edge1, T x ) { T t = clamp( (x - edge0) / (edge1 - edge0), (T){0}, (T){1} ); return t * t * ((T){3} - (T){2} * t); }
|
---|
| 520 | } // distribution
|
---|
[6b8b767] | 521 |
|
---|
[6e991d6] | 522 | // Local Variables: //
|
---|
| 523 | // mode: c //
|
---|
| 524 | // tab-width: 4 //
|
---|
| 525 | // End: //
|
---|