|
|
|
|
|
|
|
|
|
#undef NDEBUG |
|
#include <assert.h> |
|
#include <immintrin.h> |
|
#include <math.h> |
|
#include <stdint.h> |
|
|
|
#pragma GCC diagnostic push |
|
#pragma GCC diagnostic ignored "-Wdouble-promotion" |
|
|
|
|
|
inline static uint8_t round_orig(float v0) { return ((int8_t) (round(v0))) + 8; } |
|
|
|
|
|
inline static float silu_orig(float x) { |
|
return x/(1.0 + exp(-x)); |
|
} |
|
|
|
#pragma GCC diagnostic pop |
|
|
|
|
|
inline static uint8_t round_float(float v0) { return (int8_t)roundf(v0) + 8; } |
|
|
|
|
|
inline static float silu_float(float x) { |
|
return x/(1.0f + expf(-x)); |
|
} |
|
|
|
int main(void) { |
|
uint32_t x = UINT32_MAX; |
|
do { |
|
float f = *(float *)&x; |
|
assert(!isfinite(f) || (round_orig(f) == round_float(f))); |
|
} while (x--); |
|
|
|
#ifdef __F16C__ |
|
|
|
|
|
|
|
|
|
for (x = 0; x <= UINT16_MAX; x++) { |
|
float f = _cvtsh_ss(x); |
|
const float so = silu_orig(f); |
|
const float sf = silu_float(f); |
|
assert( (_cvtss_sh(so, 0) == _cvtss_sh(sf, 0)) |
|
|| (nextafterf(so, sf) == sf) |
|
|| (nextafterf(sf, so) == so)); |
|
} |
|
#endif |
|
} |
|
|