mirror of
https://github.com/intel/compute-runtime.git
synced 2026-01-03 14:55:24 +08:00
Initial commit
Change-Id: I4bf1707bd3dfeadf2c17b0a7daff372b1925ebbd
This commit is contained in:
157
runtime/helpers/basic_math.h
Normal file
157
runtime/helpers/basic_math.h
Normal file
@@ -0,0 +1,157 @@
|
||||
/*
|
||||
* Copyright (c) 2017, Intel Corporation
|
||||
*
|
||||
* Permission is hereby granted, free of charge, to any person obtaining a
|
||||
* copy of this software and associated documentation files (the "Software"),
|
||||
* to deal in the Software without restriction, including without limitation
|
||||
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
||||
* and/or sell copies of the Software, and to permit persons to whom the
|
||||
* Software is furnished to do so, subject to the following conditions:
|
||||
*
|
||||
* The above copyright notice and this permission notice shall be included
|
||||
* in all copies or substantial portions of the Software.
|
||||
*
|
||||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
||||
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
||||
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
||||
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
||||
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
||||
* OTHER DEALINGS IN THE SOFTWARE.
|
||||
*/
|
||||
|
||||
#pragma once
|
||||
#include "runtime/helpers/debug_helpers.h"
|
||||
#include <cstdint>
|
||||
#include <cmath>
|
||||
#include <stdio.h>
|
||||
|
||||
#define KB 1024uLL
|
||||
#define MB (KB * KB)
|
||||
#define GB (KB * MB)
|
||||
|
||||
namespace OCLRT {
|
||||
namespace Math {
|
||||
|
||||
inline uint32_t nextPowerOfTwo(uint32_t value) {
|
||||
--value;
|
||||
value |= value >> 1;
|
||||
value |= value >> 2;
|
||||
value |= value >> 4;
|
||||
value |= value >> 8;
|
||||
value |= value >> 16;
|
||||
++value;
|
||||
return value;
|
||||
}
|
||||
|
||||
inline uint32_t prevPowerOfTwo(uint32_t value) {
|
||||
value |= value >> 1;
|
||||
value |= value >> 2;
|
||||
value |= value >> 4;
|
||||
value |= value >> 8;
|
||||
value |= value >> 16;
|
||||
return (value - (value >> 1));
|
||||
}
|
||||
|
||||
inline uint32_t getMinLsbSet(uint32_t value) {
|
||||
static const int multiplyDeBruijnBitPosition[32] = {
|
||||
0, 1, 28, 2, 29, 14, 24, 3, 30, 22, 20, 15, 25, 17, 4, 8,
|
||||
31, 27, 13, 23, 21, 19, 16, 7, 26, 12, 18, 6, 11, 5, 10, 9};
|
||||
auto invert = -static_cast<int64_t>(value);
|
||||
value &= static_cast<uint32_t>(invert);
|
||||
return multiplyDeBruijnBitPosition[static_cast<uint32_t>(value * 0x077CB531U) >> 27];
|
||||
}
|
||||
|
||||
inline uint32_t log2(uint32_t value) {
|
||||
uint32_t exponent = 0u;
|
||||
uint32_t startVal = value;
|
||||
if (value == 0) {
|
||||
return 32;
|
||||
}
|
||||
startVal >>= 1;
|
||||
startVal &= 0x7fffffffu;
|
||||
while ((startVal & 0xffffffffu) && (exponent < 32)) {
|
||||
exponent = exponent + 1;
|
||||
startVal >>= 1;
|
||||
startVal &= 0x7fffffffu;
|
||||
}
|
||||
return exponent;
|
||||
}
|
||||
|
||||
inline uint64_t log2(uint64_t value) {
|
||||
uint64_t exponent = 0;
|
||||
uint64_t startVal = value;
|
||||
if (value == 0) {
|
||||
return 64;
|
||||
}
|
||||
startVal >>= 1;
|
||||
startVal &= 0x7fffffffffffffff;
|
||||
while ((startVal & 0xffffffffffffffff) && (exponent < 64)) {
|
||||
exponent = exponent + 1;
|
||||
startVal >>= 1;
|
||||
startVal &= 0x7fffffffffffffff;
|
||||
}
|
||||
return exponent;
|
||||
}
|
||||
|
||||
union FloatConversion {
|
||||
uint32_t u;
|
||||
float f;
|
||||
};
|
||||
|
||||
// clang-format off
|
||||
static const FloatConversion PosInfinity = {0x7f800000};
|
||||
static const FloatConversion NegInfinity = {0xff800000};
|
||||
static const FloatConversion Nan = {0x7fc00000};
|
||||
// clang-format on
|
||||
|
||||
inline uint16_t float2Half(float f) {
|
||||
FloatConversion u;
|
||||
u.f = f;
|
||||
|
||||
uint32_t fsign = (u.u >> 16) & 0x8000;
|
||||
float x = std::fabs(f);
|
||||
|
||||
//Nan
|
||||
if (x != x) {
|
||||
u.u >>= (24 - 11);
|
||||
u.u &= 0x7fff;
|
||||
u.u |= 0x0200; //silence the NaN
|
||||
return u.u | fsign;
|
||||
}
|
||||
|
||||
// overflow
|
||||
if (x >= std::ldexp(1.0f, 16)) {
|
||||
if (x == PosInfinity.f)
|
||||
return 0x7c00 | fsign;
|
||||
|
||||
return 0x7bff | fsign;
|
||||
}
|
||||
|
||||
// underflow
|
||||
if (x < std::ldexp(1.0f, -24))
|
||||
return fsign; // The halfway case can return 0x0001 or 0. 0 is even.
|
||||
|
||||
// half denormal
|
||||
if (x < std::ldexp(1.0f, -14)) {
|
||||
x *= std::ldexp(1.0f, 24);
|
||||
return (uint16_t)((int)x | fsign);
|
||||
}
|
||||
|
||||
u.u &= 0xFFFFE000U;
|
||||
u.u -= 0x38000000U;
|
||||
|
||||
return (u.u >> (24 - 11)) | fsign;
|
||||
}
|
||||
|
||||
inline bool isDivisableByPowerOfTwoDivisor(uint32_t number, uint32_t divisor) {
|
||||
DEBUG_BREAK_IF((divisor & (divisor - 1)) != 0);
|
||||
uint32_t mask = 0xffffffff;
|
||||
mask = mask - (divisor - 1);
|
||||
if ((number & mask) == number)
|
||||
return true;
|
||||
else
|
||||
return false;
|
||||
}
|
||||
} // namespace Math
|
||||
} // namespace OCLRT
|
||||
Reference in New Issue
Block a user