add a sign function, for lion
This commit is contained in:
parent
8de29fc364
commit
64bb1ae8d1
|
@ -217,6 +217,14 @@ __device__ __forceinline__ unsigned char quantize_quadrant(int QUADRANT, float *
|
|||
}
|
||||
}
|
||||
|
||||
// sign function for lion
|
||||
// taken from https://stackoverflow.com/a/4609795, but not sure if there's a proper way to do this in CUDA
|
||||
|
||||
template <typename T>
|
||||
__device__ int sgn(T val) {
|
||||
return (T(0) < val) - (val < T(0));
|
||||
}
|
||||
|
||||
__global__ void kHistogramScatterAdd2D(float* histogram, int *index1, int *index2, float *src, const int maxidx1, const int n)
|
||||
{
|
||||
const int tid = threadIdx.x + (blockDim.x*blockIdx.x);
|
||||
|
|
Loading…
Reference in New Issue
Block a user