forked from mrq/bitsandbytes-rocm
Reduce diff
This commit is contained in:
parent
575aa698fa
commit
025824d29b
|
@ -41,6 +41,14 @@ void quantize(float *code, float *A, unsigned char *out, int n)
|
|||
CUDA_CHECK_RETURN(cudaPeekAtLastError());
|
||||
}
|
||||
|
||||
void dequantize(float *code, unsigned char *A, float *out, int n)
|
||||
{
|
||||
int blocks = n/1024;
|
||||
blocks = n % 1024 == 0 ? blocks : blocks + 1;
|
||||
kDequantize<<<blocks, 1024>>>(code, A, out, n);
|
||||
CUDA_CHECK_RETURN(cudaPeekAtLastError());
|
||||
}
|
||||
|
||||
template <typename T, int STOCHASTIC> void quantizeBlockwise(float * code, T *A, float *absmax, unsigned char *out, float *rand, int rand_offset, const int n)
|
||||
{
|
||||
int blocks = n/4096;
|
||||
|
|
Loading…
Reference in New Issue
Block a user