Added launch bounds to fix launch resource error for Lion.

This commit is contained in:
Tim Dettmers 2023-04-11 08:37:02 -07:00
parent ed6f3eb146
commit 0b2ebcdab9

View File

@ -1260,6 +1260,7 @@ kPreconditionOptimizerStatic8bit1State(T* p, T* __restrict__ const g, unsigned c
template<typename T, int OPTIMIZER> template<typename T, int OPTIMIZER>
__global__ void __global__ void
__launch_bounds__(1024, 1)
kOptimizerStatic8bit1State(T* p, T* const g, unsigned char* state1, kOptimizerStatic8bit1State(T* p, T* const g, unsigned char* state1,
const float *unorm, const float max_unorm, const float param_norm, const float *unorm, const float max_unorm, const float param_norm,
const float beta1, const float beta2, const float beta1, const float beta2,