forked from mrq/bitsandbytes-rocm
clearer assertions
This commit is contained in:
parent
e29c5f5c41
commit
fc4a135ed1
|
@ -232,7 +232,7 @@ class MatMul8bitLt(torch.autograd.Function):
|
||||||
# Cast A to fp16
|
# Cast A to fp16
|
||||||
A_dtype = A.dtype
|
A_dtype = A.dtype
|
||||||
if A_dtype != torch.float16:
|
if A_dtype != torch.float16:
|
||||||
warnings.warn(f"MatMul8bitLt: temporarily casting input matrix from {A_dtype} to float16")
|
warnings.warn(f"MatMul8bitLt: input matrix will be converted from {A_dtype} to float16")
|
||||||
A = A.to(torch.float16)
|
A = A.to(torch.float16)
|
||||||
|
|
||||||
# 1. Quantize A
|
# 1. Quantize A
|
||||||
|
|
Loading…
Reference in New Issue
Block a user