Merge branch 'main' of github.com:facebookresearch/bitsandbytes into main
This commit is contained in:
commit
20294dc0f2
|
@ -21,3 +21,4 @@ Features:
|
||||||
v0.0.24:
|
v0.0.24:
|
||||||
|
|
||||||
- Fixed a bug where a float/half conversion led to a compilation error for CUDA 11.1 on Turning GPUs.
|
- Fixed a bug where a float/half conversion led to a compilation error for CUDA 11.1 on Turning GPUs.
|
||||||
|
- removed Apex dependency for bnb LAMB
|
||||||
|
|
1
Makefile
1
Makefile
|
@ -52,6 +52,7 @@ $(BUILD_DIR):
|
||||||
|
|
||||||
$(ROOT_DIR)/dependencies/cub:
|
$(ROOT_DIR)/dependencies/cub:
|
||||||
git clone https://github.com/NVlabs/cub $(ROOT_DIR)/dependencies/cub
|
git clone https://github.com/NVlabs/cub $(ROOT_DIR)/dependencies/cub
|
||||||
|
cd dependencies/cub; git checkout 1.11.0
|
||||||
|
|
||||||
clean:
|
clean:
|
||||||
rm cuda_build/* ./bitsandbytes/libbitsandbytes.so
|
rm cuda_build/* ./bitsandbytes/libbitsandbytes.so
|
||||||
|
|
|
@ -2,7 +2,6 @@
|
||||||
#
|
#
|
||||||
# This source code is licensed under the MIT license found in the
|
# This source code is licensed under the MIT license found in the
|
||||||
# LICENSE file in the root directory of this source tree.
|
# LICENSE file in the root directory of this source tree.
|
||||||
import apex
|
|
||||||
from bitsandbytes.optim.optimizer import Optimizer2State
|
from bitsandbytes.optim.optimizer import Optimizer2State
|
||||||
|
|
||||||
class LAMB(Optimizer2State):
|
class LAMB(Optimizer2State):
|
||||||
|
|
13
deploy.sh
13
deploy.sh
|
@ -1,13 +0,0 @@
|
||||||
#!/bin/bash
|
|
||||||
|
|
||||||
rm -rf dist build
|
|
||||||
make clean
|
|
||||||
CUDA_HOME=/usr/local/cuda-10.2 make
|
|
||||||
CUDA_VERSION=102 python -m build
|
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
|
||||||
|
|
||||||
rm -rf dist build
|
|
||||||
make clean
|
|
||||||
CUDA_HOME=/usr/local/cuda-11.1 make
|
|
||||||
CUDA_VERSION=111 python -m build
|
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
|
|
@ -10,7 +10,7 @@ module load gcc/7.3.0
|
||||||
CUDA_HOME=/public/apps/cuda/9.2
|
CUDA_HOME=/public/apps/cuda/9.2
|
||||||
make
|
make
|
||||||
CUDA_VERSION=92 python -m build
|
CUDA_VERSION=92 python -m build
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
python -m twine upload dist/* --verbose
|
||||||
module unload cuda
|
module unload cuda
|
||||||
|
|
||||||
|
|
||||||
|
@ -21,7 +21,7 @@ module load cuda/10.0
|
||||||
CUDA_HOME=/public/apps/cuda/10.0
|
CUDA_HOME=/public/apps/cuda/10.0
|
||||||
make cuda10x
|
make cuda10x
|
||||||
CUDA_VERSION=100 python -m build
|
CUDA_VERSION=100 python -m build
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
python -m twine upload dist/* --verbose
|
||||||
module unload cuda
|
module unload cuda
|
||||||
module unload gcc
|
module unload gcc
|
||||||
module load gcc/8.4
|
module load gcc/8.4
|
||||||
|
@ -33,7 +33,7 @@ module load cuda/10.1
|
||||||
CUDA_HOME=/public/apps/cuda/10.1
|
CUDA_HOME=/public/apps/cuda/10.1
|
||||||
make cuda10x
|
make cuda10x
|
||||||
CUDA_VERSION=101 python -m build
|
CUDA_VERSION=101 python -m build
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
python -m twine upload dist/* --verbose
|
||||||
module unload cuda
|
module unload cuda
|
||||||
|
|
||||||
rm -rf dist build
|
rm -rf dist build
|
||||||
|
@ -43,7 +43,7 @@ module load cuda/10.2
|
||||||
CUDA_HOME=/public/apps/cuda/10.2/
|
CUDA_HOME=/public/apps/cuda/10.2/
|
||||||
make cuda10x
|
make cuda10x
|
||||||
CUDA_VERSION=102 python -m build
|
CUDA_VERSION=102 python -m build
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
python -m twine upload dist/* --verbose
|
||||||
module unload cuda
|
module unload cuda
|
||||||
|
|
||||||
|
|
||||||
|
@ -54,7 +54,7 @@ module load cuda/11.0
|
||||||
CUDA_HOME=/public/apps/cuda/11.0
|
CUDA_HOME=/public/apps/cuda/11.0
|
||||||
make cuda110
|
make cuda110
|
||||||
CUDA_VERSION=110 python -m build
|
CUDA_VERSION=110 python -m build
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
python -m twine upload dist/* --verbose
|
||||||
module unload cuda
|
module unload cuda
|
||||||
|
|
||||||
rm -rf dist build
|
rm -rf dist build
|
||||||
|
@ -64,7 +64,7 @@ module load cuda/11.1
|
||||||
CUDA_HOME=/public/apps/cuda/11.1
|
CUDA_HOME=/public/apps/cuda/11.1
|
||||||
make cuda11x
|
make cuda11x
|
||||||
CUDA_VERSION=111 python -m build
|
CUDA_VERSION=111 python -m build
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
python -m twine upload dist/* --verbose
|
||||||
module unload cuda
|
module unload cuda
|
||||||
|
|
||||||
rm -rf dist build
|
rm -rf dist build
|
||||||
|
@ -74,7 +74,7 @@ module load cuda/11.2
|
||||||
CUDA_HOME=/public/apps/cuda/11.2
|
CUDA_HOME=/public/apps/cuda/11.2
|
||||||
make cuda11x
|
make cuda11x
|
||||||
CUDA_VERSION=112 python -m build
|
CUDA_VERSION=112 python -m build
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
python -m twine upload dist/* --verbose
|
||||||
module unload cuda
|
module unload cuda
|
||||||
|
|
||||||
rm -rf dist build
|
rm -rf dist build
|
||||||
|
@ -82,5 +82,5 @@ make clean
|
||||||
make cleaneggs
|
make cleaneggs
|
||||||
CUDA_HOME=/private/home/timdettmers/git/autoswap/local/cuda-11.3 make cuda11x
|
CUDA_HOME=/private/home/timdettmers/git/autoswap/local/cuda-11.3 make cuda11x
|
||||||
CUDA_VERSION=113 python -m build
|
CUDA_VERSION=113 python -m build
|
||||||
python -m twine upload --repository testpypi dist/* --verbose
|
python -m twine upload dist/* --verbose
|
||||||
module unload cuda
|
module unload cuda
|
||||||
|
|
10
setup.py
10
setup.py
|
@ -13,19 +13,19 @@ def read(fname):
|
||||||
|
|
||||||
setup(
|
setup(
|
||||||
name = f"bitsandbytes-cuda{os.environ['CUDA_VERSION']}",
|
name = f"bitsandbytes-cuda{os.environ['CUDA_VERSION']}",
|
||||||
version = "0.0.23",
|
version = "0.0.24",
|
||||||
author = "Tim Dettmers",
|
author = "Tim Dettmers",
|
||||||
author_email = "tim.dettmers@gmail.com",
|
author_email = "dettmers@cs.washington.edu",
|
||||||
description = ("Numpy-like library for GPUs."),
|
description = ("8-bit optimizers and quantization routines."),
|
||||||
license = "MIT",
|
license = "MIT",
|
||||||
keywords = "gpu",
|
keywords = "gpu optimizers optimization 8-bit quantization compression",
|
||||||
url = "http://packages.python.org/bitsandbytes",
|
url = "http://packages.python.org/bitsandbytes",
|
||||||
packages=find_packages(),
|
packages=find_packages(),
|
||||||
package_data={'': ['libbitsandbytes.so']},
|
package_data={'': ['libbitsandbytes.so']},
|
||||||
long_description=read('README.md'),
|
long_description=read('README.md'),
|
||||||
long_description_content_type = 'text/markdown',
|
long_description_content_type = 'text/markdown',
|
||||||
classifiers=[
|
classifiers=[
|
||||||
"Development Status :: 1 - Planning",
|
"Development Status :: 4 - Beta",
|
||||||
'Topic :: Scientific/Engineering :: Artificial Intelligence'
|
'Topic :: Scientific/Engineering :: Artificial Intelligence'
|
||||||
],
|
],
|
||||||
)
|
)
|
||||||
|
|
Loading…
Reference in New Issue
Block a user