Update peft + transformers + accelerate + bnb + safetensors (huggingf…

…ace#1646)
kdamaszk · Apr 25, 2024 · 86c5ce5 · 86c5ce5
1 parent 7809825
commit 86c5ce5
Show file tree

Hide file tree

Showing 5 changed files with 176 additions and 630 deletions.
diff --git a/Dockerfile b/Dockerfile
@@ -31,7 +31,7 @@ COPY launcher launcher
 RUN cargo build --release
 
 # Text Generation Inference base image
-FROM vault.habana.ai/gaudi-docker/1.14.0/ubuntu22.04/habanalabs/pytorch-installer-2.1.1:latest as base
+FROM vault.habana.ai/gaudi-docker/1.15.0/ubuntu22.04/habanalabs/pytorch-installer-2.2.0:latest as base
 
 # Text Generation Inference base env
 ENV HUGGINGFACE_HUB_CACHE=/data \
@@ -58,7 +58,7 @@ COPY server/Makefile server/Makefile
 RUN cd server && \
     make gen-server && \
     pip install -r requirements.txt && \
-    pip install git+https://github.com/HabanaAI/DeepSpeed.git@1.14.0 && \
+    pip install git+https://github.com/HabanaAI/DeepSpeed.git@1.15.0 && \
     pip install . --no-cache-dir
 
 # Install benchmarker

diff --git a/server/Makefile b/server/Makefile
@@ -22,8 +22,8 @@ install-megablocks:
 
 install: gen-server
 	pip install pip --upgrade
-	pip install -r requirements_cuda.txt
-	pip install -e ".[bnb, accelerate, quantize, peft, outlines]"
+	pip install -r requirements.txt
+	pip install -e "."
 
 run-dev:
 	SAFETENSORS_FAST_GPU=1 python -m torch.distributed.run --nproc_per_node=2 text_generation_server/cli.py serve bigscience/bloom-560m --sharded