Skip to content

Commit

Permalink
Update peft + transformers + accelerate + bnb + safetensors (huggingf…
Browse files Browse the repository at this point in the history
  • Loading branch information
abhishekkrthakur authored and kdamaszk committed Apr 25, 2024
1 parent 7809825 commit 86c5ce5
Show file tree
Hide file tree
Showing 5 changed files with 176 additions and 630 deletions.
4 changes: 2 additions & 2 deletions Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@ COPY launcher launcher
RUN cargo build --release

# Text Generation Inference base image
FROM vault.habana.ai/gaudi-docker/1.14.0/ubuntu22.04/habanalabs/pytorch-installer-2.1.1:latest as base
FROM vault.habana.ai/gaudi-docker/1.15.0/ubuntu22.04/habanalabs/pytorch-installer-2.2.0:latest as base

# Text Generation Inference base env
ENV HUGGINGFACE_HUB_CACHE=/data \
Expand All @@ -58,7 +58,7 @@ COPY server/Makefile server/Makefile
RUN cd server && \
make gen-server && \
pip install -r requirements.txt && \
pip install git+https://github.com/HabanaAI/DeepSpeed.git@1.14.0 && \
pip install git+https://github.com/HabanaAI/DeepSpeed.git@1.15.0 && \
pip install . --no-cache-dir

# Install benchmarker
Expand Down
4 changes: 2 additions & 2 deletions server/Makefile
Original file line number Diff line number Diff line change
Expand Up @@ -22,8 +22,8 @@ install-megablocks:

install: gen-server
pip install pip --upgrade
pip install -r requirements_cuda.txt
pip install -e ".[bnb, accelerate, quantize, peft, outlines]"
pip install -r requirements.txt
pip install -e "."

run-dev:
SAFETENSORS_FAST_GPU=1 python -m torch.distributed.run --nproc_per_node=2 text_generation_server/cli.py serve bigscience/bloom-560m --sharded
Expand Down
Loading

0 comments on commit 86c5ce5

Please sign in to comment.