Skip to content

Commit b4bd29d

Browse files
committed
Don't include bitsandbytes by default, update accelerate version
1 parent b8efdaa commit b4bd29d

File tree

3 files changed

+60
-17
lines changed

3 files changed

+60
-17
lines changed

Dockerfile

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -253,9 +253,7 @@ COPY --from=flash-att-v2-cache /usr/src/flash-attention-v2/build/lib.linux-x86_6
253253
# Install server
254254
COPY proto proto
255255
COPY server server
256-
RUN cd server && \
257-
make gen-server && \
258-
pip install ".[bnb, accelerate, onnx-gpu]" --no-cache-dir
256+
RUN cd server && make gen-server && pip install ".[accelerate, onnx-gpu]" --no-cache-dir
259257

260258
# Patch codegen model changes into transformers 4.31
261259
RUN cp server/transformers_patch/modeling_codegen.py \

server/poetry.lock

Lines changed: 55 additions & 11 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

server/pyproject.toml

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -8,14 +8,15 @@ authors = ["Olivier Dehaene <[email protected]>"]
88
text-generation-server = 'text_generation_server.cli:app'
99

1010
[tool.poetry.dependencies]
11-
python = "^3.9"
11+
python = ">=3.9.0,<3.13"
1212
protobuf = "^4.24.3"
1313
grpcio = "^1.58.0"
1414
grpcio-reflection = "^1.58.0"
1515
loguru = "^0.7.0"
1616
typer = "^0.9.0"
17-
accelerate = { version = "0.20.3", optional = true }
17+
accelerate = { version = "0.23.0", optional = true }
1818
bitsandbytes = { version = "^0.41.0", optional = true }
19+
scipy = { version = "^1.11.2", optional = true }
1920
safetensors = "^0.3.3"
2021
sentencepiece = "^0.1.99"
2122
transformers = "4.33.1"
@@ -33,7 +34,7 @@ cryptography = ">=41.0.3"
3334

3435
[tool.poetry.extras]
3536
accelerate = ["accelerate"]
36-
bnb = ["bitsandbytes"]
37+
bnb = ["bitsandbytes", "scipy"] # BNB doesn't declare a dep on scipy https://github.com/TimDettmers/bitsandbytes/pull/525
3738
onnx = ["optimum", "onnxruntime", "onnx"]
3839
onnx-gpu = ["optimum", "onnxruntime-gpu", "onnx"]
3940

0 commit comments

Comments
 (0)