Skip to content

Commit 1e0f9fc

Browse files
committed
Now it's working.
1 parent a90e0f1 commit 1e0f9fc

File tree

3 files changed

+10
-15
lines changed

3 files changed

+10
-15
lines changed

Cargo.lock

Lines changed: 1 addition & 2 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

Cargo.toml

Lines changed: 6 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -46,31 +46,27 @@ serde_json = "1.0"
4646
thiserror = "1.0"
4747
rand = "0.9"
4848
serial_test = "2.0.0"
49-
# cudarc = { version = "0.13" , features =["cuda-12020"]}
50-
cudarc = { git = "https://github.com/Narsil/cudarc" , rev = "61a028a3d3cac8acd8f71921293a43c2fe4f1b47", features = ["cuda-12020"]}
51-
intel-mkl-src = { version = "0.8" }
49+
cudarc = { version = "0.13" , features =["cuda-12020"], default-features = false}
50+
intel-mkl-src = { version = "0.8"}
5251
candle = { version = "0.8", package = "candle-core" }
5352
candle-nn = { version = "0.8", package = "candle-nn" }
5453
candle-transformers = { version = "0.8", package = "candle-transformers" }
5554
candle-flash-attn = { version = "0.8", package = "candle-flash-attn" }
5655
half = { version = "2.3.1", features = ["num-traits"] }
5756

5857
[patch.crates-io]
59-
cudarc = { git = "https://github.com/Narsil/cudarc" , rev = "61a028a3d3cac8acd8f71921293a43c2fe4f1b47"}
58+
cudarc = { git = "https://github.com/Narsil/cudarc" , rev = "b2d6443329e559e9580204b55ecaf44cd6fb6d90"}
6059
candle = { git = "https://github.com/huggingface/candle", rev = "ec6d7ca7738f4052b6613edc8f4d2bb6866a7539", package = "candle-core" }
6160
candle-nn = { git = "https://github.com/huggingface/candle", rev = "ec6d7ca7738f4052b6613edc8f4d2bb6866a7539", package = "candle-nn" }
6261
candle-transformers = { git = "https://github.com/huggingface/candle", rev = "ec6d7ca7738f4052b6613edc8f4d2bb6866a7539", package = "candle-transformers" }
6362
candle-flash-attn = { git = "https://github.com/huggingface/candle", rev = "ec6d7ca7738f4052b6613edc8f4d2bb6866a7539", package = "candle-flash-attn" }
64-
# candle = { path = "../candle/candle-core", package = "candle-core" }
65-
# candle-nn = { path = "../candle/candle-nn" }
66-
# candle-flash-attn = { path = "../candle/candle-flash-attn" }
6763

6864
[profile.release]
6965
debug = 0
70-
# lto = "fat"
66+
lto = "fat"
7167
opt-level = 3
72-
# codegen-units = 1
73-
# strip = "symbols"
68+
codegen-units = 1
69+
strip = "symbols"
7470
panic = "abort"
7571

7672
[profile.release-debug]

router/Cargo.toml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -88,9 +88,9 @@ accelerate = ["text-embeddings-backend/accelerate"]
8888
python = ["text-embeddings-backend/python"]
8989
ort = ["text-embeddings-backend/ort"]
9090
candle = ["text-embeddings-backend/candle"]
91-
candle-cuda = ["candle", "text-embeddings-backend/flash-attn"]
92-
candle-cuda-turing = ["candle", "text-embeddings-backend/flash-attn-v1"]
93-
candle-cuda-volta = ["candle", "text-embeddings-backend/cuda"]
91+
candle-cuda = ["candle", "text-embeddings-backend/flash-attn", "dep:cudarc"]
92+
candle-cuda-turing = ["candle", "text-embeddings-backend/flash-attn-v1", "dep:cudarc"]
93+
candle-cuda-volta = ["candle", "text-embeddings-backend/cuda", "dep:cudarc"]
9494
static-linking = ["cudarc?/static-linking", "intel-mkl-src?/mkl-static-lp64-iomp"]
9595
dynamic-linking = ["cudarc?/dynamic-linking", "intel-mkl-src?/mkl-dynamic-lp64-iomp"]
9696
google = []

0 commit comments

Comments
 (0)