Skip to content

Commit 5a3dca4

Browse files
committed
Fix the mkl-dynamic forking.
1 parent 2906b5e commit 5a3dca4

File tree

5 files changed

+16
-22
lines changed

5 files changed

+16
-22
lines changed

Cargo.lock

Lines changed: 6 additions & 14 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

Cargo.toml

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -46,8 +46,7 @@ serde_json = "1.0"
4646
thiserror = "1.0"
4747
rand = "0.9"
4848
serial_test = "2.0.0"
49-
# cudarc = { version = "0.13" , features =["cuda-version-from-build-system"]}
50-
cudarc = { git = "https://github.com/Narsil/cudarc" , rev = "1956436aeddea1da04fc3226282bc07c07eeaa35", features =["cuda-12020"]}
49+
cudarc = { version = "0.13" , features =["cuda-12020"]}
5150
candle = { version = "0.8", package = "candle-core" }
5251
candle-nn = { version = "0.8", package = "candle-nn" }
5352
candle-transformers = { version = "0.8", package = "candle-transformers" }
@@ -60,6 +59,10 @@ half = { version = "2.3.1", features = ["num-traits"] }
6059

6160
[patch.crates-io]
6261
cudarc = { git = "https://github.com/Narsil/cudarc" , rev = "1956436aeddea1da04fc3226282bc07c07eeaa35"}
62+
candle = { git = "https://github.com/Narsil/candle", rev = "2e273ddf31b1b796d3cfcd181ccb98deaa48466e", package = "candle-core" }
63+
candle-nn = { git = "https://github.com/Narsil/candle", rev = "2e273ddf31b1b796d3cfcd181ccb98deaa48466e", package = "candle-nn" }
64+
candle-transformers = { git = "https://github.com/Narsil/candle", rev = "2e273ddf31b1b796d3cfcd181ccb98deaa48466e", package = "candle-transformers" }
65+
candle-flash-attn = { git = "https://github.com/Narsil/candle", rev = "2e273ddf31b1b796d3cfcd181ccb98deaa48466e", package = "candle-flash-attn" }
6366

6467
[profile.release]
6568
debug = 0

backends/Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ candle = ["dep:text-embeddings-backend-candle"]
2525
cuda = ["text-embeddings-backend-candle?/cuda"]
2626
metal = ["text-embeddings-backend-candle?/metal"]
2727
mkl = ["text-embeddings-backend-candle?/mkl"]
28-
# mkl-dynamic = ["text-embeddings-backend-candle?/mkl-dynamic"]
28+
mkl-dynamic = ["text-embeddings-backend-candle?/mkl-dynamic"]
2929
accelerate = ["text-embeddings-backend-candle?/accelerate"]
3030
# static-linking = ["text-embeddings-backend-candle?/static-linking"]
3131
flash-attn = ["text-embeddings-backend-candle?/flash-attn"]

backends/candle/Cargo.toml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -40,8 +40,8 @@ anyhow = { version = "1", features = ["backtrace"] }
4040
[features]
4141
accelerate = ["dep:accelerate-src", "candle/accelerate", "candle-nn/accelerate"]
4242
metal = ["candle/metal", "candle-nn/metal"]
43-
mkl = ["dep:intel-mkl-src", "intel-mkl-src/mkl-static-lp64-iomp", "candle/mkl", "candle-nn/mkl"]
44-
# mkl-dynamic = ["dep:intel-mkl-src", "intel-mkl-src/mkl-dynamic-lp64-iomp", "candle/mkl-dynamic", "candle-nn/mkl-dynamic"]
43+
mkl = ["dep:intel-mkl-src", "intel-mkl-src/mkl-static-lp64-iomp", "candle/mkl"]
44+
mkl-dynamic = ["dep:intel-mkl-src", "intel-mkl-src/mkl-dynamic-lp64-iomp", "candle/mkl"]
4545
cuda = ["candle/cuda", "candle-nn/cuda", "dep:candle-cublaslt", "dep:candle-layer-norm", "dep:candle-rotary"]
4646
flash-attn-v1 = ["dep:candle-flash-attn-v1", "cuda"]
4747
flash-attn = ["dep:candle-flash-attn", "cuda"]

router/Cargo.toml

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -57,7 +57,6 @@ tonic-health = { version = "0.11.0", optional = true }
5757
tonic-reflection = { version = "0.11.0", optional = true }
5858
tokio-stream = { version = "0.1.14", optional = true }
5959
cudarc = { workspace = true }
60-
intel-mkl-src = { version = "0.8.1", default-features = false, optional = true }
6160

6261
# Malloc trim hack for linux
6362
[target.'cfg(target_os = "linux")'.dependencies]
@@ -81,8 +80,8 @@ default = ["candle", "http"]
8180
http = ["dep:axum", "dep:axum-tracing-opentelemetry", "dep:base64", "dep:tower-http", "dep:utoipa", "dep:utoipa-swagger-ui"]
8281
grpc = ["metrics-exporter-prometheus/http-listener", "dep:prost", "dep:tonic", "dep:tonic-health", "dep:tonic-reflection", "dep:tonic-build", "dep:async-stream", "dep:tokio-stream"]
8382
metal = ["text-embeddings-backend/metal"]
84-
mkl = ["dep:intel-mkl-src", "intel-mkl-src/mkl-static-lp64-iomp"]
85-
mkl-dynamic = ["dep:intel-mkl-src", "intel-mkl-src/mkl-dynamic-lp64-iomp"]
83+
mkl = ["text-embeddings-backend/mkl"]
84+
mkl-dynamic = ["text-embeddings-backend/mkl-dynamic"]
8685
accelerate = ["text-embeddings-backend/accelerate"]
8786
python = ["text-embeddings-backend/python"]
8887
ort = ["text-embeddings-backend/ort"]

0 commit comments

Comments
 (0)