Unverified Commit 448e79a6 authored by Anant Sharma's avatar Anant Sharma Committed by GitHub
Browse files

build: update cudarc dependency to crate version (#815)

parent 0e4fffbc
...@@ -677,7 +677,7 @@ dependencies = [ ...@@ -677,7 +677,7 @@ dependencies = [
"byteorder", "byteorder",
"candle-kernels 0.8.0", "candle-kernels 0.8.0",
"candle-metal-kernels", "candle-metal-kernels",
"cudarc 0.13.9 (registry+https://github.com/rust-lang/crates.io-index)", "cudarc 0.13.9",
"float8", "float8",
"gemm 0.17.1", "gemm 0.17.1",
"half", "half",
...@@ -702,7 +702,7 @@ checksum = "06ccf5ee3532e66868516d9b315f73aec9f34ea1a37ae98514534d458915dbf1" ...@@ -702,7 +702,7 @@ checksum = "06ccf5ee3532e66868516d9b315f73aec9f34ea1a37ae98514534d458915dbf1"
dependencies = [ dependencies = [
"byteorder", "byteorder",
"candle-kernels 0.8.4", "candle-kernels 0.8.4",
"cudarc 0.13.9 (registry+https://github.com/rust-lang/crates.io-index)", "cudarc 0.13.9",
"gemm 0.17.1", "gemm 0.17.1",
"half", "half",
"memmap2", "memmap2",
...@@ -1151,8 +1151,9 @@ dependencies = [ ...@@ -1151,8 +1151,9 @@ dependencies = [
[[package]] [[package]]
name = "cudarc" name = "cudarc"
version = "0.13.9" version = "0.16.2"
source = "git+https://github.com/coreylowman/cudarc.git?rev=8c52e735b55bf8e979e1a16bd85e3dfe4f87c9fe#8c52e735b55bf8e979e1a16bd85e3dfe4f87c9fe" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "e4ed411343abcb4dd6fd1fbc32db3533d76c2af0fd40735a9e5e39e778a81254"
dependencies = [ dependencies = [
"libloading", "libloading",
] ]
...@@ -1612,7 +1613,7 @@ dependencies = [ ...@@ -1612,7 +1613,7 @@ dependencies = [
"bytes", "bytes",
"candle-core 0.8.4", "candle-core 0.8.4",
"chrono", "chrono",
"cudarc 0.13.9 (git+https://github.com/coreylowman/cudarc.git?rev=8c52e735b55bf8e979e1a16bd85e3dfe4f87c9fe)", "cudarc 0.16.2",
"derive-getters", "derive-getters",
"derive_builder", "derive_builder",
"dynamo-runtime", "dynamo-runtime",
...@@ -2064,7 +2065,7 @@ version = "0.2.1" ...@@ -2064,7 +2065,7 @@ version = "0.2.1"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "dee36245af1dccf978103fcd393582806db2a1d0bcd2f38c663cdbb4a363a01c" checksum = "dee36245af1dccf978103fcd393582806db2a1d0bcd2f38c663cdbb4a363a01c"
dependencies = [ dependencies = [
"cudarc 0.13.9 (registry+https://github.com/rust-lang/crates.io-index)", "cudarc 0.13.9",
"half", "half",
"num-traits", "num-traits",
"rand 0.9.0", "rand 0.9.0",
...@@ -6805,7 +6806,7 @@ version = "0.1.0" ...@@ -6805,7 +6806,7 @@ version = "0.1.0"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "50758486d7941f8b0a636ba7e29455c07071f41590beac1fd307ec893e8db69a" checksum = "50758486d7941f8b0a636ba7e29455c07071f41590beac1fd307ec893e8db69a"
dependencies = [ dependencies = [
"cudarc 0.13.9 (registry+https://github.com/rust-lang/crates.io-index)", "cudarc 0.13.9",
"half", "half",
"serde", "serde",
"thiserror 1.0.69", "thiserror 1.0.69",
......
...@@ -37,9 +37,9 @@ keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"] ...@@ -37,9 +37,9 @@ keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]
[workspace.dependencies] [workspace.dependencies]
# Local crates # Local crates
dynamo-runtime = { path = "lib/runtime" } dynamo-runtime = { path = "lib/runtime", version = "0.1.1" }
dynamo-llm = { path = "lib/llm" } dynamo-llm = { path = "lib/llm", version = "0.1.1" }
dynamo-tokens = { path = "lib/tokens" } dynamo-tokens = { path = "lib/tokens", version = "0.1.1" }
# External dependencies # External dependencies
anyhow = { version = "1" } anyhow = { version = "1" }
......
...@@ -70,7 +70,7 @@ regex = "1" ...@@ -70,7 +70,7 @@ regex = "1"
rayon = "1" rayon = "1"
# kv_cuda # kv_cuda
cudarc = { git = "https://github.com/coreylowman/cudarc.git", rev = "8c52e735b55bf8e979e1a16bd85e3dfe4f87c9fe", features = ["cuda-12040"], optional = true } cudarc = { version = "0.16.2", features = ["cuda-12040"], optional = true }
ndarray = { version = "0.16", optional = true } ndarray = { version = "0.16", optional = true }
# protocols # protocols
......
...@@ -205,8 +205,9 @@ impl DeviceStorageOwned { ...@@ -205,8 +205,9 @@ impl DeviceStorageOwned {
} }
pub fn device_ptr(&self) -> *const c_void { pub fn device_ptr(&self) -> *const c_void {
let ptr = self.cuda_slice.device_ptr(); let stream = self.cuda_device.default_stream();
(*ptr) as *const c_void let (ptr, _) = self.cuda_slice.device_ptr(&stream);
ptr as *const c_void
} }
pub fn context(&self) -> Arc<CudaContext> { pub fn context(&self) -> Arc<CudaContext> {
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment