From b92e3165b96aebe11623dcb1cc8d0ec0512585ff Mon Sep 17 00:00:00 2001 From: Eric Buehler <65165915+EricLBuehler@users.noreply.github.com> Date: Sun, 24 Nov 2024 05:29:53 -0500 Subject: [PATCH] Support fp8 on Metal (#930) --- Cargo.lock | 10 +++++----- Cargo.toml | 4 ++-- mistralrs-core/Cargo.toml | 2 +- 3 files changed, 8 insertions(+), 8 deletions(-) diff --git a/Cargo.lock b/Cargo.lock index 543aa5c3b..580107233 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -393,7 +393,7 @@ checksum = "9ac0150caa2ae65ca5bd83f25c7de183dea78d4d366469f148435e2acfbad0da" [[package]] name = "candle-core" version = "0.8.0" -source = "git+https://github.com/EricLBuehler/candle.git?rev=e97177b#e97177bd21215968d28073ff7b805e51321230e4" +source = "git+https://github.com/EricLBuehler/candle.git?rev=6b10eac#6b10eacc58d7e0ad71f296142f6b176005d8c61c" dependencies = [ "accelerate-src", "byteorder", @@ -424,7 +424,7 @@ dependencies = [ [[package]] name = "candle-flash-attn" version = "0.8.0" -source = "git+https://github.com/EricLBuehler/candle.git?rev=e97177b#e97177bd21215968d28073ff7b805e51321230e4" +source = "git+https://github.com/EricLBuehler/candle.git?rev=6b10eac#6b10eacc58d7e0ad71f296142f6b176005d8c61c" dependencies = [ "anyhow", "bindgen_cuda 0.1.5", @@ -435,7 +435,7 @@ dependencies = [ [[package]] name = "candle-kernels" version = "0.8.0" -source = "git+https://github.com/EricLBuehler/candle.git?rev=e97177b#e97177bd21215968d28073ff7b805e51321230e4" +source = "git+https://github.com/EricLBuehler/candle.git?rev=6b10eac#6b10eacc58d7e0ad71f296142f6b176005d8c61c" dependencies = [ "bindgen_cuda 0.1.5", ] @@ -443,7 +443,7 @@ dependencies = [ [[package]] name = "candle-metal-kernels" version = "0.8.0" -source = "git+https://github.com/EricLBuehler/candle.git?rev=e97177b#e97177bd21215968d28073ff7b805e51321230e4" +source = "git+https://github.com/EricLBuehler/candle.git?rev=6b10eac#6b10eacc58d7e0ad71f296142f6b176005d8c61c" dependencies = [ "metal 0.27.0", "once_cell", @@ -454,7 +454,7 @@ dependencies = [ [[package]] name = "candle-nn" version = "0.8.0" -source = "git+https://github.com/EricLBuehler/candle.git?rev=e97177b#e97177bd21215968d28073ff7b805e51321230e4" +source = "git+https://github.com/EricLBuehler/candle.git?rev=6b10eac#6b10eacc58d7e0ad71f296142f6b176005d8c61c" dependencies = [ "accelerate-src", "candle-core", diff --git a/Cargo.toml b/Cargo.toml index ca15568f1..7143b0ff2 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -25,8 +25,8 @@ license = "MIT" [workspace.dependencies] anyhow = "1.0.80" -candle-core = { git = "https://github.com/EricLBuehler/candle.git", version = "0.8.0", rev = "e97177b" } -candle-nn = { git = "https://github.com/EricLBuehler/candle.git", version = "0.8.0", rev = "e97177b" } +candle-core = { git = "https://github.com/EricLBuehler/candle.git", version = "0.8.0", rev = "6b10eac" } +candle-nn = { git = "https://github.com/EricLBuehler/candle.git", version = "0.8.0", rev = "6b10eac" } serde = "1.0.197" serde_json = "1.0.114" indexmap = { version = "2.2.5", features = ["serde"] } diff --git a/mistralrs-core/Cargo.toml b/mistralrs-core/Cargo.toml index b8cff1eca..06ebc9751 100644 --- a/mistralrs-core/Cargo.toml +++ b/mistralrs-core/Cargo.toml @@ -17,7 +17,7 @@ candle-core.workspace = true candle-nn.workspace = true serde.workspace = true serde_json.workspace = true -candle-flash-attn = { git = "https://github.com/EricLBuehler/candle.git", version = "0.8.0", rev = "e97177b", optional = true } +candle-flash-attn = { git = "https://github.com/EricLBuehler/candle.git", version = "0.8.0", rev = "6b10eac", optional = true } dirs = "5.0.1" hf-hub = "0.3.2" thiserror = "1.0.57"