Skip to content

Commit

Permalink
Quantized support for v2-zephyr.
Browse files Browse the repository at this point in the history
  • Loading branch information
LaurentMazare committed Feb 4, 2024
1 parent 0b83dce commit 70e0769
Showing 1 changed file with 8 additions and 2 deletions.
10 changes: 8 additions & 2 deletions candle-examples/examples/stable-lm/main.rs
Original file line number Diff line number Diff line change
Expand Up @@ -162,7 +162,7 @@ struct Args {
seed: u64,

/// The length of the sample to generate (in tokens).
#[arg(long, short = 'n', default_value_t = 100)]
#[arg(long, short = 'n', default_value_t = 1000)]
sample_len: usize,

#[arg(long)]
Expand Down Expand Up @@ -261,7 +261,13 @@ fn main() -> Result<()> {
.get("stablelm-2-1_6b-q4k.gguf")?;
vec![gguf]
}
(Which::V1Zephyr | Which::V2Zephyr | Which::Code, true) => {
(Which::V2Zephyr, true) => {
let gguf = api
.model("lmz/candle-stablelm".to_string())
.get("stablelm-2-zephyr-1_6b-q4k.gguf")?;
vec![gguf]
}
(Which::V1Zephyr | Which::Code, true) => {
anyhow::bail!("Quantized {:?} variant not supported.", args.which)
}
(Which::V1Orig | Which::V1 | Which::V1Zephyr | Which::V2 | Which::V2Zephyr, false) => {
Expand Down

0 comments on commit 70e0769

Please sign in to comment.