From 6148daf2a261717b37d99f1cbbc873b98293acb0 Mon Sep 17 00:00:00 2001 From: Eric Buehler Date: Mon, 24 Feb 2025 06:53:22 -0500 Subject: [PATCH] Add todos in metal/cuda --- candle-core/src/quantized/cuda.rs | 3 +++ candle-core/src/quantized/metal.rs | 3 +++ 2 files changed, 6 insertions(+) diff --git a/candle-core/src/quantized/cuda.rs b/candle-core/src/quantized/cuda.rs index 1a3d72c0fd..e84e1e65e5 100644 --- a/candle-core/src/quantized/cuda.rs +++ b/candle-core/src/quantized/cuda.rs @@ -435,6 +435,9 @@ impl QCudaStorage { GgmlDType::Q5K => deq::(&buffer, block_len, &mut out)?, GgmlDType::Q6K => deq::(&buffer, block_len, &mut out)?, GgmlDType::Q8K => deq::(&buffer, block_len, &mut out)?, + GgmlDType::Iq4Xs | GgmlDType::Iq4Nl => { + todo!("CUDA does not support Iq4Xs or Iq4Nl yet.") + } } self.device diff --git a/candle-core/src/quantized/metal.rs b/candle-core/src/quantized/metal.rs index f7f5b68ac2..8dda650f19 100644 --- a/candle-core/src/quantized/metal.rs +++ b/candle-core/src/quantized/metal.rs @@ -225,6 +225,9 @@ impl From for candle_metal_kernels::GgmlDType { GgmlDType::Q8K => candle_metal_kernels::GgmlDType::Q8K, GgmlDType::F16 => candle_metal_kernels::GgmlDType::F16, GgmlDType::F32 => candle_metal_kernels::GgmlDType::F32, + GgmlDType::Iq4Xs | GgmlDType::Iq4Nl => { + todo!("Metal does not support Iq4Xs or Iq4Nl yet.") + } } } }