We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 2992769 commit 5201002Copy full SHA for 5201002
examples/llama-3/sft.yaml
@@ -1,6 +1,4 @@
1
-base_model: "nm-testing/llama2.c-stories42M-gsm8k-sparse-only-uncompressed"
2
-# TODO: change to
3
-# base_model: neuralmagic/Sparse-Llama-3.1-8B-2of4
+base_model: neuralmagic/Sparse-Llama-3.1-8B-2of4
4
5
plugins:
6
- axolotl.integrations.llmcompressor_sft.SFTPlugin
@@ -27,7 +25,7 @@ wandb_watch:
27
25
wandb_name:
28
26
wandb_log_model:
29
30
-# gradient_accumulation_steps: 8
+gradient_accumulation_steps: 8
31
micro_batch_size: 1
32
num_epochs: 1
33
optimizer: paged_adamw_8bit
0 commit comments