Skip to content

Commit 06652c1

Browse files
authored
Merge pull request axolotl-ai-cloud#196 from OpenAccess-AI-Collective/openllama-ft-config
tweak config to work
2 parents 068fc48 + 2ba4ae8 commit 06652c1

File tree

1 file changed

+6
-5
lines changed

1 file changed

+6
-5
lines changed

examples/openllama-3b/config.yml

+6-5
Original file line numberDiff line numberDiff line change
@@ -26,17 +26,18 @@ wandb_watch:
2626
wandb_run_id:
2727
wandb_log_model:
2828
output_dir: ./openllama-out
29-
batch_size: 16
30-
micro_batch_size: 4
29+
gradient_accumulation_steps: 1
30+
micro_batch_size: 1
3131
num_epochs: 3
3232
optimizer: adamw_bnb_8bit
3333
torchdistx_path:
3434
lr_scheduler: cosine
35-
learning_rate: 0.0002
35+
learning_rate: 0.00001
3636
train_on_inputs: false
3737
group_by_length: false
38+
float16: true
3839
bf16: false
39-
fp16: true
40+
fp16: false
4041
tf32: false
4142
gradient_checkpointing: true
4243
early_stopping_patience:
@@ -52,7 +53,7 @@ eval_steps: 50
5253
save_steps:
5354
debug:
5455
deepspeed:
55-
weight_decay: 0.0
56+
weight_decay: 0.1
5657
fsdp:
5758
fsdp_config:
5859
special_tokens:

0 commit comments

Comments
 (0)