File tree 2 files changed +21
-0
lines changed
2 files changed +21
-0
lines changed Original file line number Diff line number Diff line change @@ -1663,6 +1663,26 @@ def norm_class(self) -> Type:
1663
1663
intermediate_size = 28672 ,
1664
1664
)
1665
1665
)
1666
+ configs .append (
1667
+ # https://huggingface.co/mistralai/Mistral-Large-Instruct-2411/blob/main/config.json
1668
+ dict (
1669
+ name = "Mistral-Large-Instruct-2411" ,
1670
+ hf_config = dict (org = "mistralai" , name = "Mistral-Large-Instruct-2411" ),
1671
+ padded_vocab_size = 32768 ,
1672
+ block_size = 32768 ,
1673
+ n_layer = 88 ,
1674
+ n_head = 96 ,
1675
+ n_embd = 12288 ,
1676
+ n_query_groups = 8 ,
1677
+ rotary_percentage = 1.0 ,
1678
+ parallel_residual = False ,
1679
+ bias = False ,
1680
+ norm_class_name = "RMSNorm" ,
1681
+ norm_eps = 1e-05 ,
1682
+ mlp_class_name = "LLaMAMLP" ,
1683
+ intermediate_size = 28672 ,
1684
+ )
1685
+ )
1666
1686
1667
1687
1668
1688
############
Original file line number Diff line number Diff line change @@ -171,6 +171,7 @@ mistralai/Mistral-7B-Instruct-v0.3
171
171
mistralai/Mistral-7B-v0.1
172
172
mistralai/Mistral-7B-v0.3
173
173
mistralai/Mistral-Large-Instruct-2407
174
+ mistralai/Mistral-Large-Instruct-2411
174
175
mistralai/Mixtral-8x7B-Instruct-v0.1
175
176
mistralai/Mixtral-8x7B-v0.1
176
177
mistralai/Mixtral-8x22B-Instruct-v0.1
You can’t perform that action at this time.
0 commit comments