|
12 | 12 | _GENERATION_MODELS = {
|
13 | 13 | "AquilaModel": ("llama", "LlamaForCausalLM"),
|
14 | 14 | "AquilaForCausalLM": ("llama", "LlamaForCausalLM"), # AquilaChat2
|
| 15 | + "ArcticForCausalLM": ("arctic", "ArcticForCausalLM"), |
15 | 16 | "BaiChuanForCausalLM": ("baichuan", "BaiChuanForCausalLM"), # baichuan-7b
|
16 | 17 | "BaichuanForCausalLM": ("baichuan", "BaichuanForCausalLM"), # baichuan-13b
|
17 | 18 | "BloomForCausalLM": ("bloom", "BloomForCausalLM"),
|
|
30 | 31 | "GPTBigCodeForCausalLM": ("gpt_bigcode", "GPTBigCodeForCausalLM"),
|
31 | 32 | "GPTJForCausalLM": ("gpt_j", "GPTJForCausalLM"),
|
32 | 33 | "GPTNeoXForCausalLM": ("gpt_neox", "GPTNeoXForCausalLM"),
|
| 34 | + "GraniteForCausalLM": ("granite", "GraniteForCausalLM"), |
33 | 35 | "InternLMForCausalLM": ("llama", "LlamaForCausalLM"),
|
34 | 36 | "InternLM2ForCausalLM": ("internlm2", "InternLM2ForCausalLM"),
|
35 | 37 | "JAISLMHeadModel": ("jais", "JAISLMHeadModel"),
|
| 38 | + "JambaForCausalLM": ("jamba", "JambaForCausalLM"), |
36 | 39 | "LlamaForCausalLM": ("llama", "LlamaForCausalLM"),
|
37 | 40 | # For decapoda-research/llama-*
|
38 | 41 | "LLaMAForCausalLM": ("llama", "LlamaForCausalLM"),
|
|
52 | 55 | "PersimmonForCausalLM": ("persimmon", "PersimmonForCausalLM"),
|
53 | 56 | "PhiForCausalLM": ("phi", "PhiForCausalLM"),
|
54 | 57 | "Phi3ForCausalLM": ("phi3", "Phi3ForCausalLM"),
|
| 58 | + "Phi3SmallForCausalLM": ("phi3_small", "Phi3SmallForCausalLM"), |
55 | 59 | "PhiMoEForCausalLM": ("phimoe", "PhiMoEForCausalLM"),
|
56 | 60 | "Qwen2ForCausalLM": ("qwen2", "Qwen2ForCausalLM"),
|
57 | 61 | "Qwen2MoeForCausalLM": ("qwen2_moe", "Qwen2MoeForCausalLM"),
|
|
62 | 66 | "StableLmForCausalLM": ("stablelm", "StablelmForCausalLM"),
|
63 | 67 | "Starcoder2ForCausalLM": ("starcoder2", "Starcoder2ForCausalLM"),
|
64 | 68 | "SolarForCausalLM": ("solar", "SolarForCausalLM"),
|
65 |
| - "ArcticForCausalLM": ("arctic", "ArcticForCausalLM"), |
66 | 69 | "XverseForCausalLM": ("xverse", "XverseForCausalLM"),
|
67 |
| - "Phi3SmallForCausalLM": ("phi3_small", "Phi3SmallForCausalLM"), |
| 70 | + # NOTE: The below models are for speculative decoding only |
68 | 71 | "MedusaModel": ("medusa", "Medusa"),
|
69 | 72 | "EAGLEModel": ("eagle", "EAGLE"),
|
70 | 73 | "MLPSpeculatorPreTrainedModel": ("mlp_speculator", "MLPSpeculator"),
|
71 |
| - "JambaForCausalLM": ("jamba", "JambaForCausalLM"), |
72 |
| - "GraniteForCausalLM": ("granite", "GraniteForCausalLM") |
73 | 74 | }
|
74 | 75 |
|
75 | 76 | _EMBEDDING_MODELS = {
|
|
0 commit comments