|
12 | 12 | _GENERATION_MODELS = { |
13 | 13 | "AquilaModel": ("llama", "LlamaForCausalLM"), |
14 | 14 | "AquilaForCausalLM": ("llama", "LlamaForCausalLM"), # AquilaChat2 |
| 15 | + "ArcticForCausalLM": ("arctic", "ArcticForCausalLM"), |
15 | 16 | "BaiChuanForCausalLM": ("baichuan", "BaiChuanForCausalLM"), # baichuan-7b |
16 | 17 | "BaichuanForCausalLM": ("baichuan", "BaichuanForCausalLM"), # baichuan-13b |
17 | 18 | "BloomForCausalLM": ("bloom", "BloomForCausalLM"), |
|
30 | 31 | "GPTBigCodeForCausalLM": ("gpt_bigcode", "GPTBigCodeForCausalLM"), |
31 | 32 | "GPTJForCausalLM": ("gpt_j", "GPTJForCausalLM"), |
32 | 33 | "GPTNeoXForCausalLM": ("gpt_neox", "GPTNeoXForCausalLM"), |
| 34 | + "GraniteForCausalLM": ("granite", "GraniteForCausalLM"), |
33 | 35 | "InternLMForCausalLM": ("llama", "LlamaForCausalLM"), |
34 | 36 | "InternLM2ForCausalLM": ("internlm2", "InternLM2ForCausalLM"), |
35 | 37 | "JAISLMHeadModel": ("jais", "JAISLMHeadModel"), |
| 38 | + "JambaForCausalLM": ("jamba", "JambaForCausalLM"), |
36 | 39 | "LlamaForCausalLM": ("llama", "LlamaForCausalLM"), |
37 | 40 | # For decapoda-research/llama-* |
38 | 41 | "LLaMAForCausalLM": ("llama", "LlamaForCausalLM"), |
|
52 | 55 | "PersimmonForCausalLM": ("persimmon", "PersimmonForCausalLM"), |
53 | 56 | "PhiForCausalLM": ("phi", "PhiForCausalLM"), |
54 | 57 | "Phi3ForCausalLM": ("phi3", "Phi3ForCausalLM"), |
| 58 | + "Phi3SmallForCausalLM": ("phi3_small", "Phi3SmallForCausalLM"), |
55 | 59 | "PhiMoEForCausalLM": ("phimoe", "PhiMoEForCausalLM"), |
56 | 60 | "Qwen2ForCausalLM": ("qwen2", "Qwen2ForCausalLM"), |
57 | 61 | "Qwen2MoeForCausalLM": ("qwen2_moe", "Qwen2MoeForCausalLM"), |
|
62 | 66 | "StableLmForCausalLM": ("stablelm", "StablelmForCausalLM"), |
63 | 67 | "Starcoder2ForCausalLM": ("starcoder2", "Starcoder2ForCausalLM"), |
64 | 68 | "SolarForCausalLM": ("solar", "SolarForCausalLM"), |
65 | | - "ArcticForCausalLM": ("arctic", "ArcticForCausalLM"), |
66 | 69 | "XverseForCausalLM": ("xverse", "XverseForCausalLM"), |
67 | | - "Phi3SmallForCausalLM": ("phi3_small", "Phi3SmallForCausalLM"), |
| 70 | + # NOTE: The below models are for speculative decoding only |
68 | 71 | "MedusaModel": ("medusa", "Medusa"), |
69 | 72 | "EAGLEModel": ("eagle", "EAGLE"), |
70 | 73 | "MLPSpeculatorPreTrainedModel": ("mlp_speculator", "MLPSpeculator"), |
71 | | - "JambaForCausalLM": ("jamba", "JambaForCausalLM"), |
72 | | - "GraniteForCausalLM": ("granite", "GraniteForCausalLM") |
73 | 74 | } |
74 | 75 |
|
75 | 76 | _EMBEDDING_MODELS = { |
|
0 commit comments