@@ -57,10 +57,13 @@ turbomind_chat_model:
5757 - deepseek-ai/deepseek-coder-1.3b-instruct
5858 - codellama/CodeLlama-7b-Instruct-hf
5959 - THUDM/glm-4-9b-chat
60+ - openbmb/MiniCPM-Llama3-V-2_5
61+ - openbmb/MiniCPM-V-2_6
6062
6163pytorch_chat_model :
6264 - meta-llama/Meta-Llama-3-8B-Instruct
6365 - meta-llama/Meta-Llama-3-1-8B-Instruct
66+ - meta-llama/Llama-3.2-1B-Instruct
6467 - meta-llama/Llama-2-7b-chat-hf
6568 - internlm/internlm2_5-7b-chat
6669 - internlm/internlm2_5-20b-chat
@@ -71,6 +74,7 @@ pytorch_chat_model:
7174 - OpenGVLab/InternVL2-8B
7275 - OpenGVLab/InternVL2-26B
7376 - OpenGVLab/InternVL2-40B
77+ - OpenGVLab/InternVL-Chat-V1-5
7478 - baichuan-inc/Baichuan2-7B-Chat
7579 - baichuan-inc/Baichuan2-13B-Chat
7680 - 01-ai/Yi-6B-Chat
@@ -94,9 +98,9 @@ pytorch_chat_model:
9498 - THUDM/cogvlm2-llama3-chinese-chat-19B
9599 - THUDM/glm-4v-9b
96100 - THUDM/glm-4-9b-chat
101+ - THUDM/cogvlm-chat-hf
97102 - microsoft/Phi-3-mini-4k-instruct
98103 - microsoft/Phi-3-vision-128k-instruct
99- - bigcode/starcoder2-7b
100104
101105turbomind_base_model :
102106 - internlm/internlm2_5-7b
@@ -109,6 +113,7 @@ pytorch_base_model:
109113 - internlm/internlm2_5-7b
110114 - internlm/internlm2_5-1_8b
111115 - internlm/internlm2_5-20b
116+ - bigcode/starcoder2-7b
112117
113118vl_model :
114119 - Qwen/Qwen-VL-Chat
@@ -125,81 +130,27 @@ vl_model:
125130 - OpenGVLab/InternVL2-40B
126131 - Qwen/Qwen2-VL-2B-Instruct
127132 - Qwen/Qwen2-VL-7B-Instruct
128- - internlm/internlm-xcomposer2-vl-7b
129133 - internlm/internlm-xcomposer2d5-7b
130134 - internlm/internlm-xcomposer2-4khd-7b
131135 - THUDM/cogvlm-chat-hf
132136 - THUDM/cogvlm2-llama3-chinese-chat-19B
133137 - THUDM/glm-4v-9b
138+ - microsoft/Phi-3-mini-4k-instruct
134139 - microsoft/Phi-3-vision-128k-instruct
135140 - openbmb/MiniCPM-Llama3-V-2_5
136141 - openbmb/MiniCPM-V-2_6
137142
138143turbomind_quatization :
139- awq :
140- - meta-llama/Meta-Llama-3-1-8B-Instruct
141- - meta-llama/Meta-Llama-3-8B-Instruct
142- - meta-llama/Llama-2-7b-chat-hf
143- - internlm/internlm2_5-7b-chat
144- - internlm/internlm2_5-7b
145- - internlm/internlm2_5-20b-chat
146- - internlm/internlm2-chat-20b
147- - internlm/internlm2_5-20b
148- - internlm/internlm-chat-20b
149- - internlm/internlm-xcomposer2-4khd-7b
150- - internlm/internlm-xcomposer2d5-7b
151- - OpenGVLab/InternVL-Chat-V1-5
152- - OpenGVLab/Mini-InternVL-Chat-2B-V1-5
153- - OpenGVLab/InternVL2-2B
154- - OpenGVLab/InternVL2-8B
155- - OpenGVLab/InternVL2-26B
156- - OpenGVLab/InternVL2-40B
157- - Qwen/Qwen1.5-7B-Chat
158- - Qwen/Qwen2-7B-Instruct
159- - Qwen/Qwen2-1.5B-Instruct
160- - Qwen/Qwen2.5-7B-Instruct
161- - Qwen/Qwen-VL-Chat
162- - liuhaotian/llava-v1.5-13b
163- - liuhaotian/llava-v1.6-vicuna-7b
164- - 01-ai/Yi-VL-6B
165- - 01-ai/Yi-6B-Chat
166- - deepseek-ai/deepseek-vl-1.3b-chat
167- - baichuan-inc/Baichuan2-7B-Chat
168- - codellama/CodeLlama-7b-hf
169- - openbmb/MiniCPM-Llama3-V-2_5
170- - THUDM/glm-4-9b-chat
171- gptq :
172- - internlm/internlm2_5-7b-chat
173- kvint :
174- - meta-llama/Meta-Llama-3-1-8B-Instruct
175- - meta-llama/Meta-Llama-3-8B-Instruct
176- - meta-llama/Llama-2-7b-chat-hf
177- - internlm/internlm2_5-7b-chat
178- - internlm/internlm2_5-20b-chat
179- - internlm/internlm2-chat-20b
180- - internlm/internlm2-chat-20b-4bits
181- - internlm/internlm-chat-20b
182- - internlm/internlm-xcomposer2-4khd-7b
183- - internlm/internlm-xcomposer2d5-7b
184- - OpenGVLab/InternVL-Chat-V1-5
185- - Qwen/Qwen2-7B-Instruct
186- - Qwen/Qwen2-7B-Instruct-AWQ
187- - Qwen/Qwen2-1.5B-Instruct
188- - Qwen/Qwen1.5-7B-Chat
189- - Qwen/Qwen1.5-4B-Chat-AWQ
190- - Qwen/Qwen-VL-Chat
144+ no_awq :
145+ - Qwen/Qwen2-VL-2B-Instruct
146+ - Qwen/Qwen2-VL-7B-Instruct
147+ - mistralai/Mistral-7B-Instruct-v0.1
191148 - mistralai/Mistral-7B-Instruct-v0.2
192149 - mistralai/Mistral-7B-Instruct-v0.3
193- - lmdeploy/llama2-chat-7b-w4
194- - baichuan-inc/Baichuan2-7B-Chat
195- - 01-ai/Yi-6B-Chat
196- - 01-ai/Yi-VL-6B
197- - liuhaotian/llava-v1.5-13b
198- - liuhaotian/llava-v1.6-vicuna-7b
199- - deepseek-ai/deepseek-vl-1.3b-chat
200150 - deepseek-ai/deepseek-coder-1.3b-instruct
201151 - codellama/CodeLlama-7b-Instruct-hf
202- - THUDM/glm-4-9b-chat
152+ gptq :
153+ - internlm/internlm2_5-7b-chat
203154
204155pytorch_quatization :
205156 awq :
@@ -211,6 +162,7 @@ pytorch_quatization:
211162 - internlm/internlm2-chat-20b
212163 - OpenGVLab/InternVL-Chat-V1-5
213164 - 01-ai/Yi-6B-Chat
165+ - Qwen/Qwen1.5-7B-Chat
214166 - Qwen/Qwen2-7B-Instruct
215167 - Qwen/Qwen2-1.5B-Instruct
216168 - microsoft/Phi-3-mini-4k-instruct
@@ -223,6 +175,13 @@ pytorch_quatization:
223175 - 01-ai/Yi-6B-Chat
224176 - internlm/internlm2_5-20b
225177 - internlm/internlm2_5-7b
178+ no_kvint4 :
179+ - OpenGVLab/InternVL2-4B
180+ - deepseek-ai/DeepSeek-V2-Lite-Chat
181+ - microsoft/Phi-3-mini-4k-instruct
182+ - microsoft/Phi-3-vision-128k-instruct
183+ no_kvint8 :
184+ - deepseek-ai/DeepSeek-V2-Lite-Chat
226185
227186
228187longtext_model :
0 commit comments