|
70 | 70 | "q4f32_1": "Hermes-3-Llama-3.1-8B-q4f32_1-MLC", |
71 | 71 | } |
72 | 72 | }, |
| 73 | + "Hermes-3-Llama-3.2": { |
| 74 | + "3B": { |
| 75 | + "q0f16": "Hermes-3-Llama-3.2-3B-q0f16-MLC", |
| 76 | + "q4f16_1": "Hermes-3-Llama-3.2-3B-q4f16_1-MLC", |
| 77 | + "q4f32_1": "Hermes-3-Llama-3.2-3B-q4f32_1-MLC", |
| 78 | + } |
| 79 | + }, |
73 | 80 | "Phi-3-mini": { |
74 | 81 | "128k": { |
75 | 82 | "q0f16": "Phi-3-mini-128k-instruct-q0f16-MLC", |
|
240 | 247 | "q4f32_1": "Qwen2.5-Math-72B-Instruct-q4f32_1-MLC", |
241 | 248 | }, |
242 | 249 | }, |
| 250 | + "DeepSeek-R1-Distill-Llama": { |
| 251 | + "70B": { |
| 252 | + "q0f16": "DeepSeek-R1-Distill-Llama-70B-q0f16-MLC", |
| 253 | + "q4f16_1": "DeepSeek-R1-Distill-Llama-70B-q4f16_1-MLC", |
| 254 | + "q4f32_1": "DeepSeek-R1-Distill-Llama-70B-q4f32_1-MLC", |
| 255 | + }, |
| 256 | + "8B": { |
| 257 | + "q0f16": "DeepSeek-R1-Distill-Llama-8B-q0f16-MLC", |
| 258 | + "q4f16_1": "DeepSeek-R1-Distill-Llama-8B-q4f16_1-MLC", |
| 259 | + "q4f32_1": "DeepSeek-R1-Distill-Llama-8B-q4f32_1-MLC", |
| 260 | + }, |
| 261 | + }, |
| 262 | + "DeepSeek-R1-Distill-Qwen": { |
| 263 | + "1.5B": { |
| 264 | + "q0f16": "DeepSeek-R1-Distill-Qwen-1.5B-q0f16-MLC", |
| 265 | + "q4f16_1": "DeepSeek-R1-Distill-Qwen-1.5B-q4f16_1-MLC", |
| 266 | + "q4f32_1": "DeepSeek-R1-Distill-Qwen-1.5B-q4f32_1-MLC", |
| 267 | + }, |
| 268 | + "14B": { |
| 269 | + "q0f16": "DeepSeek-R1-Distill-Qwen-14B-q0f16-MLC", |
| 270 | + "q4f16_1": "DeepSeek-R1-Distill-Qwen-14B-q4f16_1-MLC", |
| 271 | + "q4f32_1": "DeepSeek-R1-Distill-Qwen-14B-q4f32_1-MLC", |
| 272 | + }, |
| 273 | + "32B": { |
| 274 | + "q0f16": "DeepSeek-R1-Distill-Qwen-32B-q0f16-MLC", |
| 275 | + "q4f16_1": "DeepSeek-R1-Distill-Qwen-32B-q4f16_1-MLC", |
| 276 | + "q4f32_1": "DeepSeek-R1-Distill-Qwen-32B-q4f32_1-MLC", |
| 277 | + }, |
| 278 | + "7B": { |
| 279 | + "q0f16": "DeepSeek-R1-Distill-Qwen-7B-q0f16-MLC", |
| 280 | + "q4f16_1": "DeepSeek-R1-Distill-Qwen-7B-q4f16_1-MLC", |
| 281 | + "q4f32_1": "DeepSeek-R1-Distill-Qwen-7B-q4f32_1-MLC", |
| 282 | + }, |
| 283 | + }, |
243 | 284 | "DeepSeek-V2-Lite-Chat": { |
244 | 285 | "-": { |
245 | 286 | "q0f16": "DeepSeek-V2-Lite-Chat-q0f16-MLC", |
|
260 | 301 | "q0f32": "SmolLM-1.7B-Instruct-q0f32-MLC", |
261 | 302 | "q4f16_1": "SmolLM-1.7B-Instruct-q4f16_1-MLC", |
262 | 303 | "q4f32_1": "SmolLM-1.7B-Instruct-q4f32_1-MLC", |
263 | | - } |
264 | | - }, |
265 | | - "SmolLM-135M-Instruct": { |
266 | | - "-": { |
| 304 | + }, |
| 305 | + "135M": { |
267 | 306 | "q0f16": "SmolLM-135M-Instruct-q0f16-MLC", |
268 | 307 | "q0f32": "SmolLM-135M-Instruct-q0f32-MLC", |
269 | 308 | "q4f16_1": "SmolLM-135M-Instruct-q4f16_1-MLC", |
270 | 309 | "q4f32_1": "SmolLM-135M-Instruct-q4f32_1-MLC", |
271 | | - } |
272 | | - }, |
273 | | - "SmolLM-360M-Instruct": { |
274 | | - "-": { |
| 310 | + }, |
| 311 | + "360M": { |
275 | 312 | "q0f16": "SmolLM-360M-Instruct-q0f16-MLC", |
276 | 313 | "q0f32": "SmolLM-360M-Instruct-q0f32-MLC", |
277 | 314 | "q4f16_1": "SmolLM-360M-Instruct-q4f16_1-MLC", |
278 | 315 | "q4f32_1": "SmolLM-360M-Instruct-q4f32_1-MLC", |
279 | | - } |
| 316 | + }, |
280 | 317 | }, |
281 | 318 | "SmolLM2": { |
282 | 319 | "1.7B": { |
283 | 320 | "q0f16": "SmolLM2-1.7B-Instruct-q0f16-MLC", |
284 | 321 | "q4f16_1": "SmolLM2-1.7B-Instruct-q4f16_1-MLC", |
285 | 322 | "q4f32_1": "SmolLM2-1.7B-Instruct-q4f32_1-MLC", |
286 | | - } |
287 | | - }, |
288 | | - "SmolLM2-135M-Instruct": { |
289 | | - "-": { |
| 323 | + }, |
| 324 | + "135M": { |
290 | 325 | "q0f16": "SmolLM2-135M-Instruct-q0f16-MLC", |
291 | 326 | "q0f32": "SmolLM2-135M-Instruct-q0f32-MLC", |
292 | 327 | "q4f16_1": "SmolLM2-135M-Instruct-q4f16_1-MLC", |
293 | 328 | "q4f32_1": "SmolLM2-135M-Instruct-q4f32_1-MLC", |
294 | | - } |
295 | | - }, |
296 | | - "SmolLM2-360M-Instruct": { |
297 | | - "-": { |
| 329 | + }, |
| 330 | + "360M": { |
298 | 331 | "q0f16": "SmolLM2-360M-Instruct-q0f16-MLC", |
299 | 332 | "q0f32": "SmolLM2-360M-Instruct-q0f32-MLC", |
300 | 333 | "q4f16_1": "SmolLM2-360M-Instruct-q4f16_1-MLC", |
301 | 334 | "q4f32_1": "SmolLM2-360M-Instruct-q4f32_1-MLC", |
302 | | - } |
| 335 | + }, |
303 | 336 | }, |
304 | 337 | "gemma-2": { |
305 | 338 | "27b": { |
|
0 commit comments