|
15 | 15 | "supports_prompt_caching": true, |
16 | 16 | "supports_response_schema": true, |
17 | 17 | "supports_system_messages": true, |
| 18 | + "supports_web_search": true, |
| 19 | + "search_context_cost_per_query": { |
| 20 | + "search_context_size_low": 0.0000, |
| 21 | + "search_context_size_medium": 0.0000, |
| 22 | + "search_context_size_high": 0.0000 |
| 23 | + }, |
18 | 24 | "deprecation_date": "date when the model becomes deprecated in the format YYYY-MM-DD" |
19 | 25 | }, |
20 | 26 | "omni-moderation-latest": { |
|
74 | 80 | "supports_vision": true, |
75 | 81 | "supports_prompt_caching": true, |
76 | 82 | "supports_system_messages": true, |
77 | | - "supports_tool_choice": true |
| 83 | + "supports_tool_choice": true, |
| 84 | + "supports_web_search": true, |
| 85 | + "search_context_cost_per_query": { |
| 86 | + "search_context_size_low": 0.030, |
| 87 | + "search_context_size_medium": 0.035, |
| 88 | + "search_context_size_high": 0.050 |
| 89 | + } |
| 90 | + }, |
| 91 | + "gpt-4o-search-preview-2025-03-11": { |
| 92 | + "max_tokens": 16384, |
| 93 | + "max_input_tokens": 128000, |
| 94 | + "max_output_tokens": 16384, |
| 95 | + "input_cost_per_token": 0.0000025, |
| 96 | + "output_cost_per_token": 0.000010, |
| 97 | + "input_cost_per_token_batches": 0.00000125, |
| 98 | + "output_cost_per_token_batches": 0.00000500, |
| 99 | + "cache_read_input_token_cost": 0.00000125, |
| 100 | + "litellm_provider": "openai", |
| 101 | + "mode": "chat", |
| 102 | + "supports_function_calling": true, |
| 103 | + "supports_parallel_function_calling": true, |
| 104 | + "supports_response_schema": true, |
| 105 | + "supports_vision": true, |
| 106 | + "supports_prompt_caching": true, |
| 107 | + "supports_system_messages": true, |
| 108 | + "supports_tool_choice": true, |
| 109 | + "supports_web_search": true, |
| 110 | + "search_context_cost_per_query": { |
| 111 | + "search_context_size_low": 0.030, |
| 112 | + "search_context_size_medium": 0.035, |
| 113 | + "search_context_size_high": 0.050 |
| 114 | + } |
| 115 | + }, |
| 116 | + "gpt-4o-search-preview": { |
| 117 | + "max_tokens": 16384, |
| 118 | + "max_input_tokens": 128000, |
| 119 | + "max_output_tokens": 16384, |
| 120 | + "input_cost_per_token": 0.0000025, |
| 121 | + "output_cost_per_token": 0.000010, |
| 122 | + "input_cost_per_token_batches": 0.00000125, |
| 123 | + "output_cost_per_token_batches": 0.00000500, |
| 124 | + "cache_read_input_token_cost": 0.00000125, |
| 125 | + "litellm_provider": "openai", |
| 126 | + "mode": "chat", |
| 127 | + "supports_function_calling": true, |
| 128 | + "supports_parallel_function_calling": true, |
| 129 | + "supports_response_schema": true, |
| 130 | + "supports_vision": true, |
| 131 | + "supports_prompt_caching": true, |
| 132 | + "supports_system_messages": true, |
| 133 | + "supports_tool_choice": true, |
| 134 | + "supports_web_search": true, |
| 135 | + "search_context_cost_per_query": { |
| 136 | + "search_context_size_low": 0.030, |
| 137 | + "search_context_size_medium": 0.035, |
| 138 | + "search_context_size_high": 0.050 |
| 139 | + } |
78 | 140 | }, |
79 | 141 | "gpt-4.5-preview": { |
80 | 142 | "max_tokens": 16384, |
|
199 | 261 | "supports_vision": true, |
200 | 262 | "supports_prompt_caching": true, |
201 | 263 | "supports_system_messages": true, |
202 | | - "supports_tool_choice": true |
| 264 | + "supports_tool_choice": true, |
| 265 | + "supports_web_search": true, |
| 266 | + "search_context_cost_per_query": { |
| 267 | + "search_context_size_low": 0.025, |
| 268 | + "search_context_size_medium": 0.0275, |
| 269 | + "search_context_size_high": 0.030 |
| 270 | + } |
| 271 | + }, |
| 272 | + "gpt-4o-mini-search-preview-2025-03-11":{ |
| 273 | + "max_tokens": 16384, |
| 274 | + "max_input_tokens": 128000, |
| 275 | + "max_output_tokens": 16384, |
| 276 | + "input_cost_per_token": 0.00000015, |
| 277 | + "output_cost_per_token": 0.00000060, |
| 278 | + "input_cost_per_token_batches": 0.000000075, |
| 279 | + "output_cost_per_token_batches": 0.00000030, |
| 280 | + "cache_read_input_token_cost": 0.000000075, |
| 281 | + "litellm_provider": "openai", |
| 282 | + "mode": "chat", |
| 283 | + "supports_function_calling": true, |
| 284 | + "supports_parallel_function_calling": true, |
| 285 | + "supports_response_schema": true, |
| 286 | + "supports_vision": true, |
| 287 | + "supports_prompt_caching": true, |
| 288 | + "supports_system_messages": true, |
| 289 | + "supports_tool_choice": true, |
| 290 | + "supports_web_search": true, |
| 291 | + "search_context_cost_per_query": { |
| 292 | + "search_context_size_low": 0.025, |
| 293 | + "search_context_size_medium": 0.0275, |
| 294 | + "search_context_size_high": 0.030 |
| 295 | + } |
| 296 | + }, |
| 297 | + "gpt-4o-mini-search-preview": { |
| 298 | + "max_tokens": 16384, |
| 299 | + "max_input_tokens": 128000, |
| 300 | + "max_output_tokens": 16384, |
| 301 | + "input_cost_per_token": 0.00000015, |
| 302 | + "output_cost_per_token": 0.00000060, |
| 303 | + "input_cost_per_token_batches": 0.000000075, |
| 304 | + "output_cost_per_token_batches": 0.00000030, |
| 305 | + "cache_read_input_token_cost": 0.000000075, |
| 306 | + "litellm_provider": "openai", |
| 307 | + "mode": "chat", |
| 308 | + "supports_function_calling": true, |
| 309 | + "supports_parallel_function_calling": true, |
| 310 | + "supports_response_schema": true, |
| 311 | + "supports_vision": true, |
| 312 | + "supports_prompt_caching": true, |
| 313 | + "supports_system_messages": true, |
| 314 | + "supports_tool_choice": true, |
| 315 | + "supports_web_search": true, |
| 316 | + "search_context_cost_per_query": { |
| 317 | + "search_context_size_low": 0.025, |
| 318 | + "search_context_size_medium": 0.0275, |
| 319 | + "search_context_size_high": 0.030 |
| 320 | + } |
203 | 321 | }, |
204 | 322 | "gpt-4o-mini-2024-07-18": { |
205 | 323 | "max_tokens": 16384, |
|
218 | 336 | "supports_vision": true, |
219 | 337 | "supports_prompt_caching": true, |
220 | 338 | "supports_system_messages": true, |
221 | | - "supports_tool_choice": true |
| 339 | + "supports_tool_choice": true, |
| 340 | + "search_context_cost_per_query": { |
| 341 | + "search_context_size_low": 30.00, |
| 342 | + "search_context_size_medium": 35.00, |
| 343 | + "search_context_size_high": 50.00 |
| 344 | + } |
| 345 | + }, |
| 346 | + "o1-pro": { |
| 347 | + "max_tokens": 100000, |
| 348 | + "max_input_tokens": 200000, |
| 349 | + "max_output_tokens": 100000, |
| 350 | + "input_cost_per_token": 0.00015, |
| 351 | + "output_cost_per_token": 0.0006, |
| 352 | + "input_cost_per_token_batches": 0.000075, |
| 353 | + "output_cost_per_token_batches": 0.0003, |
| 354 | + "litellm_provider": "openai", |
| 355 | + "mode": "responses", |
| 356 | + "supports_function_calling": true, |
| 357 | + "supports_parallel_function_calling": true, |
| 358 | + "supports_vision": true, |
| 359 | + "supports_prompt_caching": true, |
| 360 | + "supports_system_messages": true, |
| 361 | + "supports_response_schema": true, |
| 362 | + "supports_tool_choice": true, |
| 363 | + "supports_native_streaming": false, |
| 364 | + "supported_modalities": ["text", "image"], |
| 365 | + "supported_endpoints": ["/v1/responses", "/v1/batch"] |
| 366 | + }, |
| 367 | + "o1-pro-2025-03-19": { |
| 368 | + "max_tokens": 100000, |
| 369 | + "max_input_tokens": 200000, |
| 370 | + "max_output_tokens": 100000, |
| 371 | + "input_cost_per_token": 0.00015, |
| 372 | + "output_cost_per_token": 0.0006, |
| 373 | + "input_cost_per_token_batches": 0.000075, |
| 374 | + "output_cost_per_token_batches": 0.0003, |
| 375 | + "litellm_provider": "openai", |
| 376 | + "mode": "responses", |
| 377 | + "supports_function_calling": true, |
| 378 | + "supports_parallel_function_calling": true, |
| 379 | + "supports_vision": true, |
| 380 | + "supports_prompt_caching": true, |
| 381 | + "supports_system_messages": true, |
| 382 | + "supports_response_schema": true, |
| 383 | + "supports_tool_choice": true, |
| 384 | + "supports_native_streaming": false, |
| 385 | + "supported_modalities": ["text", "image"], |
| 386 | + "supported_endpoints": ["/v1/responses", "/v1/batch"] |
222 | 387 | }, |
223 | 388 | "o1": { |
224 | 389 | "max_tokens": 100000, |
|
383 | 548 | "supports_vision": true, |
384 | 549 | "supports_prompt_caching": true, |
385 | 550 | "supports_system_messages": true, |
386 | | - "supports_tool_choice": true |
| 551 | + "supports_tool_choice": true, |
| 552 | + "supports_web_search": true, |
| 553 | + "search_context_cost_per_query": { |
| 554 | + "search_context_size_low": 0.030, |
| 555 | + "search_context_size_medium": 0.035, |
| 556 | + "search_context_size_high": 0.050 |
| 557 | + } |
387 | 558 | }, |
388 | 559 | "gpt-4o-2024-11-20": { |
389 | 560 | "max_tokens": 16384, |
|
1384 | 1555 | "supports_vision": false, |
1385 | 1556 | "supports_prompt_caching": true |
1386 | 1557 | }, |
| 1558 | + "azure/gpt-4.5-preview": { |
| 1559 | + "max_tokens": 16384, |
| 1560 | + "max_input_tokens": 128000, |
| 1561 | + "max_output_tokens": 16384, |
| 1562 | + "input_cost_per_token": 0.000075, |
| 1563 | + "output_cost_per_token": 0.00015, |
| 1564 | + "input_cost_per_token_batches": 0.0000375, |
| 1565 | + "output_cost_per_token_batches": 0.000075, |
| 1566 | + "cache_read_input_token_cost": 0.0000375, |
| 1567 | + "litellm_provider": "azure", |
| 1568 | + "mode": "chat", |
| 1569 | + "supports_function_calling": true, |
| 1570 | + "supports_parallel_function_calling": true, |
| 1571 | + "supports_response_schema": true, |
| 1572 | + "supports_vision": true, |
| 1573 | + "supports_prompt_caching": true, |
| 1574 | + "supports_system_messages": true, |
| 1575 | + "supports_tool_choice": true |
| 1576 | + }, |
1387 | 1577 | "azure/gpt-4o": { |
1388 | | - "max_tokens": 4096, |
| 1578 | + "max_tokens": 16384, |
1389 | 1579 | "max_input_tokens": 128000, |
1390 | | - "max_output_tokens": 4096, |
1391 | | - "input_cost_per_token": 0.000005, |
1392 | | - "output_cost_per_token": 0.000015, |
| 1580 | + "max_output_tokens": 16384, |
| 1581 | + "input_cost_per_token": 0.0000025, |
| 1582 | + "output_cost_per_token": 0.00001, |
| 1583 | + "cache_read_input_token_cost": 0.00000125, |
| 1584 | + "litellm_provider": "azure", |
| 1585 | + "mode": "chat", |
| 1586 | + "supports_function_calling": true, |
| 1587 | + "supports_parallel_function_calling": true, |
| 1588 | + "supports_response_schema": true, |
| 1589 | + "supports_vision": true, |
| 1590 | + "supports_prompt_caching": true, |
| 1591 | + "supports_tool_choice": true |
| 1592 | + }, |
| 1593 | + "azure/global/gpt-4o-2024-11-20": { |
| 1594 | + "max_tokens": 16384, |
| 1595 | + "max_input_tokens": 128000, |
| 1596 | + "max_output_tokens": 16384, |
| 1597 | + "input_cost_per_token": 0.0000025, |
| 1598 | + "output_cost_per_token": 0.00001, |
1393 | 1599 | "cache_read_input_token_cost": 0.00000125, |
1394 | 1600 | "litellm_provider": "azure", |
1395 | 1601 | "mode": "chat", |
1396 | 1602 | "supports_function_calling": true, |
1397 | 1603 | "supports_parallel_function_calling": true, |
| 1604 | + "supports_response_schema": true, |
1398 | 1605 | "supports_vision": true, |
1399 | 1606 | "supports_prompt_caching": true, |
1400 | 1607 | "supports_tool_choice": true |
|
1403 | 1610 | "max_tokens": 16384, |
1404 | 1611 | "max_input_tokens": 128000, |
1405 | 1612 | "max_output_tokens": 16384, |
1406 | | - "input_cost_per_token": 0.00000275, |
1407 | | - "output_cost_per_token": 0.000011, |
| 1613 | + "input_cost_per_token": 0.0000025, |
| 1614 | + "output_cost_per_token": 0.00001, |
| 1615 | + "cache_read_input_token_cost": 0.00000125, |
| 1616 | + "litellm_provider": "azure", |
| 1617 | + "mode": "chat", |
| 1618 | + "supports_function_calling": true, |
| 1619 | + "supports_parallel_function_calling": true, |
| 1620 | + "supports_response_schema": true, |
| 1621 | + "supports_vision": true, |
| 1622 | + "supports_prompt_caching": true, |
| 1623 | + "supports_tool_choice": true |
| 1624 | + }, |
| 1625 | + "azure/global/gpt-4o-2024-08-06": { |
| 1626 | + "max_tokens": 16384, |
| 1627 | + "max_input_tokens": 128000, |
| 1628 | + "max_output_tokens": 16384, |
| 1629 | + "input_cost_per_token": 0.0000025, |
| 1630 | + "output_cost_per_token": 0.00001, |
1408 | 1631 | "cache_read_input_token_cost": 0.00000125, |
1409 | 1632 | "litellm_provider": "azure", |
1410 | 1633 | "mode": "chat", |
|
1421 | 1644 | "max_output_tokens": 16384, |
1422 | 1645 | "input_cost_per_token": 0.00000275, |
1423 | 1646 | "output_cost_per_token": 0.000011, |
| 1647 | + "cache_read_input_token_cost": 0.00000125, |
1424 | 1648 | "litellm_provider": "azure", |
1425 | 1649 | "mode": "chat", |
1426 | 1650 | "supports_function_calling": true, |
1427 | 1651 | "supports_parallel_function_calling": true, |
1428 | 1652 | "supports_response_schema": true, |
1429 | 1653 | "supports_vision": true, |
| 1654 | + "supports_prompt_caching": true, |
1430 | 1655 | "supports_tool_choice": true |
1431 | 1656 | }, |
1432 | 1657 | "azure/us/gpt-4o-2024-11-20": { |
|
2014 | 2239 | "mode": "chat", |
2015 | 2240 | "supports_tool_choice": true |
2016 | 2241 | }, |
| 2242 | + "azure_ai/mistral-small-2503": { |
| 2243 | + "max_tokens": 128000, |
| 2244 | + "max_input_tokens": 128000, |
| 2245 | + "max_output_tokens": 128000, |
| 2246 | + "input_cost_per_token": 0.000001, |
| 2247 | + "output_cost_per_token": 0.000003, |
| 2248 | + "litellm_provider": "azure_ai", |
| 2249 | + "mode": "chat", |
| 2250 | + "supports_function_calling": true, |
| 2251 | + "supports_vision": true, |
| 2252 | + "supports_tool_choice": true |
| 2253 | + }, |
2017 | 2254 | "azure_ai/mistral-large-2407": { |
2018 | 2255 | "max_tokens": 4096, |
2019 | 2256 | "max_input_tokens": 128000, |
|
0 commit comments