Skip to content
This repository was archived by the owner on Jun 5, 2025. It is now read-only.

Commit 17fab51

Browse files
Update model_prices_and_context_window.json to version generated on 2025-03-23 (#1308)
Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com>
1 parent aa650bf commit 17fab51

File tree

1 file changed

+247
-10
lines changed

1 file changed

+247
-10
lines changed

model_cost_data/model_prices_and_context_window.json

Lines changed: 247 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,12 @@
1515
"supports_prompt_caching": true,
1616
"supports_response_schema": true,
1717
"supports_system_messages": true,
18+
"supports_web_search": true,
19+
"search_context_cost_per_query": {
20+
"search_context_size_low": 0.0000,
21+
"search_context_size_medium": 0.0000,
22+
"search_context_size_high": 0.0000
23+
},
1824
"deprecation_date": "date when the model becomes deprecated in the format YYYY-MM-DD"
1925
},
2026
"omni-moderation-latest": {
@@ -74,7 +80,63 @@
7480
"supports_vision": true,
7581
"supports_prompt_caching": true,
7682
"supports_system_messages": true,
77-
"supports_tool_choice": true
83+
"supports_tool_choice": true,
84+
"supports_web_search": true,
85+
"search_context_cost_per_query": {
86+
"search_context_size_low": 0.030,
87+
"search_context_size_medium": 0.035,
88+
"search_context_size_high": 0.050
89+
}
90+
},
91+
"gpt-4o-search-preview-2025-03-11": {
92+
"max_tokens": 16384,
93+
"max_input_tokens": 128000,
94+
"max_output_tokens": 16384,
95+
"input_cost_per_token": 0.0000025,
96+
"output_cost_per_token": 0.000010,
97+
"input_cost_per_token_batches": 0.00000125,
98+
"output_cost_per_token_batches": 0.00000500,
99+
"cache_read_input_token_cost": 0.00000125,
100+
"litellm_provider": "openai",
101+
"mode": "chat",
102+
"supports_function_calling": true,
103+
"supports_parallel_function_calling": true,
104+
"supports_response_schema": true,
105+
"supports_vision": true,
106+
"supports_prompt_caching": true,
107+
"supports_system_messages": true,
108+
"supports_tool_choice": true,
109+
"supports_web_search": true,
110+
"search_context_cost_per_query": {
111+
"search_context_size_low": 0.030,
112+
"search_context_size_medium": 0.035,
113+
"search_context_size_high": 0.050
114+
}
115+
},
116+
"gpt-4o-search-preview": {
117+
"max_tokens": 16384,
118+
"max_input_tokens": 128000,
119+
"max_output_tokens": 16384,
120+
"input_cost_per_token": 0.0000025,
121+
"output_cost_per_token": 0.000010,
122+
"input_cost_per_token_batches": 0.00000125,
123+
"output_cost_per_token_batches": 0.00000500,
124+
"cache_read_input_token_cost": 0.00000125,
125+
"litellm_provider": "openai",
126+
"mode": "chat",
127+
"supports_function_calling": true,
128+
"supports_parallel_function_calling": true,
129+
"supports_response_schema": true,
130+
"supports_vision": true,
131+
"supports_prompt_caching": true,
132+
"supports_system_messages": true,
133+
"supports_tool_choice": true,
134+
"supports_web_search": true,
135+
"search_context_cost_per_query": {
136+
"search_context_size_low": 0.030,
137+
"search_context_size_medium": 0.035,
138+
"search_context_size_high": 0.050
139+
}
78140
},
79141
"gpt-4.5-preview": {
80142
"max_tokens": 16384,
@@ -199,7 +261,63 @@
199261
"supports_vision": true,
200262
"supports_prompt_caching": true,
201263
"supports_system_messages": true,
202-
"supports_tool_choice": true
264+
"supports_tool_choice": true,
265+
"supports_web_search": true,
266+
"search_context_cost_per_query": {
267+
"search_context_size_low": 0.025,
268+
"search_context_size_medium": 0.0275,
269+
"search_context_size_high": 0.030
270+
}
271+
},
272+
"gpt-4o-mini-search-preview-2025-03-11":{
273+
"max_tokens": 16384,
274+
"max_input_tokens": 128000,
275+
"max_output_tokens": 16384,
276+
"input_cost_per_token": 0.00000015,
277+
"output_cost_per_token": 0.00000060,
278+
"input_cost_per_token_batches": 0.000000075,
279+
"output_cost_per_token_batches": 0.00000030,
280+
"cache_read_input_token_cost": 0.000000075,
281+
"litellm_provider": "openai",
282+
"mode": "chat",
283+
"supports_function_calling": true,
284+
"supports_parallel_function_calling": true,
285+
"supports_response_schema": true,
286+
"supports_vision": true,
287+
"supports_prompt_caching": true,
288+
"supports_system_messages": true,
289+
"supports_tool_choice": true,
290+
"supports_web_search": true,
291+
"search_context_cost_per_query": {
292+
"search_context_size_low": 0.025,
293+
"search_context_size_medium": 0.0275,
294+
"search_context_size_high": 0.030
295+
}
296+
},
297+
"gpt-4o-mini-search-preview": {
298+
"max_tokens": 16384,
299+
"max_input_tokens": 128000,
300+
"max_output_tokens": 16384,
301+
"input_cost_per_token": 0.00000015,
302+
"output_cost_per_token": 0.00000060,
303+
"input_cost_per_token_batches": 0.000000075,
304+
"output_cost_per_token_batches": 0.00000030,
305+
"cache_read_input_token_cost": 0.000000075,
306+
"litellm_provider": "openai",
307+
"mode": "chat",
308+
"supports_function_calling": true,
309+
"supports_parallel_function_calling": true,
310+
"supports_response_schema": true,
311+
"supports_vision": true,
312+
"supports_prompt_caching": true,
313+
"supports_system_messages": true,
314+
"supports_tool_choice": true,
315+
"supports_web_search": true,
316+
"search_context_cost_per_query": {
317+
"search_context_size_low": 0.025,
318+
"search_context_size_medium": 0.0275,
319+
"search_context_size_high": 0.030
320+
}
203321
},
204322
"gpt-4o-mini-2024-07-18": {
205323
"max_tokens": 16384,
@@ -218,7 +336,54 @@
218336
"supports_vision": true,
219337
"supports_prompt_caching": true,
220338
"supports_system_messages": true,
221-
"supports_tool_choice": true
339+
"supports_tool_choice": true,
340+
"search_context_cost_per_query": {
341+
"search_context_size_low": 30.00,
342+
"search_context_size_medium": 35.00,
343+
"search_context_size_high": 50.00
344+
}
345+
},
346+
"o1-pro": {
347+
"max_tokens": 100000,
348+
"max_input_tokens": 200000,
349+
"max_output_tokens": 100000,
350+
"input_cost_per_token": 0.00015,
351+
"output_cost_per_token": 0.0006,
352+
"input_cost_per_token_batches": 0.000075,
353+
"output_cost_per_token_batches": 0.0003,
354+
"litellm_provider": "openai",
355+
"mode": "responses",
356+
"supports_function_calling": true,
357+
"supports_parallel_function_calling": true,
358+
"supports_vision": true,
359+
"supports_prompt_caching": true,
360+
"supports_system_messages": true,
361+
"supports_response_schema": true,
362+
"supports_tool_choice": true,
363+
"supports_native_streaming": false,
364+
"supported_modalities": ["text", "image"],
365+
"supported_endpoints": ["/v1/responses", "/v1/batch"]
366+
},
367+
"o1-pro-2025-03-19": {
368+
"max_tokens": 100000,
369+
"max_input_tokens": 200000,
370+
"max_output_tokens": 100000,
371+
"input_cost_per_token": 0.00015,
372+
"output_cost_per_token": 0.0006,
373+
"input_cost_per_token_batches": 0.000075,
374+
"output_cost_per_token_batches": 0.0003,
375+
"litellm_provider": "openai",
376+
"mode": "responses",
377+
"supports_function_calling": true,
378+
"supports_parallel_function_calling": true,
379+
"supports_vision": true,
380+
"supports_prompt_caching": true,
381+
"supports_system_messages": true,
382+
"supports_response_schema": true,
383+
"supports_tool_choice": true,
384+
"supports_native_streaming": false,
385+
"supported_modalities": ["text", "image"],
386+
"supported_endpoints": ["/v1/responses", "/v1/batch"]
222387
},
223388
"o1": {
224389
"max_tokens": 100000,
@@ -383,7 +548,13 @@
383548
"supports_vision": true,
384549
"supports_prompt_caching": true,
385550
"supports_system_messages": true,
386-
"supports_tool_choice": true
551+
"supports_tool_choice": true,
552+
"supports_web_search": true,
553+
"search_context_cost_per_query": {
554+
"search_context_size_low": 0.030,
555+
"search_context_size_medium": 0.035,
556+
"search_context_size_high": 0.050
557+
}
387558
},
388559
"gpt-4o-2024-11-20": {
389560
"max_tokens": 16384,
@@ -1384,17 +1555,53 @@
13841555
"supports_vision": false,
13851556
"supports_prompt_caching": true
13861557
},
1558+
"azure/gpt-4.5-preview": {
1559+
"max_tokens": 16384,
1560+
"max_input_tokens": 128000,
1561+
"max_output_tokens": 16384,
1562+
"input_cost_per_token": 0.000075,
1563+
"output_cost_per_token": 0.00015,
1564+
"input_cost_per_token_batches": 0.0000375,
1565+
"output_cost_per_token_batches": 0.000075,
1566+
"cache_read_input_token_cost": 0.0000375,
1567+
"litellm_provider": "azure",
1568+
"mode": "chat",
1569+
"supports_function_calling": true,
1570+
"supports_parallel_function_calling": true,
1571+
"supports_response_schema": true,
1572+
"supports_vision": true,
1573+
"supports_prompt_caching": true,
1574+
"supports_system_messages": true,
1575+
"supports_tool_choice": true
1576+
},
13871577
"azure/gpt-4o": {
1388-
"max_tokens": 4096,
1578+
"max_tokens": 16384,
13891579
"max_input_tokens": 128000,
1390-
"max_output_tokens": 4096,
1391-
"input_cost_per_token": 0.000005,
1392-
"output_cost_per_token": 0.000015,
1580+
"max_output_tokens": 16384,
1581+
"input_cost_per_token": 0.0000025,
1582+
"output_cost_per_token": 0.00001,
1583+
"cache_read_input_token_cost": 0.00000125,
1584+
"litellm_provider": "azure",
1585+
"mode": "chat",
1586+
"supports_function_calling": true,
1587+
"supports_parallel_function_calling": true,
1588+
"supports_response_schema": true,
1589+
"supports_vision": true,
1590+
"supports_prompt_caching": true,
1591+
"supports_tool_choice": true
1592+
},
1593+
"azure/global/gpt-4o-2024-11-20": {
1594+
"max_tokens": 16384,
1595+
"max_input_tokens": 128000,
1596+
"max_output_tokens": 16384,
1597+
"input_cost_per_token": 0.0000025,
1598+
"output_cost_per_token": 0.00001,
13931599
"cache_read_input_token_cost": 0.00000125,
13941600
"litellm_provider": "azure",
13951601
"mode": "chat",
13961602
"supports_function_calling": true,
13971603
"supports_parallel_function_calling": true,
1604+
"supports_response_schema": true,
13981605
"supports_vision": true,
13991606
"supports_prompt_caching": true,
14001607
"supports_tool_choice": true
@@ -1403,8 +1610,24 @@
14031610
"max_tokens": 16384,
14041611
"max_input_tokens": 128000,
14051612
"max_output_tokens": 16384,
1406-
"input_cost_per_token": 0.00000275,
1407-
"output_cost_per_token": 0.000011,
1613+
"input_cost_per_token": 0.0000025,
1614+
"output_cost_per_token": 0.00001,
1615+
"cache_read_input_token_cost": 0.00000125,
1616+
"litellm_provider": "azure",
1617+
"mode": "chat",
1618+
"supports_function_calling": true,
1619+
"supports_parallel_function_calling": true,
1620+
"supports_response_schema": true,
1621+
"supports_vision": true,
1622+
"supports_prompt_caching": true,
1623+
"supports_tool_choice": true
1624+
},
1625+
"azure/global/gpt-4o-2024-08-06": {
1626+
"max_tokens": 16384,
1627+
"max_input_tokens": 128000,
1628+
"max_output_tokens": 16384,
1629+
"input_cost_per_token": 0.0000025,
1630+
"output_cost_per_token": 0.00001,
14081631
"cache_read_input_token_cost": 0.00000125,
14091632
"litellm_provider": "azure",
14101633
"mode": "chat",
@@ -1421,12 +1644,14 @@
14211644
"max_output_tokens": 16384,
14221645
"input_cost_per_token": 0.00000275,
14231646
"output_cost_per_token": 0.000011,
1647+
"cache_read_input_token_cost": 0.00000125,
14241648
"litellm_provider": "azure",
14251649
"mode": "chat",
14261650
"supports_function_calling": true,
14271651
"supports_parallel_function_calling": true,
14281652
"supports_response_schema": true,
14291653
"supports_vision": true,
1654+
"supports_prompt_caching": true,
14301655
"supports_tool_choice": true
14311656
},
14321657
"azure/us/gpt-4o-2024-11-20": {
@@ -2014,6 +2239,18 @@
20142239
"mode": "chat",
20152240
"supports_tool_choice": true
20162241
},
2242+
"azure_ai/mistral-small-2503": {
2243+
"max_tokens": 128000,
2244+
"max_input_tokens": 128000,
2245+
"max_output_tokens": 128000,
2246+
"input_cost_per_token": 0.000001,
2247+
"output_cost_per_token": 0.000003,
2248+
"litellm_provider": "azure_ai",
2249+
"mode": "chat",
2250+
"supports_function_calling": true,
2251+
"supports_vision": true,
2252+
"supports_tool_choice": true
2253+
},
20172254
"azure_ai/mistral-large-2407": {
20182255
"max_tokens": 4096,
20192256
"max_input_tokens": 128000,

0 commit comments

Comments
 (0)