14121412 "deprecation_date" : " 2025-03-31" ,
14131413 "supports_tool_choice" : true
14141414 },
1415+ "azure/gpt-3.5-turbo-0125" : {
1416+ "max_tokens" : 4096 ,
1417+ "max_input_tokens" : 16384 ,
1418+ "max_output_tokens" : 4096 ,
1419+ "input_cost_per_token" : 0.0000005 ,
1420+ "output_cost_per_token" : 0.0000015 ,
1421+ "litellm_provider" : " azure" ,
1422+ "mode" : " chat" ,
1423+ "supports_function_calling" : true ,
1424+ "supports_parallel_function_calling" : true ,
1425+ "deprecation_date" : " 2025-03-31" ,
1426+ "supports_tool_choice" : true
1427+ },
14151428 "azure/gpt-35-turbo-16k" : {
14161429 "max_tokens" : 4096 ,
14171430 "max_input_tokens" : 16385 ,
14331446 "supports_function_calling" : true ,
14341447 "supports_tool_choice" : true
14351448 },
1449+ "azure/gpt-3.5-turbo" : {
1450+ "max_tokens" : 4096 ,
1451+ "max_input_tokens" : 4097 ,
1452+ "max_output_tokens" : 4096 ,
1453+ "input_cost_per_token" : 0.0000005 ,
1454+ "output_cost_per_token" : 0.0000015 ,
1455+ "litellm_provider" : " azure" ,
1456+ "mode" : " chat" ,
1457+ "supports_function_calling" : true ,
1458+ "supports_tool_choice" : true
1459+ },
14361460 "azure/gpt-3.5-turbo-instruct-0914" : {
14371461 "max_tokens" : 4097 ,
14381462 "max_input_tokens" : 4097 ,
36343658 "source" : " https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" ,
36353659 "supports_tool_choice" : true
36363660 },
3661+ "gemini-2.0-pro-exp-02-05" : {
3662+ "max_tokens" : 8192 ,
3663+ "max_input_tokens" : 2097152 ,
3664+ "max_output_tokens" : 8192 ,
3665+ "max_images_per_prompt" : 3000 ,
3666+ "max_videos_per_prompt" : 10 ,
3667+ "max_video_length" : 1 ,
3668+ "max_audio_length_hours" : 8.4 ,
3669+ "max_audio_per_prompt" : 1 ,
3670+ "max_pdf_size_mb" : 30 ,
3671+ "input_cost_per_image" : 0 ,
3672+ "input_cost_per_video_per_second" : 0 ,
3673+ "input_cost_per_audio_per_second" : 0 ,
3674+ "input_cost_per_token" : 0 ,
3675+ "input_cost_per_character" : 0 ,
3676+ "input_cost_per_token_above_128k_tokens" : 0 ,
3677+ "input_cost_per_character_above_128k_tokens" : 0 ,
3678+ "input_cost_per_image_above_128k_tokens" : 0 ,
3679+ "input_cost_per_video_per_second_above_128k_tokens" : 0 ,
3680+ "input_cost_per_audio_per_second_above_128k_tokens" : 0 ,
3681+ "output_cost_per_token" : 0 ,
3682+ "output_cost_per_character" : 0 ,
3683+ "output_cost_per_token_above_128k_tokens" : 0 ,
3684+ "output_cost_per_character_above_128k_tokens" : 0 ,
3685+ "litellm_provider" : " vertex_ai-language-models" ,
3686+ "mode" : " chat" ,
3687+ "supports_system_messages" : true ,
3688+ "supports_function_calling" : true ,
3689+ "supports_vision" : true ,
3690+ "supports_audio_input" : true ,
3691+ "supports_video_input" : true ,
3692+ "supports_pdf_input" : true ,
3693+ "supports_response_schema" : true ,
3694+ "supports_tool_choice" : true ,
3695+ "source" : " https://cloud.google.com/vertex-ai/generative-ai/pricing"
3696+ },
36373697 "gemini-2.0-flash-exp" : {
36383698 "max_tokens" : 8192 ,
36393699 "max_input_tokens" : 1048576 ,
70357095 "input_cost_per_token" : 0.00000072 ,
70367096 "output_cost_per_token" : 0.00000072 ,
70377097 "litellm_provider" : " bedrock_converse" ,
7038- "mode" : " chat"
7098+ "mode" : " chat" ,
7099+ "supports_function_calling" : true ,
7100+ "supports_tool_choice" : false
70397101 },
70407102 "meta.llama2-13b-chat-v1" : {
70417103 "max_tokens" : 4096 ,
73757437 "supports_function_calling" : true ,
73767438 "supports_tool_choice" : false
73777439 },
7440+ "us.meta.llama3-3-70b-instruct-v1:0" : {
7441+ "max_tokens" : 4096 ,
7442+ "max_input_tokens" : 128000 ,
7443+ "max_output_tokens" : 4096 ,
7444+ "input_cost_per_token" : 0.00000072 ,
7445+ "output_cost_per_token" : 0.00000072 ,
7446+ "litellm_provider" : " bedrock_converse" ,
7447+ "mode" : " chat" ,
7448+ "supports_function_calling" : true ,
7449+ "supports_tool_choice" : false
7450+ },
73787451 "512-x-512/50-steps/stability.stable-diffusion-xl-v0" : {
73797452 "max_tokens" : 77 ,
73807453 "max_input_tokens" : 77 ,
80848157 "input_cost_per_token" : 0.00000035 ,
80858158 "output_cost_per_token" : 0.00000140 ,
80868159 "litellm_provider" : " perplexity" ,
8087- "mode" : " chat" ,
8088- "supports_tool_choice" : true
8160+ "mode" : " chat"
80898161 },
80908162 "perplexity/codellama-70b-instruct" : {
80918163 "max_tokens" : 16384 ,
80948166 "input_cost_per_token" : 0.00000070 ,
80958167 "output_cost_per_token" : 0.00000280 ,
80968168 "litellm_provider" : " perplexity" ,
8097- "mode" : " chat" ,
8098- "supports_tool_choice" : true
8169+ "mode" : " chat"
80998170 },
81008171 "perplexity/llama-3.1-70b-instruct" : {
81018172 "max_tokens" : 131072 ,
81048175 "input_cost_per_token" : 0.000001 ,
81058176 "output_cost_per_token" : 0.000001 ,
81068177 "litellm_provider" : " perplexity" ,
8107- "mode" : " chat" ,
8108- "supports_tool_choice" : true
8178+ "mode" : " chat"
81098179 },
81108180 "perplexity/llama-3.1-8b-instruct" : {
81118181 "max_tokens" : 131072 ,
81148184 "input_cost_per_token" : 0.0000002 ,
81158185 "output_cost_per_token" : 0.0000002 ,
81168186 "litellm_provider" : " perplexity" ,
8117- "mode" : " chat" ,
8118- "supports_tool_choice" : true
8187+ "mode" : " chat"
81198188 },
81208189 "perplexity/llama-3.1-sonar-huge-128k-online" : {
81218190 "max_tokens" : 127072 ,
81258194 "output_cost_per_token" : 0.000005 ,
81268195 "litellm_provider" : " perplexity" ,
81278196 "mode" : " chat" ,
8128- "deprecation_date" : " 2025-02-22" ,
8129- "supports_tool_choice" : true
8197+ "deprecation_date" : " 2025-02-22"
81308198 },
81318199 "perplexity/llama-3.1-sonar-large-128k-online" : {
81328200 "max_tokens" : 127072 ,
81368204 "output_cost_per_token" : 0.000001 ,
81378205 "litellm_provider" : " perplexity" ,
81388206 "mode" : " chat" ,
8139- "deprecation_date" : " 2025-02-22" ,
8140- "supports_tool_choice" : true
8207+ "deprecation_date" : " 2025-02-22"
81418208 },
81428209 "perplexity/llama-3.1-sonar-large-128k-chat" : {
81438210 "max_tokens" : 131072 ,
81478214 "output_cost_per_token" : 0.000001 ,
81488215 "litellm_provider" : " perplexity" ,
81498216 "mode" : " chat" ,
8150- "deprecation_date" : " 2025-02-22" ,
8151- "supports_tool_choice" : true
8217+ "deprecation_date" : " 2025-02-22"
81528218 },
81538219 "perplexity/llama-3.1-sonar-small-128k-chat" : {
81548220 "max_tokens" : 131072 ,
81588224 "output_cost_per_token" : 0.0000002 ,
81598225 "litellm_provider" : " perplexity" ,
81608226 "mode" : " chat" ,
8161- "deprecation_date" : " 2025-02-22" ,
8162- "supports_tool_choice" : true
8227+ "deprecation_date" : " 2025-02-22"
81638228 },
81648229 "perplexity/llama-3.1-sonar-small-128k-online" : {
81658230 "max_tokens" : 127072 ,
81698234 "output_cost_per_token" : 0.0000002 ,
81708235 "litellm_provider" : " perplexity" ,
81718236 "mode" : " chat" ,
8172- "deprecation_date" : " 2025-02-22" ,
8173- "supports_tool_choice" : true
8237+ "deprecation_date" : " 2025-02-22"
8238+ },
8239+ "perplexity/sonar" : {
8240+ "max_tokens" : 127072 ,
8241+ "max_input_tokens" : 127072 ,
8242+ "max_output_tokens" : 127072 ,
8243+ "input_cost_per_token" : 0.000001 ,
8244+ "output_cost_per_token" : 0.000001 ,
8245+ "litellm_provider" : " perplexity" ,
8246+ "mode" : " chat"
8247+ },
8248+ "perplexity/sonar-pro" : {
8249+ "max_tokens" : 200000 ,
8250+ "max_input_tokens" : 200000 ,
8251+ "max_output_tokens" : 8096 ,
8252+ "input_cost_per_token" : 0.000003 ,
8253+ "output_cost_per_token" : 0.000015 ,
8254+ "litellm_provider" : " perplexity" ,
8255+ "mode" : " chat"
8256+ },
8257+ "perplexity/sonar" : {
8258+ "max_tokens" : 127072 ,
8259+ "max_input_tokens" : 127072 ,
8260+ "max_output_tokens" : 127072 ,
8261+ "input_cost_per_token" : 0.000001 ,
8262+ "output_cost_per_token" : 0.000001 ,
8263+ "litellm_provider" : " perplexity" ,
8264+ "mode" : " chat"
8265+ },
8266+ "perplexity/sonar-pro" : {
8267+ "max_tokens" : 200000 ,
8268+ "max_input_tokens" : 200000 ,
8269+ "max_output_tokens" : 8096 ,
8270+ "input_cost_per_token" : 0.000003 ,
8271+ "output_cost_per_token" : 0.000015 ,
8272+ "litellm_provider" : " perplexity" ,
8273+ "mode" : " chat"
81748274 },
81758275 "perplexity/pplx-7b-chat" : {
81768276 "max_tokens" : 8192 ,
81798279 "input_cost_per_token" : 0.00000007 ,
81808280 "output_cost_per_token" : 0.00000028 ,
81818281 "litellm_provider" : " perplexity" ,
8182- "mode" : " chat" ,
8183- "supports_tool_choice" : true
8282+ "mode" : " chat"
81848283 },
81858284 "perplexity/pplx-70b-chat" : {
81868285 "max_tokens" : 4096 ,
81898288 "input_cost_per_token" : 0.00000070 ,
81908289 "output_cost_per_token" : 0.00000280 ,
81918290 "litellm_provider" : " perplexity" ,
8192- "mode" : " chat" ,
8193- "supports_tool_choice" : true
8291+ "mode" : " chat"
81948292 },
81958293 "perplexity/pplx-7b-online" : {
81968294 "max_tokens" : 4096 ,
82008298 "output_cost_per_token" : 0.00000028 ,
82018299 "input_cost_per_request" : 0.005 ,
82028300 "litellm_provider" : " perplexity" ,
8203- "mode" : " chat" ,
8204- "supports_tool_choice" : true
8301+ "mode" : " chat"
82058302 },
82068303 "perplexity/pplx-70b-online" : {
82078304 "max_tokens" : 4096 ,
82118308 "output_cost_per_token" : 0.00000280 ,
82128309 "input_cost_per_request" : 0.005 ,
82138310 "litellm_provider" : " perplexity" ,
8214- "mode" : " chat" ,
8215- "supports_tool_choice" : true
8311+ "mode" : " chat"
82168312 },
82178313 "perplexity/llama-2-70b-chat" : {
82188314 "max_tokens" : 4096 ,
82218317 "input_cost_per_token" : 0.00000070 ,
82228318 "output_cost_per_token" : 0.00000280 ,
82238319 "litellm_provider" : " perplexity" ,
8224- "mode" : " chat" ,
8225- "supports_tool_choice" : true
8320+ "mode" : " chat"
82268321 },
82278322 "perplexity/mistral-7b-instruct" : {
82288323 "max_tokens" : 4096 ,
82318326 "input_cost_per_token" : 0.00000007 ,
82328327 "output_cost_per_token" : 0.00000028 ,
82338328 "litellm_provider" : " perplexity" ,
8234- "mode" : " chat" ,
8235- "supports_tool_choice" : true
8329+ "mode" : " chat"
82368330 },
82378331 "perplexity/mixtral-8x7b-instruct" : {
82388332 "max_tokens" : 4096 ,
82418335 "input_cost_per_token" : 0.00000007 ,
82428336 "output_cost_per_token" : 0.00000028 ,
82438337 "litellm_provider" : " perplexity" ,
8244- "mode" : " chat" ,
8245- "supports_tool_choice" : true
8338+ "mode" : " chat"
82468339 },
82478340 "perplexity/sonar-small-chat" : {
82488341 "max_tokens" : 16384 ,
82518344 "input_cost_per_token" : 0.00000007 ,
82528345 "output_cost_per_token" : 0.00000028 ,
82538346 "litellm_provider" : " perplexity" ,
8254- "mode" : " chat" ,
8255- "supports_tool_choice" : true
8347+ "mode" : " chat"
82568348 },
82578349 "perplexity/sonar-small-online" : {
82588350 "max_tokens" : 12000 ,
82628354 "output_cost_per_token" : 0.00000028 ,
82638355 "input_cost_per_request" : 0.005 ,
82648356 "litellm_provider" : " perplexity" ,
8265- "mode" : " chat" ,
8266- "supports_tool_choice" : true
8357+ "mode" : " chat"
82678358 },
82688359 "perplexity/sonar-medium-chat" : {
82698360 "max_tokens" : 16384 ,
82728363 "input_cost_per_token" : 0.0000006 ,
82738364 "output_cost_per_token" : 0.0000018 ,
82748365 "litellm_provider" : " perplexity" ,
8275- "mode" : " chat" ,
8276- "supports_tool_choice" : true
8366+ "mode" : " chat"
82778367 },
82788368 "perplexity/sonar-medium-online" : {
82798369 "max_tokens" : 12000 ,
82838373 "output_cost_per_token" : 0.0000018 ,
82848374 "input_cost_per_request" : 0.005 ,
82858375 "litellm_provider" : " perplexity" ,
8286- "mode" : " chat" ,
8287- "supports_tool_choice" : true
8376+ "mode" : " chat"
82888377 },
82898378 "fireworks_ai/accounts/fireworks/models/llama-v3p2-1b-instruct" : {
82908379 "max_tokens" : 16384 ,
90449133 "output_cost_per_second" : 0.00 ,
90459134 "litellm_provider" : " assemblyai"
90469135 }
9047- }
9136+ }
0 commit comments