88 "input_cache_read_cost_per_mil_tokens" : 0.025 ,
99 "displayName" : " GPT-5 mini" ,
1010 "reasoning" : true ,
11- "max_input_tokens" : 400000 ,
11+ "max_input_tokens" : 272000 ,
1212 "max_output_tokens" : 128000
1313 },
1414 "gpt-5-mini-2025-08-07" : {
2121 "displayName" : " GPT-5 mini (2025-08-07)" ,
2222 "reasoning" : true ,
2323 "parent" : " gpt-5-mini" ,
24- "max_input_tokens" : 400000 ,
24+ "max_input_tokens" : 272000 ,
2525 "max_output_tokens" : 128000
2626 },
2727 "gpt-5" : {
3333 "input_cache_read_cost_per_mil_tokens" : 0.125 ,
3434 "displayName" : " GPT-5" ,
3535 "reasoning" : true ,
36- "max_input_tokens" : 400000 ,
36+ "max_input_tokens" : 272000 ,
3737 "max_output_tokens" : 128000
3838 },
3939 "gpt-5-2025-08-07" : {
4646 "displayName" : " GPT-5 (2025-08-07)" ,
4747 "reasoning" : true ,
4848 "parent" : " gpt-5" ,
49- "max_input_tokens" : 400000 ,
49+ "max_input_tokens" : 272000 ,
5050 "max_output_tokens" : 128000
5151 },
5252 "gpt-5-pro" : {
5757 "output_cost_per_mil_tokens" : 120 ,
5858 "displayName" : " GPT-5 Pro" ,
5959 "reasoning" : true ,
60- "max_input_tokens" : 400000 ,
60+ "max_input_tokens" : 128000 ,
6161 "max_output_tokens" : 272000
6262 },
6363 "gpt-5-pro-2025-10-06" : {
6868 "output_cost_per_mil_tokens" : 120 ,
6969 "reasoning" : true ,
7070 "parent" : " gpt-5-pro" ,
71- "max_input_tokens" : 400000 ,
71+ "max_input_tokens" : 128000 ,
7272 "max_output_tokens" : 272000
7373 },
7474 "gpt-5-codex" : {
8080 "input_cache_read_cost_per_mil_tokens" : 0.125 ,
8181 "displayName" : " GPT-5 Codex" ,
8282 "reasoning" : true ,
83- "max_input_tokens" : 400000 ,
83+ "max_input_tokens" : 272000 ,
8484 "max_output_tokens" : 128000
8585 },
8686 "gpt-5-nano" : {
9292 "input_cache_read_cost_per_mil_tokens" : 0.005 ,
9393 "displayName" : " GPT-5 nano" ,
9494 "reasoning" : true ,
95- "max_input_tokens" : 400000 ,
95+ "max_input_tokens" : 272000 ,
9696 "max_output_tokens" : 128000
9797 },
9898 "gpt-5-nano-2025-08-07" : {
105105 "displayName" : " GPT-5 nano (2025-08-07)" ,
106106 "reasoning" : true ,
107107 "parent" : " gpt-5-nano" ,
108- "max_input_tokens" : 400000 ,
108+ "max_input_tokens" : 272000 ,
109109 "max_output_tokens" : 128000
110110 },
111111 "gpt-5-chat-latest" : {
117117 "input_cache_read_cost_per_mil_tokens" : 0.125 ,
118118 "displayName" : " GPT-5 chat" ,
119119 "reasoning" : true ,
120- "max_input_tokens" : 400000 ,
120+ "max_input_tokens" : 128000 ,
121121 "max_output_tokens" : 16384
122122 },
123123 "gpt-4o" : {
850850 "reasoning_budget" : true ,
851851 "deprecation_date" : " 2025-06-01" ,
852852 "max_input_tokens" : 200000 ,
853- "max_output_tokens" : 128000
853+ "max_output_tokens" : 64000
854854 },
855855 "claude-3-7-sonnet-20250219" : {
856856 "format" : " anthropic" ,
865865 "deprecation_date" : " 2026-02-19" ,
866866 "parent" : " claude-3-7-sonnet-latest" ,
867867 "max_input_tokens" : 200000 ,
868- "max_output_tokens" : 128000
868+ "max_output_tokens" : 64000
869869 },
870870 "claude-haiku-4-5" : {
871871 "format" : " anthropic" ,
974974 "displayName" : " Claude 4.6 Opus" ,
975975 "reasoning" : true ,
976976 "reasoning_budget" : true ,
977- "max_input_tokens" : 200000 ,
977+ "max_input_tokens" : 1000000 ,
978978 "max_output_tokens" : 128000
979979 },
980980 "claude-opus-4-5" : {
23632363 "displayName" : " Gemini 3 Pro (Preview)" ,
23642364 "reasoning" : true ,
23652365 "reasoning_budget" : true ,
2366+ "deprecation_date" : " 2026-03-26" ,
23662367 "max_input_tokens" : 1048576 ,
23672368 "max_output_tokens" : 65535
23682369 },
25612562 "output_cost_per_mil_tokens" : 0.4 ,
25622563 "input_cache_read_cost_per_mil_tokens" : 0.025 ,
25632564 "displayName" : " Gemini 2.0 Flash Latest" ,
2564- "deprecation_date" : " 2026-03-31 " ,
2565+ "deprecation_date" : " 2026-06-01 " ,
25652566 "max_input_tokens" : 1048576 ,
25662567 "max_output_tokens" : 8192
25672568 },
25722573 "input_cost_per_mil_tokens" : 0.15 ,
25732574 "output_cost_per_mil_tokens" : 0.6 ,
25742575 "input_cache_read_cost_per_mil_tokens" : 0.0375 ,
2575- "deprecation_date" : " 2026-03-31 " ,
2576+ "deprecation_date" : " 2026-06-01 " ,
25762577 "parent" : " gemini-2.0-flash" ,
25772578 "max_input_tokens" : 1048576 ,
25782579 "max_output_tokens" : 8192
25852586 "output_cost_per_mil_tokens" : 0.3 ,
25862587 "input_cache_read_cost_per_mil_tokens" : 0.01875 ,
25872588 "displayName" : " Gemini 2.0 Flash-Lite" ,
2588- "deprecation_date" : " 2026-03-31 " ,
2589+ "deprecation_date" : " 2026-06-01 " ,
25892590 "max_input_tokens" : 1048576 ,
25902591 "max_output_tokens" : 8192
25912592 },
25962597 "input_cost_per_mil_tokens" : 0.075 ,
25972598 "output_cost_per_mil_tokens" : 0.3 ,
25982599 "input_cache_read_cost_per_mil_tokens" : 0.01875 ,
2599- "deprecation_date" : " 2026-03-31 " ,
2600+ "deprecation_date" : " 2026-06-01 " ,
26002601 "parent" : " gemini-2.0-flash-lite" ,
26012602 "max_input_tokens" : 1048576 ,
26022603 "max_output_tokens" : 8192
29752976 "output_cost_per_mil_tokens" : 0.5 ,
29762977 "input_cache_read_cost_per_mil_tokens" : 0.075 ,
29772978 "reasoning" : true ,
2979+ "deprecation_date" : " 2026-02-28" ,
29782980 "max_input_tokens" : 131072 ,
29792981 "max_output_tokens" : 131072
29802982 },
29952997 "output_cost_per_mil_tokens" : 0.5 ,
29962998 "input_cache_read_cost_per_mil_tokens" : 0.075 ,
29972999 "reasoning" : true ,
3000+ "deprecation_date" : " 2026-02-28" ,
29983001 "max_input_tokens" : 131072 ,
29993002 "max_output_tokens" : 131072
30003003 },
30723075 "multimodal" : true ,
30733076 "input_cost_per_mil_tokens" : 2 ,
30743077 "output_cost_per_mil_tokens" : 10 ,
3078+ "deprecation_date" : " 2026-02-28" ,
30753079 "parent" : " grok-2-vision" ,
30763080 "max_input_tokens" : 32768 ,
30773081 "max_output_tokens" : 32768
33913395 "input_cache_read_cost_per_mil_tokens" : 0.3 ,
33923396 "input_cache_write_cost_per_mil_tokens" : 3.75 ,
33933397 "displayName" : " Claude 3.5 Sonnet v2" ,
3394- "max_input_tokens" : 200000 ,
3398+ "max_input_tokens" : 1000000 ,
33953399 "max_output_tokens" : 8192
33963400 },
33973401 "us.anthropic.claude-3-5-sonnet-20241022-v2:0" : {
34263430 "multimodal" : true ,
34273431 "input_cost_per_mil_tokens" : 3 ,
34283432 "output_cost_per_mil_tokens" : 15 ,
3433+ "input_cache_read_cost_per_mil_tokens" : 0.3 ,
3434+ "input_cache_write_cost_per_mil_tokens" : 3.75 ,
34293435 "displayName" : " Claude 3.5 Sonnet" ,
3430- "max_input_tokens" : 200000 ,
3436+ "max_input_tokens" : 1000000 ,
34313437 "max_output_tokens" : 4096
34323438 },
34333439 "us.anthropic.claude-3-5-sonnet-20240620-v1:0" : {
34363442 "multimodal" : true ,
34373443 "input_cost_per_mil_tokens" : 3 ,
34383444 "output_cost_per_mil_tokens" : 15 ,
3445+ "input_cache_read_cost_per_mil_tokens" : 0.3 ,
3446+ "input_cache_write_cost_per_mil_tokens" : 3.75 ,
34393447 "displayName" : " US Claude 3.5 Sonnet" ,
34403448 "parent" : " anthropic.claude-3-5-sonnet-20240620-v1:0" ,
34413449 "max_input_tokens" : 200000 ,
34473455 "multimodal" : true ,
34483456 "input_cost_per_mil_tokens" : 3 ,
34493457 "output_cost_per_mil_tokens" : 15 ,
3458+ "input_cache_read_cost_per_mil_tokens" : 0.3 ,
3459+ "input_cache_write_cost_per_mil_tokens" : 3.75 ,
34503460 "displayName" : " APAC Claude 3.5 Sonnet" ,
34513461 "parent" : " anthropic.claude-3-5-sonnet-20240620-v1:0" ,
34523462 "max_input_tokens" : 200000 ,
34583468 "multimodal" : true ,
34593469 "input_cost_per_mil_tokens" : 3 ,
34603470 "output_cost_per_mil_tokens" : 15 ,
3471+ "input_cache_read_cost_per_mil_tokens" : 0.3 ,
3472+ "input_cache_write_cost_per_mil_tokens" : 3.75 ,
34613473 "displayName" : " EU Claude 3.5 Sonnet" ,
34623474 "parent" : " anthropic.claude-3-5-sonnet-20240620-v1:0" ,
34633475 "max_input_tokens" : 200000 ,
35813593 "multimodal" : true ,
35823594 "input_cost_per_mil_tokens" : 15 ,
35833595 "output_cost_per_mil_tokens" : 75 ,
3596+ "input_cache_read_cost_per_mil_tokens" : 1.5 ,
3597+ "input_cache_write_cost_per_mil_tokens" : 18.75 ,
35843598 "displayName" : " Claude 3 Opus" ,
35853599 "max_input_tokens" : 200000 ,
35863600 "max_output_tokens" : 4096
35913605 "multimodal" : true ,
35923606 "input_cost_per_mil_tokens" : 15 ,
35933607 "output_cost_per_mil_tokens" : 75 ,
3608+ "input_cache_read_cost_per_mil_tokens" : 1.5 ,
3609+ "input_cache_write_cost_per_mil_tokens" : 18.75 ,
35943610 "displayName" : " US Claude 3 Opus" ,
35953611 "parent" : " anthropic.claude-3-opus-20240229-v1:0" ,
35963612 "max_input_tokens" : 200000 ,
36023618 "multimodal" : true ,
36033619 "input_cost_per_mil_tokens" : 3 ,
36043620 "output_cost_per_mil_tokens" : 15 ,
3621+ "input_cache_read_cost_per_mil_tokens" : 0.3 ,
3622+ "input_cache_write_cost_per_mil_tokens" : 3.75 ,
36053623 "displayName" : " Claude 3 Sonnet" ,
36063624 "max_input_tokens" : 200000 ,
36073625 "max_output_tokens" : 4096
36123630 "multimodal" : true ,
36133631 "input_cost_per_mil_tokens" : 3 ,
36143632 "output_cost_per_mil_tokens" : 15 ,
3633+ "input_cache_read_cost_per_mil_tokens" : 0.3 ,
3634+ "input_cache_write_cost_per_mil_tokens" : 3.75 ,
36153635 "displayName" : " US Claude 3 Sonnet" ,
36163636 "parent" : " anthropic.claude-3-sonnet-20240229-v1:0" ,
36173637 "max_input_tokens" : 200000 ,
36233643 "multimodal" : true ,
36243644 "input_cost_per_mil_tokens" : 3 ,
36253645 "output_cost_per_mil_tokens" : 15 ,
3646+ "input_cache_read_cost_per_mil_tokens" : 0.3 ,
3647+ "input_cache_write_cost_per_mil_tokens" : 3.75 ,
36263648 "displayName" : " APAC Claude 3 Sonnet" ,
36273649 "parent" : " anthropic.claude-3-sonnet-20240229-v1:0" ,
36283650 "max_input_tokens" : 200000 ,
36343656 "multimodal" : true ,
36353657 "input_cost_per_mil_tokens" : 3 ,
36363658 "output_cost_per_mil_tokens" : 15 ,
3659+ "input_cache_read_cost_per_mil_tokens" : 0.3 ,
3660+ "input_cache_write_cost_per_mil_tokens" : 3.75 ,
36373661 "displayName" : " EU Claude 3 Sonnet" ,
36383662 "parent" : " anthropic.claude-3-sonnet-20240229-v1:0" ,
36393663 "max_input_tokens" : 200000 ,
36453669 "multimodal" : true ,
36463670 "input_cost_per_mil_tokens" : 0.25 ,
36473671 "output_cost_per_mil_tokens" : 1.25 ,
3672+ "input_cache_read_cost_per_mil_tokens" : 0.025 ,
3673+ "input_cache_write_cost_per_mil_tokens" : 0.3125 ,
36483674 "displayName" : " Claude 3 Haiku" ,
36493675 "max_input_tokens" : 200000 ,
36503676 "max_output_tokens" : 4096
36553681 "multimodal" : true ,
36563682 "input_cost_per_mil_tokens" : 0.25 ,
36573683 "output_cost_per_mil_tokens" : 1.25 ,
3684+ "input_cache_read_cost_per_mil_tokens" : 0.025 ,
3685+ "input_cache_write_cost_per_mil_tokens" : 0.3125 ,
36583686 "displayName" : " US Claude 3 Haiku" ,
36593687 "parent" : " anthropic.claude-3-haiku-20240307-v1:0" ,
36603688 "max_input_tokens" : 200000 ,
36663694 "multimodal" : true ,
36673695 "input_cost_per_mil_tokens" : 0.25 ,
36683696 "output_cost_per_mil_tokens" : 1.25 ,
3697+ "input_cache_read_cost_per_mil_tokens" : 0.025 ,
3698+ "input_cache_write_cost_per_mil_tokens" : 0.3125 ,
36693699 "displayName" : " APAC Claude 3 Haiku" ,
36703700 "parent" : " anthropic.claude-3-haiku-20240307-v1:0" ,
36713701 "max_input_tokens" : 200000 ,
36773707 "multimodal" : true ,
36783708 "input_cost_per_mil_tokens" : 0.25 ,
36793709 "output_cost_per_mil_tokens" : 1.25 ,
3710+ "input_cache_read_cost_per_mil_tokens" : 0.025 ,
3711+ "input_cache_write_cost_per_mil_tokens" : 0.3125 ,
36803712 "displayName" : " EU Claude 3 Haiku" ,
36813713 "parent" : " anthropic.claude-3-haiku-20240307-v1:0" ,
36823714 "max_input_tokens" : 200000 ,
39583990 "displayName" : " Gemini 3 Pro Preview" ,
39593991 "reasoning" : true ,
39603992 "reasoning_budget" : true ,
3961- "locations" : [" global" ],
3993+ "locations" : [
3994+ " global"
3995+ ],
39623996 "max_input_tokens" : 1048576 ,
39633997 "max_output_tokens" : 65535
39643998 },
39724006 "displayName" : " Gemini 3 Flash Preview" ,
39734007 "reasoning" : true ,
39744008 "reasoning_budget" : true ,
3975- "locations" : [" global" ],
4009+ "locations" : [
4010+ " global"
4011+ ],
39764012 "max_input_tokens" : 1048576 ,
39774013 "max_output_tokens" : 65535
39784014 },
47114747 "input_cost_per_mil_tokens" : 1.2 ,
47124748 "output_cost_per_mil_tokens" : 1.2 ,
47134749 "input_cache_read_cost_per_mil_tokens" : 0.1 ,
4714- "reasoning" : true ,
47154750 "displayName" : " Kimi K2.5" ,
4751+ "reasoning" : true ,
47164752 "max_input_tokens" : 131072 ,
47174753 "max_output_tokens" : 131072
47184754 },
50165052 "input_cost_per_mil_tokens" : 0.22 ,
50175053 "output_cost_per_mil_tokens" : 0.88 ,
50185054 "displayName" : " Qwen3 235B A22B Instruct 2507" ,
5055+ "locations" : [
5056+ " global" ,
5057+ " us-south1"
5058+ ],
50195059 "max_input_tokens" : 262144 ,
5020- "max_output_tokens" : 16384 ,
5021- "locations" : [" global" , " us-south1" ]
5060+ "max_output_tokens" : 16384
50225061 },
50235062 "accounts/fireworks/models/deepseek-v3p2" : {
50245063 "format" : " openai" ,
50485087 "max_input_tokens" : 131072 ,
50495088 "max_output_tokens" : 131072
50505089 }
5051- }
5090+ }
0 commit comments