Skip to content

Commit ee0ea6d

Browse files
authored
Update model_list.json (#406)
Doing an update with the existing script, before I update the script to add providers to model_list.json. This way the two changes are separated.
1 parent cb9a4a5 commit ee0ea6d

2 files changed

Lines changed: 65 additions & 26 deletions

File tree

packages/proxy/schema/model_list.json

Lines changed: 63 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@
88
"input_cache_read_cost_per_mil_tokens": 0.025,
99
"displayName": "GPT-5 mini",
1010
"reasoning": true,
11-
"max_input_tokens": 400000,
11+
"max_input_tokens": 272000,
1212
"max_output_tokens": 128000
1313
},
1414
"gpt-5-mini-2025-08-07": {
@@ -21,7 +21,7 @@
2121
"displayName": "GPT-5 mini (2025-08-07)",
2222
"reasoning": true,
2323
"parent": "gpt-5-mini",
24-
"max_input_tokens": 400000,
24+
"max_input_tokens": 272000,
2525
"max_output_tokens": 128000
2626
},
2727
"gpt-5": {
@@ -33,7 +33,7 @@
3333
"input_cache_read_cost_per_mil_tokens": 0.125,
3434
"displayName": "GPT-5",
3535
"reasoning": true,
36-
"max_input_tokens": 400000,
36+
"max_input_tokens": 272000,
3737
"max_output_tokens": 128000
3838
},
3939
"gpt-5-2025-08-07": {
@@ -46,7 +46,7 @@
4646
"displayName": "GPT-5 (2025-08-07)",
4747
"reasoning": true,
4848
"parent": "gpt-5",
49-
"max_input_tokens": 400000,
49+
"max_input_tokens": 272000,
5050
"max_output_tokens": 128000
5151
},
5252
"gpt-5-pro": {
@@ -57,7 +57,7 @@
5757
"output_cost_per_mil_tokens": 120,
5858
"displayName": "GPT-5 Pro",
5959
"reasoning": true,
60-
"max_input_tokens": 400000,
60+
"max_input_tokens": 128000,
6161
"max_output_tokens": 272000
6262
},
6363
"gpt-5-pro-2025-10-06": {
@@ -68,7 +68,7 @@
6868
"output_cost_per_mil_tokens": 120,
6969
"reasoning": true,
7070
"parent": "gpt-5-pro",
71-
"max_input_tokens": 400000,
71+
"max_input_tokens": 128000,
7272
"max_output_tokens": 272000
7373
},
7474
"gpt-5-codex": {
@@ -80,7 +80,7 @@
8080
"input_cache_read_cost_per_mil_tokens": 0.125,
8181
"displayName": "GPT-5 Codex",
8282
"reasoning": true,
83-
"max_input_tokens": 400000,
83+
"max_input_tokens": 272000,
8484
"max_output_tokens": 128000
8585
},
8686
"gpt-5-nano": {
@@ -92,7 +92,7 @@
9292
"input_cache_read_cost_per_mil_tokens": 0.005,
9393
"displayName": "GPT-5 nano",
9494
"reasoning": true,
95-
"max_input_tokens": 400000,
95+
"max_input_tokens": 272000,
9696
"max_output_tokens": 128000
9797
},
9898
"gpt-5-nano-2025-08-07": {
@@ -105,7 +105,7 @@
105105
"displayName": "GPT-5 nano (2025-08-07)",
106106
"reasoning": true,
107107
"parent": "gpt-5-nano",
108-
"max_input_tokens": 400000,
108+
"max_input_tokens": 272000,
109109
"max_output_tokens": 128000
110110
},
111111
"gpt-5-chat-latest": {
@@ -117,7 +117,7 @@
117117
"input_cache_read_cost_per_mil_tokens": 0.125,
118118
"displayName": "GPT-5 chat",
119119
"reasoning": true,
120-
"max_input_tokens": 400000,
120+
"max_input_tokens": 128000,
121121
"max_output_tokens": 16384
122122
},
123123
"gpt-4o": {
@@ -850,7 +850,7 @@
850850
"reasoning_budget": true,
851851
"deprecation_date": "2025-06-01",
852852
"max_input_tokens": 200000,
853-
"max_output_tokens": 128000
853+
"max_output_tokens": 64000
854854
},
855855
"claude-3-7-sonnet-20250219": {
856856
"format": "anthropic",
@@ -865,7 +865,7 @@
865865
"deprecation_date": "2026-02-19",
866866
"parent": "claude-3-7-sonnet-latest",
867867
"max_input_tokens": 200000,
868-
"max_output_tokens": 128000
868+
"max_output_tokens": 64000
869869
},
870870
"claude-haiku-4-5": {
871871
"format": "anthropic",
@@ -974,7 +974,7 @@
974974
"displayName": "Claude 4.6 Opus",
975975
"reasoning": true,
976976
"reasoning_budget": true,
977-
"max_input_tokens": 200000,
977+
"max_input_tokens": 1000000,
978978
"max_output_tokens": 128000
979979
},
980980
"claude-opus-4-5": {
@@ -2389,6 +2389,7 @@
23892389
"displayName": "Gemini 3 Pro (Preview)",
23902390
"reasoning": true,
23912391
"reasoning_budget": true,
2392+
"deprecation_date": "2026-03-26",
23922393
"max_input_tokens": 1048576,
23932394
"max_output_tokens": 65535
23942395
},
@@ -2587,7 +2588,7 @@
25872588
"output_cost_per_mil_tokens": 0.4,
25882589
"input_cache_read_cost_per_mil_tokens": 0.025,
25892590
"displayName": "Gemini 2.0 Flash Latest",
2590-
"deprecation_date": "2026-03-31",
2591+
"deprecation_date": "2026-06-01",
25912592
"max_input_tokens": 1048576,
25922593
"max_output_tokens": 8192
25932594
},
@@ -2598,7 +2599,7 @@
25982599
"input_cost_per_mil_tokens": 0.15,
25992600
"output_cost_per_mil_tokens": 0.6,
26002601
"input_cache_read_cost_per_mil_tokens": 0.0375,
2601-
"deprecation_date": "2026-03-31",
2602+
"deprecation_date": "2026-06-01",
26022603
"parent": "gemini-2.0-flash",
26032604
"max_input_tokens": 1048576,
26042605
"max_output_tokens": 8192
@@ -2611,7 +2612,7 @@
26112612
"output_cost_per_mil_tokens": 0.3,
26122613
"input_cache_read_cost_per_mil_tokens": 0.01875,
26132614
"displayName": "Gemini 2.0 Flash-Lite",
2614-
"deprecation_date": "2026-03-31",
2615+
"deprecation_date": "2026-06-01",
26152616
"max_input_tokens": 1048576,
26162617
"max_output_tokens": 8192
26172618
},
@@ -2622,7 +2623,7 @@
26222623
"input_cost_per_mil_tokens": 0.075,
26232624
"output_cost_per_mil_tokens": 0.3,
26242625
"input_cache_read_cost_per_mil_tokens": 0.01875,
2625-
"deprecation_date": "2026-03-31",
2626+
"deprecation_date": "2026-06-01",
26262627
"parent": "gemini-2.0-flash-lite",
26272628
"max_input_tokens": 1048576,
26282629
"max_output_tokens": 8192
@@ -3001,6 +3002,7 @@
30013002
"output_cost_per_mil_tokens": 0.5,
30023003
"input_cache_read_cost_per_mil_tokens": 0.075,
30033004
"reasoning": true,
3005+
"deprecation_date": "2026-02-28",
30043006
"max_input_tokens": 131072,
30053007
"max_output_tokens": 131072
30063008
},
@@ -3021,6 +3023,7 @@
30213023
"output_cost_per_mil_tokens": 0.5,
30223024
"input_cache_read_cost_per_mil_tokens": 0.075,
30233025
"reasoning": true,
3026+
"deprecation_date": "2026-02-28",
30243027
"max_input_tokens": 131072,
30253028
"max_output_tokens": 131072
30263029
},
@@ -3098,6 +3101,7 @@
30983101
"multimodal": true,
30993102
"input_cost_per_mil_tokens": 2,
31003103
"output_cost_per_mil_tokens": 10,
3104+
"deprecation_date": "2026-02-28",
31013105
"parent": "grok-2-vision",
31023106
"max_input_tokens": 32768,
31033107
"max_output_tokens": 32768
@@ -3417,7 +3421,7 @@
34173421
"input_cache_read_cost_per_mil_tokens": 0.3,
34183422
"input_cache_write_cost_per_mil_tokens": 3.75,
34193423
"displayName": "Claude 3.5 Sonnet v2",
3420-
"max_input_tokens": 200000,
3424+
"max_input_tokens": 1000000,
34213425
"max_output_tokens": 8192
34223426
},
34233427
"us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
@@ -3452,8 +3456,10 @@
34523456
"multimodal": true,
34533457
"input_cost_per_mil_tokens": 3,
34543458
"output_cost_per_mil_tokens": 15,
3459+
"input_cache_read_cost_per_mil_tokens": 0.3,
3460+
"input_cache_write_cost_per_mil_tokens": 3.75,
34553461
"displayName": "Claude 3.5 Sonnet",
3456-
"max_input_tokens": 200000,
3462+
"max_input_tokens": 1000000,
34573463
"max_output_tokens": 4096
34583464
},
34593465
"us.anthropic.claude-3-5-sonnet-20240620-v1:0": {
@@ -3462,6 +3468,8 @@
34623468
"multimodal": true,
34633469
"input_cost_per_mil_tokens": 3,
34643470
"output_cost_per_mil_tokens": 15,
3471+
"input_cache_read_cost_per_mil_tokens": 0.3,
3472+
"input_cache_write_cost_per_mil_tokens": 3.75,
34653473
"displayName": "US Claude 3.5 Sonnet",
34663474
"parent": "anthropic.claude-3-5-sonnet-20240620-v1:0",
34673475
"max_input_tokens": 200000,
@@ -3473,6 +3481,8 @@
34733481
"multimodal": true,
34743482
"input_cost_per_mil_tokens": 3,
34753483
"output_cost_per_mil_tokens": 15,
3484+
"input_cache_read_cost_per_mil_tokens": 0.3,
3485+
"input_cache_write_cost_per_mil_tokens": 3.75,
34763486
"displayName": "APAC Claude 3.5 Sonnet",
34773487
"parent": "anthropic.claude-3-5-sonnet-20240620-v1:0",
34783488
"max_input_tokens": 200000,
@@ -3484,6 +3494,8 @@
34843494
"multimodal": true,
34853495
"input_cost_per_mil_tokens": 3,
34863496
"output_cost_per_mil_tokens": 15,
3497+
"input_cache_read_cost_per_mil_tokens": 0.3,
3498+
"input_cache_write_cost_per_mil_tokens": 3.75,
34873499
"displayName": "EU Claude 3.5 Sonnet",
34883500
"parent": "anthropic.claude-3-5-sonnet-20240620-v1:0",
34893501
"max_input_tokens": 200000,
@@ -3607,6 +3619,8 @@
36073619
"multimodal": true,
36083620
"input_cost_per_mil_tokens": 15,
36093621
"output_cost_per_mil_tokens": 75,
3622+
"input_cache_read_cost_per_mil_tokens": 1.5,
3623+
"input_cache_write_cost_per_mil_tokens": 18.75,
36103624
"displayName": "Claude 3 Opus",
36113625
"max_input_tokens": 200000,
36123626
"max_output_tokens": 4096
@@ -3617,6 +3631,8 @@
36173631
"multimodal": true,
36183632
"input_cost_per_mil_tokens": 15,
36193633
"output_cost_per_mil_tokens": 75,
3634+
"input_cache_read_cost_per_mil_tokens": 1.5,
3635+
"input_cache_write_cost_per_mil_tokens": 18.75,
36203636
"displayName": "US Claude 3 Opus",
36213637
"parent": "anthropic.claude-3-opus-20240229-v1:0",
36223638
"max_input_tokens": 200000,
@@ -3628,6 +3644,8 @@
36283644
"multimodal": true,
36293645
"input_cost_per_mil_tokens": 3,
36303646
"output_cost_per_mil_tokens": 15,
3647+
"input_cache_read_cost_per_mil_tokens": 0.3,
3648+
"input_cache_write_cost_per_mil_tokens": 3.75,
36313649
"displayName": "Claude 3 Sonnet",
36323650
"max_input_tokens": 200000,
36333651
"max_output_tokens": 4096
@@ -3638,6 +3656,8 @@
36383656
"multimodal": true,
36393657
"input_cost_per_mil_tokens": 3,
36403658
"output_cost_per_mil_tokens": 15,
3659+
"input_cache_read_cost_per_mil_tokens": 0.3,
3660+
"input_cache_write_cost_per_mil_tokens": 3.75,
36413661
"displayName": "US Claude 3 Sonnet",
36423662
"parent": "anthropic.claude-3-sonnet-20240229-v1:0",
36433663
"max_input_tokens": 200000,
@@ -3649,6 +3669,8 @@
36493669
"multimodal": true,
36503670
"input_cost_per_mil_tokens": 3,
36513671
"output_cost_per_mil_tokens": 15,
3672+
"input_cache_read_cost_per_mil_tokens": 0.3,
3673+
"input_cache_write_cost_per_mil_tokens": 3.75,
36523674
"displayName": "APAC Claude 3 Sonnet",
36533675
"parent": "anthropic.claude-3-sonnet-20240229-v1:0",
36543676
"max_input_tokens": 200000,
@@ -3660,6 +3682,8 @@
36603682
"multimodal": true,
36613683
"input_cost_per_mil_tokens": 3,
36623684
"output_cost_per_mil_tokens": 15,
3685+
"input_cache_read_cost_per_mil_tokens": 0.3,
3686+
"input_cache_write_cost_per_mil_tokens": 3.75,
36633687
"displayName": "EU Claude 3 Sonnet",
36643688
"parent": "anthropic.claude-3-sonnet-20240229-v1:0",
36653689
"max_input_tokens": 200000,
@@ -3671,6 +3695,8 @@
36713695
"multimodal": true,
36723696
"input_cost_per_mil_tokens": 0.25,
36733697
"output_cost_per_mil_tokens": 1.25,
3698+
"input_cache_read_cost_per_mil_tokens": 0.025,
3699+
"input_cache_write_cost_per_mil_tokens": 0.3125,
36743700
"displayName": "Claude 3 Haiku",
36753701
"max_input_tokens": 200000,
36763702
"max_output_tokens": 4096
@@ -3681,6 +3707,8 @@
36813707
"multimodal": true,
36823708
"input_cost_per_mil_tokens": 0.25,
36833709
"output_cost_per_mil_tokens": 1.25,
3710+
"input_cache_read_cost_per_mil_tokens": 0.025,
3711+
"input_cache_write_cost_per_mil_tokens": 0.3125,
36843712
"displayName": "US Claude 3 Haiku",
36853713
"parent": "anthropic.claude-3-haiku-20240307-v1:0",
36863714
"max_input_tokens": 200000,
@@ -3692,6 +3720,8 @@
36923720
"multimodal": true,
36933721
"input_cost_per_mil_tokens": 0.25,
36943722
"output_cost_per_mil_tokens": 1.25,
3723+
"input_cache_read_cost_per_mil_tokens": 0.025,
3724+
"input_cache_write_cost_per_mil_tokens": 0.3125,
36953725
"displayName": "APAC Claude 3 Haiku",
36963726
"parent": "anthropic.claude-3-haiku-20240307-v1:0",
36973727
"max_input_tokens": 200000,
@@ -3703,6 +3733,8 @@
37033733
"multimodal": true,
37043734
"input_cost_per_mil_tokens": 0.25,
37053735
"output_cost_per_mil_tokens": 1.25,
3736+
"input_cache_read_cost_per_mil_tokens": 0.025,
3737+
"input_cache_write_cost_per_mil_tokens": 0.3125,
37063738
"displayName": "EU Claude 3 Haiku",
37073739
"parent": "anthropic.claude-3-haiku-20240307-v1:0",
37083740
"max_input_tokens": 200000,
@@ -4012,7 +4044,9 @@
40124044
"displayName": "Gemini 3 Pro Preview",
40134045
"reasoning": true,
40144046
"reasoning_budget": true,
4015-
"locations": ["global"],
4047+
"locations": [
4048+
"global"
4049+
],
40164050
"max_input_tokens": 1048576,
40174051
"max_output_tokens": 65535
40184052
},
@@ -4026,7 +4060,9 @@
40264060
"displayName": "Gemini 3 Flash Preview",
40274061
"reasoning": true,
40284062
"reasoning_budget": true,
4029-
"locations": ["global"],
4063+
"locations": [
4064+
"global"
4065+
],
40304066
"max_input_tokens": 1048576,
40314067
"max_output_tokens": 65535
40324068
},
@@ -4765,8 +4801,8 @@
47654801
"input_cost_per_mil_tokens": 1.2,
47664802
"output_cost_per_mil_tokens": 1.2,
47674803
"input_cache_read_cost_per_mil_tokens": 0.1,
4768-
"reasoning": true,
47694804
"displayName": "Kimi K2.5",
4805+
"reasoning": true,
47704806
"max_input_tokens": 131072,
47714807
"max_output_tokens": 131072
47724808
},
@@ -5070,9 +5106,12 @@
50705106
"input_cost_per_mil_tokens": 0.22,
50715107
"output_cost_per_mil_tokens": 0.88,
50725108
"displayName": "Qwen3 235B A22B Instruct 2507",
5109+
"locations": [
5110+
"global",
5111+
"us-south1"
5112+
],
50735113
"max_input_tokens": 262144,
5074-
"max_output_tokens": 16384,
5075-
"locations": ["global", "us-south1"]
5114+
"max_output_tokens": 16384
50765115
},
50775116
"accounts/fireworks/models/deepseek-v3p2": {
50785117
"format": "openai",

packages/proxy/scripts/sync_models.ts

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1195,7 +1195,7 @@ async function updateModelsCommand(argv: any) {
11951195

11961196
await fs.promises.writeFile(
11971197
LOCAL_MODEL_LIST_PATH,
1198-
JSON.stringify(orderedModelsToWrite, null, 2), // Use the reordered models
1198+
JSON.stringify(orderedModelsToWrite, null, 2) + "\n", // Use the reordered models
11991199
);
12001200
console.log(
12011201
`\nLocal model_list.json has been updated with new model information (pricing, token limits) and keys ordered according to schema.`,
@@ -1414,7 +1414,7 @@ async function addModelsCommand(argv: any) {
14141414

14151415
await fs.promises.writeFile(
14161416
LOCAL_MODEL_LIST_PATH,
1417-
JSON.stringify(orderedModelsToWrite, null, 2),
1417+
JSON.stringify(orderedModelsToWrite, null, 2) + "\n",
14181418
);
14191419
console.log(
14201420
`\n✅ Successfully added ${missingInLocal.length} models to ${LOCAL_MODEL_LIST_PATH}`,

0 commit comments

Comments
 (0)