Skip to content

Commit 12cbac7

Browse files
Merge pull request #15210 from uc4w6c/feat/add_global_cross_region
feat: add Global Cross-Region Inference
2 parents 077b5e1 + ba0dcfc commit 12cbac7

File tree

3 files changed

+169
-49
lines changed

3 files changed

+169
-49
lines changed

litellm/llms/bedrock/common_utils.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -440,7 +440,7 @@ def _supported_cross_region_inference_region() -> List[str]:
440440
"""
441441
Abbreviations of regions AWS Bedrock supports for cross region inference
442442
"""
443-
return ["us", "eu", "apac", "jp"]
443+
return ["global", "us", "eu", "apac", "jp"]
444444

445445
@staticmethod
446446
def get_bedrock_route(

litellm/model_prices_and_context_window_backup.json

Lines changed: 84 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -7838,19 +7838,19 @@
78387838
"tool_use_system_prompt_tokens": 159
78397839
},
78407840
"eu.anthropic.claude-sonnet-4-5-20250929-v1:0": {
7841-
"cache_creation_input_token_cost": 3.75e-06,
7842-
"cache_read_input_token_cost": 3e-07,
7843-
"input_cost_per_token": 3e-06,
7844-
"input_cost_per_token_above_200k_tokens": 6e-06,
7845-
"output_cost_per_token_above_200k_tokens": 2.25e-05,
7846-
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
7847-
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
7841+
"cache_creation_input_token_cost": 4.125e-06,
7842+
"cache_read_input_token_cost": 3.3e-07,
7843+
"input_cost_per_token": 3.3e-06,
7844+
"input_cost_per_token_above_200k_tokens": 6.6e-06,
7845+
"output_cost_per_token_above_200k_tokens": 2.475e-05,
7846+
"cache_creation_input_token_cost_above_200k_tokens": 8.25e-06,
7847+
"cache_read_input_token_cost_above_200k_tokens": 6.6e-07,
78487848
"litellm_provider": "bedrock_converse",
78497849
"max_input_tokens": 200000,
78507850
"max_output_tokens": 64000,
78517851
"max_tokens": 200000,
78527852
"mode": "chat",
7853-
"output_cost_per_token": 1.5e-05,
7853+
"output_cost_per_token": 1.65e-05,
78547854
"search_context_cost_per_query": {
78557855
"search_context_size_high": 0.01,
78567856
"search_context_size_low": 0.01,
@@ -11820,6 +11820,66 @@
1182011820
"video"
1182111821
]
1182211822
},
11823+
"global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
11824+
"cache_creation_input_token_cost": 3.75e-06,
11825+
"cache_read_input_token_cost": 3e-07,
11826+
"input_cost_per_token": 3e-06,
11827+
"input_cost_per_token_above_200k_tokens": 6e-06,
11828+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
11829+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
11830+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
11831+
"litellm_provider": "bedrock_converse",
11832+
"max_input_tokens": 200000,
11833+
"max_output_tokens": 64000,
11834+
"max_tokens": 200000,
11835+
"mode": "chat",
11836+
"output_cost_per_token": 1.5e-05,
11837+
"search_context_cost_per_query": {
11838+
"search_context_size_high": 0.01,
11839+
"search_context_size_low": 0.01,
11840+
"search_context_size_medium": 0.01
11841+
},
11842+
"supports_assistant_prefill": true,
11843+
"supports_computer_use": true,
11844+
"supports_function_calling": true,
11845+
"supports_pdf_input": true,
11846+
"supports_prompt_caching": true,
11847+
"supports_reasoning": true,
11848+
"supports_response_schema": true,
11849+
"supports_tool_choice": true,
11850+
"supports_vision": true,
11851+
"tool_use_system_prompt_tokens": 346
11852+
},
11853+
"global.anthropic.claude-sonnet-4-20250514-v1:0": {
11854+
"cache_creation_input_token_cost": 3.75e-06,
11855+
"cache_read_input_token_cost": 3e-07,
11856+
"input_cost_per_token": 3e-06,
11857+
"input_cost_per_token_above_200k_tokens": 6e-06,
11858+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
11859+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
11860+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
11861+
"litellm_provider": "bedrock_converse",
11862+
"max_input_tokens": 1000000,
11863+
"max_output_tokens": 64000,
11864+
"max_tokens": 64000,
11865+
"mode": "chat",
11866+
"output_cost_per_token": 1.5e-05,
11867+
"search_context_cost_per_query": {
11868+
"search_context_size_high": 0.01,
11869+
"search_context_size_low": 0.01,
11870+
"search_context_size_medium": 0.01
11871+
},
11872+
"supports_assistant_prefill": true,
11873+
"supports_computer_use": true,
11874+
"supports_function_calling": true,
11875+
"supports_pdf_input": true,
11876+
"supports_prompt_caching": true,
11877+
"supports_reasoning": true,
11878+
"supports_response_schema": true,
11879+
"supports_tool_choice": true,
11880+
"supports_vision": true,
11881+
"tool_use_system_prompt_tokens": 159
11882+
},
1182311883
"gpt-3.5-turbo": {
1182411884
"input_cost_per_token": 0.5e-06,
1182511885
"litellm_provider": "openai",
@@ -14219,19 +14279,19 @@
1421914279
"output_cost_per_token": 1.8e-08
1422014280
},
1422114281
"jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
14222-
"cache_creation_input_token_cost": 3.75e-06,
14223-
"cache_read_input_token_cost": 3e-07,
14224-
"input_cost_per_token": 3e-06,
14225-
"input_cost_per_token_above_200k_tokens": 6e-06,
14226-
"output_cost_per_token_above_200k_tokens": 2.25e-05,
14227-
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
14228-
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
14282+
"cache_creation_input_token_cost": 4.125e-06,
14283+
"cache_read_input_token_cost": 3.3e-07,
14284+
"input_cost_per_token": 3.3e-06,
14285+
"input_cost_per_token_above_200k_tokens": 6.6e-06,
14286+
"output_cost_per_token_above_200k_tokens": 2.475e-05,
14287+
"cache_creation_input_token_cost_above_200k_tokens": 8.25e-06,
14288+
"cache_read_input_token_cost_above_200k_tokens": 6.6e-07,
1422914289
"litellm_provider": "bedrock_converse",
1423014290
"max_input_tokens": 200000,
1423114291
"max_output_tokens": 64000,
1423214292
"max_tokens": 200000,
1423314293
"mode": "chat",
14234-
"output_cost_per_token": 1.5e-05,
14294+
"output_cost_per_token": 1.65e-05,
1423514295
"search_context_cost_per_query": {
1423614296
"search_context_size_high": 0.01,
1423714297
"search_context_size_low": 0.01,
@@ -19848,19 +19908,19 @@
1984819908
"tool_use_system_prompt_tokens": 159
1984919909
},
1985019910
"us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
19851-
"cache_creation_input_token_cost": 3.75e-06,
19852-
"cache_read_input_token_cost": 3e-07,
19853-
"input_cost_per_token": 3e-06,
19854-
"input_cost_per_token_above_200k_tokens": 6e-06,
19855-
"output_cost_per_token_above_200k_tokens": 2.25e-05,
19856-
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
19857-
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
19911+
"cache_creation_input_token_cost": 4.125e-06,
19912+
"cache_read_input_token_cost": 33e-07,
19913+
"input_cost_per_token": 33e-06,
19914+
"input_cost_per_token_above_200k_tokens": 66e-06,
19915+
"output_cost_per_token_above_200k_tokens": 2.475e-05,
19916+
"cache_creation_input_token_cost_above_200k_tokens": 8.25e-06,
19917+
"cache_read_input_token_cost_above_200k_tokens": 66e-07,
1985819918
"litellm_provider": "bedrock_converse",
1985919919
"max_input_tokens": 200000,
1986019920
"max_output_tokens": 64000,
1986119921
"max_tokens": 200000,
1986219922
"mode": "chat",
19863-
"output_cost_per_token": 1.5e-05,
19923+
"output_cost_per_token": 1.65e-05,
1986419924
"search_context_cost_per_query": {
1986519925
"search_context_size_high": 0.01,
1986619926
"search_context_size_low": 0.01,

model_prices_and_context_window.json

Lines changed: 84 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -7838,19 +7838,19 @@
78387838
"tool_use_system_prompt_tokens": 159
78397839
},
78407840
"eu.anthropic.claude-sonnet-4-5-20250929-v1:0": {
7841-
"cache_creation_input_token_cost": 3.75e-06,
7842-
"cache_read_input_token_cost": 3e-07,
7843-
"input_cost_per_token": 3e-06,
7844-
"input_cost_per_token_above_200k_tokens": 6e-06,
7845-
"output_cost_per_token_above_200k_tokens": 2.25e-05,
7846-
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
7847-
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
7841+
"cache_creation_input_token_cost": 4.125e-06,
7842+
"cache_read_input_token_cost": 3.3e-07,
7843+
"input_cost_per_token": 3.3e-06,
7844+
"input_cost_per_token_above_200k_tokens": 6.6e-06,
7845+
"output_cost_per_token_above_200k_tokens": 2.475e-05,
7846+
"cache_creation_input_token_cost_above_200k_tokens": 8.25e-06,
7847+
"cache_read_input_token_cost_above_200k_tokens": 6.6e-07,
78487848
"litellm_provider": "bedrock_converse",
78497849
"max_input_tokens": 200000,
78507850
"max_output_tokens": 64000,
78517851
"max_tokens": 200000,
78527852
"mode": "chat",
7853-
"output_cost_per_token": 1.5e-05,
7853+
"output_cost_per_token": 1.65e-05,
78547854
"search_context_cost_per_query": {
78557855
"search_context_size_high": 0.01,
78567856
"search_context_size_low": 0.01,
@@ -11820,6 +11820,66 @@
1182011820
"video"
1182111821
]
1182211822
},
11823+
"global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
11824+
"cache_creation_input_token_cost": 3.75e-06,
11825+
"cache_read_input_token_cost": 3e-07,
11826+
"input_cost_per_token": 3e-06,
11827+
"input_cost_per_token_above_200k_tokens": 6e-06,
11828+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
11829+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
11830+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
11831+
"litellm_provider": "bedrock_converse",
11832+
"max_input_tokens": 200000,
11833+
"max_output_tokens": 64000,
11834+
"max_tokens": 200000,
11835+
"mode": "chat",
11836+
"output_cost_per_token": 1.5e-05,
11837+
"search_context_cost_per_query": {
11838+
"search_context_size_high": 0.01,
11839+
"search_context_size_low": 0.01,
11840+
"search_context_size_medium": 0.01
11841+
},
11842+
"supports_assistant_prefill": true,
11843+
"supports_computer_use": true,
11844+
"supports_function_calling": true,
11845+
"supports_pdf_input": true,
11846+
"supports_prompt_caching": true,
11847+
"supports_reasoning": true,
11848+
"supports_response_schema": true,
11849+
"supports_tool_choice": true,
11850+
"supports_vision": true,
11851+
"tool_use_system_prompt_tokens": 346
11852+
},
11853+
"global.anthropic.claude-sonnet-4-20250514-v1:0": {
11854+
"cache_creation_input_token_cost": 3.75e-06,
11855+
"cache_read_input_token_cost": 3e-07,
11856+
"input_cost_per_token": 3e-06,
11857+
"input_cost_per_token_above_200k_tokens": 6e-06,
11858+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
11859+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
11860+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
11861+
"litellm_provider": "bedrock_converse",
11862+
"max_input_tokens": 1000000,
11863+
"max_output_tokens": 64000,
11864+
"max_tokens": 64000,
11865+
"mode": "chat",
11866+
"output_cost_per_token": 1.5e-05,
11867+
"search_context_cost_per_query": {
11868+
"search_context_size_high": 0.01,
11869+
"search_context_size_low": 0.01,
11870+
"search_context_size_medium": 0.01
11871+
},
11872+
"supports_assistant_prefill": true,
11873+
"supports_computer_use": true,
11874+
"supports_function_calling": true,
11875+
"supports_pdf_input": true,
11876+
"supports_prompt_caching": true,
11877+
"supports_reasoning": true,
11878+
"supports_response_schema": true,
11879+
"supports_tool_choice": true,
11880+
"supports_vision": true,
11881+
"tool_use_system_prompt_tokens": 159
11882+
},
1182311883
"gpt-3.5-turbo": {
1182411884
"input_cost_per_token": 0.5e-06,
1182511885
"litellm_provider": "openai",
@@ -14266,19 +14326,19 @@
1426614326
"output_cost_per_token": 1.8e-08
1426714327
},
1426814328
"jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
14269-
"cache_creation_input_token_cost": 3.75e-06,
14270-
"cache_read_input_token_cost": 3e-07,
14271-
"input_cost_per_token": 3e-06,
14272-
"input_cost_per_token_above_200k_tokens": 6e-06,
14273-
"output_cost_per_token_above_200k_tokens": 2.25e-05,
14274-
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
14275-
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
14329+
"cache_creation_input_token_cost": 4.125e-06,
14330+
"cache_read_input_token_cost": 3.3e-07,
14331+
"input_cost_per_token": 3.3e-06,
14332+
"input_cost_per_token_above_200k_tokens": 6.6e-06,
14333+
"output_cost_per_token_above_200k_tokens": 2.475e-05,
14334+
"cache_creation_input_token_cost_above_200k_tokens": 8.25e-06,
14335+
"cache_read_input_token_cost_above_200k_tokens": 6.6e-07,
1427614336
"litellm_provider": "bedrock_converse",
1427714337
"max_input_tokens": 200000,
1427814338
"max_output_tokens": 64000,
1427914339
"max_tokens": 200000,
1428014340
"mode": "chat",
14281-
"output_cost_per_token": 1.5e-05,
14341+
"output_cost_per_token": 1.65e-05,
1428214342
"search_context_cost_per_query": {
1428314343
"search_context_size_high": 0.01,
1428414344
"search_context_size_low": 0.01,
@@ -19943,19 +20003,19 @@
1994320003
"tool_use_system_prompt_tokens": 159
1994420004
},
1994520005
"us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
19946-
"cache_creation_input_token_cost": 3.75e-06,
19947-
"cache_read_input_token_cost": 3e-07,
19948-
"input_cost_per_token": 3e-06,
19949-
"input_cost_per_token_above_200k_tokens": 6e-06,
19950-
"output_cost_per_token_above_200k_tokens": 2.25e-05,
19951-
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
19952-
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
20006+
"cache_creation_input_token_cost": 4.125e-06,
20007+
"cache_read_input_token_cost": 33e-07,
20008+
"input_cost_per_token": 33e-06,
20009+
"input_cost_per_token_above_200k_tokens": 66e-06,
20010+
"output_cost_per_token_above_200k_tokens": 2.475e-05,
20011+
"cache_creation_input_token_cost_above_200k_tokens": 8.25e-06,
20012+
"cache_read_input_token_cost_above_200k_tokens": 66e-07,
1995320013
"litellm_provider": "bedrock_converse",
1995420014
"max_input_tokens": 200000,
1995520015
"max_output_tokens": 64000,
1995620016
"max_tokens": 200000,
1995720017
"mode": "chat",
19958-
"output_cost_per_token": 1.5e-05,
20018+
"output_cost_per_token": 1.65e-05,
1995920019
"search_context_cost_per_query": {
1996020020
"search_context_size_high": 0.01,
1996120021
"search_context_size_low": 0.01,

0 commit comments

Comments
 (0)