Anirudh Esthuri commited on
Commit
9b52469
·
1 Parent(s): 4a34f6e

Read inference profile ARNs from environment variables (secrets)

Browse files
Files changed (1) hide show
  1. model_config.py +18 -5
model_config.py CHANGED
@@ -33,8 +33,21 @@ MODEL_DISPLAY_NAMES = {
33
  MODEL_CHOICES = [model for models in PROVIDER_MODEL_MAP.values() for model in models]
34
 
35
  # Inference profile ARNs for provisioned throughput models
36
- MODEL_TO_INFERENCE_PROFILE_ARN = {
37
- "anthropic.claude-haiku-4-5-20251001-v1:0": "arn:aws:bedrock:us-east-1:850995563530:inference-profile/global.anthropic.claude-haiku-4-5-20251001-v1:0",
38
- "anthropic.claude-sonnet-4-5-20250929-v1:0": "arn:aws:bedrock:us-east-1:850995563530:inference-profile/global.anthropic.claude-sonnet-4-5-20250929-v1:0",
39
- "anthropic.claude-opus-4-20250514-v1:0": "arn:aws:bedrock:us-east-1:850995563530:inference-profile/global.anthropic.claude-sonnet-4-20250514-v1:0",
40
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  MODEL_CHOICES = [model for models in PROVIDER_MODEL_MAP.values() for model in models]
34
 
35
  # Inference profile ARNs for provisioned throughput models
36
+ # Read from environment variables (Hugging Face secrets)
37
+ import os
38
+
39
+ MODEL_TO_INFERENCE_PROFILE_ARN = {}
40
+ # Claude Haiku 4.5
41
+ haiku_arn = os.getenv("BEDROCK_HAIKU_4_5_ARN", "").strip()
42
+ if haiku_arn:
43
+ MODEL_TO_INFERENCE_PROFILE_ARN["anthropic.claude-haiku-4-5-20251001-v1:0"] = haiku_arn
44
+
45
+ # Claude Sonnet 4.5
46
+ sonnet_arn = os.getenv("BEDROCK_SONNET_4_5_ARN", "").strip()
47
+ if sonnet_arn:
48
+ MODEL_TO_INFERENCE_PROFILE_ARN["anthropic.claude-sonnet-4-5-20250929-v1:0"] = sonnet_arn
49
+
50
+ # Claude Opus 4
51
+ opus_arn = os.getenv("BEDROCK_OPUS_4_ARN", "").strip()
52
+ if opus_arn:
53
+ MODEL_TO_INFERENCE_PROFILE_ARN["anthropic.claude-opus-4-20250514-v1:0"] = opus_arn