File size: 599 Bytes
b521314
 
 
 
 
984e3c2
b521314
 
984e3c2
1a6672d
b521314
984e3c2
b521314
1a6672d
984e3c2
b521314
 
984e3c2
b521314
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
# Primary: Qwen2.5-Coder-32B via HuggingFace (AMD hackathon Qwen prize eligible)
USE_QWEN=true
QWEN_API_KEY=hf_your_token_here
QWEN_MODEL=Qwen/Qwen2.5-Coder-32B-Instruct
QWEN_BASE_URL=https://api-inference.huggingface.co/models/Qwen/Qwen2.5-Coder-32B-Instruct/v1

# Fallback: Groq LLaMA (when Qwen unavailable)
GROQ_API_KEY=your_groq_key
GROQ_MODEL=llama-3.3-70b-versatile

# AMD DevCloud production (vLLM on MI300X)
# USE_VLLM=true
# VLLM_BASE_URL=http://your-amd-cloud:8000/v1
# VLLM_MODEL=Qwen/Qwen2.5-Coder-32B-Instruct

# ROCm toolchain
ROCM_AVAILABLE=true
HIPCC_PATH=hipcc
ROCPROF_PATH=rocprof