{ "backend": "llama.cpp", "model_type": "qwen2", "context_length": 2048, "threads": 4, "mobile_optimized": true }