Spaces:
Running
Running
Refactor settings.py: Add OpenChat 3.5 model configuration, enhancing capabilities and documentation
Browse files- config/settings.py +44 -0
config/settings.py
CHANGED
|
@@ -300,6 +300,50 @@ MODELS = {
|
|
| 300 |
"documentation": "https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1"
|
| 301 |
}
|
| 302 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 303 |
}
|
| 304 |
|
| 305 |
# Update MODELS configuration
|
|
|
|
| 300 |
"documentation": "https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1"
|
| 301 |
}
|
| 302 |
},
|
| 303 |
+
"openchat-3.5": {
|
| 304 |
+
"id": "openchat/openchat-3.5",
|
| 305 |
+
"name": "OpenChat 3.5",
|
| 306 |
+
"description": "Open-source alternative to ChatGPT with comparable performance",
|
| 307 |
+
"type": "base",
|
| 308 |
+
"parameters": {
|
| 309 |
+
"max_length": 4096,
|
| 310 |
+
"temperature": 0.7,
|
| 311 |
+
"top_p": 0.9,
|
| 312 |
+
"repetition_penalty": 1.1,
|
| 313 |
+
},
|
| 314 |
+
"training": {
|
| 315 |
+
"base_model_path": "openchat/openchat-3.5",
|
| 316 |
+
"fine_tuned_path": os.path.join(TRAINING_OUTPUT_DIR, "openchat-3.5-tuned"),
|
| 317 |
+
"lora_config": {
|
| 318 |
+
"r": 16,
|
| 319 |
+
"lora_alpha": 32,
|
| 320 |
+
"lora_dropout": 0.05,
|
| 321 |
+
"target_modules": ["q_proj", "v_proj", "k_proj", "o_proj"]
|
| 322 |
+
}
|
| 323 |
+
},
|
| 324 |
+
"details": {
|
| 325 |
+
"full_name": "OpenChat 3.5",
|
| 326 |
+
"capabilities": [
|
| 327 |
+
"Strong performance comparable to GPT-3.5",
|
| 328 |
+
"Excellent instruction following",
|
| 329 |
+
"Good multilingual support",
|
| 330 |
+
"Strong reasoning capabilities",
|
| 331 |
+
"Free and open source"
|
| 332 |
+
],
|
| 333 |
+
"limitations": [
|
| 334 |
+
"May require more specific prompting",
|
| 335 |
+
"Less specialized in legal domain",
|
| 336 |
+
"Requires more computational resources"
|
| 337 |
+
],
|
| 338 |
+
"use_cases": [
|
| 339 |
+
"Legal consultation",
|
| 340 |
+
"Document analysis",
|
| 341 |
+
"Complex reasoning tasks",
|
| 342 |
+
"Multilingual support"
|
| 343 |
+
],
|
| 344 |
+
"documentation": "https://huggingface.co/openchat/openchat-3.5"
|
| 345 |
+
}
|
| 346 |
+
}
|
| 347 |
}
|
| 348 |
|
| 349 |
# Update MODELS configuration
|