Rulga commited on
Commit
3b79d57
·
1 Parent(s): aa9498f

Refactor settings.py: Add OpenChat 3.5 model configuration, enhancing capabilities and documentation

Browse files
Files changed (1) hide show
  1. config/settings.py +44 -0
config/settings.py CHANGED
@@ -300,6 +300,50 @@ MODELS = {
300
  "documentation": "https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1"
301
  }
302
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
303
  }
304
 
305
  # Update MODELS configuration
 
300
  "documentation": "https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1"
301
  }
302
  },
303
+ "openchat-3.5": {
304
+ "id": "openchat/openchat-3.5",
305
+ "name": "OpenChat 3.5",
306
+ "description": "Open-source alternative to ChatGPT with comparable performance",
307
+ "type": "base",
308
+ "parameters": {
309
+ "max_length": 4096,
310
+ "temperature": 0.7,
311
+ "top_p": 0.9,
312
+ "repetition_penalty": 1.1,
313
+ },
314
+ "training": {
315
+ "base_model_path": "openchat/openchat-3.5",
316
+ "fine_tuned_path": os.path.join(TRAINING_OUTPUT_DIR, "openchat-3.5-tuned"),
317
+ "lora_config": {
318
+ "r": 16,
319
+ "lora_alpha": 32,
320
+ "lora_dropout": 0.05,
321
+ "target_modules": ["q_proj", "v_proj", "k_proj", "o_proj"]
322
+ }
323
+ },
324
+ "details": {
325
+ "full_name": "OpenChat 3.5",
326
+ "capabilities": [
327
+ "Strong performance comparable to GPT-3.5",
328
+ "Excellent instruction following",
329
+ "Good multilingual support",
330
+ "Strong reasoning capabilities",
331
+ "Free and open source"
332
+ ],
333
+ "limitations": [
334
+ "May require more specific prompting",
335
+ "Less specialized in legal domain",
336
+ "Requires more computational resources"
337
+ ],
338
+ "use_cases": [
339
+ "Legal consultation",
340
+ "Document analysis",
341
+ "Complex reasoning tasks",
342
+ "Multilingual support"
343
+ ],
344
+ "documentation": "https://huggingface.co/openchat/openchat-3.5"
345
+ }
346
+ }
347
  }
348
 
349
  # Update MODELS configuration