Spaces:

Rulga
/

status-law-gbot

Running

App Files Files Community

Rulga commited on Apr 25

Commit

3a0af00

1 Parent(s): ad89110

Refactor settings.py: Update Llama 7B model configuration to TinyLlama 1.1B and replace OpenChat 3.5 with Microsoft Phi-2, enhancing performance details and documentation

Browse files

Files changed (1) hide show

config/settings.py +23 -66

config/settings.py CHANGED Viewed

@@ -127,7 +127,7 @@ MODELS = {
             "documentation": "https://huggingface.co/HuggingFaceH4/zephyr-7b-beta"
         }
     },
-    "llama-7b": {  # оставляем ключ тот же для совместимости
         "id": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
         "name": "TinyLlama 1.1B Chat",
         "description": "Lightweight chat model with excellent performance for its size",
@@ -174,50 +174,6 @@ MODELS = {
             "documentation": "https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0"
         }
     },
-    "mistral-7b": {
-        "id": "mistralai/Mistral-7B-Instruct-v0.2",  # Меняем на стандартную версию
-        "name": "Mistral 7B Instruct",
-        "description": "High-performance instruction-tuned 7B model with strong multilingual capabilities",
-        "type": "base",
-        "parameters": {
-            "max_length": 2048,
-            "temperature": 0.7,
-            "top_p": 0.9,
-            "repetition_penalty": 1.1,
-        },
-        "training": {
-            "base_model_path": "mistralai/Mistral-7B-Instruct-v0.2",
-            "fine_tuned_path": os.path.join(TRAINING_OUTPUT_DIR, "mistral-7b-instruct-tuned"),
-            "lora_config": {
-                "r": 16,
-                "lora_alpha": 32,
-                "lora_dropout": 0.05,
-                "target_modules": ["q_proj", "v_proj", "k_proj", "o_proj"]
-            }
-        },
-        "details": {
-            "full_name": "Mistral 7B Instruct v0.2",
-            "capabilities": [
-                "Strong multilingual support",
-                "Excellent instruction following",
-                "Advanced reasoning capabilities",
-                "High-quality text generation",
-                "Free for commercial use"
-            ],
-            "limitations": [
-                "Requires more RAM than GGUF version",
-                "May need GPU for optimal performance",
-                "Knowledge cutoff before latest developments"
-            ],
-            "use_cases": [
-                "Complex legal analysis",
-                "Multilingual consultation",
-                "Document processing",
-                "General assistance"
-            ],
-            "documentation": "https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2"
-        }
-    },
     "mixtral-8x7b": {
         "id": "mistralai/Mixtral-8x7B-Instruct-v0.1",
         "name": "Mixtral 8x7B Instruct",
@@ -261,20 +217,20 @@ MODELS = {
             "documentation": "https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1"
         }
     },
-    "openchat-3.5": {
-        "id": "openchat/openchat_3.5",  # Исправленный ID модели
-        "name": "OpenChat 3.5",
-        "description": "Open-source alternative to ChatGPT with comparable performance",
         "type": "base",
         "parameters": {
-            "max_length": 4096,
             "temperature": 0.7,
             "top_p": 0.9,
             "repetition_penalty": 1.1,
         },
         "training": {
-            "base_model_path": "openchat/openchat-3.5",
-            "fine_tuned_path": os.path.join(TRAINING_OUTPUT_DIR, "openchat-3.5-tuned"),
             "lora_config": {
                 "r": 16,
                 "lora_alpha": 32,
@@ -283,29 +239,30 @@ MODELS = {
             }
         },
         "details": {
-            "full_name": "OpenChat 3.5",
             "capabilities": [
-                "Strong performance comparable to GPT-3.5",
-                "Excellent instruction following",
-                "Good multilingual support",
-                "Strong reasoning capabilities",
-                "Free and open source"
             ],
             "limitations": [
-                "May require more specific prompting",
                 "Less specialized in legal domain",
-                "Requires more computational resources"
             ],
             "use_cases": [
-                "Legal consultation",
                 "Document analysis",
-                "Complex reasoning tasks",
-                "Multilingual support"
             ],
-            "documentation": "https://huggingface.co/openchat/openchat-3.5"
         }
-    },
- }
 # Update MODELS configuration
 for model in MODELS.values():

             "documentation": "https://huggingface.co/HuggingFaceH4/zephyr-7b-beta"
         }
     },
+    "llama-7b": {
         "id": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
         "name": "TinyLlama 1.1B Chat",
         "description": "Lightweight chat model with excellent performance for its size",
             "documentation": "https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0"
         }
     },
     "mixtral-8x7b": {
         "id": "mistralai/Mixtral-8x7B-Instruct-v0.1",
         "name": "Mixtral 8x7B Instruct",
             "documentation": "https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1"
         }
     },
+    "phi-2": {
+        "id": "microsoft/phi-2",
+        "name": "Phi-2",
+        "description": "Compact yet powerful 2.7B model with strong reasoning capabilities",
         "type": "base",
         "parameters": {
+            "max_length": 2048,
             "temperature": 0.7,
             "top_p": 0.9,
             "repetition_penalty": 1.1,
         },
         "training": {
+            "base_model_path": "microsoft/phi-2",
+            "fine_tuned_path": os.path.join(TRAINING_OUTPUT_DIR, "phi-2-tuned"),
             "lora_config": {
                 "r": 16,
                 "lora_alpha": 32,
             }
         },
         "details": {
+            "full_name": "Microsoft Phi-2",
             "capabilities": [
+                "Strong reasoning abilities",
+                "Excellent code understanding",
+                "Compact size (2.7B parameters)",
+                "Good performance-to-size ratio",
+                "Efficient resource usage",
+                "Research and commercial use allowed"
             ],
             "limitations": [
+                "Smaller context window than larger models",
                 "Less specialized in legal domain",
+                "Limited multilingual capabilities"
             ],
             "use_cases": [
+                "Quick legal consultations",
                 "Document analysis",
+                "Code-related legal questions",
+                "Resource-efficient deployments"
             ],
+            "documentation": "https://huggingface.co/microsoft/phi-2"
         }
+    }
+}
 # Update MODELS configuration
 for model in MODELS.values():