Spaces:

Rulga
/

status-law-gbot

Running

Rulga commited on Apr 2

Commit

5a6f1a5

1 Parent(s): af6d411

Add XGLM 7.5B model details to app.py and settings.py for multilingual support

Files changed (2) hide show

app.py CHANGED Viewed

@@ -102,7 +102,29 @@ MODEL_DETAILS = {
         ],
         "documentation": "https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2"
     },
     }
 # MODEL_DETAILS = {
 #     "llama-7b": {
 #         "full_name": "Meta Llama 2 7B Chat",

         ],
         "documentation": "https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2"
     },
+    "xglm-7.5b": {
+        "full_name": "Meta XGLM 7.5B",
+        "capabilities": [
+            "Specialized for multilingual generation",
+            "Support for 30+ languages",
+            "Strong cross-lingual transfer abilities",
+            "Consistent performance across diverse languages"
+        ],
+        "limitations": [
+            "Less instruction-tuned than dedicated chat models",
+            "May require more specific prompting",
+            "Not specifically optimized for legal domain",
+            "Slightly larger model requiring more GPU memory"
+        ],
+        "use_cases": [
+            "International legal assistance in native languages",
+            "Complex multilingual documentation",
+            "Serving clients from diverse linguistic backgrounds",
+            "Translation and summarization of legal concepts across languages"
+        ],
+        "documentation": "https://huggingface.co/facebook/xglm-7.5B"
     }
+}
 # MODEL_DETAILS = {
 #     "llama-7b": {
 #         "full_name": "Meta Llama 2 7B Chat",

config/settings.py CHANGED Viewed

@@ -87,6 +87,28 @@ MODELS = {
             }
         }
     },
 }
 # Default model

             }
         }
     },
+    "xglm-7.5b": {
+        "id": "facebook/xglm-7.5B",
+        "name": "XGLM 7.5B",
+        "description": "Meta's multilingual model designed for cross-lingual generation",
+        "type": "base",
+        "parameters": {
+            "max_length": 2048,
+            "temperature": 0.7,
+            "top_p": 0.9,
+            "repetition_penalty": 1.1,
+        },
+        "training": {
+            "base_model_path": "facebook/xglm-7.5B",
+            "fine_tuned_path": os.path.join(TRAINING_OUTPUT_DIR, "xglm-7.5b-tuned"),
+            "lora_config": {
+                "r": 16,
+                "lora_alpha": 32,
+                "lora_dropout": 0.05,
+                "target_modules": ["q_proj", "v_proj", "k_proj", "o_proj"]
+            }
+        }
+    }
 }
 # Default model