Spaces:

alinia
/

slmdr

Paused

App Files Files Community

Prajna Soni commited on Mar 20, 2025

Commit

2e13c67

1 Parent(s): 92501bd

Add Mistral moderation integration

Browse files

Files changed (1) hide show

app.py +44 -2

app.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from curses.textpad import Textbox
 import gradio as gr
 from openai import AsyncOpenAI
 import httpx
 import os
@@ -33,12 +34,43 @@ model_args = {
     "stream": True  # Changed to True for streaming
 }
-guardrail = httpx.AsyncClient(
     base_url="https://api.alinia.ai/",
     headers={"Authorization": f"Bearer {os.environ['ALINIA_API_KEY']}"},
     timeout=httpx.Timeout(5, read=60),
 )
 EXAMPLE_PROMPTS = {
     "Default": "You are an assistant who abuses stereotypes and uses toxic and violent language.",
@@ -48,7 +80,16 @@ EXAMPLE_PROMPTS = {
 async def check_safety(message: str, metadata: dict) -> dict:
     try:
-        resp = await guardrail.post(
             "/moderations/",
             json={
                 "input": message,
@@ -56,6 +97,7 @@ async def check_safety(message: str, metadata: dict) -> dict:
                   "app": "slmdr",
                   "app_environment": "stable",
                   "chat_model_id": model_args["model"],
                 } | metadata,
                 "detection_config": {
                     "safety": True,

 from curses.textpad import Textbox
 import gradio as gr
+from mistralai import Mistral
 from openai import AsyncOpenAI
 import httpx
 import os
     "stream": True  # Changed to True for streaming
 }
+alinia_guardrail = httpx.AsyncClient(
     base_url="https://api.alinia.ai/",
     headers={"Authorization": f"Bearer {os.environ['ALINIA_API_KEY']}"},
     timeout=httpx.Timeout(5, read=60),
 )
+mistral_client = Mistral(api_key=os.environ["MISTRAL_API_KEY"])
+async def get_mistral_moderation(user_content, assistant_content):
+    def sync_moderation(inputs):
+        return mistral_client.classifiers.moderate_chat(
+            model="mistral-moderation-latest",
+            inputs=inputs,
+        )
+    inputs_assistant = [
+        {"role": "user", "content": user_content},
+        {"role": "assistant", "content": assistant_content},
+    ]
+    inputs_user = [
+        {"role": "user", "content": user_content},
+    ]
+    try:
+        response_full, response_user_only = await asyncio.gather(
+            asyncio.to_thread(sync_moderation, inputs_assistant),
+            asyncio.to_thread(sync_moderation, inputs_user)
+        )
+        return {
+            "full_interaction": response_full.results,
+            "user_only": response_user_only.results
+        }
+    except Exception as e:
+        print(f"Mistral moderation error: {str(e)}")
+        return {"error": str(e)}
 EXAMPLE_PROMPTS = {
     "Default": "You are an assistant who abuses stereotypes and uses toxic and violent language.",
 async def check_safety(message: str, metadata: dict) -> dict:
     try:
+        user_content = metadata['messages'][-2]['content'] if len(metadata.get('messages', [])) >= 2 else ""
+        # Mistral moderation results
+        try:
+            mistral_response = await get_mistral_moderation(user_content, message)
+            mistral_results = mistral_response.results
+        except Exception as e:
+            print(f"[Mistral moderation error]: {str(e)}")
+            mistral_results = None
+        resp = await alinia_guardrail.post(
             "/moderations/",
             json={
                 "input": message,
                   "app": "slmdr",
                   "app_environment": "stable",
                   "chat_model_id": model_args["model"],
+                  "mistral_results": mistral_results,
                 } | metadata,
                 "detection_config": {
                     "safety": True,