Spaces:

daniel-was-taken
/

CompifAI

Runtime error

App Files Files Community

daniel-was-taken commited on Jul 28, 2025

Commit

d5b706b

1 Parent(s): acbfa77

Change embedding model

Browse files

Files changed (3) hide show

app.py +21 -15
compose.yml +1 -1
populate_db.py +4 -4

app.py CHANGED Viewed

@@ -41,8 +41,8 @@ else:
         main()
     milvus_client.load_collection(collection_name=collection_name)
-embedding_model = SentenceTransformer("BAAI/bge-small-en-v1.5")
 # Initialize LLM
 model = ChatNebius(
     model="Qwen/Qwen3-14B",
@@ -129,26 +129,24 @@ def setup_rag_chain():
             "context": doc_objects,
             "history": cl.user_session.get("messages", [])
         }
-    system_prompt = """You are a helpful assistant specialising in disability support, reasonable adjustments, and equality legislation.
 When answering questions, you should:
 1. Use the provided context documents to inform your response
 2. Be accurate and helpful
-3. Only provide inline citations from the context documents
-4. If the context doesn't contain relevant information, say so clearly
-5. Always reply in English
-6. Provide clear recommendations wherever applicable
-7. Do not make assumptions about the user's knowledge or background
-8. If the user asks for a specific law or regulation, provide a brief explanation and cite relevant documents if available.
-9. Do not overlook the importance of accessibility and inclusivity in your responses.
-10. Do not overemphasize disability in your responses, but rather focus on the support and adjustments that can be made to ensure equality and inclusivity.
-11. If the user asks about a specific disability, provide general information and resources, but do not make assumptions about the individual's experience or needs.
-12. If the user query explicitly asks for a disability-related topic, provide a well-informed response based on the context documents.
 Context documents:
 {context}
-Please provide a clear response using the above context"""
     # Get the current settings to check if Think mode is enabled
     settings = cl.user_session.get("settings", {})
@@ -236,7 +234,7 @@ async def on_chat_start():
 @cl.on_settings_update
 async def setup_agent(settings):
-    print("on_settings_update", settings)
     # Store the settings in the user session so they can be accessed in setup_rag_chain
     cl.user_session.set("settings", settings)
@@ -259,7 +257,15 @@ async def on_chat_resume(thread: ThreadDict):
     cl.user_session.set("messages", messages)
     chain = setup_rag_chain()
     cl.user_session.set("chain", chain)

         main()
     milvus_client.load_collection(collection_name=collection_name)
+# embedding_model = SentenceTransformer("BAAI/bge-small-en-v1.5")
+embedding_model = SentenceTransformer("Qwen/Qwen3-Embedding-0.6B")
 # Initialize LLM
 model = ChatNebius(
     model="Qwen/Qwen3-14B",
             "context": doc_objects,
             "history": cl.user_session.get("messages", [])
         }
+    system_prompt = """You are a helpful assistant specialising in developing non-discriminatory competence standards and disability support, reasonable adjustments, and equality legislation.
 When answering questions, you should:
 1. Use the provided context documents to inform your response
 2. Be accurate and helpful
+3. If the context doesn't contain relevant information, say so clearly
+4. Always reply in English
+5. Provide clear recommendations and examples wherever applicable
+6. Do not make assumptions about the user's knowledge or background
+7. If the user asks for a specific law or regulation, provide a brief explanation and cite relevant documents if available.
+8. Do not overemphasize disability in your responses, but rather focus on the support and adjustments that can be made to ensure equality and inclusivity.
+9. If the user query explicitly asks for a disability-related topic, provide a well-informed response based on the context documents.
 Context documents:
 {context}
+Please provide a clear response using the above context
+"""
     # Get the current settings to check if Think mode is enabled
     settings = cl.user_session.get("settings", {})
 @cl.on_settings_update
 async def setup_agent(settings):
+    # print("on_settings_update", settings)
     # Store the settings in the user session so they can be accessed in setup_rag_chain
     cl.user_session.set("settings", settings)
     cl.user_session.set("messages", messages)
+    settings = await cl.ChatSettings(
+        [
+            Switch(id="Think", label="Use Deep Thinking", initial=True),
+        ]
+    ).send()
+    # Store initial settings
+    cl.user_session.set("settings", {"Think": True})  # Set the default value
+    # TODO: # Reinitialize the chain with the current settings
     chain = setup_rag_chain()
     cl.user_session.set("chain", chain)

compose.yml CHANGED Viewed

@@ -78,7 +78,7 @@ services:
       - CHAINLIT_AUTH_SECRET=${CHAINLIT_AUTH_SECRET}
       - OAUTH_GOOGLE_CLIENT_ID=${OAUTH_GOOGLE_CLIENT_ID}
       - OAUTH_GOOGLE_CLIENT_SECRET=${OAUTH_GOOGLE_CLIENT_SECRET}
-      - CHAINLIT_FORCE_HTTPS=true
     depends_on:
       - standalone

       - CHAINLIT_AUTH_SECRET=${CHAINLIT_AUTH_SECRET}
       - OAUTH_GOOGLE_CLIENT_ID=${OAUTH_GOOGLE_CLIENT_ID}
       - OAUTH_GOOGLE_CLIENT_SECRET=${OAUTH_GOOGLE_CLIENT_SECRET}
     depends_on:
       - standalone

populate_db.py CHANGED Viewed

@@ -14,8 +14,8 @@ milvus_client = MilvusClient(uri=MILVUS_URI)
 collection_name = "my_rag_collection"
 # Initialize embedding model
-embedding_model = SentenceTransformer("BAAI/bge-small-en-v1.5")
 def emb_text(text):
     """Generate embeddings for text using the sentence transformer model."""
     return embedding_model.encode([text], normalize_embeddings=True).tolist()[0]
@@ -29,8 +29,8 @@ def create_collection():
     # Create Milvus collection schema
     schema = milvus_client.create_schema(auto_id=False, enable_dynamic_field=False)
     schema.add_field(field_name="id", datatype=DataType.INT64, is_primary=True)
-    schema.add_field(field_name="vector", datatype=DataType.FLOAT_VECTOR, dim=384)  # BGE-small-en-v1.5 dimension
-    schema.add_field(field_name="text", datatype=DataType.VARCHAR, max_length=32768)  # 32KB max
     schema.add_field(field_name="metadata", datatype=DataType.JSON)
     # Create index for vector search

 collection_name = "my_rag_collection"
 # Initialize embedding model
+# embedding_model = SentenceTransformer("BAAI/bge-small-en-v1.5")
+embedding_model = SentenceTransformer("Qwen/Qwen3-Embedding-0.6B")
 def emb_text(text):
     """Generate embeddings for text using the sentence transformer model."""
     return embedding_model.encode([text], normalize_embeddings=True).tolist()[0]
     # Create Milvus collection schema
     schema = milvus_client.create_schema(auto_id=False, enable_dynamic_field=False)
     schema.add_field(field_name="id", datatype=DataType.INT64, is_primary=True)
+    schema.add_field(field_name="vector", datatype=DataType.FLOAT_VECTOR, dim=1024)  # Qwen/Qwen3-Embedding-0.6B dimension
+    schema.add_field(field_name="text", datatype=DataType.VARCHAR)  # 32KB max
     schema.add_field(field_name="metadata", datatype=DataType.JSON)
     # Create index for vector search