Spaces:

sds-ai
/

Yee-R1-Demo

Sleeping

App Files Files Community

Shining-Data commited on Jun 4, 2025

Commit

f17b0c4

verified ·

1 Parent(s): d46278b

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -12

app.py CHANGED Viewed

@@ -80,7 +80,7 @@ def load_pipeline(model_name):
     Tries bfloat16, falls back to float16 or float32 if unsupported.
     """
     global PIPELINES
-    if model_name in PIPELINES:
         return PIPELINES[model_name]
     repo = MODELS[model_name]["repo_id"]
     tokenizer = AutoTokenizer.from_pretrained(repo)
@@ -148,13 +148,6 @@ def chat_response(user_msg, chat_history, system_prompt,
         debug = 'Web search disabled.'
     try:
-        # merge any fetched search results into the system prompt
-        if search_results:
-            enriched = system_prompt.strip() + "\n\nRelevant context:\n" + "\n".join(search_results)
-        else:
-            enriched = system_prompt
         # wait up to 1s for snippets, then replace debug with them
         if enable_search:
             thread_search.join(timeout=float(search_timeout))
@@ -165,16 +158,18 @@ def chat_response(user_msg, chat_history, system_prompt,
             else:
                 debug = "*No web search results found.*"
-        # merge fetched snippets into the system prompt
-        if search_results:
-            enriched = system_prompt.strip() + "\n\nRelevant context:\n" + "\n".join(search_results)
         else:
             enriched = system_prompt
         pipe = load_pipeline(model_name)
         prompt = format_conversation(history, enriched, pipe["tokenizer"])
         prompt_debug = f"\n\n--- Prompt Preview ---\n```\n{prompt}\n```"
-        streamer = TextIteratorStreamer(pipe["tokenizer"],
                                         skip_prompt=True,
                                         skip_special_tokens=True)
         generation_config = dict(

     Tries bfloat16, falls back to float16 or float32 if unsupported.
     """
     global PIPELINES
+    if model_name in PIPELINES.keys():
         return PIPELINES[model_name]
     repo = MODELS[model_name]["repo_id"]
     tokenizer = AutoTokenizer.from_pretrained(repo)
         debug = 'Web search disabled.'
     try:
         # wait up to 1s for snippets, then replace debug with them
         if enable_search:
             thread_search.join(timeout=float(search_timeout))
             else:
                 debug = "*No web search results found.*"
+            # merge fetched snippets into the system prompt
+            if search_results:
+                enriched = system_prompt.strip() + "\n\nRelevant context:\n" + "\n".join(search_results)
+            else:
+                enriched = system_prompt
         else:
             enriched = system_prompt
         pipe = load_pipeline(model_name)
         prompt = format_conversation(history, enriched, pipe["tokenizer"])
         prompt_debug = f"\n\n--- Prompt Preview ---\n```\n{prompt}\n```"
+        streamer = TextIterStreamer(pipe["tokenizer"],
                                         skip_prompt=True,
                                         skip_special_tokens=True)
         generation_config = dict(