FinLLaVA

Runtime error

TobyYang7 commited on Aug 28, 2024

Commit

cec0b15

verified ·

1 Parent(s): ea37c27

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -24,7 +24,6 @@ tokenizer, llava_model, image_processor, context_len = load_pretrained_model(
     device=device
 )
 @spaces.GPU
 def bot_streaming(message, history):
     print(message)
@@ -53,20 +52,39 @@ def bot_streaming(message, history):
     # Generate the prompt for the model
     prompt = message['text']
-    # Call the chat_llava function to generate the output
-    output = chat_llava(
-        args=None,
-        image_file=image,
-        text=prompt,
-        tokenizer=tokenizer,
-        model=llava_model,
-        image_processor=image_processor,
-        context_len=context_len
-    )
     # Stream the output
     buffer = ""
-    for new_text in output:
         buffer += new_text
         yield buffer

     device=device
 )
 @spaces.GPU
 def bot_streaming(message, history):
     print(message)
     # Generate the prompt for the model
     prompt = message['text']
+    # Use a streamer to generate the output in a streaming fashion
+    streamer = []
+    # Define a function to call chat_llava in a separate thread
+    def generate_output():
+        output = chat_llava(
+            args=None,
+            image_file=image,
+            text=prompt,
+            tokenizer=tokenizer,
+            model=llava_model,
+            image_processor=image_processor,
+            context_len=context_len
+        )
+        for new_text in output:
+            streamer.append(new_text)
+    # Start the generation in a separate thread
+    thread = Thread(target=generate_output)
+    thread.start()
     # Stream the output
     buffer = ""
+    while thread.is_alive() or streamer:
+        while streamer:
+            new_text = streamer.pop(0)
+            buffer += new_text
+            yield buffer
+        time.sleep(0.1)
+    # Ensure any remaining text is yielded after the thread completes
+    while streamer:
+        new_text = streamer.pop(0)
         buffer += new_text
         yield buffer