Spaces:

skzz
/

lytest

Paused

App Files Files Community

skzz commited on Jun 25, 2024

Commit

769970e

verified ·

1 Parent(s): a638ee1

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -16

app.py CHANGED Viewed

@@ -28,7 +28,7 @@ class ChatClient:
         self.model = AutoModelForCausalLM.from_pretrained(model_path).to(self.device)
         self.model.eval()  # 设置为评估模式
-    async def chat_completion(self, messages, max_tokens, stream=False, temperature=1.0, top_p=1.0):
         """
         生成对话回复。
         """
@@ -47,17 +47,15 @@ class ChatClient:
         }
         # 使用生成器生成文本
-        output_sequences = self.model.generate(**inputs, **gen_kwargs)
         # 解码生成的文本
         # result_text = self.tokenizer.decode(output_sequences[0], skip_special_tokens=True)
         # yield result_text
-        # 解码生成的文本
-        for sequence in output_sequences:
-            result_text = self.tokenizer.decode(sequence, skip_special_tokens=True)
-            await anyio.sleep(0)  # Yield control, simulating asynchronous operation
-            yield result_text
 # 创建客户端实例，指定模型路径
 model_path = 'model/v3/'
@@ -68,7 +66,7 @@ client = ChatClient(model_path)
-async def respond(
     message,
     history: list[tuple[str, str]],
     system_message,
@@ -91,21 +89,19 @@ async def respond(
     response = ""
-    async for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,
         top_p=top_p,
     ):
-        # print(message)
-        # token = message
-        # #token = message.choices[0].delta.content
-        # response += token
-        # yield response
-        yield message
 """
 For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface

         self.model = AutoModelForCausalLM.from_pretrained(model_path).to(self.device)
         self.model.eval()  # 设置为评估模式
+    def chat_completion(self, messages, max_tokens, stream=False, temperature=1.0, top_p=1.0):
         """
         生成对话回复。
         """
         }
         # 使用生成器生成文本
+        # output_sequences = self.model.generate(**inputs, **gen_kwargs)
         # 解码生成的文本
         # result_text = self.tokenizer.decode(output_sequences[0], skip_special_tokens=True)
         # yield result_text
+        # claude 3.5
+        for token in self.model.generate(**inputs, **gen_kwargs, streamer=None):
+            yield self.tokenizer.decode(token, skip_special_tokens=True)
 # 创建客户端实例，指定模型路径
 model_path = 'model/v3/'
+def respond(
     message,
     history: list[tuple[str, str]],
     system_message,
     response = ""
+    for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,
         top_p=top_p,
     ):
+        print(message)
+        token = message
+        #token = message.choices[0].delta.content
+        response += token
+        yield response
 """
 For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface