pr0methium commited on
Commit
8d2ac5a
·
verified ·
1 Parent(s): de9f38e

Update main.py

Browse files
Files changed (1) hide show
  1. main.py +7 -1
main.py CHANGED
@@ -2,6 +2,7 @@ from fastapi import FastAPI
2
  from pydantic import BaseModel
3
  from huggingface_hub import InferenceClient
4
  import uvicorn
 
5
  from typing import List
6
 
7
  app = FastAPI()
@@ -42,6 +43,11 @@ def generate(item: Item):
42
 
43
  for response in stream:
44
  output += response.token.text
 
 
 
 
 
45
  return output
46
 
47
  @app.get("/generate/")
@@ -63,4 +69,4 @@ async def generate_text(
63
  top_p=top_p,
64
  repetition_penalty=repetition_penalty
65
  )
66
- return {"response": generate(item)}
 
2
  from pydantic import BaseModel
3
  from huggingface_hub import InferenceClient
4
  import uvicorn
5
+ import re
6
  from typing import List
7
 
8
  app = FastAPI()
 
43
 
44
  for response in stream:
45
  output += response.token.text
46
+
47
+ # Remove unwanted sequences or patterns (e.g., <s>, [/INST], etc.)
48
+ output = re.sub(r'<[^>]+>', '', output) # Remove any HTML-like tags
49
+ output = re.sub(r'\s+', ' ', output).strip() # Clean up extra whitespace
50
+
51
  return output
52
 
53
  @app.get("/generate/")
 
69
  top_p=top_p,
70
  repetition_penalty=repetition_penalty
71
  )
72
+ return {"response": generate(item)}