Rsnarsna commited on
Commit
b9da2c5
·
verified ·
1 Parent(s): 28e126b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +0 -2
app.py CHANGED
@@ -8,10 +8,8 @@ app = FastAPI()
8
  llm = Llama.from_pretrained(
9
  repo_id="microsoft/Phi-3-mini-4k-instruct-gguf",
10
  filename="Phi-3-mini-4k-instruct-q4.gguf",
11
- cache_dir='/content/cache',
12
  )
13
 
14
-
15
  @app.post("/chat")
16
  async def chat(request: Request):
17
  try:
 
8
  llm = Llama.from_pretrained(
9
  repo_id="microsoft/Phi-3-mini-4k-instruct-gguf",
10
  filename="Phi-3-mini-4k-instruct-q4.gguf",
 
11
  )
12
 
 
13
  @app.post("/chat")
14
  async def chat(request: Request):
15
  try: