kouki321 commited on
Commit
5fb8929
·
verified ·
1 Parent(s): b17c82e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +18 -15
app.py CHANGED
@@ -1,16 +1,19 @@
1
- from transformers import pipeline
2
- from fastapi import FastAPI, Request, HTTPException
3
 
4
- app = FastAPI()
5
-
6
- generator = pipeline('text2text-generation', model='google/flan-t5-small')
7
-
8
- @app.post("/")
9
- async def generate(request: Request):
10
- try:
11
- data = await request.json()
12
- text = data["text"]
13
- output = generator(text)
14
- return {"output": output[0]["generated_text"]}
15
- except Exception as e:
16
- raise HTTPException(status_code=500, detail=str(e))
 
 
 
 
1
+ from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
2
+ import torch
3
 
4
+ model_id = "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B"
5
+
6
+ tokenizer = AutoTokenizer.from_pretrained(model_id, trust_remote_code=True)
7
+ model = AutoModelForCausalLM.from_pretrained(
8
+ model_id,
9
+ torch_dtype=torch.float16,
10
+ device_map="auto",
11
+ trust_remote_code=True
12
+ )
13
+
14
+ pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
15
+
16
+ def generate(prompt):
17
+ return pipe(prompt, max_new_tokens=100)[0]["generated_text"]
18
+
19
+ # Launch your app (Gradio, FastAPI, etc.)