ProfessorCEO commited on
Commit
785d8df
·
verified ·
1 Parent(s): 2c53a91

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +38 -0
app.py ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from fastapi import FastAPI
2
+ from pydantic import BaseModel
3
+ from transformers import AutoTokenizer, AutoModelForCausalLM
4
+ import torch
5
+
6
+ app = FastAPI()
7
+
8
+ model_name = "deepseek-ai/deepseek-coder-1.3b-instruct"
9
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
10
+ model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float32)
11
+
12
+ class CodeRequest(BaseModel):
13
+ code: str
14
+ language: str = "python"
15
+ max_tokens: int = 128
16
+
17
+ @app.get("/")
18
+ def root():
19
+ return {"status": "DevOS AI is running"}
20
+
21
+ @app.post("/complete")
22
+ def complete_code(request: CodeRequest):
23
+ prompt = f"Continue the following {request.language} code:\n{request.code}"
24
+ inputs = tokenizer(prompt, return_tensors="pt")
25
+
26
+ with torch.no_grad():
27
+ outputs = model.generate(
28
+ **inputs,
29
+ max_new_tokens=request.max_tokens,
30
+ temperature=0.2,
31
+ do_sample=True,
32
+ pad_token_id=tokenizer.eos_token_id
33
+ )
34
+
35
+ generated = tokenizer.decode(outputs[0], skip_special_tokens=True)
36
+ suggestion = generated[len(prompt):]
37
+
38
+ return {"suggestion": suggestion.strip()}