ElPremOoO commited on
Commit
066236e
·
verified ·
1 Parent(s): e803dc8

Update main.py

Browse files
Files changed (1) hide show
  1. main.py +8 -8
main.py CHANGED
@@ -4,23 +4,23 @@ import torch
4
 
5
  app = Flask(__name__)
6
 
7
- # Load model and tokenizer
8
- model_name = "mistralai/Mistral-7B-v0.1"
9
 
10
- # Enable quantization for better performance on free-tier Spaces
 
11
  model = AutoModelForCausalLM.from_pretrained(
12
  model_name,
13
- torch_dtype=torch.float16,
14
- device_map="auto"
15
  )
16
 
17
- tokenizer = AutoTokenizer.from_pretrained(model_name)
18
 
19
  @app.route("/")
20
  def home():
21
  return request.url
22
 
23
- @app.route("/generate")
24
  def generate_text():
25
  data = request.get_json()
26
  prompt = data.get("prompt", "")
@@ -28,7 +28,7 @@ def generate_text():
28
  if not prompt:
29
  return jsonify({"error": "No prompt provided"}), 400
30
 
31
- inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
32
  outputs = model.generate(**inputs, max_length=200)
33
  response_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
34
 
 
4
 
5
  app = Flask(__name__)
6
 
7
+ # Use CodeLlama-7B (No authentication needed)
8
+ model_name = "codellama/CodeLlama-7B"
9
 
10
+ # Load model and tokenizer
11
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
12
  model = AutoModelForCausalLM.from_pretrained(
13
  model_name,
14
+ torch_dtype=torch.float16, # Use float16 for efficiency
15
+ device_map="auto" # Automatically use GPU if available
16
  )
17
 
 
18
 
19
  @app.route("/")
20
  def home():
21
  return request.url
22
 
23
+ @app.route("/generate", methods=["POST"])
24
  def generate_text():
25
  data = request.get_json()
26
  prompt = data.get("prompt", "")
 
28
  if not prompt:
29
  return jsonify({"error": "No prompt provided"}), 400
30
 
31
+ inputs = tokenizer(prompt, return_tensors="pt").to("cuda" if torch.cuda.is_available() else "cpu")
32
  outputs = model.generate(**inputs, max_length=200)
33
  response_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
34