DMID23 commited on
Commit
b34953c
·
verified ·
1 Parent(s): 9a8f367

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +62 -0
app.py ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
3
+ import os
4
+ import subprocess
5
+ import torch
6
+
7
+ # ---------- STEP 1: Fine-tuned 모델 Git에서 clone ----------
8
+ repo_url = "https://github.com/yourusername/your-finetuned-model"
9
+ local_dir = "./finetuned_model"
10
+
11
+ if not os.path.exists(local_dir):
12
+ subprocess.run(["git", "clone", repo_url, local_dir])
13
+
14
+ # ---------- STEP 2: Tokenizer와 모델 로드 ----------
15
+ base_model = "mistralai/Mistral-7B-Instruct-v0.2"
16
+
17
+ tokenizer = AutoTokenizer.from_pretrained(base_model)
18
+
19
+ model = AutoModelForCausalLM.from_pretrained(
20
+ local_dir,
21
+ torch_dtype=torch.float32,
22
+ )
23
+ model = model.to("cpu")
24
+
25
+ pipe = pipeline("text-generation", model=model, tokenizer=tokenizer, device=-1)
26
+
27
+ # ---------- STEP 3: Gradio 함수 정의 ----------
28
+ def generate_response(prompt, max_length=256, temperature=0.7):
29
+ # max_length를 제한하여 속도를 빠르게 함
30
+ outputs = pipe(
31
+ prompt,
32
+ max_length=max_length,
33
+ temperature=temperature,
34
+ do_sample=True,
35
+ top_p=0.9,
36
+ num_return_sequences=1,
37
+ pad_token_id=tokenizer.eos_token_id,
38
+ )
39
+ return outputs[0]["generated_text"]
40
+
41
+ # ---------- STEP 4: Gradio UI ----------
42
+ with gr.Blocks() as demo:
43
+ gr.Markdown("# 🚀 Fine-tuned Mistral-7B (CPU Optimized)")
44
+
45
+ with gr.Row():
46
+ prompt_input = gr.Textbox(label="Input Prompt", placeholder="Type your prompt here...", lines=4)
47
+
48
+ with gr.Row():
49
+ max_len_slider = gr.Slider(64, 512, value=256, step=16, label="Max Length (lower = faster)")
50
+ temp_slider = gr.Slider(0.1, 1.5, value=0.7, step=0.1, label="Temperature")
51
+
52
+ generate_button = gr.Button("Generate")
53
+ output_box = gr.Textbox(label="Generated Output", lines=10)
54
+
55
+ generate_button.click(
56
+ fn=generate_response,
57
+ inputs=[prompt_input, max_len_slider, temp_slider],
58
+ outputs=output_box,
59
+ )
60
+
61
+ # ---------- STEP 5: Launch ----------
62
+ demo.launch()