Javedalam commited on
Commit
8af4634
·
verified ·
1 Parent(s): dab0a34

Create Zapp.py

Browse files
Files changed (1) hide show
  1. Zapp.py +23 -0
Zapp.py ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ from transformers import AutoModelForCausalLM, AutoTokenizer
3
+
4
+ model_id = "EssentialAI/rnj-1-instruct"
5
+ tokenizer = AutoTokenizer.from_pretrained(model_id)
6
+ model = AutoModelForCausalLM.from_pretrained(
7
+ model_id,
8
+ torch_dtype="auto",
9
+ device_map="auto"
10
+ )
11
+
12
+ def chat(prompt):
13
+ inputs = tokenizer(prompt, return_tensors="pt")
14
+ output = model.generate(
15
+ **inputs,
16
+ max_new_tokens=4096, # long output
17
+ temperature=0.2,
18
+ do_sample=False
19
+ )
20
+ return tokenizer.decode(output[0], skip_special_tokens=True)
21
+
22
+ iface = gr.Interface(fn=chat, inputs="text", outputs="text")
23
+ iface.launch()