AddieFoote commited on
Commit
16766ba
·
1 Parent(s): d7848e5

bfloat and less tokens

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -1,13 +1,14 @@
1
  import gradio as gr
2
  from transformers import AutoModelForCausalLM, AutoTokenizer
 
3
 
4
  model_name = "AddieFoote0/arithmetic-300M-reference"
5
- model = AutoModelForCausalLM.from_pretrained(model_name)
6
  tokenizer = AutoTokenizer.from_pretrained(model_name)
7
 
8
  def generate_response(prompt):
9
  inputs = tokenizer(prompt, return_tensors="pt")
10
- outputs = model.generate(**inputs, max_new_tokens=50, temperature=0.7)
11
  return tokenizer.decode(outputs[0], skip_special_tokens=True)
12
 
13
  iface = gr.Interface(
 
1
  import gradio as gr
2
  from transformers import AutoModelForCausalLM, AutoTokenizer
3
+ import torch
4
 
5
  model_name = "AddieFoote0/arithmetic-300M-reference"
6
+ model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.bfloat16)
7
  tokenizer = AutoTokenizer.from_pretrained(model_name)
8
 
9
  def generate_response(prompt):
10
  inputs = tokenizer(prompt, return_tensors="pt")
11
+ outputs = model.generate(**inputs, max_new_tokens=20, temperature=1.0)
12
  return tokenizer.decode(outputs[0], skip_special_tokens=True)
13
 
14
  iface = gr.Interface(