Spaces:

kdevoe
/

tinyLlama

Runtime error

kdevoe commited on May 23, 2024

Commit

b84ac0e

1 Parent(s): 1106581

Changing model datatype to int8

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,9 +1,10 @@
 import gradio as gr
 import time
 from transformers import pipeline
 # Load the TinyLlama text generation pipeline
-pipe = pipeline("text-generation", model="TinyLlama/TinyLlama-1.1B-Chat-v1.0")
 # Define the inference function
 def generate_text(prompt):

 import gradio as gr
 import time
 from transformers import pipeline
+import torch
 # Load the TinyLlama text generation pipeline
+pipe = pipeline("text-generation", model="TinyLlama/TinyLlama-1.1B-Chat-v1.0", torch_dtype=torch.int8)
 # Define the inference function
 def generate_text(prompt):