Spaces:
Build error
Build error
Commit
·
7592fb5
1
Parent(s):
3618983
Switched back to running on GPU
Browse files
app.py
CHANGED
|
@@ -6,8 +6,7 @@ import torch
|
|
| 6 |
@st.cache_resource
|
| 7 |
def load_model_and_tokenizer(model_name):
|
| 8 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 9 |
-
|
| 10 |
-
model = AutoModelForCausalLM.from_pretrained(model_name, device_map="cpu", load_in_8bit=True)
|
| 11 |
return model, tokenizer
|
| 12 |
|
| 13 |
model_8b, tokenizer_8b = load_model_and_tokenizer("huggyllama/llama-3.1-8b")
|
|
@@ -19,15 +18,13 @@ def generate_text(model, tokenizer, prompt, max_length=100):
|
|
| 19 |
outputs = model.generate(**inputs, max_length=max_length, num_return_sequences=1)
|
| 20 |
return tokenizer.decode(outputs[0], skip_special_tokens=True)
|
| 21 |
|
| 22 |
-
st.title("LLaMA-3.1-8B vs LLaMA-3.1-8B-Instruct Comparison
|
| 23 |
|
| 24 |
prompt = st.text_area("Enter your prompt:", height=100)
|
| 25 |
max_length = st.slider("Max output length:", min_value=50, max_value=500, value=100)
|
| 26 |
|
| 27 |
if st.button("Generate"):
|
| 28 |
if prompt:
|
| 29 |
-
st.warning("Generation may take several minutes. Please be patient.")
|
| 30 |
-
|
| 31 |
col1, col2 = st.columns(2)
|
| 32 |
|
| 33 |
with col1:
|
|
|
|
| 6 |
@st.cache_resource
|
| 7 |
def load_model_and_tokenizer(model_name):
|
| 8 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 9 |
+
model = AutoModelForCausalLM.from_pretrained(model_name)
|
|
|
|
| 10 |
return model, tokenizer
|
| 11 |
|
| 12 |
model_8b, tokenizer_8b = load_model_and_tokenizer("huggyllama/llama-3.1-8b")
|
|
|
|
| 18 |
outputs = model.generate(**inputs, max_length=max_length, num_return_sequences=1)
|
| 19 |
return tokenizer.decode(outputs[0], skip_special_tokens=True)
|
| 20 |
|
| 21 |
+
st.title("LLaMA-3.1-8B vs LLaMA-3.1-8B-Instruct Comparison")
|
| 22 |
|
| 23 |
prompt = st.text_area("Enter your prompt:", height=100)
|
| 24 |
max_length = st.slider("Max output length:", min_value=50, max_value=500, value=100)
|
| 25 |
|
| 26 |
if st.button("Generate"):
|
| 27 |
if prompt:
|
|
|
|
|
|
|
| 28 |
col1, col2 = st.columns(2)
|
| 29 |
|
| 30 |
with col1:
|