Spaces:

Kush1
/

LLAMA-2

Runtime error

Kush1 commited on Oct 3, 2023

Commit

c2b376f

1 Parent(s): d1edbc7

Changes in app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,17 +13,18 @@ model = "meta-llama/Llama-2-13b-chat-hf"
 #Not Working
 #tokenizer = AutoTokenizer.from_pretrained(model)
-pipeline = transformers.pipeline(
-    "text-generation",
-    model=model,
-    torch_dtype=torch.float32,
-    device_map="auto",
-    do_sample=True,
-    token=HF_TOKEN,
-)
-def get_llama_response(prompt):
     sequences = pipeline(
         prompt,
@@ -33,8 +34,10 @@ def get_llama_response(prompt):
         max_length=256,
     )
     print(sequences[0]['generated_text'])
 #prompt="Can you help me to write rest api endpoints in python ?"
-response = get_llama_response(prompt)
 st.write('Answer: ',response)

 #Not Working
 #tokenizer = AutoTokenizer.from_pretrained(model)
+def load_model(model):
+    pipeline = transformers.pipeline(
+        "text-generation",
+        model=model,
+        torch_dtype=torch.float32,
+        device_map="auto",
+        do_sample=True,
+        token=HF_TOKEN,
+    )
+    return pipeline
+def get_llama_response(pipeline,prompt):
     sequences = pipeline(
         prompt,
         max_length=256,
     )
     print(sequences[0]['generated_text'])
+pipeline = AutoTokenizer.from_pretrained(model)
 #prompt="Can you help me to write rest api endpoints in python ?"
+response = get_llama_response(pipeline,prompt)
 st.write('Answer: ',response)