HackWeasel
/

llama-3.2-1b-QLORA-IMDB

Text Generation

Model card Files Files and versions

HackWeasel commited on Jan 10, 2025

Commit

3e2e5dc

·

verified ·

1 Parent(s): f833dd1

Update README.md

Files changed (1) hide show

README.md +64 -0

README.md CHANGED Viewed

@@ -24,6 +24,70 @@ Ask questions about movies which have been rated on IMDB
 Use the code below to get started with the model.
 ### Training Data
 mteb/imdb/tree/main/test.jsonl

 Use the code below to get started with the model.
+``` Python
+from peft import PeftModel
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch
+# Set device
+device = "cuda" if torch.cuda.is_available() else "cpu"
+# Load tokenizer and models
+print("Loading models...")
+tokenizer = AutoTokenizer.from_pretrained("unsloth/llama-3.2-1b-instruct-bnb-4bit")
+base_model = AutoModelForCausalLM.from_pretrained("unsloth/llama-3.2-1b-instruct-bnb-4bit").to(device)
+model = PeftModel.from_pretrained(base_model, "HackWeasel/llama-3.2-1b-QLORA-IMDB").to(device)
+model.eval()
+print("Models loaded!")
+def generate_response(prompt, max_length=4096, temperature=0.7):
+    with torch.no_grad():
+        inputs = tokenizer(prompt, return_tensors="pt").to(device)  # Move inputs to GPU
+        outputs = model.generate(
+            **inputs,
+            max_length=max_length,
+            temperature=temperature,
+            do_sample=True,
+            pad_token_id=tokenizer.eos_token_id
+        )
+        return tokenizer.decode(outputs[0], skip_special_tokens=True)
+def main():
+    conversation_history = ""
+    print("\nWelcome! Start chatting with the model (type 'quit' to exit)")
+    while True:
+        user_input = input("\nYou: ").strip()
+        if user_input.lower() == 'quit':
+            print("Goodbye!")
+            break
+        # Construct the prompt with conversation history
+        if conversation_history:
+            full_prompt = f"{conversation_history}\nHuman: {user_input}\nAssistant:"
+        else:
+            full_prompt = f"Human: {user_input}\nAssistant:"
+        try:
+            # Generate response
+            response = generate_response(full_prompt)
+            # Extract just the new response
+            new_response = response.split("Assistant:")[-1].strip()
+            # Update conversation history
+            conversation_history = f"{conversation_history}\nHuman: {user_input}\nAssistant: {new_response}"
+            # Print the response
+            print("\nAssistant:", new_response)
+        except Exception as e:
+            print(f"An error occurred: {e}")
+            print("Continuing conversation...")
+if __name__ == "__main__":
+    main()
+```
 ### Training Data
 mteb/imdb/tree/main/test.jsonl