Ellight
/

gemma-2b-bnb-4bit

Text Generation

text-generation-inference

Model card Files Files and versions

Ellight commited on May 7, 2024

Commit

41d1dbb

·

verified ·

1 Parent(s): 9361b08

Update README.md

Files changed (1) hide show

README.md +4 -2

README.md CHANGED Viewed

@@ -36,18 +36,20 @@ model, tokenizer = FastLanguageModel.from_pretrained(
 )
 FastLanguageModel.for_inference(model) # Enable native 2x faster inference
-alpaca_prompt = """
 ### Instruction:
 {}
 ### Response:
 {}"""
 inputs = tokenizer(
 [
-    alpaca_prompt.format(
         "शतरंज बोर्ड पर कितने वर्ग होते हैं?", # instruction
         "", # output - leave this blank for generation!
     )
 ], return_tensors = "pt").to("cuda")
 outputs = model.generate(**inputs, max_new_tokens = 64, use_cache = True)

 )
 FastLanguageModel.for_inference(model) # Enable native 2x faster inference
+prompt = """
 ### Instruction:
 {}
 ### Response:
 {}"""
 inputs = tokenizer(
 [
+    prompt.format(
         "शतरंज बोर्ड पर कितने वर्ग होते हैं?", # instruction
         "", # output - leave this blank for generation!
     )
 ], return_tensors = "pt").to("cuda")
 outputs = model.generate(**inputs, max_new_tokens = 64, use_cache = True)