bigcode
/

astraios-1b-lora

terryyz commited on Dec 18, 2023

Commit

e3a45fb

1 Parent(s): 78e607a

Upload README.md with huggingface_hub

Files changed (1) hide show

README.md CHANGED Viewed

@@ -1,3 +1,4 @@
 ---
 license: bigcode-openrail-m
 datasets:
@@ -86,7 +87,9 @@ tags:
 ## Intended use
-The model follows instructions provided in the input. You should always preface your input with "Question: " and finish it with "Answer:", for example: "Question: Please write a function in Python that performs bubble sort.\n\nAnswer:"
 **Feel free to share your generations in the Community tab!**
@@ -97,7 +100,7 @@ The model follows instructions provided in the input. You should always preface
 from peft import PeftModel
 from transformers import AutoModelForCausalLM, AutoTokenizer
-peft_checkpoint = "bigcode/astraios-1b-lora"
 checkpoint = "bigcode/starcoderbase-1b"
 model = AutoModelForCausalLM.from_pretrained(checkpoint)
 model = PeftModel.from_pretrained(model, peft_checkpoint)
@@ -106,7 +109,9 @@ device = "cuda" # for GPU usage or "cpu" for CPU usage
 tokenizer = AutoTokenizer.from_pretrained(checkpoint)
 model = AutoModelForCausalLM.from_pretrained(checkpoint).to(device)
-inputs = tokenizer.encode("Question: Please write a function in Python that performs bubble sort.\n\nAnswer:", return_tensors="pt").to(device)
 outputs = model.generate(inputs)
 print(tokenizer.decode(outputs[0]))
 ```
@@ -135,4 +140,4 @@ print(tokenizer.decode(outputs[0]))
 # Citation
 ```bibtex
-```

 ---
 license: bigcode-openrail-m
 datasets:
 ## Intended use
+The model follows instructions provided in the input. You should always preface your input with "Question: " and finish it with "Answer:", for example: "Question: Please write a function in Python that performs bubble sort.
+Answer:"
 **Feel free to share your generations in the Community tab!**
 from peft import PeftModel
 from transformers import AutoModelForCausalLM, AutoTokenizer
+peft_checkpoint = bigcode/astraios-1b-lora
 checkpoint = "bigcode/starcoderbase-1b"
 model = AutoModelForCausalLM.from_pretrained(checkpoint)
 model = PeftModel.from_pretrained(model, peft_checkpoint)
 tokenizer = AutoTokenizer.from_pretrained(checkpoint)
 model = AutoModelForCausalLM.from_pretrained(checkpoint).to(device)
+inputs = tokenizer.encode("Question: Please write a function in Python that performs bubble sort.
+Answer:", return_tensors="pt").to(device)
 outputs = model.generate(inputs)
 print(tokenizer.decode(outputs[0]))
 ```
 # Citation
 ```bibtex
+```