nisten
/

bigdoc-c34b-python-v1

Model card Files Files and versions

nisten commited on Aug 27, 2023

Commit

ae5ecc1

·

1 Parent(s): f63c8cd

Update README.md

Files changed (1) hide show

README.md +6 -6

README.md CHANGED Viewed

@@ -2,7 +2,8 @@
 library_name: peft
 license: mit
 ---
-## Training procedure (only 2000/5000 complete)
 The following `bitsandbytes` quantization config was used during training:
@@ -37,14 +38,14 @@ import torch
 from peft import PeftModel
 from transformers import AutoModelForCausalLM, AutoTokenizer, LlamaTokenizer, StoppingCriteria, StoppingCriteriaList, TextIteratorStreamer
-model_name = "TheBloke/CodeLlama-34B-Python-fp16"
 adapters_name = 'nisten/bigdoc-c34b-python-v1'
 print(f"Starting to load the model {model_name} into memory")
 m = AutoModelForCausalLM.from_pretrained(
     model_name,
-    load_in_4bit=True, #19GB in 4bit, 38GB with load_in_8bit, 67GB in full f16 if you just delete this line
     torch_dtype=torch.bfloat16,
     device_map={"": 0}
 )
@@ -62,12 +63,11 @@ print(f"Successfully loaded the model {model_name} into memory")
 ```
-### And now for the UI
 ```
-# Setup the gradio Demo.
 import datetime
 import os
 from threading import Event, Thread

 library_name: peft
 license: mit
 ---
+## training only 2000/5000 complete
 The following `bitsandbytes` quantization config was used during training:
 from peft import PeftModel
 from transformers import AutoModelForCausalLM, AutoTokenizer, LlamaTokenizer, StoppingCriteria, StoppingCriteriaList, TextIteratorStreamer
+model_name = "TheBloke/CodeLlama-34B-Instruct-fp16"
 adapters_name = 'nisten/bigdoc-c34b-python-v1'
 print(f"Starting to load the model {model_name} into memory")
 m = AutoModelForCausalLM.from_pretrained(
     model_name,
+    #load_in_4bit=True, #19GB in 4bit, 38GB with load_in_8bit, 67GB in full f16 if you just delete this line
     torch_dtype=torch.bfloat16,
     device_map={"": 0}
 )
 ```
+### Gradio the UI
 ```
+#should all work in one click
 import datetime
 import os
 from threading import Event, Thread