varshithkumar commited on
Commit
92e762c
·
1 Parent(s): 6964968

Added app.py and requirements.txt

Browse files
Files changed (1) hide show
  1. app.py +5 -4
app.py CHANGED
@@ -19,11 +19,12 @@ print("Using device:", device)
19
  print("Loading base model...")
20
  base_model = AutoModelForCausalLM.from_pretrained(
21
  BASE_MODEL,
22
- device_map=None,
 
 
23
  low_cpu_mem_usage=True,
24
- torch_dtype=torch.float16 if device == "cuda" else torch.float32,
25
- token=HF_TOKEN
26
- ).to(device)
27
 
28
  print("Loading tokenizer...")
29
  tokenizer = AutoTokenizer.from_pretrained(
 
19
  print("Loading base model...")
20
  base_model = AutoModelForCausalLM.from_pretrained(
21
  BASE_MODEL,
22
+ device_map="auto",
23
+ load_in_8bit=True,
24
+ torch_dtype=torch.float16,
25
  low_cpu_mem_usage=True,
26
+ use_auth_token=HF_TOKEN
27
+ )
 
28
 
29
  print("Loading tokenizer...")
30
  tokenizer = AutoTokenizer.from_pretrained(