PyaeSoneK commited on
Commit
5ed70b1
·
1 Parent(s): 9042ed9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -6
app.py CHANGED
@@ -6,20 +6,21 @@ from transformers import AutoModel
6
  import torch
7
  import transformers
8
  from transformers import AutoTokenizer, AutoModelForCausalLM
 
9
 
10
  # App framework
11
  st.title('🦜Seon\'s Legal QA For Dummies 🔗 ')
12
 
13
-
14
-
15
- offload_folder = 'C:\model_weights'
16
-
17
- model = AutoModelForCausalLM.from_pretrained("PyaeSoneK/LlamaV2LegalFineTuned",
18
  device_map='auto',
19
  torch_dtype=torch.float16,
20
  use_auth_token= st.secrets['hf_access_token'],
21
- offload_folder=offload_folder,
22
  )
 
 
 
 
23
  # load_in_4bit=True
24
 
25
  tokenizer = AutoTokenizer.from_pretrained("PyaeSoneK/LlamaV2LegalFineTuned",
 
6
  import torch
7
  import transformers
8
  from transformers import AutoTokenizer, AutoModelForCausalLM
9
+ from accelerate import init_empty_weights, load_checkpoint_and_dispatch
10
 
11
  # App framework
12
  st.title('🦜Seon\'s Legal QA For Dummies 🔗 ')
13
 
14
+ with init_empty_weights():
15
+ model = AutoModelForCausalLM.from_pretrained("PyaeSoneK/LlamaV2LegalFineTuned",
 
 
 
16
  device_map='auto',
17
  torch_dtype=torch.float16,
18
  use_auth_token= st.secrets['hf_access_token'],
 
19
  )
20
+
21
+ model = load_checkpoint_and_dispatch(
22
+ model, checkpoint=checkpoint_file, device_map="auto"
23
+ )
24
  # load_in_4bit=True
25
 
26
  tokenizer = AutoTokenizer.from_pretrained("PyaeSoneK/LlamaV2LegalFineTuned",