Monimoy commited on
Commit
94b45bd
·
verified ·
1 Parent(s): 98fafc0

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -6
app.py CHANGED
@@ -40,13 +40,13 @@ def load_model():
40
  vocab_size = 50257
41
 
42
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
43
- model = SmolLM(vocab_size, embed_dim, num_heads, num_layers, max_seq_len).to(device)
44
 
45
- model.load_state_dict(torch.load(checkpoint_path, map_location=torch.device('cpu')))
46
- #checkpoint = torch.load(checkpoint_path, map_location=device)
47
- #config = checkpoint['config']
48
- #model = GPT(config)
49
- #model.load_state_dict(checkpoint['model_state_dict'])
50
  model.to(device)
51
  model.eval() # Set to evaluation mode
52
 
 
40
  vocab_size = 50257
41
 
42
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
43
+ #model = SmolLM(vocab_size, embed_dim, num_heads, num_layers, max_seq_len).to(device)
44
 
45
+ #model.load_state_dict(torch.load(checkpoint_path, map_location=torch.device('cpu')))
46
+ checkpoint = torch.load(checkpoint_path, map_location=device)
47
+ config = checkpoint['config']
48
+ model = SmolLM(vocab_size, embed_dim, num_heads, num_layers, max_seq_len)
49
+ model.load_state_dict(checkpoint['model_state_dict'])
50
  model.to(device)
51
  model.eval() # Set to evaluation mode
52