Upload app.py
Browse files
app.py
CHANGED
|
@@ -40,13 +40,13 @@ def load_model():
|
|
| 40 |
vocab_size = 50257
|
| 41 |
|
| 42 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
| 43 |
-
model = SmolLM(vocab_size, embed_dim, num_heads, num_layers, max_seq_len).to(device)
|
| 44 |
|
| 45 |
-
model.load_state_dict(torch.load(checkpoint_path, map_location=torch.device('cpu')))
|
| 46 |
-
|
| 47 |
-
|
| 48 |
-
|
| 49 |
-
|
| 50 |
model.to(device)
|
| 51 |
model.eval() # Set to evaluation mode
|
| 52 |
|
|
|
|
| 40 |
vocab_size = 50257
|
| 41 |
|
| 42 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
| 43 |
+
#model = SmolLM(vocab_size, embed_dim, num_heads, num_layers, max_seq_len).to(device)
|
| 44 |
|
| 45 |
+
#model.load_state_dict(torch.load(checkpoint_path, map_location=torch.device('cpu')))
|
| 46 |
+
checkpoint = torch.load(checkpoint_path, map_location=device)
|
| 47 |
+
config = checkpoint['config']
|
| 48 |
+
model = SmolLM(vocab_size, embed_dim, num_heads, num_layers, max_seq_len)
|
| 49 |
+
model.load_state_dict(checkpoint['model_state_dict'])
|
| 50 |
model.to(device)
|
| 51 |
model.eval() # Set to evaluation mode
|
| 52 |
|