Spaces:

satyanayak
/

transformer-basic

Build error

satyanayak commited on Jan 15, 2025

Commit

852e307

1 Parent(s): 2bb12cf

model source file name changed

Files changed (3) hide show

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import torch
 import torch.nn.functional as F
 import tiktoken
 from huggingface_hub import hf_hub_download
-from transformer-basic import GPT, GPTConfig  # Import your model class
 # Load the model from Hugging Face Hub
 device = 'cuda' if torch.cuda.is_available() else 'cpu'

 import torch.nn.functional as F
 import tiktoken
 from huggingface_hub import hf_hub_download
+from transformer import GPT, GPTConfig  # Import your model class
 # Load the model from Hugging Face Hub
 device = 'cuda' if torch.cuda.is_available() else 'cpu'

input.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

transformer-basic.py → transformer.py RENAMED Viewed

@@ -269,7 +269,7 @@ best_loss = float('inf')
 step = 0
 losses = []  # Keep track of losses for monitoring
 last_time = time.time()
-interval = 10  # Print every 10 steps
 while step < total_steps and best_loss > 0.099999:
     x, y = train_loader.next_batch()
@@ -317,8 +317,6 @@ print(f'Average of last 100 losses: {sum(losses[-100:]) / min(len(losses), 100):
 save_path = 'trained_model.pt'
 torch.save({
     'model_state_dict': model.state_dict(),
-    'optimizer_state_dict': optimizer.state_dict(),
-    'scheduler_state_dict': scheduler.state_dict(),
     'best_loss': best_loss,
     'config': model.config,
 }, save_path)

 step = 0
 losses = []  # Keep track of losses for monitoring
 last_time = time.time()
+interval = 2  # Print every 10 steps
 while step < total_steps and best_loss > 0.099999:
     x, y = train_loader.next_batch()
 save_path = 'trained_model.pt'
 torch.save({
     'model_state_dict': model.state_dict(),
     'best_loss': best_loss,
     'config': model.config,
 }, save_path)