edwjin commited on
Commit
5ad679c
·
verified ·
1 Parent(s): 28aad06

Update constants.py

Browse files
Files changed (1) hide show
  1. constants.py +3 -3
constants.py CHANGED
@@ -4,8 +4,8 @@ seed = 42
4
  """ Hyperparameters to use for training to roughly match
5
  the numbers mentioned in the assignment description """
6
  batch_size = 16 # Number of independent sequences we will process in parallel
7
- block_size = 128 # Maximum context length for predictions
8
- learning_rate = 1e-4 # Learning rate for the optimizer , OG: 1e-3
9
  n_embd = 512 # Embedding dimension
10
  n_head = 8 # Number of attention heads
11
  n_layer = 6 # Number of transformer encoder layers
@@ -18,4 +18,4 @@ feed_forward = 2048
18
  n_input = 512 # Input size for the classifier, should match the embedding size of the transformer
19
  n_hidden = 100 # Hidden size for the classifier
20
  n_output = 46 # Output size for the classifier, we have 46 presidents
21
- epochs_CLS = 5 # epochs for classifier training
 
4
  """ Hyperparameters to use for training to roughly match
5
  the numbers mentioned in the assignment description """
6
  batch_size = 16 # Number of independent sequences we will process in parallel
7
+ block_size = max([16,32,48,64,80]) # Maximum context length for predictions
8
+ learning_rate = 1e-3 # Learning rate for the optimizer , OG: 1e-3
9
  n_embd = 512 # Embedding dimension
10
  n_head = 8 # Number of attention heads
11
  n_layer = 6 # Number of transformer encoder layers
 
18
  n_input = 512 # Input size for the classifier, should match the embedding size of the transformer
19
  n_hidden = 100 # Hidden size for the classifier
20
  n_output = 46 # Output size for the classifier, we have 46 presidents
21
+ epochs_CLS = 7 # epochs for classifier training