Update train.py
Browse files
train.py
CHANGED
|
@@ -12,6 +12,7 @@ from util import generate_text
|
|
| 12 |
# Configuration Parameters
|
| 13 |
# ============================
|
| 14 |
dataset_path = 'flpelerin/tinystories-100k'
|
|
|
|
| 15 |
|
| 16 |
num_epochs = 1
|
| 17 |
batch_size = 4
|
|
@@ -102,9 +103,18 @@ print(f"Model has {parameters_count:,} parameters")
|
|
| 102 |
# ============================
|
| 103 |
|
| 104 |
## TODO: Add naming of the run, from: "[MODEL_NAME]-[RANDOM_HEX]" (like: mingru-a14b)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 105 |
wandb.login(key="860f8753998c6e6dc356914de07e8855aa2f9642")
|
| 106 |
wandb.init(
|
| 107 |
-
project="minGRU-Training",
|
|
|
|
| 108 |
config={
|
| 109 |
"dataset_path": dataset_path,
|
| 110 |
|
|
|
|
| 12 |
# Configuration Parameters
|
| 13 |
# ============================
|
| 14 |
dataset_path = 'flpelerin/tinystories-100k'
|
| 15 |
+
run_name = generate_name()
|
| 16 |
|
| 17 |
num_epochs = 1
|
| 18 |
batch_size = 4
|
|
|
|
| 103 |
# ============================
|
| 104 |
|
| 105 |
## TODO: Add naming of the run, from: "[MODEL_NAME]-[RANDOM_HEX]" (like: mingru-a14b)
|
| 106 |
+
|
| 107 |
+
def generate_name():
|
| 108 |
+
prefix = "mingru"
|
| 109 |
+
random_number = random.randint(0, 0xFFFF)
|
| 110 |
+
hex_code = f"{random_number:04x}"
|
| 111 |
+
unique_name = f"{prefix}-{hex_code}"
|
| 112 |
+
return unique_name
|
| 113 |
+
|
| 114 |
wandb.login(key="860f8753998c6e6dc356914de07e8855aa2f9642")
|
| 115 |
wandb.init(
|
| 116 |
+
project="minGRU-Training",
|
| 117 |
+
name=run_name,
|
| 118 |
config={
|
| 119 |
"dataset_path": dataset_path,
|
| 120 |
|