k23064919 commited on
Commit
7316afe
·
2 Parent(s): e7b127b20050ad

checkpoint

Browse files
Files changed (1) hide show
  1. trainingModel/run_training.py +30 -6
trainingModel/run_training.py CHANGED
@@ -1,15 +1,18 @@
1
  import os
2
  import numpy as np
3
-
4
  from clearml import Task, Dataset
5
  from datasets import load_dataset
6
- from dataPrep.helpers.transforms_loaders import make_dataset_loaders
7
 
8
- import torch
9
- from models.modelOne import modelOne
10
- from trainingModel.Training import train_model
 
11
 
 
 
 
12
 
 
13
  # -------------- Load Data --------------
14
 
15
  all_tasks = Task.get_tasks(project_name="Small Group Project")
@@ -25,6 +28,12 @@ latest_task = max(dp_tasks, key=lambda t: t.id)
25
  DYNAMIC_TASK_ID = latest_task.id
26
  DATA_PREP = Task.get_task(task_id=DYNAMIC_TASK_ID)
27
 
 
 
 
 
 
 
28
  # Dataset ID
29
  config_objects = DATA_PREP.get_configuration_objects()
30
  raw_meta = config_objects["Dataset Metadata"]
@@ -34,7 +43,12 @@ dataset_id = raw_meta.split("=")[1].strip().replace('"', "")
34
  subset_clearml = Dataset.get(dataset_id=dataset_id)
35
  local_folder = subset_clearml.get_local_copy()
36
 
 
37
  subset_indices = np.load(os.path.join(local_folder, "subset_indices.npy"))
 
 
 
 
38
 
39
  # Load Dataset Parameters
40
  data_params = DATA_PREP.get_parameters()
@@ -116,8 +130,15 @@ device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
116
 
117
  # ------- Train the model (on subset for now) -------
118
 
 
119
  print("\n--- Starting Model Training on Subset ---")
120
  training_metrics = train_model(
 
 
 
 
 
 
121
  model=model,
122
  train_loader=subset_loaders['train'],
123
  val_loader=subset_loaders['val'],
@@ -126,6 +147,7 @@ training_metrics = train_model(
126
  lr=training_config["learning_rate"],
127
  save_path=training_config["save_path"],
128
  )
 
129
 
130
 
131
  # ----------- Log metrics to ClearML -----------
@@ -146,4 +168,6 @@ training_logger.report_single_value("best_val_accuracy", training_metrics["best_
146
  training_task.upload_artifact("best_model", training_config["save_path"])
147
 
148
  print("\nTraining complete.")
149
- training_task.close()
 
 
 
1
  import os
2
  import numpy as np
 
3
  from clearml import Task, Dataset
4
  from datasets import load_dataset
 
5
 
6
+ # Latest Data Prep Task
7
+ all_tasks = Task.get_tasks(project_name="Small Group Project")
8
+ if not all_tasks:
9
+ raise RuntimeError("No tasks found in project 'Small Group Project'")
10
 
11
+ dp_tasks = [t for t in all_tasks if t.name == "Data Preparation"]
12
+ if not dp_tasks:
13
+ raise RuntimeError("No 'Data Preparation' tasks found in this project!")
14
 
15
+ <<<<<<< HEAD
16
  # -------------- Load Data --------------
17
 
18
  all_tasks = Task.get_tasks(project_name="Small Group Project")
 
28
  DYNAMIC_TASK_ID = latest_task.id
29
  DATA_PREP = Task.get_task(task_id=DYNAMIC_TASK_ID)
30
 
31
+ =======
32
+ latest_task = max(dp_tasks, key=lambda t: t.id)
33
+ DYNAMIC_TASK_ID = latest_task.id
34
+ DATA_PREP = Task.get_task(task_id=DYNAMIC_TASK_ID)
35
+
36
+ >>>>>>> 20050ad82ebca27a376e15837a7abf79fca23e98
37
  # Dataset ID
38
  config_objects = DATA_PREP.get_configuration_objects()
39
  raw_meta = config_objects["Dataset Metadata"]
 
43
  subset_clearml = Dataset.get(dataset_id=dataset_id)
44
  local_folder = subset_clearml.get_local_copy()
45
 
46
+ <<<<<<< HEAD
47
  subset_indices = np.load(os.path.join(local_folder, "subset_indices.npy"))
48
+ =======
49
+ subset_indices_path = os.path.join(local_folder, "subset_indices.npy")
50
+ subset_indices = np.load(subset_indices_path)
51
+ >>>>>>> 20050ad82ebca27a376e15837a7abf79fca23e98
52
 
53
  # Load Dataset Parameters
54
  data_params = DATA_PREP.get_parameters()
 
130
 
131
  # ------- Train the model (on subset for now) -------
132
 
133
+ <<<<<<< HEAD
134
  print("\n--- Starting Model Training on Subset ---")
135
  training_metrics = train_model(
136
+ =======
137
+ #When calling this function, the model should be trained on the given dataset
138
+
139
+ print("\n--- Starting Model Training on Subset ---")
140
+ train_model(
141
+ >>>>>>> 20050ad82ebca27a376e15837a7abf79fca23e98
142
  model=model,
143
  train_loader=subset_loaders['train'],
144
  val_loader=subset_loaders['val'],
 
147
  lr=training_config["learning_rate"],
148
  save_path=training_config["save_path"],
149
  )
150
+ <<<<<<< HEAD
151
 
152
 
153
  # ----------- Log metrics to ClearML -----------
 
168
  training_task.upload_artifact("best_model", training_config["save_path"])
169
 
170
  print("\nTraining complete.")
171
+ training_task.close()
172
+ =======
173
+ >>>>>>> 20050ad82ebca27a376e15837a7abf79fca23e98