Updates batch job configuration and model path
Browse filesUpdates the batch job configuration file to use the 'amdgpu' partition and increases the time limit.
Changes the model save path to a new versioned directory. This ensures that the training process saves the model to the correct location.
- hoho_gpu_class.batch +2 -2
- train_pnet_class_cluster.py +1 -1
hoho_gpu_class.batch
CHANGED
|
@@ -3,10 +3,10 @@
|
|
| 3 |
#SBATCH --ntasks-per-node=1 # 1 tasks per node
|
| 4 |
#SBATCH --cpus-per-task=16 # 6 CPUS per task = 12 CPUS per node
|
| 5 |
#SBATCH --mem-per-cpu=10G # 8GB per CPU = 96GB per node
|
| 6 |
-
#SBATCH --time=
|
| 7 |
#SBATCH --error=hoho_gpu_class.err # standard error file
|
| 8 |
#SBATCH --output=hoho_gpu_class.out # standard output file
|
| 9 |
-
#SBATCH --partition=
|
| 10 |
#SBATCH --mail-user=skvrnjan@fel.cvut.cz # where send info about job
|
| 11 |
#SBATCH --mail-type=ALL # what to send, valid type values are NONE, BEGIN, END, FAIL, REQUEUE, ALL
|
| 12 |
#SBATCH --gres=gpu:1
|
|
|
|
| 3 |
#SBATCH --ntasks-per-node=1 # 1 tasks per node
|
| 4 |
#SBATCH --cpus-per-task=16 # 6 CPUS per task = 12 CPUS per node
|
| 5 |
#SBATCH --mem-per-cpu=10G # 8GB per CPU = 96GB per node
|
| 6 |
+
#SBATCH --time=24:00:00 # time limits: 1 hour
|
| 7 |
#SBATCH --error=hoho_gpu_class.err # standard error file
|
| 8 |
#SBATCH --output=hoho_gpu_class.out # standard output file
|
| 9 |
+
#SBATCH --partition=amdgpu # partition name
|
| 10 |
#SBATCH --mail-user=skvrnjan@fel.cvut.cz # where send info about job
|
| 11 |
#SBATCH --mail-type=ALL # what to send, valid type values are NONE, BEGIN, END, FAIL, REQUEUE, ALL
|
| 12 |
#SBATCH --gres=gpu:1
|
train_pnet_class_cluster.py
CHANGED
|
@@ -5,7 +5,7 @@ if __name__ == "__main__":
|
|
| 5 |
|
| 6 |
# Load the dataset
|
| 7 |
dataset_path = "/mnt/personal/skvrnjan/hohocustom_edges/"
|
| 8 |
-
model_save_path = "/mnt/personal/skvrnjan/
|
| 9 |
|
| 10 |
os.makedirs(model_save_path, exist_ok=True)
|
| 11 |
|
|
|
|
| 5 |
|
| 6 |
# Load the dataset
|
| 7 |
dataset_path = "/mnt/personal/skvrnjan/hohocustom_edges/"
|
| 8 |
+
model_save_path = "/mnt/personal/skvrnjan/hoho_pnet_edges_v2/initial.pth"
|
| 9 |
|
| 10 |
os.makedirs(model_save_path, exist_ok=True)
|
| 11 |
|