jskvrna commited on
Commit
5d8d206
·
1 Parent(s): 25d87ae

Updates batch job configuration and model path

Browse files

Updates the batch job configuration file to use the 'amdgpu' partition and increases the time limit.

Changes the model save path to a new versioned directory. This ensures that the training process saves the model to the correct location.

hoho_gpu_class.batch CHANGED
@@ -3,10 +3,10 @@
3
  #SBATCH --ntasks-per-node=1 # 1 tasks per node
4
  #SBATCH --cpus-per-task=16 # 6 CPUS per task = 12 CPUS per node
5
  #SBATCH --mem-per-cpu=10G # 8GB per CPU = 96GB per node
6
- #SBATCH --time=4:00:00 # time limits: 1 hour
7
  #SBATCH --error=hoho_gpu_class.err # standard error file
8
  #SBATCH --output=hoho_gpu_class.out # standard output file
9
- #SBATCH --partition=amdgpufast # partition name
10
  #SBATCH --mail-user=skvrnjan@fel.cvut.cz # where send info about job
11
  #SBATCH --mail-type=ALL # what to send, valid type values are NONE, BEGIN, END, FAIL, REQUEUE, ALL
12
  #SBATCH --gres=gpu:1
 
3
  #SBATCH --ntasks-per-node=1 # 1 tasks per node
4
  #SBATCH --cpus-per-task=16 # 6 CPUS per task = 12 CPUS per node
5
  #SBATCH --mem-per-cpu=10G # 8GB per CPU = 96GB per node
6
+ #SBATCH --time=24:00:00 # time limits: 1 hour
7
  #SBATCH --error=hoho_gpu_class.err # standard error file
8
  #SBATCH --output=hoho_gpu_class.out # standard output file
9
+ #SBATCH --partition=amdgpu # partition name
10
  #SBATCH --mail-user=skvrnjan@fel.cvut.cz # where send info about job
11
  #SBATCH --mail-type=ALL # what to send, valid type values are NONE, BEGIN, END, FAIL, REQUEUE, ALL
12
  #SBATCH --gres=gpu:1
train_pnet_class_cluster.py CHANGED
@@ -5,7 +5,7 @@ if __name__ == "__main__":
5
 
6
  # Load the dataset
7
  dataset_path = "/mnt/personal/skvrnjan/hohocustom_edges/"
8
- model_save_path = "/mnt/personal/skvrnjan/hoho_pnet_edges/initial.pth"
9
 
10
  os.makedirs(model_save_path, exist_ok=True)
11
 
 
5
 
6
  # Load the dataset
7
  dataset_path = "/mnt/personal/skvrnjan/hohocustom_edges/"
8
+ model_save_path = "/mnt/personal/skvrnjan/hoho_pnet_edges_v2/initial.pth"
9
 
10
  os.makedirs(model_save_path, exist_ok=True)
11