ho22joshua commited on
Commit
eb039b5
·
1 Parent(s): 0296317

git profiling tools

Browse files
root_gnn_dgl/configs/stats_100K/ttH_CP_even_vs_odd_batch_size_2048.yaml ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Training_Name: ttH_CP_even_vs_odd_batch_size_2048
2
+ Training_Directory: trainings/stats_100K/ttH_CP_even_vs_odd_batch_size_2048
3
+ Model:
4
+ module: models.GCN
5
+ class: Edge_Network
6
+ args:
7
+ hid_size: 64
8
+ in_size: 7
9
+ out_size: 1
10
+ n_layers: 4
11
+ n_proc_steps: 4
12
+ dropout: 0
13
+ Training:
14
+ epochs: 500
15
+ batch_size: 2048
16
+ learning_rate: 0.0001
17
+ gamma: 0.99
18
+ Datasets:
19
+ ttH_CP_even: &dataset_defn
20
+ module: root_gnn_base.dataset
21
+ class: LazyDataset
22
+ shuffle_chunks: 3
23
+ batch_size: 2048
24
+ padding_mode: NONE #one of STEPS, FIXED, or NONE
25
+ args: &dataset_args
26
+ name: ttH_CP_even
27
+ label: 0
28
+ # weight_var: weight
29
+ chunks: 3
30
+ buffer_size: 2
31
+ file_names: ttH_NLO.root
32
+ tree_name: output
33
+ fold_var: Number
34
+ raw_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/stats_100K/
35
+ save_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/processed_graphs/stats_100K/ttH_CP_even_vs_odd_batch_size_2048/
36
+ node_branch_names:
37
+ - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
38
+ - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
39
+ - [jet_phi, ele_phi, mu_phi, ph_phi, MET_phi]
40
+ - CALC_E
41
+ - [jet_btag, 0, 0, 0, 0]
42
+ - [0, ele_charge, mu_charge, 0, 0]
43
+ - NODE_TYPE
44
+ node_branch_types: [vector, vector, vector, vector, single]
45
+ node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
46
+ folding:
47
+ n_folds: 4
48
+ test: [0]
49
+ # validation: 1
50
+ train: [1, 2, 3]
51
+ ttH_CP_odd:
52
+ <<: *dataset_defn
53
+ args:
54
+ <<: *dataset_args
55
+ name: ttH_CP_odd
56
+ label: 1
57
+ file_names: ttH_CPodd.root
root_gnn_dgl/configs/stats_100K/ttH_CP_even_vs_odd_batch_size_4096.yaml ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Training_Name: ttH_CP_even_vs_odd_batch_size_4096
2
+ Training_Directory: trainings/stats_100K/ttH_CP_even_vs_odd_batch_size_4096
3
+ Model:
4
+ module: models.GCN
5
+ class: Edge_Network
6
+ args:
7
+ hid_size: 64
8
+ in_size: 7
9
+ out_size: 1
10
+ n_layers: 4
11
+ n_proc_steps: 4
12
+ dropout: 0
13
+ Training:
14
+ epochs: 500
15
+ batch_size: 1024
16
+ learning_rate: 0.0001
17
+ gamma: 0.99
18
+ Datasets:
19
+ ttH_CP_even: &dataset_defn
20
+ module: root_gnn_base.dataset
21
+ class: LazyDataset
22
+ shuffle_chunks: 3
23
+ batch_size: 4096
24
+ padding_mode: NONE #one of STEPS, FIXED, or NONE
25
+ args: &dataset_args
26
+ name: ttH_CP_even
27
+ label: 0
28
+ # weight_var: weight
29
+ chunks: 3
30
+ buffer_size: 2
31
+ file_names: ttH_NLO.root
32
+ tree_name: output
33
+ fold_var: Number
34
+ raw_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/stats_100K/
35
+ save_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/processed_graphs/stats_100K/ttH_CP_even_vs_odd_batch_size_4096/
36
+ node_branch_names:
37
+ - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
38
+ - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
39
+ - [jet_phi, ele_phi, mu_phi, ph_phi, MET_phi]
40
+ - CALC_E
41
+ - [jet_btag, 0, 0, 0, 0]
42
+ - [0, ele_charge, mu_charge, 0, 0]
43
+ - NODE_TYPE
44
+ node_branch_types: [vector, vector, vector, vector, single]
45
+ node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
46
+ folding:
47
+ n_folds: 4
48
+ test: [0]
49
+ # validation: 1
50
+ train: [1, 2, 3]
51
+ ttH_CP_odd:
52
+ <<: *dataset_defn
53
+ args:
54
+ <<: *dataset_args
55
+ name: ttH_CP_odd
56
+ label: 1
57
+ file_names: ttH_CPodd.root
root_gnn_dgl/configs/stats_100K/ttH_CP_even_vs_odd_batch_size_8192.yaml ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Training_Name: ttH_CP_even_vs_odd_batch_size_8192
2
+ Training_Directory: trainings/stats_100K/ttH_CP_even_vs_odd_batch_size_8192
3
+ Model:
4
+ module: models.GCN
5
+ class: Edge_Network
6
+ args:
7
+ hid_size: 64
8
+ in_size: 7
9
+ out_size: 1
10
+ n_layers: 4
11
+ n_proc_steps: 4
12
+ dropout: 0
13
+ Training:
14
+ epochs: 500
15
+ batch_size: 2048
16
+ learning_rate: 0.0001
17
+ gamma: 0.99
18
+ Datasets:
19
+ ttH_CP_even: &dataset_defn
20
+ module: root_gnn_base.dataset
21
+ class: LazyDataset
22
+ shuffle_chunks: 3
23
+ batch_size: 2048
24
+ padding_mode: NONE #one of STEPS, FIXED, or NONE
25
+ args: &dataset_args
26
+ name: ttH_CP_even
27
+ label: 0
28
+ # weight_var: weight
29
+ chunks: 3
30
+ buffer_size: 2
31
+ file_names: ttH_NLO.root
32
+ tree_name: output
33
+ fold_var: Number
34
+ raw_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/stats_100K/
35
+ save_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/processed_graphs/stats_100K/ttH_CP_even_vs_odd_batch_size_8192/
36
+ node_branch_names:
37
+ - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
38
+ - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
39
+ - [jet_phi, ele_phi, mu_phi, ph_phi, MET_phi]
40
+ - CALC_E
41
+ - [jet_btag, 0, 0, 0, 0]
42
+ - [0, ele_charge, mu_charge, 0, 0]
43
+ - NODE_TYPE
44
+ node_branch_types: [vector, vector, vector, vector, single]
45
+ node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
46
+ folding:
47
+ n_folds: 4
48
+ test: [0]
49
+ # validation: 1
50
+ train: [1, 2, 3]
51
+ ttH_CP_odd:
52
+ <<: *dataset_defn
53
+ args:
54
+ <<: *dataset_args
55
+ name: ttH_CP_odd
56
+ label: 1
57
+ file_names: ttH_CPodd.root
root_gnn_dgl/profile.sh ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ nsys profile \
2
+ -o /pscratch/sd/j/joshuaho/my_profile_report_1_gpu_batch_size_1028 \
3
+ --capture-range=cudaProfilerApi \
4
+ --capture-range-end=stop-shutdown \
5
+ --force-overwrite true \
6
+ --trace=nvtx \
7
+ --cudabacktrace=all \
8
+ python scripts/training_script.py --config configs/stats_100K/ttH_CP_even_vs_odd.yaml --preshuffle --nocompile --lazy --restart --profile
9
+
10
+ nsys profile \
11
+ -o /pscratch/sd/j/joshuaho/my_profile_report_1_gpu_batch_size_2048 \
12
+ --capture-range=cudaProfilerApi \
13
+ --capture-range-end=stop-shutdown \
14
+ --force-overwrite true \
15
+ --trace=nvtx \
16
+ --cudabacktrace=all \
17
+ python scripts/training_script.py --config configs/stats_100K/ttH_CP_even_vs_odd_batch_size_2048.yaml --preshuffle --nocompile --lazy --restart --profile
18
+
19
+ nsys profile \
20
+ -o /pscratch/sd/j/joshuaho/my_profile_report_1_gpu_batch_size_4096 \
21
+ --capture-range=cudaProfilerApi \
22
+ --capture-range-end=stop-shutdown \
23
+ --force-overwrite true \
24
+ --trace=nvtx \
25
+ --cudabacktrace=all \
26
+ python scripts/training_script.py --config configs/stats_100K/ttH_CP_even_vs_odd_batch_size_4096.yaml --preshuffle --nocompile --lazy --restart --profile
27
+
28
+ nsys profile \
29
+ -o /pscratch/sd/j/joshuaho/my_profile_report_1_gpu_batch_size_8192 \
30
+ --capture-range=cudaProfilerApi \
31
+ --capture-range-end=stop-shutdown \
32
+ --force-overwrite true \
33
+ --trace=nvtx \
34
+ --cudabacktrace=all \
35
+ python scripts/training_script.py --config configs/stats_100K/ttH_CP_even_vs_odd_batch_size_8192.yaml --preshuffle --nocompile --lazy --restart --profile