arXiv:2412.10665
ho22joshua commited on
Commit
8c39cb0
·
1 Parent(s): 5ff9d14

restructured configs

Browse files
root_gnn_dgl/configs/pretraining/multiclass.yaml DELETED
File without changes
root_gnn_dgl/configs/{demo/finetuning_ttH_CP_Even_vs_Odd.yaml → stats_100K/finetuning_ttH_CP_even_vs_odd.yaml} RENAMED
@@ -1,10 +1,10 @@
1
- Training_Name: finetuning_ttH_CP_Even_vs_Odd
2
- Training_Directory: trainings/demo/finetuning_ttH_CP_Even_vs_Odd
3
  Model:
4
  module: models.GCN
5
  class: Transferred_Learning_Finetuning
6
  args:
7
- pretraining_path: trainings/demo/pretraining_multiclass/model_epoch_100.pt # update to the last epoch of the pretraining
8
  pretraining_model:
9
  module: models.GCN
10
  class: Edge_Network
@@ -23,26 +23,26 @@ Model:
23
  Training:
24
  epochs: 500
25
  batch_size: 1024
26
- learning_rate: 0.00001
27
  gamma: 0.99
28
  Datasets:
29
- ttH_CP_Even: &dataset_defn
30
  module: root_gnn_base.dataset
31
  class: LazyDataset
32
- shuffle_chunks: 3
33
  batch_size: 1024
34
  padding_mode: NONE #one of STEPS, FIXED, or NONE
35
  args: &dataset_args
36
- name: ttH_CP_Even
37
  label: 0
38
- weight_var: weight
39
- chunks: 3
40
- buffer_size: 1
41
  file_names: ttH_NLO.root
42
  tree_name: output
43
  fold_var: Number
44
- raw_dir: /global/cfs/projectdirs/atlas/joshua/root_gnn/root_gnn_dgl/data/ntuples/Hyy_pretraining/multilabel_10K/
45
- save_dir: /pscratch/sd/j/joshuaho/GNN4Colliders/root_gnn_dgl/data/demo/finetuning_ttH_CP_Even_vs_Odd/
46
  node_branch_names:
47
  - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
48
  - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
@@ -54,14 +54,14 @@ Datasets:
54
  node_branch_types: [vector, vector, vector, vector, single]
55
  node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
56
  folding:
57
- n_folds: 3
58
  test: [0]
59
  # validation: 1
60
- train: [1, 2]
61
- ttH_CP_Odd:
62
  <<: *dataset_defn
63
  args:
64
  <<: *dataset_args
65
- name: ttH_CP_Odd
66
  label: 1
67
  file_names: ttH_CPodd.root
 
1
+ Training_Name: finetuning_ttH_CP_even_vs_odd
2
+ Training_Directory: trainings/stats_100K/finetuning_ttH_CP_even_vs_odd
3
  Model:
4
  module: models.GCN
5
  class: Transferred_Learning_Finetuning
6
  args:
7
+ pretraining_path: trainings/stats_100K/pretraining_multiclass/model_epoch_100.pt # update to the last epoch of the pretraining
8
  pretraining_model:
9
  module: models.GCN
10
  class: Edge_Network
 
23
  Training:
24
  epochs: 500
25
  batch_size: 1024
26
+ learning_rate: 0.0001
27
  gamma: 0.99
28
  Datasets:
29
+ ttH_CP_even: &dataset_defn
30
  module: root_gnn_base.dataset
31
  class: LazyDataset
32
+ shuffle_chunks: 1
33
  batch_size: 1024
34
  padding_mode: NONE #one of STEPS, FIXED, or NONE
35
  args: &dataset_args
36
+ name: ttH_CP_even
37
  label: 0
38
+ # weight_var: weight
39
+ chunks: 1
40
+ buffer_size: 0
41
  file_names: ttH_NLO.root
42
  tree_name: output
43
  fold_var: Number
44
+ raw_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/stats_100K/
45
+ save_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/processed_graphs/stats_100K/ttH_CP_even_vs_odd/
46
  node_branch_names:
47
  - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
48
  - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
 
54
  node_branch_types: [vector, vector, vector, vector, single]
55
  node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
56
  folding:
57
+ n_folds: 4
58
  test: [0]
59
  # validation: 1
60
+ train: [1, 2, 3]
61
+ ttH_CP_odd:
62
  <<: *dataset_defn
63
  args:
64
  <<: *dataset_args
65
+ name: ttH_CP_odd
66
  label: 1
67
  file_names: ttH_CPodd.root
root_gnn_dgl/configs/{demo → stats_100K}/pretraining_multiclass.yaml RENAMED
@@ -1,5 +1,5 @@
1
  Training_Name: pretraining_multiclass
2
- Training_Directory: trainings/demo/pretraining_multiclass/
3
  Model:
4
  module: models.GCN
5
  class: Edge_Network
@@ -27,19 +27,19 @@ Datasets:
27
  ttH: &dataset_defn
28
  module: root_gnn_base.dataset
29
  class: LazyDataset
30
- shuffle_chunks: 3
31
  padding_mode: NONE #one of STEPS, FIXED, or NONE
32
  args: &dataset_args
33
  name: ttH
34
  label: 0
35
- weight_var: weight
36
- chunks: 3
37
- buffer_size: 1
38
  file_names: ttH_NLO_inc.root
39
  tree_name: output
40
  fold_var: Number
41
- raw_dir: /global/cfs/projectdirs/atlas/joshua/root_gnn/root_gnn_dgl/data/ntuples/Hyy_pretraining/multilabel_10K/
42
- save_dir: /pscratch/sd/j/joshuaho/GNN4Colliders/root_gnn_dgl/data/demo/pretraining_multiclass/
43
  node_branch_names:
44
  - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
45
  - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
@@ -51,10 +51,10 @@ Datasets:
51
  node_branch_types: [vector, vector, vector, vector, single]
52
  node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
53
  folding:
54
- n_folds: 3
55
  test: [0]
56
- # validation: 1
57
- train: [1, 2]
58
  tHjb:
59
  <<: *dataset_defn
60
  args:
 
1
  Training_Name: pretraining_multiclass
2
+ Training_Directory: trainings/stats_100K/pretraining_multiclass/
3
  Model:
4
  module: models.GCN
5
  class: Edge_Network
 
27
  ttH: &dataset_defn
28
  module: root_gnn_base.dataset
29
  class: LazyDataset
30
+ shuffle_chunks: 1
31
  padding_mode: NONE #one of STEPS, FIXED, or NONE
32
  args: &dataset_args
33
  name: ttH
34
  label: 0
35
+ # weight_var: weight
36
+ chunks: 1
37
+ buffer_size: 0
38
  file_names: ttH_NLO_inc.root
39
  tree_name: output
40
  fold_var: Number
41
+ raw_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/stats_100K/
42
+ save_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/processed_graphs/stats_100K/pretraining_multiclass/
43
  node_branch_names:
44
  - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
45
  - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
 
51
  node_branch_types: [vector, vector, vector, vector, single]
52
  node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
53
  folding:
54
+ n_folds: 4
55
  test: [0]
56
+ # validation: [1]
57
+ train: [1, 2, 3]
58
  tHjb:
59
  <<: *dataset_defn
60
  args:
root_gnn_dgl/configs/stats_100K/ttH_CP_even_vs_odd.yaml ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Training_Name: ttH_CP_even_vs_odd
2
+ Training_Directory: trainings/stats_100K/ttH_CP_even_vs_odd
3
+ Model:
4
+ module: models.GCN
5
+ class: Edge_Network
6
+ args:
7
+ hid_size: 64
8
+ in_size: 7
9
+ out_size: 1
10
+ n_layers: 4
11
+ n_proc_steps: 4
12
+ dropout: 0
13
+ Training:
14
+ epochs: 500
15
+ batch_size: 1024
16
+ learning_rate: 0.0001
17
+ gamma: 0.99
18
+ Datasets:
19
+ ttH_CP_even: &dataset_defn
20
+ module: root_gnn_base.dataset
21
+ class: LazyDataset
22
+ shuffle_chunks: 1
23
+ batch_size: 1024
24
+ padding_mode: NONE #one of STEPS, FIXED, or NONE
25
+ args: &dataset_args
26
+ name: ttH_CP_even
27
+ label: 0
28
+ # weight_var: weight
29
+ chunks: 1
30
+ buffer_size: 0
31
+ file_names: ttH_NLO.root
32
+ tree_name: output
33
+ fold_var: Number
34
+ raw_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/stats_100K/
35
+ save_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/processed_graphs/stats_100K/ttH_CP_even_vs_odd/
36
+ node_branch_names:
37
+ - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
38
+ - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
39
+ - [jet_phi, ele_phi, mu_phi, ph_phi, MET_phi]
40
+ - CALC_E
41
+ - [jet_btag, 0, 0, 0, 0]
42
+ - [0, ele_charge, mu_charge, 0, 0]
43
+ - NODE_TYPE
44
+ node_branch_types: [vector, vector, vector, vector, single]
45
+ node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
46
+ folding:
47
+ n_folds: 4
48
+ test: [0]
49
+ # validation: 1
50
+ train: [1, 2, 3]
51
+ ttH_CP_odd:
52
+ <<: *dataset_defn
53
+ args:
54
+ <<: *dataset_args
55
+ name: ttH_CP_odd
56
+ label: 1
57
+ file_names: ttH_CPodd.root
root_gnn_dgl/configs/stats_all/finetuning_ttH_CP_even_vs_odd.yaml ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Training_Name: finetuning_ttH_CP_even_vs_odd
2
+ Training_Directory: trainings/stats_all/finetuning_ttH_CP_even_vs_odd
3
+ Model:
4
+ module: models.GCN
5
+ class: Transferred_Learning_Finetuning
6
+ args:
7
+ pretraining_path: trainings/stats_100K/pretraining_multiclass/model_epoch_100.pt # update to the last epoch of the pretraining
8
+ pretraining_model:
9
+ module: models.GCN
10
+ class: Edge_Network
11
+ args:
12
+ hid_size: 64
13
+ in_size: 7
14
+ out_size: 12
15
+ n_layers: 4
16
+ n_proc_steps: 4
17
+ hid_size: 64
18
+ in_size: 7
19
+ out_size: 1
20
+ n_layers: 4
21
+ n_proc_steps: 4
22
+ dropout: 0
23
+ Datasets:
24
+ ttH_CP_even: &dataset_defn
25
+ module: root_gnn_base.dataset
26
+ class: LazyDataset
27
+ shuffle_chunks: 10
28
+ batch_size: 1024
29
+ padding_mode: NONE #one of STEPS, FIXED, or NONE
30
+ args: &dataset_args
31
+ name: ttH_CP_even
32
+ label: 0
33
+ # weight_var: weight
34
+ chunks: 10
35
+ buffer_size: 3
36
+ file_names: ttH_NLO.root
37
+ tree_name: output
38
+ fold_var: Number
39
+ raw_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/stats_all/
40
+ save_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/processed_graphs/stats_all/ttH_CP_even_vs_odd/
41
+ node_branch_names:
42
+ - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
43
+ - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
44
+ - [jet_phi, ele_phi, mu_phi, ph_phi, MET_phi]
45
+ - CALC_E
46
+ - [jet_btag, 0, 0, 0, 0]
47
+ - [0, ele_charge, mu_charge, 0, 0]
48
+ - NODE_TYPE
49
+ node_branch_types: [vector, vector, vector, vector, single]
50
+ node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
51
+ folding:
52
+ n_folds: 4
53
+ test: [0]
54
+ # validation: 1
55
+ train: [1, 2, 3]
56
+ ttH_CP_odd:
57
+ <<: *dataset_defn
58
+ args:
59
+ <<: *dataset_args
60
+ name: ttH_CP_odd
61
+ label: 1
62
+ file_names: ttH_CPodd.root
root_gnn_dgl/configs/stats_all/pretraining_multiclass.yaml ADDED
@@ -0,0 +1,134 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Training_Name: pretraining_multiclass
2
+ Training_Directory: trainings/stats_all/pretraining_multiclass/
3
+ Model:
4
+ module: models.GCN
5
+ class: Edge_Network
6
+ args:
7
+ hid_size: 64
8
+ in_size: 7
9
+ out_size: 12
10
+ n_layers: 4
11
+ n_proc_steps: 4
12
+ dropout: 0
13
+ Loss:
14
+ module: torch.nn
15
+ class: CrossEntropyLoss
16
+ args: {}
17
+ finish:
18
+ module: torch.nn
19
+ class: Softmax
20
+ args: {dim: 1}
21
+ Training:
22
+ epochs: 500
23
+ batch_size: 1024
24
+ learning_rate: 0.0001
25
+ gamma: 0.99
26
+ Datasets:
27
+ ttH: &dataset_defn
28
+ module: root_gnn_base.dataset
29
+ class: LazyDataset
30
+ shuffle_chunks: 10
31
+ padding_mode: NONE #one of STEPS, FIXED, or NONE
32
+ args: &dataset_args
33
+ name: ttH
34
+ label: 0
35
+ # weight_var: weight
36
+ chunks: 10
37
+ buffer_size: 3
38
+ file_names: ttH_NLO_inc.root
39
+ tree_name: output
40
+ fold_var: Number
41
+ raw_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/stats_all/
42
+ save_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/processed_graphs/stats_all/pretraining_multiclass/
43
+ node_branch_names:
44
+ - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
45
+ - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
46
+ - [jet_phi, ele_phi, mu_phi, ph_phi, MET_phi]
47
+ - CALC_E
48
+ - [jet_btag, 0, 0, 0, 0]
49
+ - [0, ele_charge, mu_charge, 0, 0]
50
+ - NODE_TYPE
51
+ node_branch_types: [vector, vector, vector, vector, single]
52
+ node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
53
+ folding:
54
+ n_folds: 4
55
+ test: [0]
56
+ # validation: [1]
57
+ train: [1, 2, 3]
58
+ tHjb:
59
+ <<: *dataset_defn
60
+ args:
61
+ <<: *dataset_args
62
+ name: tHjb
63
+ label: 1
64
+ file_names: tHjb_NLO_inc.root
65
+ ggF:
66
+ <<: *dataset_defn
67
+ args:
68
+ <<: *dataset_args
69
+ name: ggF
70
+ label: 2
71
+ file_names: ggF_NLO_inc.root
72
+ VBF:
73
+ <<: *dataset_defn
74
+ args:
75
+ <<: *dataset_args
76
+ name: VBF
77
+ label: 3
78
+ file_names: VBF_NLO_inc.root
79
+ WH:
80
+ <<: *dataset_defn
81
+ args:
82
+ <<: *dataset_args
83
+ name: WH
84
+ label: 4
85
+ file_names: WH_NLO_inc.root
86
+ ZH:
87
+ <<: *dataset_defn
88
+ args:
89
+ <<: *dataset_args
90
+ name: ZH
91
+ label: 5
92
+ file_names: ZH_NLO_inc.root
93
+ ttyy:
94
+ <<: *dataset_defn
95
+ args:
96
+ <<: *dataset_args
97
+ name: ttyy_ch
98
+ label: 6
99
+ file_names: 'ttyy.root'
100
+ tttt:
101
+ <<: *dataset_defn
102
+ args:
103
+ <<: *dataset_args
104
+ name: tttt
105
+ label: 7
106
+ file_names: 'tttt.root'
107
+ SingleT_schan:
108
+ <<: *dataset_defn
109
+ args:
110
+ <<: *dataset_args
111
+ name: SingleT_schan
112
+ label: 8
113
+ file_names: 'SingleT_schan.root'
114
+ ttbar:
115
+ <<: *dataset_defn
116
+ args:
117
+ <<: *dataset_args
118
+ name: ttbar
119
+ label: 9
120
+ file_names: 'ttbar.root'
121
+ ttW:
122
+ <<: *dataset_defn
123
+ args:
124
+ <<: *dataset_args
125
+ name: ttW
126
+ label: 10
127
+ file_names: 'ttW.root'
128
+ ttt:
129
+ <<: *dataset_defn
130
+ args:
131
+ <<: *dataset_args
132
+ name: ttt
133
+ label: 11
134
+ file_names: 'ttt.root'
root_gnn_dgl/configs/stats_all/ttH_CP_even_vs_odd.yaml ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Training_Name: ttH_CP_even_vs_odd
2
+ Training_Directory: trainings/stats_all/ttH_CP_even_vs_odd
3
+ Model:
4
+ module: models.GCN
5
+ class: Edge_Network
6
+ args:
7
+ hid_size: 64
8
+ in_size: 7
9
+ out_size: 1
10
+ n_layers: 4
11
+ n_proc_steps: 4
12
+ dropout: 0
13
+ Training:
14
+ epochs: 500
15
+ batch_size: 1024
16
+ learning_rate: 0.0001
17
+ gamma: 0.99
18
+ Datasets:
19
+ ttH_CP_even: &dataset_defn
20
+ module: root_gnn_base.dataset
21
+ class: LazyDataset
22
+ shuffle_chunks: 10
23
+ batch_size: 1024
24
+ padding_mode: NONE #one of STEPS, FIXED, or NONE
25
+ args: &dataset_args
26
+ name: ttH_CP_even
27
+ label: 0
28
+ # weight_var: weight
29
+ chunks: 10
30
+ buffer_size: 3
31
+ file_names: ttH_NLO.root
32
+ tree_name: output
33
+ fold_var: Number
34
+ raw_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/stats_all/
35
+ save_dir: /global/cfs/projectdirs/trn007/lbl_atlas/data/processed_graphs/stats_all/ttH_CP_even_vs_odd/
36
+ node_branch_names:
37
+ - [jet_pt, ele_pt, mu_pt, ph_pt, MET_met]
38
+ - [jet_eta, ele_eta, mu_eta, ph_eta, 0]
39
+ - [jet_phi, ele_phi, mu_phi, ph_phi, MET_phi]
40
+ - CALC_E
41
+ - [jet_btag, 0, 0, 0, 0]
42
+ - [0, ele_charge, mu_charge, 0, 0]
43
+ - NODE_TYPE
44
+ node_branch_types: [vector, vector, vector, vector, single]
45
+ node_feature_scales: [1e-1, 1, 1, 1e-1, 1, 1, 1]
46
+ folding:
47
+ n_folds: 4
48
+ test: [0]
49
+ # validation: 1
50
+ train: [1, 2, 3]
51
+ ttH_CP_odd:
52
+ <<: *dataset_defn
53
+ args:
54
+ <<: *dataset_args
55
+ name: ttH_CP_odd
56
+ label: 1
57
+ file_names: ttH_CPodd.root