valentinsingularity commited on
Commit
75529b1
·
verified ·
1 Parent(s): 8d12415

Upload 82 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
configs/mc-o1.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o1
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o10.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o10
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 1024
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o11.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o11
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 256
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o12.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o12
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [-20., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o13.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o13
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 200.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 200.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 5
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 17
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o14.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o14
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 200.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 200.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 5
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 32
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 17
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o15.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o15
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 200.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 200.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 5
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 17
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 512
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 10
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o16.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o16
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 200.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 200.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 5
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 17
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 20
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o2.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o2
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 10
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o3.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o3
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 50
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o4.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o4
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-3
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o5.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o5
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 512
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o7.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o7
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 8
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o8.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o8
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 256
67
+ width_fno: 128
68
+ n_fno_blocks : 6
69
+ modes: 32
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc-o9.yaml ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc-o9
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: VariableQ
28
+ kwargs:
29
+ q_min_range: [0.01, 0.05]
30
+ q_max_range: [0.15, 0.4]
31
+ n_q_range: [128, 256]
32
+ device: 'cuda'
33
+
34
+ intensity_noise:
35
+ cls: BasicExpIntensityNoise
36
+ kwargs:
37
+ relative_errors: [0.0, 0.2]
38
+ abs_errors: 0.0
39
+ consistent_rel_err: true
40
+ logdist: false
41
+ apply_shift: false
42
+ shift_range: [-0.3, 0.3]
43
+ apply_scaling: false
44
+ scale_range: [-0.02, 0.02]
45
+
46
+ q_noise:
47
+ cls: BasicQNoiseGenerator
48
+ kwargs:
49
+ shift_std: 1.0e-3
50
+ noise_std: [0., 1.0e-3]
51
+
52
+ curves_scaler:
53
+ cls: LogAffineCurvesScaler
54
+ kwargs:
55
+ weight: 0.2
56
+ bias: 1.0
57
+ eps: 1.0e-10
58
+
59
+ model:
60
+ network:
61
+ cls: NetworkWithPriorsFnoEmb
62
+ pretrained_name: null
63
+ device: 'cuda'
64
+ kwargs:
65
+ in_channels: 2
66
+ dim_embedding: 512
67
+ width_fno: 128
68
+ n_fno_blocks : 1
69
+ modes: 16
70
+ embedding_net_activation: 'gelu'
71
+ use_batch_norm: True
72
+ dim_out: 8
73
+ layer_width: 1024
74
+ num_blocks: 6
75
+ repeats_per_block: 2
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+
79
+ training:
80
+ num_iterations: 50000
81
+ batch_size: 1024
82
+ lr: 1.0e-4
83
+ grad_accumulation_steps: 1
84
+ clip_grad_norm_max: 1.0
85
+ train_with_q_input: True
86
+ update_tqdm_freq: 1
87
+ optimizer: AdamW
88
+ trainer_kwargs:
89
+ optim_kwargs:
90
+ betas: [0.9, 0.999]
91
+ weight_decay: 0.0005
92
+ callbacks:
93
+ save_best_model:
94
+ enable: true
95
+ freq: 500
96
+ lr_scheduler:
97
+ cls: StepLR
98
+ kwargs:
99
+ step_size: 2000
100
+ gamma: 0.9
101
+ logger:
102
+ use_neptune: false
configs/mc1.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc1
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc10.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc10
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: true
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc11.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc11
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: true
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.2, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc12.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc12
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: true
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc13.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc13
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: true
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: true
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc14.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc14
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.2, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: true
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: true
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc15.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc15
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: true
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: true
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc16.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc16
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: true
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: true
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc17.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc17
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.2, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: true
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: true
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc18.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc18
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: true
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: true
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc19.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc19
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc2.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc2
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.2, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc20.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc20
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.2, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc21.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc21
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc22.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc22
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc23.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc23
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.2, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc24.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc24
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc25.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc25
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc26.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc26
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 150.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc27.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc27
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 150.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc28.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc28
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc29.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc29
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 150.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc3.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc3
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc30.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc30
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 150.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc31.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc31
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 10.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc32.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc32
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 1.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc33.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc33
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 50.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc34.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc34
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [-20., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc35.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc35
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [-20., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc36.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc36
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [-20., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 128]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc37.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc37
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 20.]
12
+ slds: [-20., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc38.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc38
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 300.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 300.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 3
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 11
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc39.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc39
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 300.]
11
+ roughnesses: [0., 20.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 300.]
15
+ roughnesses: [1.0e-2, 20.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 3
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.3, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 11
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc4.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc4
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 500.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 500.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 2
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: false
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 8
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani
configs/mc40.yaml ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: mc40
3
+ root_dir: null
4
+
5
+ dset:
6
+ prior_sampler:
7
+ cls: SubpriorParametricSampler
8
+ kwargs:
9
+ param_ranges:
10
+ thicknesses: [0., 300.]
11
+ roughnesses: [0., 60.]
12
+ slds: [0., 50.]
13
+ bound_width_ranges:
14
+ thicknesses: [1.0e-2, 300.]
15
+ roughnesses: [1.0e-2, 60.]
16
+ slds: [ 1.0e-2, 5.]
17
+ model_name: standard_model
18
+ max_num_layers: 3
19
+ constrained_roughness: true
20
+ max_thickness_share: 0.5
21
+ logdist: false
22
+ scale_params_by_ranges: false
23
+ scaled_range: [-1., 1.]
24
+ device: 'cuda'
25
+
26
+ q_generator:
27
+ cls: ConstantQ
28
+ kwargs:
29
+ q: [0.02, 0.15, 256]
30
+ device: 'cuda'
31
+
32
+ intensity_noise:
33
+ cls: BasicExpIntensityNoise
34
+ kwargs:
35
+ relative_errors: [0.0, 0.2]
36
+ abs_errors: 0.0
37
+ consistent_rel_err: true
38
+ logdist: false
39
+ apply_shift: false
40
+ shift_range: [-0.3, 0.3]
41
+ apply_scaling: false
42
+ scale_range: [-0.02, 0.02]
43
+
44
+ # q_noise:
45
+ # cls: BasicQNoiseGenerator
46
+ # kwargs:
47
+ # shift_std: 1.0e-3
48
+ # noise_std: [0., 1.0e-3]
49
+
50
+ curves_scaler:
51
+ cls: LogAffineCurvesScaler
52
+ kwargs:
53
+ weight: 0.2
54
+ bias: 1.0
55
+ eps: 1.0e-10
56
+
57
+ model:
58
+ network:
59
+ cls: NetworkWithPriorsConvEmb
60
+ pretrained_name: null
61
+ device: 'cuda'
62
+ kwargs:
63
+ in_channels: 1
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ dim_embedding: 128
66
+ dim_avpool: 1
67
+ embedding_net_activation: 'gelu'
68
+ use_batch_norm: true
69
+ dim_out: 11
70
+ layer_width: 1024
71
+ num_blocks: 6
72
+ repeats_per_block: 2
73
+ mlp_activation: 'gelu'
74
+ dropout_rate: 0.0
75
+ pretrained_embedding_net: null
76
+
77
+ training:
78
+ num_iterations: 50000
79
+ batch_size: 4096
80
+ lr: 1.0e-4
81
+ grad_accumulation_steps: 1
82
+ clip_grad_norm_max: null
83
+ train_with_q_input: False
84
+ update_tqdm_freq: 1
85
+ optimizer: AdamW
86
+ trainer_kwargs:
87
+ optim_kwargs:
88
+ betas: [0.9, 0.999]
89
+ weight_decay: 0.0005
90
+ callbacks:
91
+ save_best_model:
92
+ enable: true
93
+ freq: 100
94
+ lr_scheduler:
95
+ cls: StepLR
96
+ kwargs:
97
+ step_size: 2000
98
+ gamma: 0.9
99
+ logger:
100
+ use_neptune: false
101
+
102
+ slurm:
103
+ cluster: 'tuebingen'
104
+ time: 0-05:00 #D-HH:MM
105
+ partition: 2080-galvani