valentinsingularity commited on
Commit
fe20c1e
·
verified ·
1 Parent(s): 2d8737c

Upload 6 files

Browse files
configs/b_mc_point_xray_conv_absorption_L1_InputQ.yaml ADDED
@@ -0,0 +1,114 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: b_mc_point_xray_conv_absorption_L1_InputQ
3
+ root_dir: null
4
+
5
+ dset:
6
+ cls: ReflectivityDataLoader
7
+ prior_sampler:
8
+ cls: SubpriorParametricSampler
9
+ kwargs:
10
+ param_ranges:
11
+ thicknesses: [1., 1000.]
12
+ roughnesses: [0., 60.]
13
+ slds: [0., 150.]
14
+ islds: [0., 30.]
15
+ bound_width_ranges:
16
+ thicknesses: [1.0e-2, 1000.]
17
+ roughnesses: [1.0e-2, 60.]
18
+ slds: [ 1.0e-2, 5.]
19
+ islds: [1.0e-2, 5.]
20
+ model_name: model_with_absorption
21
+ max_num_layers: 1
22
+ constrained_roughness: true
23
+ constrained_isld: true
24
+ max_thickness_share: 0.5
25
+ max_sld_share: 0.2
26
+ logdist: false
27
+ scale_params_by_ranges: false
28
+ scaled_range: [-1., 1.]
29
+ device: 'cuda'
30
+
31
+ q_generator:
32
+ cls: VariableQ
33
+ kwargs:
34
+ q_min_range: [0.001, 0.03]
35
+ q_max_range: [0.1, 0.4]
36
+ n_q_range: [128, 128]
37
+ device: 'cuda'
38
+
39
+ intensity_noise:
40
+ cls: GaussianExpIntensityNoise
41
+ kwargs:
42
+ relative_errors: [0.01, 0.3]
43
+ consistent_rel_err: false
44
+ apply_shift: true
45
+ shift_range: [-0.3, 0.3]
46
+ add_to_context: true
47
+
48
+ curves_scaler:
49
+ cls: LogAffineCurvesScaler
50
+ kwargs:
51
+ weight: 0.2
52
+ bias: 1.0
53
+ eps: 1.0e-10
54
+
55
+ model:
56
+ network:
57
+ cls: NetworkWithPriors
58
+ pretrained_name: null
59
+ device: 'cuda'
60
+ kwargs:
61
+ embedding_net_type: 'conv'
62
+ embedding_net_kwargs:
63
+ in_channels: 2
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ kernel_size: 3
66
+ dim_embedding: 128
67
+ dim_avpool: 1
68
+ use_batch_norm: true
69
+ use_se: false
70
+ activation: 'gelu'
71
+ pretrained_embedding_net: null
72
+ dim_out: 7 #4n_l+3
73
+ dim_conditioning_params: 0
74
+ layer_width: 512
75
+ num_blocks: 8
76
+ repeats_per_block: 2
77
+ residual: true
78
+ use_batch_norm: true
79
+ use_layer_norm: false
80
+ mlp_activation: 'gelu'
81
+ dropout_rate: 0.0
82
+ tanh_output: false
83
+ conditioning: 'film'
84
+ concat_condition_first_layer: false
85
+
86
+ training:
87
+ trainer_cls: PointEstimatorTrainer
88
+ num_iterations: 100000
89
+ batch_size: 4096
90
+ lr: 1.0e-3
91
+ grad_accumulation_steps: 1
92
+ clip_grad_norm_max: null
93
+ update_tqdm_freq: 1
94
+ optimizer: AdamW
95
+ trainer_kwargs:
96
+ train_with_q_input: true
97
+ train_with_sigmas: false
98
+ condition_on_q_resolutions: false
99
+ use_curve_reconstruction_loss: false
100
+ rescale_loss_interval_width: true
101
+ use_l1_loss: true
102
+ optim_kwargs:
103
+ betas: [0.9, 0.999]
104
+ weight_decay: 0.0005
105
+ callbacks:
106
+ save_best_model:
107
+ enable: true
108
+ freq: 500
109
+ lr_scheduler:
110
+ cls: CosineAnnealingWithWarmup
111
+ kwargs:
112
+ min_lr: 1.0e-6
113
+ warmup_iters: 500
114
+ total_iters: 100000
configs/b_mc_point_xray_conv_absorption_L2_InputQ.yaml ADDED
@@ -0,0 +1,114 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: b_mc_point_xray_conv_absorption_L2_InputQ
3
+ root_dir: null
4
+
5
+ dset:
6
+ cls: ReflectivityDataLoader
7
+ prior_sampler:
8
+ cls: SubpriorParametricSampler
9
+ kwargs:
10
+ param_ranges:
11
+ thicknesses: [1., 500.]
12
+ roughnesses: [0., 60.]
13
+ slds: [0., 150.]
14
+ islds: [0., 30.]
15
+ bound_width_ranges:
16
+ thicknesses: [1.0e-2, 500.]
17
+ roughnesses: [1.0e-2, 60.]
18
+ slds: [ 1.0e-2, 5.]
19
+ islds: [1.0e-2, 5.]
20
+ model_name: model_with_absorption
21
+ max_num_layers: 2
22
+ constrained_roughness: true
23
+ constrained_isld: true
24
+ max_thickness_share: 0.5
25
+ max_sld_share: 0.2
26
+ logdist: false
27
+ scale_params_by_ranges: false
28
+ scaled_range: [-1., 1.]
29
+ device: 'cuda'
30
+
31
+ q_generator:
32
+ cls: VariableQ
33
+ kwargs:
34
+ q_min_range: [0.001, 0.03]
35
+ q_max_range: [0.1, 0.4]
36
+ n_q_range: [128, 128]
37
+ device: 'cuda'
38
+
39
+ intensity_noise:
40
+ cls: GaussianExpIntensityNoise
41
+ kwargs:
42
+ relative_errors: [0.01, 0.3]
43
+ consistent_rel_err: false
44
+ apply_shift: true
45
+ shift_range: [-0.3, 0.3]
46
+ add_to_context: true
47
+
48
+ curves_scaler:
49
+ cls: LogAffineCurvesScaler
50
+ kwargs:
51
+ weight: 0.2
52
+ bias: 1.0
53
+ eps: 1.0e-10
54
+
55
+ model:
56
+ network:
57
+ cls: NetworkWithPriors
58
+ pretrained_name: null
59
+ device: 'cuda'
60
+ kwargs:
61
+ embedding_net_type: 'conv'
62
+ embedding_net_kwargs:
63
+ in_channels: 2
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ kernel_size: 3
66
+ dim_embedding: 128
67
+ dim_avpool: 1
68
+ use_batch_norm: true
69
+ use_se: false
70
+ activation: 'gelu'
71
+ pretrained_embedding_net: null
72
+ dim_out: 11 #4n_l+3
73
+ dim_conditioning_params: 0
74
+ layer_width: 512
75
+ num_blocks: 8
76
+ repeats_per_block: 2
77
+ residual: true
78
+ use_batch_norm: true
79
+ use_layer_norm: false
80
+ mlp_activation: 'gelu'
81
+ dropout_rate: 0.0
82
+ tanh_output: false
83
+ conditioning: 'film'
84
+ concat_condition_first_layer: false
85
+
86
+ training:
87
+ trainer_cls: PointEstimatorTrainer
88
+ num_iterations: 100000
89
+ batch_size: 4096
90
+ lr: 1.0e-3
91
+ grad_accumulation_steps: 1
92
+ clip_grad_norm_max: null
93
+ update_tqdm_freq: 1
94
+ optimizer: AdamW
95
+ trainer_kwargs:
96
+ train_with_q_input: true
97
+ train_with_sigmas: false
98
+ condition_on_q_resolutions: false
99
+ use_curve_reconstruction_loss: false
100
+ rescale_loss_interval_width: true
101
+ use_l1_loss: true
102
+ optim_kwargs:
103
+ betas: [0.9, 0.999]
104
+ weight_decay: 0.0005
105
+ callbacks:
106
+ save_best_model:
107
+ enable: true
108
+ freq: 500
109
+ lr_scheduler:
110
+ cls: CosineAnnealingWithWarmup
111
+ kwargs:
112
+ min_lr: 1.0e-6
113
+ warmup_iters: 500
114
+ total_iters: 100000
configs/b_mc_point_xray_conv_absorption_L3_InputQ.yaml ADDED
@@ -0,0 +1,114 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: b_mc_point_xray_conv_absorption_L3_InputQ
3
+ root_dir: null
4
+
5
+ dset:
6
+ cls: ReflectivityDataLoader
7
+ prior_sampler:
8
+ cls: SubpriorParametricSampler
9
+ kwargs:
10
+ param_ranges:
11
+ thicknesses: [1., 500.]
12
+ roughnesses: [0., 60.]
13
+ slds: [0., 150.]
14
+ islds: [0., 30.]
15
+ bound_width_ranges:
16
+ thicknesses: [1.0e-2, 500.]
17
+ roughnesses: [1.0e-2, 60.]
18
+ slds: [ 1.0e-2, 5.]
19
+ islds: [1.0e-2, 5.]
20
+ model_name: model_with_absorption
21
+ max_num_layers: 3
22
+ constrained_roughness: true
23
+ constrained_isld: true
24
+ max_thickness_share: 0.5
25
+ max_sld_share: 0.2
26
+ logdist: false
27
+ scale_params_by_ranges: false
28
+ scaled_range: [-1., 1.]
29
+ device: 'cuda'
30
+
31
+ q_generator:
32
+ cls: VariableQ
33
+ kwargs:
34
+ q_min_range: [0.001, 0.03]
35
+ q_max_range: [0.1, 0.4]
36
+ n_q_range: [128, 128]
37
+ device: 'cuda'
38
+
39
+ intensity_noise:
40
+ cls: GaussianExpIntensityNoise
41
+ kwargs:
42
+ relative_errors: [0.01, 0.3]
43
+ consistent_rel_err: false
44
+ apply_shift: true
45
+ shift_range: [-0.3, 0.3]
46
+ add_to_context: true
47
+
48
+ curves_scaler:
49
+ cls: LogAffineCurvesScaler
50
+ kwargs:
51
+ weight: 0.2
52
+ bias: 1.0
53
+ eps: 1.0e-10
54
+
55
+ model:
56
+ network:
57
+ cls: NetworkWithPriors
58
+ pretrained_name: null
59
+ device: 'cuda'
60
+ kwargs:
61
+ embedding_net_type: 'conv'
62
+ embedding_net_kwargs:
63
+ in_channels: 2
64
+ hidden_channels: [32, 64, 128, 256, 512]
65
+ kernel_size: 3
66
+ dim_embedding: 128
67
+ dim_avpool: 1
68
+ use_batch_norm: true
69
+ use_se: false
70
+ activation: 'gelu'
71
+ pretrained_embedding_net: null
72
+ dim_out: 15 #4n_l+3
73
+ dim_conditioning_params: 0
74
+ layer_width: 512
75
+ num_blocks: 8
76
+ repeats_per_block: 2
77
+ residual: true
78
+ use_batch_norm: true
79
+ use_layer_norm: false
80
+ mlp_activation: 'gelu'
81
+ dropout_rate: 0.0
82
+ tanh_output: false
83
+ conditioning: 'film'
84
+ concat_condition_first_layer: false
85
+
86
+ training:
87
+ trainer_cls: PointEstimatorTrainer
88
+ num_iterations: 100000
89
+ batch_size: 4096
90
+ lr: 1.0e-3
91
+ grad_accumulation_steps: 1
92
+ clip_grad_norm_max: null
93
+ update_tqdm_freq: 1
94
+ optimizer: AdamW
95
+ trainer_kwargs:
96
+ train_with_q_input: true
97
+ train_with_sigmas: false
98
+ condition_on_q_resolutions: false
99
+ use_curve_reconstruction_loss: false
100
+ rescale_loss_interval_width: true
101
+ use_l1_loss: true
102
+ optim_kwargs:
103
+ betas: [0.9, 0.999]
104
+ weight_decay: 0.0005
105
+ callbacks:
106
+ save_best_model:
107
+ enable: true
108
+ freq: 500
109
+ lr_scheduler:
110
+ cls: CosineAnnealingWithWarmup
111
+ kwargs:
112
+ min_lr: 1.0e-6
113
+ warmup_iters: 500
114
+ total_iters: 100000
configs/b_mc_point_xray_conv_standard_L1_InputQ.yaml ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: b_mc_point_xray_conv_standard_L1_InputQ
3
+ root_dir: null
4
+
5
+ dset:
6
+ cls: ReflectivityDataLoader
7
+ prior_sampler:
8
+ cls: SubpriorParametricSampler
9
+ kwargs:
10
+ param_ranges:
11
+ thicknesses: [1., 1000.]
12
+ roughnesses: [0., 60.]
13
+ slds: [0., 50.]
14
+ bound_width_ranges:
15
+ thicknesses: [1.0e-2, 1000.]
16
+ roughnesses: [1.0e-2, 60.]
17
+ slds: [1.0e-2, 5.]
18
+ model_name: standard_model
19
+ max_num_layers: 1
20
+ constrained_roughness: true
21
+ max_thickness_share: 0.5
22
+ logdist: false
23
+ scale_params_by_ranges: false
24
+ scaled_range: [-1., 1.]
25
+ device: 'cuda'
26
+
27
+ q_generator:
28
+ cls: VariableQ
29
+ kwargs:
30
+ q_min_range: [0.001, 0.03]
31
+ q_max_range: [0.1, 0.4]
32
+ n_q_range: [128, 128]
33
+ device: 'cuda'
34
+
35
+ intensity_noise:
36
+ cls: GaussianExpIntensityNoise
37
+ kwargs:
38
+ relative_errors: [0.01, 0.3]
39
+ consistent_rel_err: false
40
+ apply_shift: true
41
+ shift_range: [-0.3, 0.3]
42
+ add_to_context: true
43
+
44
+ curves_scaler:
45
+ cls: LogAffineCurvesScaler
46
+ kwargs:
47
+ weight: 0.2
48
+ bias: 1.0
49
+ eps: 1.0e-10
50
+
51
+ model:
52
+ network:
53
+ cls: NetworkWithPriors
54
+ pretrained_name: null
55
+ device: 'cuda'
56
+ kwargs:
57
+ embedding_net_type: 'conv'
58
+ embedding_net_kwargs:
59
+ in_channels: 2
60
+ hidden_channels: [32, 64, 128, 256, 512]
61
+ kernel_size: 3
62
+ dim_embedding: 128
63
+ dim_avpool: 1
64
+ use_batch_norm: true
65
+ use_se: false
66
+ activation: 'gelu'
67
+ pretrained_embedding_net: null
68
+ dim_out: 5
69
+ dim_conditioning_params: 0
70
+ layer_width: 512
71
+ num_blocks: 8
72
+ repeats_per_block: 2
73
+ residual: true
74
+ use_batch_norm: true
75
+ use_layer_norm: false
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+ tanh_output: false
79
+ conditioning: 'film'
80
+ concat_condition_first_layer: false
81
+
82
+ training:
83
+ trainer_cls: PointEstimatorTrainer
84
+ num_iterations: 100000
85
+ batch_size: 4096
86
+ lr: 1.0e-3
87
+ grad_accumulation_steps: 1
88
+ clip_grad_norm_max: null
89
+ update_tqdm_freq: 1
90
+ optimizer: AdamW
91
+ trainer_kwargs:
92
+ train_with_q_input: true
93
+ train_with_sigmas: false
94
+ condition_on_q_resolutions: false
95
+ use_curve_reconstruction_loss: false
96
+ rescale_loss_interval_width: true
97
+ use_l1_loss: true
98
+ optim_kwargs:
99
+ betas: [0.9, 0.999]
100
+ weight_decay: 0.0005
101
+ callbacks:
102
+ save_best_model:
103
+ enable: true
104
+ freq: 500
105
+ lr_scheduler:
106
+ cls: CosineAnnealingWithWarmup
107
+ kwargs:
108
+ min_lr: 1.0e-6
109
+ warmup_iters: 500
110
+ total_iters: 100000
configs/b_mc_point_xray_conv_standard_L2_InputQ.yaml ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: b_mc_point_xray_conv_standard_L2_InputQ
3
+ root_dir: null
4
+
5
+ dset:
6
+ cls: ReflectivityDataLoader
7
+ prior_sampler:
8
+ cls: SubpriorParametricSampler
9
+ kwargs:
10
+ param_ranges:
11
+ thicknesses: [1., 500.]
12
+ roughnesses: [0., 60.]
13
+ slds: [0., 50.]
14
+ bound_width_ranges:
15
+ thicknesses: [1.0e-2, 500.]
16
+ roughnesses: [1.0e-2, 60.]
17
+ slds: [1.0e-2, 5.]
18
+ model_name: standard_model
19
+ max_num_layers: 2
20
+ constrained_roughness: true
21
+ max_thickness_share: 0.5
22
+ logdist: false
23
+ scale_params_by_ranges: false
24
+ scaled_range: [-1., 1.]
25
+ device: 'cuda'
26
+
27
+ q_generator:
28
+ cls: VariableQ
29
+ kwargs:
30
+ q_min_range: [0.001, 0.03]
31
+ q_max_range: [0.1, 0.4]
32
+ n_q_range: [128, 128]
33
+ device: 'cuda'
34
+
35
+ intensity_noise:
36
+ cls: GaussianExpIntensityNoise
37
+ kwargs:
38
+ relative_errors: [0.01, 0.3]
39
+ consistent_rel_err: false
40
+ apply_shift: true
41
+ shift_range: [-0.3, 0.3]
42
+ add_to_context: true
43
+
44
+ curves_scaler:
45
+ cls: LogAffineCurvesScaler
46
+ kwargs:
47
+ weight: 0.2
48
+ bias: 1.0
49
+ eps: 1.0e-10
50
+
51
+ model:
52
+ network:
53
+ cls: NetworkWithPriors
54
+ pretrained_name: null
55
+ device: 'cuda'
56
+ kwargs:
57
+ embedding_net_type: 'conv'
58
+ embedding_net_kwargs:
59
+ in_channels: 2
60
+ hidden_channels: [32, 64, 128, 256, 512]
61
+ kernel_size: 3
62
+ dim_embedding: 128
63
+ dim_avpool: 1
64
+ use_batch_norm: true
65
+ use_se: false
66
+ activation: 'gelu'
67
+ pretrained_embedding_net: null
68
+ dim_out: 8
69
+ dim_conditioning_params: 0
70
+ layer_width: 512
71
+ num_blocks: 8
72
+ repeats_per_block: 2
73
+ residual: true
74
+ use_batch_norm: true
75
+ use_layer_norm: false
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+ tanh_output: false
79
+ conditioning: 'film'
80
+ concat_condition_first_layer: false
81
+
82
+ training:
83
+ trainer_cls: PointEstimatorTrainer
84
+ num_iterations: 100000
85
+ batch_size: 4096
86
+ lr: 1.0e-3
87
+ grad_accumulation_steps: 1
88
+ clip_grad_norm_max: null
89
+ update_tqdm_freq: 1
90
+ optimizer: AdamW
91
+ trainer_kwargs:
92
+ train_with_q_input: true
93
+ train_with_sigmas: false
94
+ condition_on_q_resolutions: false
95
+ use_curve_reconstruction_loss: false
96
+ rescale_loss_interval_width: true
97
+ use_l1_loss: true
98
+ optim_kwargs:
99
+ betas: [0.9, 0.999]
100
+ weight_decay: 0.0005
101
+ callbacks:
102
+ save_best_model:
103
+ enable: true
104
+ freq: 500
105
+ lr_scheduler:
106
+ cls: CosineAnnealingWithWarmup
107
+ kwargs:
108
+ min_lr: 1.0e-6
109
+ warmup_iters: 500
110
+ total_iters: 100000
configs/b_mc_point_xray_conv_standard_L3_InputQ.yaml ADDED
@@ -0,0 +1,110 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: b_mc_point_xray_conv_standard_L3_InputQ
3
+ root_dir: null
4
+
5
+ dset:
6
+ cls: ReflectivityDataLoader
7
+ prior_sampler:
8
+ cls: SubpriorParametricSampler
9
+ kwargs:
10
+ param_ranges:
11
+ thicknesses: [1., 500.]
12
+ roughnesses: [0., 60.]
13
+ slds: [0., 50.]
14
+ bound_width_ranges:
15
+ thicknesses: [1.0e-2, 500.]
16
+ roughnesses: [1.0e-2, 60.]
17
+ slds: [1.0e-2, 5.]
18
+ model_name: standard_model
19
+ max_num_layers: 3
20
+ constrained_roughness: true
21
+ max_thickness_share: 0.5
22
+ logdist: false
23
+ scale_params_by_ranges: false
24
+ scaled_range: [-1., 1.]
25
+ device: 'cuda'
26
+
27
+ q_generator:
28
+ cls: VariableQ
29
+ kwargs:
30
+ q_min_range: [0.001, 0.03]
31
+ q_max_range: [0.1, 0.4]
32
+ n_q_range: [128, 128]
33
+ device: 'cuda'
34
+
35
+ intensity_noise:
36
+ cls: GaussianExpIntensityNoise
37
+ kwargs:
38
+ relative_errors: [0.01, 0.3]
39
+ consistent_rel_err: false
40
+ apply_shift: true
41
+ shift_range: [-0.3, 0.3]
42
+ add_to_context: true
43
+
44
+ curves_scaler:
45
+ cls: LogAffineCurvesScaler
46
+ kwargs:
47
+ weight: 0.2
48
+ bias: 1.0
49
+ eps: 1.0e-10
50
+
51
+ model:
52
+ network:
53
+ cls: NetworkWithPriors
54
+ pretrained_name: null
55
+ device: 'cuda'
56
+ kwargs:
57
+ embedding_net_type: 'conv'
58
+ embedding_net_kwargs:
59
+ in_channels: 2
60
+ hidden_channels: [32, 64, 128, 256, 512]
61
+ kernel_size: 3
62
+ dim_embedding: 128
63
+ dim_avpool: 1
64
+ use_batch_norm: true
65
+ use_se: false
66
+ activation: 'gelu'
67
+ pretrained_embedding_net: null
68
+ dim_out: 11
69
+ dim_conditioning_params: 0
70
+ layer_width: 512
71
+ num_blocks: 8
72
+ repeats_per_block: 2
73
+ residual: true
74
+ use_batch_norm: true
75
+ use_layer_norm: false
76
+ mlp_activation: 'gelu'
77
+ dropout_rate: 0.0
78
+ tanh_output: false
79
+ conditioning: 'film'
80
+ concat_condition_first_layer: false
81
+
82
+ training:
83
+ trainer_cls: PointEstimatorTrainer
84
+ num_iterations: 100000
85
+ batch_size: 4096
86
+ lr: 1.0e-3
87
+ grad_accumulation_steps: 1
88
+ clip_grad_norm_max: null
89
+ update_tqdm_freq: 1
90
+ optimizer: AdamW
91
+ trainer_kwargs:
92
+ train_with_q_input: true
93
+ train_with_sigmas: false
94
+ condition_on_q_resolutions: false
95
+ use_curve_reconstruction_loss: false
96
+ rescale_loss_interval_width: true
97
+ use_l1_loss: true
98
+ optim_kwargs:
99
+ betas: [0.9, 0.999]
100
+ weight_decay: 0.0005
101
+ callbacks:
102
+ save_best_model:
103
+ enable: true
104
+ freq: 500
105
+ lr_scheduler:
106
+ cls: CosineAnnealingWithWarmup
107
+ kwargs:
108
+ min_lr: 1.0e-6
109
+ warmup_iters: 500
110
+ total_iters: 100000