AnneLena commited on
Commit
6f8c7f7
·
verified ·
1 Parent(s): da8025a

Upload configs/hysteresis_in_phase_volumes_point_neutron_conv_standard_L3_InputQDq_n256_Sept9_logspace.yaml with huggingface_hub

Browse files
configs/hysteresis_in_phase_volumes_point_neutron_conv_standard_L3_InputQDq_n256_Sept9_logspace.yaml ADDED
@@ -0,0 +1,121 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ general:
2
+ name: hysteresis_in_phase_volumes_point_neutron_conv_standard_L3_InputQDq_n256_Sept1_logspace
3
+ root_dir: /mnt/lustre/work/schreiber/szb249
4
+
5
+ dset:
6
+ cls: ReflectivityDataLoader
7
+ prior_sampler:
8
+ cls: SubpriorParametricSampler
9
+ kwargs:
10
+ param_ranges:
11
+ thicknesses: [1., 950.]
12
+ roughnesses: [0., 55.]
13
+ slds: [-3., 4.5]
14
+ r_scale: [0.9, 1.1]
15
+ log10_background: [-8.0, -6.0]
16
+ bound_width_ranges:
17
+ thicknesses: [1.0e-2, 950.]
18
+ roughnesses: [1.0e-2, 55.]
19
+ slds: [1.0e-2, 5.]
20
+ r_scale: [1.0e-3, 0.2]
21
+ log10_background: [1.0e-2, 2.0]
22
+ shift_param_config:
23
+ r_scale: true
24
+ log10_background: true
25
+ model_name: standard_model
26
+ max_num_layers: 3
27
+ max_total_thickness: 950
28
+ constrained_roughness: true
29
+ max_thickness_share: 0.5
30
+ logdist: false
31
+ scale_params_by_ranges: false
32
+ scaled_range: [-1., 1.]
33
+ device: 'cuda'
34
+
35
+ q_generator:
36
+ cls: VariableQ
37
+ kwargs:
38
+ mode: 'logspace'
39
+ q_min_range: [0.001, 0.006]
40
+ q_max_range: [0.03, 0.35]
41
+ n_q_range: [256, 256]
42
+ device: 'cuda'
43
+
44
+ intensity_noise:
45
+ cls: GaussianExpIntensityNoise
46
+ kwargs:
47
+ relative_errors: [0.01, 0.3]
48
+ add_to_context: true
49
+
50
+ smearing:
51
+ cls: Smearing
52
+ kwargs:
53
+ sigma_range: [0.01, 0.12]
54
+ gauss_num: 17
55
+ share_smeared: 1.0
56
+
57
+ curves_scaler:
58
+ cls: LogAffineCurvesScaler
59
+ kwargs:
60
+ weight: 0.2
61
+ bias: 1.0
62
+ eps: 1.0e-10
63
+
64
+ model:
65
+ network:
66
+ cls: NetworkWithPriors
67
+ pretrained_name: null
68
+ device: 'cuda'
69
+ kwargs:
70
+ embedding_net_type: 'conv'
71
+ embedding_net_kwargs:
72
+ in_channels: 2
73
+ hidden_channels: [32, 64, 128, 256, 512]
74
+ kernel_size: 3
75
+ dim_embedding: 512
76
+ dim_avpool: 4
77
+ use_batch_norm: true
78
+ use_se: false
79
+ activation: 'gelu'
80
+ pretrained_embedding_net: null
81
+ dim_out: 13
82
+ dim_conditioning_params: 1
83
+ layer_width: 1024
84
+ num_blocks: 8
85
+ repeats_per_block: 2
86
+ residual: true
87
+ use_batch_norm: true
88
+ use_layer_norm: false
89
+ mlp_activation: 'gelu'
90
+ dropout_rate: 0.0
91
+ tanh_output: false
92
+ conditioning: 'film'
93
+ concat_condition_first_layer: false
94
+
95
+ training:
96
+ trainer_cls: PointEstimatorTrainer
97
+ num_iterations: 300000
98
+ batch_size: 2048
99
+ lr: 1.0e-3
100
+ grad_accumulation_steps: 1
101
+ clip_grad_norm_max: null
102
+ update_tqdm_freq: 1
103
+ optimizer: AdamW
104
+ trainer_kwargs:
105
+ train_with_q_input: true
106
+ condition_on_q_resolutions: true
107
+ rescale_loss_interval_width: true
108
+ use_l1_loss: true
109
+ optim_kwargs:
110
+ betas: [0.9, 0.999]
111
+ weight_decay: 0.0005
112
+ callbacks:
113
+ save_best_model:
114
+ enable: true
115
+ freq: 50
116
+ lr_scheduler:
117
+ cls: CosineAnnealingWithWarmup
118
+ kwargs:
119
+ min_lr: 1.0e-6
120
+ warmup_iters: 500
121
+ total_iters: 300000