Upload b_mc_point_neutron_conv_standard_L4_InputQDq.yaml
Browse files
configs/b_mc_point_neutron_conv_standard_L4_InputQDq.yaml
ADDED
|
@@ -0,0 +1,120 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: b_mc_point_neutron_conv_standard_L4_InputQDq
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
cls: ReflectivityDataLoader
|
| 7 |
+
prior_sampler:
|
| 8 |
+
cls: SubpriorParametricSampler
|
| 9 |
+
kwargs:
|
| 10 |
+
param_ranges:
|
| 11 |
+
thicknesses: [1., 400.]
|
| 12 |
+
roughnesses: [0., 60.]
|
| 13 |
+
slds: [-8., 16.]
|
| 14 |
+
bound_width_ranges:
|
| 15 |
+
thicknesses: [1.0e-2, 400.]
|
| 16 |
+
roughnesses: [1.0e-2, 60.]
|
| 17 |
+
slds: [1.0e-2, 5.]
|
| 18 |
+
model_name: standard_model
|
| 19 |
+
max_num_layers: 4
|
| 20 |
+
constrained_roughness: true
|
| 21 |
+
max_thickness_share: 0.5
|
| 22 |
+
logdist: false
|
| 23 |
+
scale_params_by_ranges: false
|
| 24 |
+
scaled_range: [-1., 1.]
|
| 25 |
+
device: 'cuda'
|
| 26 |
+
|
| 27 |
+
q_generator:
|
| 28 |
+
cls: VariableQ
|
| 29 |
+
kwargs:
|
| 30 |
+
q_min_range: [0.001, 0.03]
|
| 31 |
+
q_max_range: [0.1, 0.4]
|
| 32 |
+
n_q_range: [128, 128]
|
| 33 |
+
device: 'cuda'
|
| 34 |
+
|
| 35 |
+
intensity_noise:
|
| 36 |
+
cls: GaussianExpIntensityNoise
|
| 37 |
+
kwargs:
|
| 38 |
+
relative_errors: [0.01, 0.3]
|
| 39 |
+
consistent_rel_err: false
|
| 40 |
+
apply_shift: true
|
| 41 |
+
shift_range: [-0.3, 0.3]
|
| 42 |
+
apply_background: true
|
| 43 |
+
background_range: [1.0e-10, 1.0e-4]
|
| 44 |
+
add_to_context: true
|
| 45 |
+
|
| 46 |
+
smearing:
|
| 47 |
+
cls: Smearing
|
| 48 |
+
kwargs:
|
| 49 |
+
sigma_range: [0.01, 0.10]
|
| 50 |
+
constant_dq: False
|
| 51 |
+
gauss_num: 17
|
| 52 |
+
share_smeared: 0.8
|
| 53 |
+
|
| 54 |
+
curves_scaler:
|
| 55 |
+
cls: LogAffineCurvesScaler
|
| 56 |
+
kwargs:
|
| 57 |
+
weight: 0.2
|
| 58 |
+
bias: 1.0
|
| 59 |
+
eps: 1.0e-10
|
| 60 |
+
|
| 61 |
+
model:
|
| 62 |
+
network:
|
| 63 |
+
cls: NetworkWithPriors
|
| 64 |
+
pretrained_name: null
|
| 65 |
+
device: 'cuda'
|
| 66 |
+
kwargs:
|
| 67 |
+
embedding_net_type: 'conv'
|
| 68 |
+
embedding_net_kwargs:
|
| 69 |
+
in_channels: 2
|
| 70 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 71 |
+
kernel_size: 3
|
| 72 |
+
dim_embedding: 128
|
| 73 |
+
dim_avpool: 1
|
| 74 |
+
use_batch_norm: true
|
| 75 |
+
use_se: false
|
| 76 |
+
activation: 'gelu'
|
| 77 |
+
pretrained_embedding_net: null
|
| 78 |
+
dim_out: 14
|
| 79 |
+
dim_conditioning_params: 1
|
| 80 |
+
layer_width: 512
|
| 81 |
+
num_blocks: 8
|
| 82 |
+
repeats_per_block: 2
|
| 83 |
+
residual: true
|
| 84 |
+
use_batch_norm: true
|
| 85 |
+
use_layer_norm: false
|
| 86 |
+
mlp_activation: 'gelu'
|
| 87 |
+
dropout_rate: 0.0
|
| 88 |
+
tanh_output: false
|
| 89 |
+
conditioning: 'film'
|
| 90 |
+
concat_condition_first_layer: true ### back. comp.
|
| 91 |
+
|
| 92 |
+
training:
|
| 93 |
+
trainer_cls: PointEstimatorTrainer
|
| 94 |
+
num_iterations: 100000
|
| 95 |
+
batch_size: 2048 #reduced batch
|
| 96 |
+
lr: 1.0e-3
|
| 97 |
+
grad_accumulation_steps: 1
|
| 98 |
+
clip_grad_norm_max: null
|
| 99 |
+
update_tqdm_freq: 1
|
| 100 |
+
optimizer: AdamW
|
| 101 |
+
trainer_kwargs:
|
| 102 |
+
train_with_q_input: true
|
| 103 |
+
train_with_sigmas: false
|
| 104 |
+
condition_on_q_resolutions: true
|
| 105 |
+
use_curve_reconstruction_loss: false
|
| 106 |
+
rescale_loss_interval_width: true
|
| 107 |
+
use_l1_loss: true
|
| 108 |
+
optim_kwargs:
|
| 109 |
+
betas: [0.9, 0.999]
|
| 110 |
+
weight_decay: 0.0005
|
| 111 |
+
callbacks:
|
| 112 |
+
save_best_model:
|
| 113 |
+
enable: true
|
| 114 |
+
freq: 500
|
| 115 |
+
lr_scheduler:
|
| 116 |
+
cls: CosineAnnealingWithWarmup
|
| 117 |
+
kwargs:
|
| 118 |
+
min_lr: 1.0e-6
|
| 119 |
+
warmup_iters: 500
|
| 120 |
+
total_iters: 100000
|