Upload 82 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- configs/mc-o1.yaml +102 -0
- configs/mc-o10.yaml +102 -0
- configs/mc-o11.yaml +102 -0
- configs/mc-o12.yaml +102 -0
- configs/mc-o13.yaml +102 -0
- configs/mc-o14.yaml +102 -0
- configs/mc-o15.yaml +102 -0
- configs/mc-o16.yaml +102 -0
- configs/mc-o2.yaml +102 -0
- configs/mc-o3.yaml +102 -0
- configs/mc-o4.yaml +102 -0
- configs/mc-o5.yaml +102 -0
- configs/mc-o7.yaml +102 -0
- configs/mc-o8.yaml +102 -0
- configs/mc-o9.yaml +102 -0
- configs/mc1.yaml +105 -0
- configs/mc10.yaml +105 -0
- configs/mc11.yaml +105 -0
- configs/mc12.yaml +105 -0
- configs/mc13.yaml +105 -0
- configs/mc14.yaml +105 -0
- configs/mc15.yaml +105 -0
- configs/mc16.yaml +105 -0
- configs/mc17.yaml +105 -0
- configs/mc18.yaml +105 -0
- configs/mc19.yaml +105 -0
- configs/mc2.yaml +105 -0
- configs/mc20.yaml +105 -0
- configs/mc21.yaml +105 -0
- configs/mc22.yaml +105 -0
- configs/mc23.yaml +105 -0
- configs/mc24.yaml +105 -0
- configs/mc25.yaml +105 -0
- configs/mc26.yaml +105 -0
- configs/mc27.yaml +105 -0
- configs/mc28.yaml +105 -0
- configs/mc29.yaml +105 -0
- configs/mc3.yaml +105 -0
- configs/mc30.yaml +105 -0
- configs/mc31.yaml +105 -0
- configs/mc32.yaml +105 -0
- configs/mc33.yaml +105 -0
- configs/mc34.yaml +105 -0
- configs/mc35.yaml +105 -0
- configs/mc36.yaml +105 -0
- configs/mc37.yaml +105 -0
- configs/mc38.yaml +105 -0
- configs/mc39.yaml +105 -0
- configs/mc4.yaml +105 -0
- configs/mc40.yaml +105 -0
configs/mc-o1.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o1
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o10.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o10
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 1024
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o11.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o11
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 256
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o12.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o12
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [-20., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o13.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o13
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 200.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 200.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 5
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 17
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o14.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o14
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 200.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 200.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 5
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 32
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 17
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o15.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o15
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 200.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 200.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 5
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 17
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 512
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 10
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o16.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o16
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 200.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 200.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 5
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 17
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 20
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o2.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o2
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 10
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o3.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o3
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 50
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o4.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o4
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-3
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o5.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o5
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 512
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o7.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o7
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 8
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o8.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o8
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 256
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 6
|
| 69 |
+
modes: 32
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc-o9.yaml
ADDED
|
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc-o9
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: VariableQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q_min_range: [0.01, 0.05]
|
| 30 |
+
q_max_range: [0.15, 0.4]
|
| 31 |
+
n_q_range: [128, 256]
|
| 32 |
+
device: 'cuda'
|
| 33 |
+
|
| 34 |
+
intensity_noise:
|
| 35 |
+
cls: BasicExpIntensityNoise
|
| 36 |
+
kwargs:
|
| 37 |
+
relative_errors: [0.0, 0.2]
|
| 38 |
+
abs_errors: 0.0
|
| 39 |
+
consistent_rel_err: true
|
| 40 |
+
logdist: false
|
| 41 |
+
apply_shift: false
|
| 42 |
+
shift_range: [-0.3, 0.3]
|
| 43 |
+
apply_scaling: false
|
| 44 |
+
scale_range: [-0.02, 0.02]
|
| 45 |
+
|
| 46 |
+
q_noise:
|
| 47 |
+
cls: BasicQNoiseGenerator
|
| 48 |
+
kwargs:
|
| 49 |
+
shift_std: 1.0e-3
|
| 50 |
+
noise_std: [0., 1.0e-3]
|
| 51 |
+
|
| 52 |
+
curves_scaler:
|
| 53 |
+
cls: LogAffineCurvesScaler
|
| 54 |
+
kwargs:
|
| 55 |
+
weight: 0.2
|
| 56 |
+
bias: 1.0
|
| 57 |
+
eps: 1.0e-10
|
| 58 |
+
|
| 59 |
+
model:
|
| 60 |
+
network:
|
| 61 |
+
cls: NetworkWithPriorsFnoEmb
|
| 62 |
+
pretrained_name: null
|
| 63 |
+
device: 'cuda'
|
| 64 |
+
kwargs:
|
| 65 |
+
in_channels: 2
|
| 66 |
+
dim_embedding: 512
|
| 67 |
+
width_fno: 128
|
| 68 |
+
n_fno_blocks : 1
|
| 69 |
+
modes: 16
|
| 70 |
+
embedding_net_activation: 'gelu'
|
| 71 |
+
use_batch_norm: True
|
| 72 |
+
dim_out: 8
|
| 73 |
+
layer_width: 1024
|
| 74 |
+
num_blocks: 6
|
| 75 |
+
repeats_per_block: 2
|
| 76 |
+
mlp_activation: 'gelu'
|
| 77 |
+
dropout_rate: 0.0
|
| 78 |
+
|
| 79 |
+
training:
|
| 80 |
+
num_iterations: 50000
|
| 81 |
+
batch_size: 1024
|
| 82 |
+
lr: 1.0e-4
|
| 83 |
+
grad_accumulation_steps: 1
|
| 84 |
+
clip_grad_norm_max: 1.0
|
| 85 |
+
train_with_q_input: True
|
| 86 |
+
update_tqdm_freq: 1
|
| 87 |
+
optimizer: AdamW
|
| 88 |
+
trainer_kwargs:
|
| 89 |
+
optim_kwargs:
|
| 90 |
+
betas: [0.9, 0.999]
|
| 91 |
+
weight_decay: 0.0005
|
| 92 |
+
callbacks:
|
| 93 |
+
save_best_model:
|
| 94 |
+
enable: true
|
| 95 |
+
freq: 500
|
| 96 |
+
lr_scheduler:
|
| 97 |
+
cls: StepLR
|
| 98 |
+
kwargs:
|
| 99 |
+
step_size: 2000
|
| 100 |
+
gamma: 0.9
|
| 101 |
+
logger:
|
| 102 |
+
use_neptune: false
|
configs/mc1.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc1
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc10.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc10
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: true
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc11.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc11
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: true
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.2, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc12.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc12
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: true
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc13.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc13
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: true
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: true
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc14.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc14
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.2, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: true
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: true
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc15.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc15
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: true
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: true
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc16.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc16
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: true
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: true
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc17.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc17
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.2, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: true
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: true
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc18.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc18
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: true
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: true
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc19.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc19
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc2.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc2
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.2, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc20.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc20
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.2, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc21.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc21
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc22.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc22
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc23.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc23
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.2, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc24.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc24
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc25.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc25
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc26.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc26
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 150.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc27.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc27
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 150.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc28.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc28
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc29.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc29
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 150.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc3.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc3
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc30.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc30
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 150.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc31.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc31
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 10.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc32.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc32
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 1.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc33.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc33
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 50.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc34.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc34
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [-20., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc35.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc35
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [-20., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc36.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc36
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [-20., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 128]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc37.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc37
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [-20., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc38.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc38
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 300.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 300.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 3
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 11
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc39.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc39
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 300.]
|
| 11 |
+
roughnesses: [0., 20.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 300.]
|
| 15 |
+
roughnesses: [1.0e-2, 20.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 3
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.3, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 11
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc4.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc4
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 500.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 500.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 2
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: false
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 8
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|
configs/mc40.yaml
ADDED
|
@@ -0,0 +1,105 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
general:
|
| 2 |
+
name: mc40
|
| 3 |
+
root_dir: null
|
| 4 |
+
|
| 5 |
+
dset:
|
| 6 |
+
prior_sampler:
|
| 7 |
+
cls: SubpriorParametricSampler
|
| 8 |
+
kwargs:
|
| 9 |
+
param_ranges:
|
| 10 |
+
thicknesses: [0., 300.]
|
| 11 |
+
roughnesses: [0., 60.]
|
| 12 |
+
slds: [0., 50.]
|
| 13 |
+
bound_width_ranges:
|
| 14 |
+
thicknesses: [1.0e-2, 300.]
|
| 15 |
+
roughnesses: [1.0e-2, 60.]
|
| 16 |
+
slds: [ 1.0e-2, 5.]
|
| 17 |
+
model_name: standard_model
|
| 18 |
+
max_num_layers: 3
|
| 19 |
+
constrained_roughness: true
|
| 20 |
+
max_thickness_share: 0.5
|
| 21 |
+
logdist: false
|
| 22 |
+
scale_params_by_ranges: false
|
| 23 |
+
scaled_range: [-1., 1.]
|
| 24 |
+
device: 'cuda'
|
| 25 |
+
|
| 26 |
+
q_generator:
|
| 27 |
+
cls: ConstantQ
|
| 28 |
+
kwargs:
|
| 29 |
+
q: [0.02, 0.15, 256]
|
| 30 |
+
device: 'cuda'
|
| 31 |
+
|
| 32 |
+
intensity_noise:
|
| 33 |
+
cls: BasicExpIntensityNoise
|
| 34 |
+
kwargs:
|
| 35 |
+
relative_errors: [0.0, 0.2]
|
| 36 |
+
abs_errors: 0.0
|
| 37 |
+
consistent_rel_err: true
|
| 38 |
+
logdist: false
|
| 39 |
+
apply_shift: false
|
| 40 |
+
shift_range: [-0.3, 0.3]
|
| 41 |
+
apply_scaling: false
|
| 42 |
+
scale_range: [-0.02, 0.02]
|
| 43 |
+
|
| 44 |
+
# q_noise:
|
| 45 |
+
# cls: BasicQNoiseGenerator
|
| 46 |
+
# kwargs:
|
| 47 |
+
# shift_std: 1.0e-3
|
| 48 |
+
# noise_std: [0., 1.0e-3]
|
| 49 |
+
|
| 50 |
+
curves_scaler:
|
| 51 |
+
cls: LogAffineCurvesScaler
|
| 52 |
+
kwargs:
|
| 53 |
+
weight: 0.2
|
| 54 |
+
bias: 1.0
|
| 55 |
+
eps: 1.0e-10
|
| 56 |
+
|
| 57 |
+
model:
|
| 58 |
+
network:
|
| 59 |
+
cls: NetworkWithPriorsConvEmb
|
| 60 |
+
pretrained_name: null
|
| 61 |
+
device: 'cuda'
|
| 62 |
+
kwargs:
|
| 63 |
+
in_channels: 1
|
| 64 |
+
hidden_channels: [32, 64, 128, 256, 512]
|
| 65 |
+
dim_embedding: 128
|
| 66 |
+
dim_avpool: 1
|
| 67 |
+
embedding_net_activation: 'gelu'
|
| 68 |
+
use_batch_norm: true
|
| 69 |
+
dim_out: 11
|
| 70 |
+
layer_width: 1024
|
| 71 |
+
num_blocks: 6
|
| 72 |
+
repeats_per_block: 2
|
| 73 |
+
mlp_activation: 'gelu'
|
| 74 |
+
dropout_rate: 0.0
|
| 75 |
+
pretrained_embedding_net: null
|
| 76 |
+
|
| 77 |
+
training:
|
| 78 |
+
num_iterations: 50000
|
| 79 |
+
batch_size: 4096
|
| 80 |
+
lr: 1.0e-4
|
| 81 |
+
grad_accumulation_steps: 1
|
| 82 |
+
clip_grad_norm_max: null
|
| 83 |
+
train_with_q_input: False
|
| 84 |
+
update_tqdm_freq: 1
|
| 85 |
+
optimizer: AdamW
|
| 86 |
+
trainer_kwargs:
|
| 87 |
+
optim_kwargs:
|
| 88 |
+
betas: [0.9, 0.999]
|
| 89 |
+
weight_decay: 0.0005
|
| 90 |
+
callbacks:
|
| 91 |
+
save_best_model:
|
| 92 |
+
enable: true
|
| 93 |
+
freq: 100
|
| 94 |
+
lr_scheduler:
|
| 95 |
+
cls: StepLR
|
| 96 |
+
kwargs:
|
| 97 |
+
step_size: 2000
|
| 98 |
+
gamma: 0.9
|
| 99 |
+
logger:
|
| 100 |
+
use_neptune: false
|
| 101 |
+
|
| 102 |
+
slurm:
|
| 103 |
+
cluster: 'tuebingen'
|
| 104 |
+
time: 0-05:00 #D-HH:MM
|
| 105 |
+
partition: 2080-galvani
|