Upload 15 files
Browse files- pretrained_linear/dinov2_reg_retrain_d3/args.yaml +271 -0
- pretrained_linear/dinov2_reg_retrain_d3/model_best.pth.tar +3 -0
- pretrained_linear/dinov2_reg_retrain_d3/summary.csv +15 -0
- pretrained_linear/dinov2_retrain_d3/args.yaml +271 -0
- pretrained_linear/dinov2_retrain_d3/model_best.pth.tar +3 -0
- pretrained_linear/dinov2_retrain_d3/summary.csv +14 -0
- pretrained_linear/siglip_retrain_d3/args.yaml +271 -0
- pretrained_linear/siglip_retrain_d3/model_best.pth.tar +3 -0
- pretrained_linear/siglip_retrain_d3/summary.csv +15 -0
- pretrained_linear/vit_tiny_code_retrain_d3/args.yaml +271 -0
- pretrained_linear/vit_tiny_code_retrain_d3/model_best.pth.tar +3 -0
- pretrained_linear/vit_tiny_code_retrain_d3/summary.csv +20 -0
- pretrained_linear/vit_tiny_retrain_d3/args.yaml +271 -0
- pretrained_linear/vit_tiny_retrain_d3/model_best.pth.tar +3 -0
- pretrained_linear/vit_tiny_retrain_d3/summary.csv +16 -0
pretrained_linear/dinov2_reg_retrain_d3/args.yaml
ADDED
|
@@ -0,0 +1,271 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
aa: null
|
| 2 |
+
amp: true
|
| 3 |
+
amp_dtype: float16
|
| 4 |
+
amp_impl: native
|
| 5 |
+
aug_repeats: 0
|
| 6 |
+
aug_splits: 0
|
| 7 |
+
batch_size: 64
|
| 8 |
+
bce_loss: true
|
| 9 |
+
bce_target_thresh: null
|
| 10 |
+
benchmark: false
|
| 11 |
+
blur_max: 2
|
| 12 |
+
blur_min: 0.1
|
| 13 |
+
blur_prob: 0.5
|
| 14 |
+
blur_sig:
|
| 15 |
+
- 0
|
| 16 |
+
- 3.0
|
| 17 |
+
bn_eps: null
|
| 18 |
+
bn_momentum: null
|
| 19 |
+
brightness_max: 2
|
| 20 |
+
brightness_min: 0.5
|
| 21 |
+
channels_last: false
|
| 22 |
+
checkpoint_hist: 10
|
| 23 |
+
cineca: true
|
| 24 |
+
class_map: ''
|
| 25 |
+
classifier:
|
| 26 |
+
- linear
|
| 27 |
+
- knn
|
| 28 |
+
- svm
|
| 29 |
+
clip_grad: null
|
| 30 |
+
clip_mode: norm
|
| 31 |
+
color_jitter: 0.4
|
| 32 |
+
contrast_max: 1.5
|
| 33 |
+
contrast_min: 0.5
|
| 34 |
+
contrastive_loss: false
|
| 35 |
+
cooldown_epochs: 0
|
| 36 |
+
corvi_resnet: false
|
| 37 |
+
crop_max: 512
|
| 38 |
+
crop_min: 64
|
| 39 |
+
crop_pct: null
|
| 40 |
+
cutmix: 0.0
|
| 41 |
+
cutmix_minmax: null
|
| 42 |
+
data: null
|
| 43 |
+
data_dir: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/webdatasets_elsa_v2
|
| 44 |
+
data_dir_eval_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/transf
|
| 45 |
+
data_dir_eval_no_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/no_transf
|
| 46 |
+
data_generator: null
|
| 47 |
+
data_len_eval: 4800
|
| 48 |
+
data_len_linear: 9600
|
| 49 |
+
data_len_train: null
|
| 50 |
+
dataset: elsa_v2_binarycrossentropy
|
| 51 |
+
dataset_download: false
|
| 52 |
+
dataset_eval: elsa_v2_binarycrossentropy_all_gen
|
| 53 |
+
decay_epochs: 90
|
| 54 |
+
decay_milestones:
|
| 55 |
+
- 90
|
| 56 |
+
- 180
|
| 57 |
+
- 270
|
| 58 |
+
decay_rate: 0.1
|
| 59 |
+
defake: false
|
| 60 |
+
deterministic: true
|
| 61 |
+
dino_crop: false
|
| 62 |
+
dino_head: false
|
| 63 |
+
dino_loss: false
|
| 64 |
+
dino_loss_weight: 0.5
|
| 65 |
+
dino_temp: 0.1
|
| 66 |
+
dist_bn: reduce
|
| 67 |
+
distance: cosine
|
| 68 |
+
double_contrastive: false
|
| 69 |
+
drop: 0.0
|
| 70 |
+
drop_block: null
|
| 71 |
+
drop_connect: null
|
| 72 |
+
drop_path: null
|
| 73 |
+
early_stopping: false
|
| 74 |
+
epoch_repeats: 0.0
|
| 75 |
+
epochs: 150
|
| 76 |
+
epochs_classifier: 1500
|
| 77 |
+
eval_metric: accuracy
|
| 78 |
+
experiment: dinov2reg-linear_d3-augm_prob_0.5-vit_large_patch14_reg4_dinov2.lvd142m_w8_transform_lr-5e-5-batch_size-256_epochs-150_loss-bce_optimizer-adam_fcocchi
|
| 79 |
+
external_transform: true
|
| 80 |
+
fast_norm: false
|
| 81 |
+
fuser: ''
|
| 82 |
+
global_crops_scale:
|
| 83 |
+
- 0.4
|
| 84 |
+
- 1.0
|
| 85 |
+
gp: null
|
| 86 |
+
grad_accum_steps: 1
|
| 87 |
+
grad_checkpointing: false
|
| 88 |
+
head_bottlenck: 256
|
| 89 |
+
head_hidden_dim: 384
|
| 90 |
+
head_init_bias: null
|
| 91 |
+
head_init_scale: null
|
| 92 |
+
head_out: 192
|
| 93 |
+
hflip: 0.5
|
| 94 |
+
img_size: null
|
| 95 |
+
in_chans: null
|
| 96 |
+
infonce_loss_temperature: 0.1
|
| 97 |
+
initial_checkpoint: ''
|
| 98 |
+
input_size:
|
| 99 |
+
- 3
|
| 100 |
+
- 518
|
| 101 |
+
- 518
|
| 102 |
+
interpolation: ''
|
| 103 |
+
jitter_max: 1.5
|
| 104 |
+
jitter_min: 0.5
|
| 105 |
+
job_id: 0
|
| 106 |
+
jpeg_max: 100
|
| 107 |
+
jpeg_min: 30
|
| 108 |
+
jpeg_prob: 0.5
|
| 109 |
+
jsd_loss: false
|
| 110 |
+
ladeda: false
|
| 111 |
+
lambda_loss: 10
|
| 112 |
+
last_crop: false
|
| 113 |
+
layer_decay: null
|
| 114 |
+
linear_pretrained: null
|
| 115 |
+
linear_train_shards: dataset/shards/elsa_v2_train_transf.shards
|
| 116 |
+
load_code: false
|
| 117 |
+
local_crops_scale:
|
| 118 |
+
- 0.05
|
| 119 |
+
- 0.4
|
| 120 |
+
local_rank: 0
|
| 121 |
+
log_interval: 5
|
| 122 |
+
log_wandb: true
|
| 123 |
+
lr: 5.0e-05
|
| 124 |
+
lr_base: 0.1
|
| 125 |
+
lr_base_scale: ''
|
| 126 |
+
lr_base_size: 256
|
| 127 |
+
lr_cycle_decay: 0.5
|
| 128 |
+
lr_cycle_limit: 1
|
| 129 |
+
lr_cycle_mul: 1.0
|
| 130 |
+
lr_k_decay: 1.0
|
| 131 |
+
lr_noise: null
|
| 132 |
+
lr_noise_pct: 0.67
|
| 133 |
+
lr_noise_std: 1.0
|
| 134 |
+
margin: 1
|
| 135 |
+
mean:
|
| 136 |
+
- 0.485
|
| 137 |
+
- 0.456
|
| 138 |
+
- 0.406
|
| 139 |
+
min_lr: 0.0
|
| 140 |
+
mixup: 0.0
|
| 141 |
+
mixup_mode: batch
|
| 142 |
+
mixup_off_epoch: 0
|
| 143 |
+
mixup_prob: 1.0
|
| 144 |
+
mixup_switch_prob: 0.5
|
| 145 |
+
model: vit_large_patch14_reg4_dinov2.lvd142m
|
| 146 |
+
model_ema: false
|
| 147 |
+
model_ema_decay: 0.9998
|
| 148 |
+
model_ema_force_cpu: false
|
| 149 |
+
model_kwargs: {}
|
| 150 |
+
momentum: 0.9
|
| 151 |
+
multiple_evaluations: true
|
| 152 |
+
n_crops: 1
|
| 153 |
+
no_aug: false
|
| 154 |
+
no_ddp_bb: false
|
| 155 |
+
no_prefetcher: true
|
| 156 |
+
no_resume_opt: false
|
| 157 |
+
not_load_input_size: false
|
| 158 |
+
num_classes: null
|
| 159 |
+
num_jobs: 1
|
| 160 |
+
num_step: 6800
|
| 161 |
+
num_transform: 2
|
| 162 |
+
ojha_d3: false
|
| 163 |
+
only_linear_training: true
|
| 164 |
+
only_validate: false
|
| 165 |
+
opacity_max: 1.0
|
| 166 |
+
opacity_min: 0.2
|
| 167 |
+
opt: adam
|
| 168 |
+
opt_betas: null
|
| 169 |
+
opt_eps: null
|
| 170 |
+
opt_kwargs: {}
|
| 171 |
+
output: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/runs
|
| 172 |
+
overlay_max: 0.35
|
| 173 |
+
overlay_min: 0.05
|
| 174 |
+
pad_max: 0.25
|
| 175 |
+
pad_min: 0.01
|
| 176 |
+
patience_counter: 0
|
| 177 |
+
patience_epochs: 5
|
| 178 |
+
permutation_fake: false
|
| 179 |
+
permutation_real: false
|
| 180 |
+
pin_mem: false
|
| 181 |
+
pix_max: 1
|
| 182 |
+
pix_min: 0.3
|
| 183 |
+
plot_freq: 5
|
| 184 |
+
pretrained: true
|
| 185 |
+
random_crop: false
|
| 186 |
+
random_grayscale_prob: 0.01
|
| 187 |
+
ratio:
|
| 188 |
+
- 0.75
|
| 189 |
+
- 1.3333333333333333
|
| 190 |
+
ratio_max: 2
|
| 191 |
+
ratio_min: 0.75
|
| 192 |
+
real_centering_loss: false
|
| 193 |
+
recount: 1
|
| 194 |
+
recovery_interval: 0
|
| 195 |
+
remode: pixel
|
| 196 |
+
reprob: 0.0
|
| 197 |
+
resize_max: 512
|
| 198 |
+
resize_min: 64
|
| 199 |
+
resplit: false
|
| 200 |
+
resume: ''
|
| 201 |
+
rotatio_max: 270
|
| 202 |
+
rotatio_min: 90
|
| 203 |
+
saturation_max: 1.5
|
| 204 |
+
saturation_min: 0.5
|
| 205 |
+
save_images: false
|
| 206 |
+
save_model_linear: false
|
| 207 |
+
scale:
|
| 208 |
+
- 0.08
|
| 209 |
+
- 1.0
|
| 210 |
+
scale_max: 1.5
|
| 211 |
+
scale_min: 0.5
|
| 212 |
+
sched: plateau
|
| 213 |
+
sched_on_updates: false
|
| 214 |
+
seed: 42
|
| 215 |
+
sharp_max: 2.0
|
| 216 |
+
sharp_min: 1.2
|
| 217 |
+
shuffle_max: 0.35
|
| 218 |
+
shuffle_min: 0.0
|
| 219 |
+
skew_max: 1.0
|
| 220 |
+
skew_min: -1.0
|
| 221 |
+
smoothing: 0.0
|
| 222 |
+
split_bn: false
|
| 223 |
+
start_epoch: null
|
| 224 |
+
std:
|
| 225 |
+
- 0.229
|
| 226 |
+
- 0.224
|
| 227 |
+
- 0.225
|
| 228 |
+
step: 5
|
| 229 |
+
sup_contrastive_loss: false
|
| 230 |
+
suppl: false
|
| 231 |
+
sync_bn: true
|
| 232 |
+
synchronize_step: false
|
| 233 |
+
teacher_temp: 0.07
|
| 234 |
+
teacher_temp_fix: false
|
| 235 |
+
test_augm: false
|
| 236 |
+
test_shards_augm: dataset/shards/coco-test-dict.shards
|
| 237 |
+
test_shards_no_augm: dataset/shards/coco-test-dict.shards
|
| 238 |
+
threshold_plateau: 0.001
|
| 239 |
+
torchcompile: null
|
| 240 |
+
torchscript: false
|
| 241 |
+
train_interpolation: random
|
| 242 |
+
train_shards: dataset/shards/elsav2-training.shards
|
| 243 |
+
train_split: train
|
| 244 |
+
triplet_loss: false
|
| 245 |
+
tta: 0
|
| 246 |
+
use_multi_epochs_loader: false
|
| 247 |
+
val: false
|
| 248 |
+
val_shards_augm: dataset/shards/validation_set-transf-elsav2.shards
|
| 249 |
+
val_shards_no_augm: dataset/shards/validation_set-no_transf-elsav2.shards
|
| 250 |
+
val_split: validation
|
| 251 |
+
validation_batch_size: 50
|
| 252 |
+
vflip: 0.0
|
| 253 |
+
wandb_entity: lorenzo_b_master_thesis
|
| 254 |
+
wandb_group: null
|
| 255 |
+
wandb_id: null
|
| 256 |
+
wandb_logging: false
|
| 257 |
+
wandb_name: null
|
| 258 |
+
wandb_notes: null
|
| 259 |
+
wandb_project_name: contrastive-fake
|
| 260 |
+
wandb_resume: allow
|
| 261 |
+
warmup_epochs: 0
|
| 262 |
+
warmup_lr: 1.0e-06
|
| 263 |
+
warmup_prefix: false
|
| 264 |
+
warmup_teacher_temp: 0.04
|
| 265 |
+
warmup_teacher_temp_epochs: 30
|
| 266 |
+
watermark_prob: 0.2
|
| 267 |
+
weight_decay: 2.0e-05
|
| 268 |
+
weight_decay_end: null
|
| 269 |
+
worker_seeding: all
|
| 270 |
+
workers: 8
|
| 271 |
+
workers_validate: 3
|
pretrained_linear/dinov2_reg_retrain_d3/model_best.pth.tar
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f200a9647877efd001ee47dfb0cb7c181038a5b19a44c2833049c0207950bfb
|
| 3 |
+
size 1217633268
|
pretrained_linear/dinov2_reg_retrain_d3/summary.csv
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epoch,train_loss,train_loss_contrastive_1,train_loss_contrastive_2,train_loss_dino,train_loss_mse,eval_loss,eval_loss_contrastive_1,eval_loss_contrastive_2,eval_loss_dino,eval_top1_tot,eval_top1_real,eval_top1_f0,eval_top1_f1,eval_top1_f2,eval_top1_f3,eval_accuracy,lr
|
| 2 |
+
0,0.4270891603301553,0.4270891603301553,0.0,0.0,0.0,0.3398622473080953,0.3398622473080953,0.0,0.0,0.8586249972383181,0.7591666628917059,0.7466666673620542,0.8956249952316284,0.9114583258827528,0.9802083522081375,0.8586249972383181,5e-05
|
| 3 |
+
1,0.3588951288777239,0.3588951288777239,0.0,0.0,0.0,0.32810890922943753,0.32810890922943753,0.0,0.0,0.8607916757464409,0.7891666616002718,0.7345833306511244,0.8906249925494194,0.909791665772597,0.9797916834553083,0.8607916757464409,5e-05
|
| 4 |
+
2,0.3471918925204698,0.3471918925204698,0.0,0.0,0.0,0.3279983016351859,0.3279983016351859,0.0,0.0,0.8601250027616819,0.8041666646798452,0.7343749925494194,0.8827083284656206,0.9014583205183347,0.9779166852434477,0.8601250027616819,5e-05
|
| 5 |
+
3,0.3418740119127666,0.3418740119127666,0.0,0.0,0.0,0.32968178018927574,0.32968178018927574,0.0,0.0,0.8573749909798304,0.8102083280682564,0.7258333265781403,0.876666655143102,0.8958333159486452,0.97833335151275,0.8573749909798304,5e-05
|
| 6 |
+
4,0.3402972218635328,0.3402972218635328,0.0,0.0,0.0,0.33015526706973713,0.33015526706973713,0.0,0.0,0.8566249931852022,0.812291661898295,0.7249999965230624,0.8731249844034513,0.8952083165446917,0.9775000189741453,0.8566249931852022,5e-05
|
| 7 |
+
5,0.3397858255816733,0.3397858255816733,0.0,0.0,0.0,0.3304978149632613,0.3304978149632613,0.0,0.0,0.8560416723291079,0.8133333226044973,0.7247916584213575,0.8722916568319002,0.8929166495800018,0.9768750220537186,0.8560416723291079,5e-05
|
| 8 |
+
6,0.33837131336331366,0.33837131336331366,0.0,0.0,0.0,0.3342321266730626,0.3342321266730626,0.0,0.0,0.8535000036160151,0.8174999877810478,0.716249999900659,0.8677083253860474,0.8899999856948853,0.9760416895151138,0.8535000036160151,5e-05
|
| 9 |
+
7,0.3367009612457717,0.3367009612457717,0.0,0.0,0.0,0.3338993216554324,0.3338993216554324,0.0,0.0,0.8542916675408682,0.8179166540503502,0.719374991953373,0.86749999721845,0.8912499845027924,0.9754166901111603,0.8542916675408682,5e-05
|
| 10 |
+
8,0.3396024629035417,0.3396024629035417,0.0,0.0,0.0,0.3347433991730213,0.3347433991730213,0.0,0.0,0.8532916679978371,0.8187499865889549,0.7172916606068611,0.8656249965230624,0.8895833169420561,0.9752083569765091,0.8532916679978371,5e-06
|
| 11 |
+
9,0.33822163167026115,0.33822163167026115,0.0,0.0,0.0,0.3339970335364342,0.3339970335364342,0.0,0.0,0.8541666691501936,0.8185416534543037,0.719583327571551,0.8662499934434891,0.8904166519641876,0.9760416895151138,0.8541666691501936,5e-06
|
| 12 |
+
10,0.33892199272180307,0.33892199272180307,0.0,0.0,0.0,0.33424188445011777,0.33424188445011777,0.0,0.0,0.8541666641831398,0.8187499865889549,0.7189583281675974,0.8664583265781403,0.8904166494806608,0.976250022649765,0.8541666641831398,5e-06
|
| 13 |
+
11,0.33800992470453767,0.33800992470453767,0.0,0.0,0.0,0.33405251676837605,0.33405251676837605,0.0,0.0,0.8543333311875662,0.8185416534543037,0.719583327571551,0.8664583265781403,0.8906249850988388,0.9764583557844162,0.8543333311875662,5e-06
|
| 14 |
+
12,0.33754491546355625,0.33754491546355625,0.0,0.0,0.0,0.33390598247448605,0.33390598247448605,0.0,0.0,0.8538333252072334,0.8179166515668234,0.719583327571551,0.8654166609048843,0.8902083188295364,0.9760416895151138,0.8538333252072334,5e-06
|
| 15 |
+
13,0.3365888311253751,0.3365888311253751,0.0,0.0,0.0,0.33463675901293755,0.33463675901293755,0.0,0.0,0.8533749878406525,0.8185416509707769,0.7181249931454659,0.864999994635582,0.8891666531562805,0.9760416895151138,0.8533749878406525,5e-06
|
pretrained_linear/dinov2_retrain_d3/args.yaml
ADDED
|
@@ -0,0 +1,271 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
aa: null
|
| 2 |
+
amp: true
|
| 3 |
+
amp_dtype: float16
|
| 4 |
+
amp_impl: native
|
| 5 |
+
aug_repeats: 0
|
| 6 |
+
aug_splits: 0
|
| 7 |
+
batch_size: 64
|
| 8 |
+
bce_loss: true
|
| 9 |
+
bce_target_thresh: null
|
| 10 |
+
benchmark: false
|
| 11 |
+
blur_max: 2
|
| 12 |
+
blur_min: 0.1
|
| 13 |
+
blur_prob: 0.5
|
| 14 |
+
blur_sig:
|
| 15 |
+
- 0
|
| 16 |
+
- 3.0
|
| 17 |
+
bn_eps: null
|
| 18 |
+
bn_momentum: null
|
| 19 |
+
brightness_max: 2
|
| 20 |
+
brightness_min: 0.5
|
| 21 |
+
channels_last: false
|
| 22 |
+
checkpoint_hist: 10
|
| 23 |
+
cineca: true
|
| 24 |
+
class_map: ''
|
| 25 |
+
classifier:
|
| 26 |
+
- linear
|
| 27 |
+
- knn
|
| 28 |
+
- svm
|
| 29 |
+
clip_grad: null
|
| 30 |
+
clip_mode: norm
|
| 31 |
+
color_jitter: 0.4
|
| 32 |
+
contrast_max: 1.5
|
| 33 |
+
contrast_min: 0.5
|
| 34 |
+
contrastive_loss: false
|
| 35 |
+
cooldown_epochs: 0
|
| 36 |
+
corvi_resnet: false
|
| 37 |
+
crop_max: 512
|
| 38 |
+
crop_min: 64
|
| 39 |
+
crop_pct: null
|
| 40 |
+
cutmix: 0.0
|
| 41 |
+
cutmix_minmax: null
|
| 42 |
+
data: null
|
| 43 |
+
data_dir: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/webdatasets_elsa_v2
|
| 44 |
+
data_dir_eval_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/transf
|
| 45 |
+
data_dir_eval_no_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/no_transf
|
| 46 |
+
data_generator: null
|
| 47 |
+
data_len_eval: 4800
|
| 48 |
+
data_len_linear: 9600
|
| 49 |
+
data_len_train: null
|
| 50 |
+
dataset: elsa_v2_binarycrossentropy
|
| 51 |
+
dataset_download: false
|
| 52 |
+
dataset_eval: elsa_v2_binarycrossentropy_all_gen
|
| 53 |
+
decay_epochs: 90
|
| 54 |
+
decay_milestones:
|
| 55 |
+
- 90
|
| 56 |
+
- 180
|
| 57 |
+
- 270
|
| 58 |
+
decay_rate: 0.1
|
| 59 |
+
defake: false
|
| 60 |
+
deterministic: true
|
| 61 |
+
dino_crop: false
|
| 62 |
+
dino_head: false
|
| 63 |
+
dino_loss: false
|
| 64 |
+
dino_loss_weight: 0.5
|
| 65 |
+
dino_temp: 0.1
|
| 66 |
+
dist_bn: reduce
|
| 67 |
+
distance: cosine
|
| 68 |
+
double_contrastive: false
|
| 69 |
+
drop: 0.0
|
| 70 |
+
drop_block: null
|
| 71 |
+
drop_connect: null
|
| 72 |
+
drop_path: null
|
| 73 |
+
early_stopping: false
|
| 74 |
+
epoch_repeats: 0.0
|
| 75 |
+
epochs: 150
|
| 76 |
+
epochs_classifier: 1500
|
| 77 |
+
eval_metric: accuracy
|
| 78 |
+
experiment: dinov2-linear_d3-augm_prob_0.5-vit_large_patch14_dinov2.lvd142m_w8_transform_lr-5e-5-batch_size-256_epochs-150_loss-bce_optimizer-adam_fcocchi
|
| 79 |
+
external_transform: true
|
| 80 |
+
fast_norm: false
|
| 81 |
+
fuser: ''
|
| 82 |
+
global_crops_scale:
|
| 83 |
+
- 0.4
|
| 84 |
+
- 1.0
|
| 85 |
+
gp: null
|
| 86 |
+
grad_accum_steps: 1
|
| 87 |
+
grad_checkpointing: false
|
| 88 |
+
head_bottlenck: 256
|
| 89 |
+
head_hidden_dim: 384
|
| 90 |
+
head_init_bias: null
|
| 91 |
+
head_init_scale: null
|
| 92 |
+
head_out: 192
|
| 93 |
+
hflip: 0.5
|
| 94 |
+
img_size: null
|
| 95 |
+
in_chans: null
|
| 96 |
+
infonce_loss_temperature: 0.1
|
| 97 |
+
initial_checkpoint: ''
|
| 98 |
+
input_size:
|
| 99 |
+
- 3
|
| 100 |
+
- 518
|
| 101 |
+
- 518
|
| 102 |
+
interpolation: ''
|
| 103 |
+
jitter_max: 1.5
|
| 104 |
+
jitter_min: 0.5
|
| 105 |
+
job_id: 0
|
| 106 |
+
jpeg_max: 100
|
| 107 |
+
jpeg_min: 30
|
| 108 |
+
jpeg_prob: 0.5
|
| 109 |
+
jsd_loss: false
|
| 110 |
+
ladeda: false
|
| 111 |
+
lambda_loss: 10
|
| 112 |
+
last_crop: false
|
| 113 |
+
layer_decay: null
|
| 114 |
+
linear_pretrained: null
|
| 115 |
+
linear_train_shards: dataset/shards/elsa_v2_train_transf.shards
|
| 116 |
+
load_code: false
|
| 117 |
+
local_crops_scale:
|
| 118 |
+
- 0.05
|
| 119 |
+
- 0.4
|
| 120 |
+
local_rank: 0
|
| 121 |
+
log_interval: 5
|
| 122 |
+
log_wandb: true
|
| 123 |
+
lr: 5.0e-05
|
| 124 |
+
lr_base: 0.1
|
| 125 |
+
lr_base_scale: ''
|
| 126 |
+
lr_base_size: 256
|
| 127 |
+
lr_cycle_decay: 0.5
|
| 128 |
+
lr_cycle_limit: 1
|
| 129 |
+
lr_cycle_mul: 1.0
|
| 130 |
+
lr_k_decay: 1.0
|
| 131 |
+
lr_noise: null
|
| 132 |
+
lr_noise_pct: 0.67
|
| 133 |
+
lr_noise_std: 1.0
|
| 134 |
+
margin: 1
|
| 135 |
+
mean:
|
| 136 |
+
- 0.485
|
| 137 |
+
- 0.456
|
| 138 |
+
- 0.406
|
| 139 |
+
min_lr: 0.0
|
| 140 |
+
mixup: 0.0
|
| 141 |
+
mixup_mode: batch
|
| 142 |
+
mixup_off_epoch: 0
|
| 143 |
+
mixup_prob: 1.0
|
| 144 |
+
mixup_switch_prob: 0.5
|
| 145 |
+
model: vit_large_patch14_dinov2.lvd142m
|
| 146 |
+
model_ema: false
|
| 147 |
+
model_ema_decay: 0.9998
|
| 148 |
+
model_ema_force_cpu: false
|
| 149 |
+
model_kwargs: {}
|
| 150 |
+
momentum: 0.9
|
| 151 |
+
multiple_evaluations: true
|
| 152 |
+
n_crops: 1
|
| 153 |
+
no_aug: false
|
| 154 |
+
no_ddp_bb: false
|
| 155 |
+
no_prefetcher: true
|
| 156 |
+
no_resume_opt: false
|
| 157 |
+
not_load_input_size: false
|
| 158 |
+
num_classes: null
|
| 159 |
+
num_jobs: 1
|
| 160 |
+
num_step: 6800
|
| 161 |
+
num_transform: 2
|
| 162 |
+
ojha_d3: false
|
| 163 |
+
only_linear_training: true
|
| 164 |
+
only_validate: false
|
| 165 |
+
opacity_max: 1.0
|
| 166 |
+
opacity_min: 0.2
|
| 167 |
+
opt: adam
|
| 168 |
+
opt_betas: null
|
| 169 |
+
opt_eps: null
|
| 170 |
+
opt_kwargs: {}
|
| 171 |
+
output: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/runs
|
| 172 |
+
overlay_max: 0.35
|
| 173 |
+
overlay_min: 0.05
|
| 174 |
+
pad_max: 0.25
|
| 175 |
+
pad_min: 0.01
|
| 176 |
+
patience_counter: 0
|
| 177 |
+
patience_epochs: 5
|
| 178 |
+
permutation_fake: false
|
| 179 |
+
permutation_real: false
|
| 180 |
+
pin_mem: false
|
| 181 |
+
pix_max: 1
|
| 182 |
+
pix_min: 0.3
|
| 183 |
+
plot_freq: 5
|
| 184 |
+
pretrained: true
|
| 185 |
+
random_crop: false
|
| 186 |
+
random_grayscale_prob: 0.01
|
| 187 |
+
ratio:
|
| 188 |
+
- 0.75
|
| 189 |
+
- 1.3333333333333333
|
| 190 |
+
ratio_max: 2
|
| 191 |
+
ratio_min: 0.75
|
| 192 |
+
real_centering_loss: false
|
| 193 |
+
recount: 1
|
| 194 |
+
recovery_interval: 0
|
| 195 |
+
remode: pixel
|
| 196 |
+
reprob: 0.0
|
| 197 |
+
resize_max: 512
|
| 198 |
+
resize_min: 64
|
| 199 |
+
resplit: false
|
| 200 |
+
resume: ''
|
| 201 |
+
rotatio_max: 270
|
| 202 |
+
rotatio_min: 90
|
| 203 |
+
saturation_max: 1.5
|
| 204 |
+
saturation_min: 0.5
|
| 205 |
+
save_images: false
|
| 206 |
+
save_model_linear: false
|
| 207 |
+
scale:
|
| 208 |
+
- 0.08
|
| 209 |
+
- 1.0
|
| 210 |
+
scale_max: 1.5
|
| 211 |
+
scale_min: 0.5
|
| 212 |
+
sched: plateau
|
| 213 |
+
sched_on_updates: false
|
| 214 |
+
seed: 42
|
| 215 |
+
sharp_max: 2.0
|
| 216 |
+
sharp_min: 1.2
|
| 217 |
+
shuffle_max: 0.35
|
| 218 |
+
shuffle_min: 0.0
|
| 219 |
+
skew_max: 1.0
|
| 220 |
+
skew_min: -1.0
|
| 221 |
+
smoothing: 0.0
|
| 222 |
+
split_bn: false
|
| 223 |
+
start_epoch: null
|
| 224 |
+
std:
|
| 225 |
+
- 0.229
|
| 226 |
+
- 0.224
|
| 227 |
+
- 0.225
|
| 228 |
+
step: 5
|
| 229 |
+
sup_contrastive_loss: false
|
| 230 |
+
suppl: false
|
| 231 |
+
sync_bn: true
|
| 232 |
+
synchronize_step: false
|
| 233 |
+
teacher_temp: 0.07
|
| 234 |
+
teacher_temp_fix: false
|
| 235 |
+
test_augm: false
|
| 236 |
+
test_shards_augm: dataset/shards/coco-test-dict.shards
|
| 237 |
+
test_shards_no_augm: dataset/shards/coco-test-dict.shards
|
| 238 |
+
threshold_plateau: 0.001
|
| 239 |
+
torchcompile: null
|
| 240 |
+
torchscript: false
|
| 241 |
+
train_interpolation: random
|
| 242 |
+
train_shards: dataset/shards/elsav2-training.shards
|
| 243 |
+
train_split: train
|
| 244 |
+
triplet_loss: false
|
| 245 |
+
tta: 0
|
| 246 |
+
use_multi_epochs_loader: false
|
| 247 |
+
val: false
|
| 248 |
+
val_shards_augm: dataset/shards/validation_set-transf-elsav2.shards
|
| 249 |
+
val_shards_no_augm: dataset/shards/validation_set-no_transf-elsav2.shards
|
| 250 |
+
val_split: validation
|
| 251 |
+
validation_batch_size: 50
|
| 252 |
+
vflip: 0.0
|
| 253 |
+
wandb_entity: lorenzo_b_master_thesis
|
| 254 |
+
wandb_group: null
|
| 255 |
+
wandb_id: null
|
| 256 |
+
wandb_logging: false
|
| 257 |
+
wandb_name: null
|
| 258 |
+
wandb_notes: null
|
| 259 |
+
wandb_project_name: contrastive-fake
|
| 260 |
+
wandb_resume: allow
|
| 261 |
+
warmup_epochs: 0
|
| 262 |
+
warmup_lr: 1.0e-06
|
| 263 |
+
warmup_prefix: false
|
| 264 |
+
warmup_teacher_temp: 0.04
|
| 265 |
+
warmup_teacher_temp_epochs: 30
|
| 266 |
+
watermark_prob: 0.2
|
| 267 |
+
weight_decay: 2.0e-05
|
| 268 |
+
weight_decay_end: null
|
| 269 |
+
worker_seeding: all
|
| 270 |
+
workers: 8
|
| 271 |
+
workers_validate: 3
|
pretrained_linear/dinov2_retrain_d3/model_best.pth.tar
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ce63ed647d40b3b5d71653d5b9b5e7a83a7fbf1af8581dcc2b1cf6415dc5b99
|
| 3 |
+
size 1217620662
|
pretrained_linear/dinov2_retrain_d3/summary.csv
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epoch,train_loss,train_loss_contrastive_1,train_loss_contrastive_2,train_loss_dino,train_loss_mse,eval_loss,eval_loss_contrastive_1,eval_loss_contrastive_2,eval_loss_dino,eval_top1_tot,eval_top1_real,eval_top1_f0,eval_top1_f1,eval_top1_f2,eval_top1_f3,eval_accuracy,lr
|
| 2 |
+
0,0.40779598109862386,0.40779598109862386,0.0,0.0,0.0,0.32200923189520836,0.32200923189520836,0.0,0.0,0.8652499988675117,0.766041673719883,0.7824999913573265,0.8802083333333334,0.916666661699613,0.9808333516120911,0.8652499988675117,5e-05
|
| 3 |
+
1,0.35053964555263517,0.35053964555263517,0.0,0.0,0.0,0.3143559818466504,0.3143559818466504,0.0,0.0,0.8659166743357977,0.7720833246906599,0.7914583285649618,0.8731249968210856,0.9108333314458529,0.9820833504199982,0.8659166743357977,5e-05
|
| 4 |
+
2,0.34292491872740144,0.34292491872740144,0.0,0.0,0.0,0.31599651897946995,0.31599651897946995,0.0,0.0,0.8627916673819224,0.7710416689515114,0.7904166604081789,0.8681249966224035,0.9043749868869781,0.9800000190734863,0.8627916673819224,5e-05
|
| 5 |
+
3,0.3417624373755911,0.3417624373755911,0.0,0.0,0.0,0.31639740616083145,0.31639740616083145,0.0,0.0,0.8628749921917915,0.7706249927481016,0.793958326180776,0.8668749953309695,0.9027083242932955,0.9802083522081375,0.8628749921917915,5e-05
|
| 6 |
+
4,0.3424564203356995,0.3424564203356995,0.0,0.0,0.0,0.31380850573380786,0.31380850573380786,0.0,0.0,0.8637500007947286,0.7687499995032946,0.7987499932448069,0.8658333296577135,0.9047916556398073,0.9806250184774399,0.8637500007947286,5e-05
|
| 7 |
+
5,0.34277600281159665,0.34277600281159665,0.0,0.0,0.0,0.3148735302189986,0.3148735302189986,0.0,0.0,0.8623333250482877,0.7685416638851166,0.7960416600108147,0.863958328962326,0.9020833224058151,0.9810416847467422,0.8623333250482877,5e-05
|
| 8 |
+
6,0.3431625930044581,0.3431625930044581,0.0,0.0,0.0,0.31514046092828113,0.31514046092828113,0.0,0.0,0.8631666675209999,0.7745833347241083,0.7968749950329462,0.8608333294590315,0.9037499899665514,0.9797916859388351,0.8631666675209999,5e-05
|
| 9 |
+
7,0.34295197775697006,0.34295197775697006,0.0,0.0,0.0,0.3158290758728981,0.3158290758728981,0.0,0.0,0.8624999945362409,0.7737499997019768,0.7937499930461248,0.8620833307504654,0.903333326180776,0.979583352804184,0.8624999945362409,5e-06
|
| 10 |
+
8,0.3403211101780043,0.3403211101780043,0.0,0.0,0.0,0.31419028465946514,0.31419028465946514,0.0,0.0,0.8633333245913187,0.7704166620969772,0.796458326280117,0.8649999996026357,0.9052083243926367,0.979583352804184,0.8633333245913187,5e-06
|
| 11 |
+
9,0.34168748154359707,0.34168748154359707,0.0,0.0,0.0,0.3151494575043519,0.3151494575043519,0.0,0.0,0.8635416626930237,0.77374999721845,0.7956249937415123,0.8643750001986822,0.9041666562358538,0.9797916859388351,0.8635416626930237,5e-06
|
| 12 |
+
10,0.34067836066379265,0.34067836066379265,0.0,0.0,0.0,0.31461643303434056,0.31461643303434056,0.0,0.0,0.8639166603485743,0.7716666658719381,0.7991666570305824,0.8643749952316284,0.9047916581233343,0.979583352804184,0.8639166603485743,5e-06
|
| 13 |
+
11,0.3410450046772466,0.3410450046772466,0.0,0.0,0.0,0.31480051080385846,0.31480051080385846,0.0,0.0,0.8635833313067754,0.7720833321412405,0.7972916563351949,0.8627083326379458,0.9052083243926367,0.9806250184774399,0.8635833313067754,5e-06
|
| 14 |
+
12,0.3398179399178309,0.3398179399178309,0.0,0.0,0.0,0.3150838501751423,0.3150838501751423,0.0,0.0,0.8636249924699465,0.7735416616002718,0.7972916563351949,0.862916665772597,0.9047916556398073,0.979583352804184,0.8636249924699465,5e-06
|
pretrained_linear/siglip_retrain_d3/args.yaml
ADDED
|
@@ -0,0 +1,271 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
aa: null
|
| 2 |
+
amp: true
|
| 3 |
+
amp_dtype: float16
|
| 4 |
+
amp_impl: native
|
| 5 |
+
aug_repeats: 0
|
| 6 |
+
aug_splits: 0
|
| 7 |
+
batch_size: 64
|
| 8 |
+
bce_loss: true
|
| 9 |
+
bce_target_thresh: null
|
| 10 |
+
benchmark: false
|
| 11 |
+
blur_max: 2
|
| 12 |
+
blur_min: 0.1
|
| 13 |
+
blur_prob: 0.5
|
| 14 |
+
blur_sig:
|
| 15 |
+
- 0
|
| 16 |
+
- 3.0
|
| 17 |
+
bn_eps: null
|
| 18 |
+
bn_momentum: null
|
| 19 |
+
brightness_max: 2
|
| 20 |
+
brightness_min: 0.5
|
| 21 |
+
channels_last: false
|
| 22 |
+
checkpoint_hist: 10
|
| 23 |
+
cineca: true
|
| 24 |
+
class_map: ''
|
| 25 |
+
classifier:
|
| 26 |
+
- linear
|
| 27 |
+
- knn
|
| 28 |
+
- svm
|
| 29 |
+
clip_grad: null
|
| 30 |
+
clip_mode: norm
|
| 31 |
+
color_jitter: 0.4
|
| 32 |
+
contrast_max: 1.5
|
| 33 |
+
contrast_min: 0.5
|
| 34 |
+
contrastive_loss: false
|
| 35 |
+
cooldown_epochs: 0
|
| 36 |
+
corvi_resnet: false
|
| 37 |
+
crop_max: 512
|
| 38 |
+
crop_min: 64
|
| 39 |
+
crop_pct: null
|
| 40 |
+
cutmix: 0.0
|
| 41 |
+
cutmix_minmax: null
|
| 42 |
+
data: null
|
| 43 |
+
data_dir: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/webdatasets_elsa_v2
|
| 44 |
+
data_dir_eval_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/transf
|
| 45 |
+
data_dir_eval_no_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/no_transf
|
| 46 |
+
data_generator: null
|
| 47 |
+
data_len_eval: 4800
|
| 48 |
+
data_len_linear: 9600
|
| 49 |
+
data_len_train: null
|
| 50 |
+
dataset: elsa_v2_binarycrossentropy
|
| 51 |
+
dataset_download: false
|
| 52 |
+
dataset_eval: elsa_v2_binarycrossentropy_all_gen
|
| 53 |
+
decay_epochs: 90
|
| 54 |
+
decay_milestones:
|
| 55 |
+
- 90
|
| 56 |
+
- 180
|
| 57 |
+
- 270
|
| 58 |
+
decay_rate: 0.1
|
| 59 |
+
defake: false
|
| 60 |
+
deterministic: true
|
| 61 |
+
dino_crop: false
|
| 62 |
+
dino_head: false
|
| 63 |
+
dino_loss: false
|
| 64 |
+
dino_loss_weight: 0.5
|
| 65 |
+
dino_temp: 0.1
|
| 66 |
+
dist_bn: reduce
|
| 67 |
+
distance: cosine
|
| 68 |
+
double_contrastive: false
|
| 69 |
+
drop: 0.0
|
| 70 |
+
drop_block: null
|
| 71 |
+
drop_connect: null
|
| 72 |
+
drop_path: null
|
| 73 |
+
early_stopping: false
|
| 74 |
+
epoch_repeats: 0.0
|
| 75 |
+
epochs: 150
|
| 76 |
+
epochs_classifier: 1500
|
| 77 |
+
eval_metric: accuracy
|
| 78 |
+
experiment: siglip-linear_d3-augm_prob_0.5-vit_large_patch16_siglip_384_w8_transform_lr-5e-5-batch_size-256_epochs-150_loss-bce_optimizer-adam_fcocchi
|
| 79 |
+
external_transform: true
|
| 80 |
+
fast_norm: false
|
| 81 |
+
fuser: ''
|
| 82 |
+
global_crops_scale:
|
| 83 |
+
- 0.4
|
| 84 |
+
- 1.0
|
| 85 |
+
gp: null
|
| 86 |
+
grad_accum_steps: 1
|
| 87 |
+
grad_checkpointing: false
|
| 88 |
+
head_bottlenck: 256
|
| 89 |
+
head_hidden_dim: 384
|
| 90 |
+
head_init_bias: null
|
| 91 |
+
head_init_scale: null
|
| 92 |
+
head_out: 192
|
| 93 |
+
hflip: 0.5
|
| 94 |
+
img_size: null
|
| 95 |
+
in_chans: null
|
| 96 |
+
infonce_loss_temperature: 0.1
|
| 97 |
+
initial_checkpoint: ''
|
| 98 |
+
input_size:
|
| 99 |
+
- 3
|
| 100 |
+
- 384
|
| 101 |
+
- 384
|
| 102 |
+
interpolation: ''
|
| 103 |
+
jitter_max: 1.5
|
| 104 |
+
jitter_min: 0.5
|
| 105 |
+
job_id: 0
|
| 106 |
+
jpeg_max: 100
|
| 107 |
+
jpeg_min: 30
|
| 108 |
+
jpeg_prob: 0.5
|
| 109 |
+
jsd_loss: false
|
| 110 |
+
ladeda: false
|
| 111 |
+
lambda_loss: 10
|
| 112 |
+
last_crop: false
|
| 113 |
+
layer_decay: null
|
| 114 |
+
linear_pretrained: null
|
| 115 |
+
linear_train_shards: dataset/shards/elsa_v2_train_transf.shards
|
| 116 |
+
load_code: false
|
| 117 |
+
local_crops_scale:
|
| 118 |
+
- 0.05
|
| 119 |
+
- 0.4
|
| 120 |
+
local_rank: 0
|
| 121 |
+
log_interval: 5
|
| 122 |
+
log_wandb: true
|
| 123 |
+
lr: 5.0e-05
|
| 124 |
+
lr_base: 0.1
|
| 125 |
+
lr_base_scale: ''
|
| 126 |
+
lr_base_size: 256
|
| 127 |
+
lr_cycle_decay: 0.5
|
| 128 |
+
lr_cycle_limit: 1
|
| 129 |
+
lr_cycle_mul: 1.0
|
| 130 |
+
lr_k_decay: 1.0
|
| 131 |
+
lr_noise: null
|
| 132 |
+
lr_noise_pct: 0.67
|
| 133 |
+
lr_noise_std: 1.0
|
| 134 |
+
margin: 1
|
| 135 |
+
mean:
|
| 136 |
+
- 0.485
|
| 137 |
+
- 0.456
|
| 138 |
+
- 0.406
|
| 139 |
+
min_lr: 0.0
|
| 140 |
+
mixup: 0.0
|
| 141 |
+
mixup_mode: batch
|
| 142 |
+
mixup_off_epoch: 0
|
| 143 |
+
mixup_prob: 1.0
|
| 144 |
+
mixup_switch_prob: 0.5
|
| 145 |
+
model: vit_large_patch16_siglip_384
|
| 146 |
+
model_ema: false
|
| 147 |
+
model_ema_decay: 0.9998
|
| 148 |
+
model_ema_force_cpu: false
|
| 149 |
+
model_kwargs: {}
|
| 150 |
+
momentum: 0.9
|
| 151 |
+
multiple_evaluations: true
|
| 152 |
+
n_crops: 1
|
| 153 |
+
no_aug: false
|
| 154 |
+
no_ddp_bb: false
|
| 155 |
+
no_prefetcher: true
|
| 156 |
+
no_resume_opt: false
|
| 157 |
+
not_load_input_size: false
|
| 158 |
+
num_classes: null
|
| 159 |
+
num_jobs: 1
|
| 160 |
+
num_step: 6800
|
| 161 |
+
num_transform: 2
|
| 162 |
+
ojha_d3: false
|
| 163 |
+
only_linear_training: true
|
| 164 |
+
only_validate: false
|
| 165 |
+
opacity_max: 1.0
|
| 166 |
+
opacity_min: 0.2
|
| 167 |
+
opt: adam
|
| 168 |
+
opt_betas: null
|
| 169 |
+
opt_eps: null
|
| 170 |
+
opt_kwargs: {}
|
| 171 |
+
output: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/runs
|
| 172 |
+
overlay_max: 0.35
|
| 173 |
+
overlay_min: 0.05
|
| 174 |
+
pad_max: 0.25
|
| 175 |
+
pad_min: 0.01
|
| 176 |
+
patience_counter: 0
|
| 177 |
+
patience_epochs: 5
|
| 178 |
+
permutation_fake: false
|
| 179 |
+
permutation_real: false
|
| 180 |
+
pin_mem: false
|
| 181 |
+
pix_max: 1
|
| 182 |
+
pix_min: 0.3
|
| 183 |
+
plot_freq: 5
|
| 184 |
+
pretrained: true
|
| 185 |
+
random_crop: false
|
| 186 |
+
random_grayscale_prob: 0.01
|
| 187 |
+
ratio:
|
| 188 |
+
- 0.75
|
| 189 |
+
- 1.3333333333333333
|
| 190 |
+
ratio_max: 2
|
| 191 |
+
ratio_min: 0.75
|
| 192 |
+
real_centering_loss: false
|
| 193 |
+
recount: 1
|
| 194 |
+
recovery_interval: 0
|
| 195 |
+
remode: pixel
|
| 196 |
+
reprob: 0.0
|
| 197 |
+
resize_max: 512
|
| 198 |
+
resize_min: 64
|
| 199 |
+
resplit: false
|
| 200 |
+
resume: ''
|
| 201 |
+
rotatio_max: 270
|
| 202 |
+
rotatio_min: 90
|
| 203 |
+
saturation_max: 1.5
|
| 204 |
+
saturation_min: 0.5
|
| 205 |
+
save_images: false
|
| 206 |
+
save_model_linear: false
|
| 207 |
+
scale:
|
| 208 |
+
- 0.08
|
| 209 |
+
- 1.0
|
| 210 |
+
scale_max: 1.5
|
| 211 |
+
scale_min: 0.5
|
| 212 |
+
sched: plateau
|
| 213 |
+
sched_on_updates: false
|
| 214 |
+
seed: 42
|
| 215 |
+
sharp_max: 2.0
|
| 216 |
+
sharp_min: 1.2
|
| 217 |
+
shuffle_max: 0.35
|
| 218 |
+
shuffle_min: 0.0
|
| 219 |
+
skew_max: 1.0
|
| 220 |
+
skew_min: -1.0
|
| 221 |
+
smoothing: 0.0
|
| 222 |
+
split_bn: false
|
| 223 |
+
start_epoch: null
|
| 224 |
+
std:
|
| 225 |
+
- 0.229
|
| 226 |
+
- 0.224
|
| 227 |
+
- 0.225
|
| 228 |
+
step: 5
|
| 229 |
+
sup_contrastive_loss: false
|
| 230 |
+
suppl: false
|
| 231 |
+
sync_bn: true
|
| 232 |
+
synchronize_step: false
|
| 233 |
+
teacher_temp: 0.07
|
| 234 |
+
teacher_temp_fix: false
|
| 235 |
+
test_augm: false
|
| 236 |
+
test_shards_augm: dataset/shards/coco-test-dict.shards
|
| 237 |
+
test_shards_no_augm: dataset/shards/coco-test-dict.shards
|
| 238 |
+
threshold_plateau: 0.001
|
| 239 |
+
torchcompile: null
|
| 240 |
+
torchscript: false
|
| 241 |
+
train_interpolation: random
|
| 242 |
+
train_shards: dataset/shards/elsav2-training.shards
|
| 243 |
+
train_split: train
|
| 244 |
+
triplet_loss: false
|
| 245 |
+
tta: 0
|
| 246 |
+
use_multi_epochs_loader: false
|
| 247 |
+
val: false
|
| 248 |
+
val_shards_augm: dataset/shards/validation_set-transf-elsav2.shards
|
| 249 |
+
val_shards_no_augm: dataset/shards/validation_set-no_transf-elsav2.shards
|
| 250 |
+
val_split: validation
|
| 251 |
+
validation_batch_size: 50
|
| 252 |
+
vflip: 0.0
|
| 253 |
+
wandb_entity: lorenzo_b_master_thesis
|
| 254 |
+
wandb_group: null
|
| 255 |
+
wandb_id: null
|
| 256 |
+
wandb_logging: false
|
| 257 |
+
wandb_name: null
|
| 258 |
+
wandb_notes: null
|
| 259 |
+
wandb_project_name: contrastive-fake
|
| 260 |
+
wandb_resume: allow
|
| 261 |
+
warmup_epochs: 0
|
| 262 |
+
warmup_lr: 1.0e-06
|
| 263 |
+
warmup_prefix: false
|
| 264 |
+
warmup_teacher_temp: 0.04
|
| 265 |
+
warmup_teacher_temp_epochs: 30
|
| 266 |
+
watermark_prob: 0.2
|
| 267 |
+
weight_decay: 2.0e-05
|
| 268 |
+
weight_decay_end: null
|
| 269 |
+
worker_seeding: all
|
| 270 |
+
workers: 8
|
| 271 |
+
workers_validate: 3
|
pretrained_linear/siglip_retrain_d3/model_best.pth.tar
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69f3624335a5fff6f0b548344460f01a68b0f8fc50c7ccbdef32639fe9ca93a3
|
| 3 |
+
size 1265275454
|
pretrained_linear/siglip_retrain_d3/summary.csv
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epoch,train_loss,train_loss_contrastive_1,train_loss_contrastive_2,train_loss_dino,train_loss_mse,eval_loss,eval_loss_contrastive_1,eval_loss_contrastive_2,eval_loss_dino,eval_top1_tot,eval_top1_real,eval_top1_f0,eval_top1_f1,eval_top1_f2,eval_top1_f3,eval_accuracy,lr
|
| 2 |
+
0,0.3344188324340126,0.3344188324340126,0.0,0.0,0.0,0.1751169382284085,0.1751169382284085,0.0,0.0,0.939750000834465,0.8743749981125196,0.8862499793370565,0.9695833524068197,0.9762500201662382,0.9922916740179062,0.939750000834465,5e-05
|
| 3 |
+
1,0.2314104215844589,0.2314104215844589,0.0,0.0,0.0,0.1584866630534331,0.1584866630534331,0.0,0.0,0.9415833403666815,0.8947916626930237,0.8864583174387614,0.963750017186006,0.9725000212589899,0.9904166758060455,0.9415833403666815,5e-05
|
| 4 |
+
2,0.21575307705823113,0.21575307705823113,0.0,0.0,0.0,0.153275314408044,0.153275314408044,0.0,0.0,0.9418333396315575,0.9018749942382177,0.888333318134149,0.960416687031587,0.9700000211596489,0.988541675110658,0.9418333396315575,5e-05
|
| 5 |
+
3,0.20837736009236643,0.20837736009236643,0.0,0.0,0.0,0.15168093983083963,0.15168093983083963,0.0,0.0,0.9409583335121473,0.9062499950329462,0.8847916523615519,0.9589583526055018,0.96666669100523,0.9881250088413557,0.9409583335121473,5e-05
|
| 6 |
+
4,0.20403576982481514,0.20403576982481514,0.0,0.0,0.0,0.1500517725944519,0.1500517725944519,0.0,0.0,0.9416250015298525,0.9087499976158142,0.8868749812245369,0.9585416863361994,0.9668750241398811,0.9870833431680998,0.9416250015298525,5e-05
|
| 7 |
+
5,0.20182003947522711,0.20182003947522711,0.0,0.0,0.0,0.15012356142203012,0.15012356142203012,0.0,0.0,0.940833330154419,0.9127083321412405,0.883333312968413,0.9566666881243387,0.9650000259280205,0.9864583437641462,0.940833330154419,5e-05
|
| 8 |
+
6,0.20062986188294257,0.20062986188294257,0.0,0.0,0.0,0.14709053157518306,0.14709053157518306,0.0,0.0,0.9422916695475578,0.9081249982118607,0.8891666457056999,0.9595833544929823,0.96666669100523,0.9879166757067045,0.9422916695475578,5e-05
|
| 9 |
+
7,0.19959692339796353,0.19959692339796353,0.0,0.0,0.0,0.14905244639764229,0.14905244639764229,0.0,0.0,0.9413749923308691,0.9141666665673256,0.8835416461030642,0.9570833543936411,0.9650000259280205,0.9870833431680998,0.9413749923308691,5e-05
|
| 10 |
+
8,0.1990351523491828,0.1990351523491828,0.0,0.0,0.0,0.14873001724481583,0.14873001724481583,0.0,0.0,0.9413333286841711,0.9125000014901161,0.8847916473944982,0.9572916875282923,0.9650000259280205,0.9870833431680998,0.9413333286841711,5e-06
|
| 11 |
+
9,0.19868248202016248,0.19868248202016248,0.0,0.0,0.0,0.14857638534158468,0.14857638534158468,0.0,0.0,0.9416249891122183,0.9133333340287209,0.8849999805291494,0.9577083537975947,0.9650000259280205,0.9870833431680998,0.9416249891122183,5e-06
|
| 12 |
+
10,0.19878224588601906,0.19878224588601906,0.0,0.0,0.0,0.1486006344979008,0.1486006344979008,0.0,0.0,0.9413750047485033,0.9127083346247673,0.885624979933103,0.9564583549896876,0.9650000259280205,0.9870833431680998,0.9413750047485033,5e-06
|
| 13 |
+
11,0.1976470441173981,0.1976470441173981,0.0,0.0,0.0,0.14826239521304765,0.14826239521304765,0.0,0.0,0.9415416618188223,0.9116666664679846,0.8870833118756613,0.9566666881243387,0.9650000259280205,0.9872916787862778,0.9415416618188223,5e-06
|
| 14 |
+
12,0.19841566756367685,0.19841566756367685,0.0,0.0,0.0,0.14800164755433798,0.14800164755433798,0.0,0.0,0.9415833254655203,0.911041667064031,0.887916644414266,0.9566666881243387,0.9652083590626717,0.9870833456516266,0.9415833254655203,5e-06
|
| 15 |
+
13,0.19977029511595473,0.19977029511595473,0.0,0.0,0.0,0.14848711838324866,0.14848711838324866,0.0,0.0,0.9411666616797447,0.9116666664679846,0.8866666456063589,0.9564583549896876,0.9643750265240669,0.9866666793823242,0.9411666616797447,5e-06
|
pretrained_linear/vit_tiny_code_retrain_d3/args.yaml
ADDED
|
@@ -0,0 +1,271 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
aa: null
|
| 2 |
+
amp: true
|
| 3 |
+
amp_dtype: float16
|
| 4 |
+
amp_impl: native
|
| 5 |
+
aug_repeats: 0
|
| 6 |
+
aug_splits: 0
|
| 7 |
+
batch_size: 64
|
| 8 |
+
bce_loss: true
|
| 9 |
+
bce_target_thresh: null
|
| 10 |
+
benchmark: false
|
| 11 |
+
blur_max: 2
|
| 12 |
+
blur_min: 0.1
|
| 13 |
+
blur_prob: 0.5
|
| 14 |
+
blur_sig:
|
| 15 |
+
- 0
|
| 16 |
+
- 3.0
|
| 17 |
+
bn_eps: null
|
| 18 |
+
bn_momentum: null
|
| 19 |
+
brightness_max: 2
|
| 20 |
+
brightness_min: 0.5
|
| 21 |
+
channels_last: false
|
| 22 |
+
checkpoint_hist: 10
|
| 23 |
+
cineca: true
|
| 24 |
+
class_map: ''
|
| 25 |
+
classifier:
|
| 26 |
+
- linear
|
| 27 |
+
- knn
|
| 28 |
+
- svm
|
| 29 |
+
clip_grad: null
|
| 30 |
+
clip_mode: norm
|
| 31 |
+
color_jitter: 0.4
|
| 32 |
+
contrast_max: 1.5
|
| 33 |
+
contrast_min: 0.5
|
| 34 |
+
contrastive_loss: false
|
| 35 |
+
cooldown_epochs: 0
|
| 36 |
+
corvi_resnet: false
|
| 37 |
+
crop_max: 512
|
| 38 |
+
crop_min: 64
|
| 39 |
+
crop_pct: null
|
| 40 |
+
cutmix: 0.0
|
| 41 |
+
cutmix_minmax: null
|
| 42 |
+
data: null
|
| 43 |
+
data_dir: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/webdatasets_elsa_v2
|
| 44 |
+
data_dir_eval_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/transf
|
| 45 |
+
data_dir_eval_no_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/no_transf
|
| 46 |
+
data_generator: null
|
| 47 |
+
data_len_eval: 4800
|
| 48 |
+
data_len_linear: 9600
|
| 49 |
+
data_len_train: null
|
| 50 |
+
dataset: elsa_v2_binarycrossentropy
|
| 51 |
+
dataset_download: false
|
| 52 |
+
dataset_eval: elsa_v2_binarycrossentropy_all_gen
|
| 53 |
+
decay_epochs: 90
|
| 54 |
+
decay_milestones:
|
| 55 |
+
- 90
|
| 56 |
+
- 180
|
| 57 |
+
- 270
|
| 58 |
+
decay_rate: 0.1
|
| 59 |
+
defake: false
|
| 60 |
+
deterministic: true
|
| 61 |
+
dino_crop: false
|
| 62 |
+
dino_head: false
|
| 63 |
+
dino_loss: false
|
| 64 |
+
dino_loss_weight: 0.5
|
| 65 |
+
dino_temp: 0.1
|
| 66 |
+
dist_bn: reduce
|
| 67 |
+
distance: cosine
|
| 68 |
+
double_contrastive: false
|
| 69 |
+
drop: 0.0
|
| 70 |
+
drop_block: null
|
| 71 |
+
drop_connect: null
|
| 72 |
+
drop_path: null
|
| 73 |
+
early_stopping: false
|
| 74 |
+
epoch_repeats: 0.0
|
| 75 |
+
epochs: 150
|
| 76 |
+
epochs_classifier: 1500
|
| 77 |
+
eval_metric: accuracy
|
| 78 |
+
experiment: code-pro-linear_d3-augm_prob_0.5-vit_tiny_patch16_224.augreg_in21k_w8_transform_lr-5e-5-batch_size-256_epochs-150_loss-bce_optimizer-adam_fcocchi
|
| 79 |
+
external_transform: false
|
| 80 |
+
fast_norm: false
|
| 81 |
+
fuser: ''
|
| 82 |
+
global_crops_scale:
|
| 83 |
+
- 0.4
|
| 84 |
+
- 1.0
|
| 85 |
+
gp: null
|
| 86 |
+
grad_accum_steps: 1
|
| 87 |
+
grad_checkpointing: false
|
| 88 |
+
head_bottlenck: 256
|
| 89 |
+
head_hidden_dim: 384
|
| 90 |
+
head_init_bias: null
|
| 91 |
+
head_init_scale: null
|
| 92 |
+
head_out: 192
|
| 93 |
+
hflip: 0.5
|
| 94 |
+
img_size: null
|
| 95 |
+
in_chans: null
|
| 96 |
+
infonce_loss_temperature: 0.1
|
| 97 |
+
initial_checkpoint: ''
|
| 98 |
+
input_size:
|
| 99 |
+
- 3
|
| 100 |
+
- 224
|
| 101 |
+
- 224
|
| 102 |
+
interpolation: ''
|
| 103 |
+
jitter_max: 1.5
|
| 104 |
+
jitter_min: 0.5
|
| 105 |
+
job_id: 0
|
| 106 |
+
jpeg_max: 100
|
| 107 |
+
jpeg_min: 30
|
| 108 |
+
jpeg_prob: 0.5
|
| 109 |
+
jsd_loss: false
|
| 110 |
+
ladeda: false
|
| 111 |
+
lambda_loss: 10
|
| 112 |
+
last_crop: false
|
| 113 |
+
layer_decay: null
|
| 114 |
+
linear_pretrained: null
|
| 115 |
+
linear_train_shards: dataset/shards/elsa_v2_train_transf.shards
|
| 116 |
+
load_code: true
|
| 117 |
+
local_crops_scale:
|
| 118 |
+
- 0.05
|
| 119 |
+
- 0.4
|
| 120 |
+
local_rank: 0
|
| 121 |
+
log_interval: 5
|
| 122 |
+
log_wandb: true
|
| 123 |
+
lr: 5.0e-05
|
| 124 |
+
lr_base: 0.1
|
| 125 |
+
lr_base_scale: ''
|
| 126 |
+
lr_base_size: 256
|
| 127 |
+
lr_cycle_decay: 0.5
|
| 128 |
+
lr_cycle_limit: 1
|
| 129 |
+
lr_cycle_mul: 1.0
|
| 130 |
+
lr_k_decay: 1.0
|
| 131 |
+
lr_noise: null
|
| 132 |
+
lr_noise_pct: 0.67
|
| 133 |
+
lr_noise_std: 1.0
|
| 134 |
+
margin: 1
|
| 135 |
+
mean:
|
| 136 |
+
- 0.485
|
| 137 |
+
- 0.456
|
| 138 |
+
- 0.406
|
| 139 |
+
min_lr: 0.0
|
| 140 |
+
mixup: 0.0
|
| 141 |
+
mixup_mode: batch
|
| 142 |
+
mixup_off_epoch: 0
|
| 143 |
+
mixup_prob: 1.0
|
| 144 |
+
mixup_switch_prob: 0.5
|
| 145 |
+
model: vit_tiny_patch16_224.augreg_in21k
|
| 146 |
+
model_ema: false
|
| 147 |
+
model_ema_decay: 0.9998
|
| 148 |
+
model_ema_force_cpu: false
|
| 149 |
+
model_kwargs: {}
|
| 150 |
+
momentum: 0.9
|
| 151 |
+
multiple_evaluations: true
|
| 152 |
+
n_crops: 1
|
| 153 |
+
no_aug: false
|
| 154 |
+
no_ddp_bb: false
|
| 155 |
+
no_prefetcher: true
|
| 156 |
+
no_resume_opt: false
|
| 157 |
+
not_load_input_size: false
|
| 158 |
+
num_classes: null
|
| 159 |
+
num_jobs: 1
|
| 160 |
+
num_step: 6800
|
| 161 |
+
num_transform: 2
|
| 162 |
+
ojha_d3: false
|
| 163 |
+
only_linear_training: true
|
| 164 |
+
only_validate: false
|
| 165 |
+
opacity_max: 1.0
|
| 166 |
+
opacity_min: 0.2
|
| 167 |
+
opt: adam
|
| 168 |
+
opt_betas: null
|
| 169 |
+
opt_eps: null
|
| 170 |
+
opt_kwargs: {}
|
| 171 |
+
output: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/runs
|
| 172 |
+
overlay_max: 0.35
|
| 173 |
+
overlay_min: 0.05
|
| 174 |
+
pad_max: 0.25
|
| 175 |
+
pad_min: 0.01
|
| 176 |
+
patience_counter: 0
|
| 177 |
+
patience_epochs: 5
|
| 178 |
+
permutation_fake: false
|
| 179 |
+
permutation_real: false
|
| 180 |
+
pin_mem: false
|
| 181 |
+
pix_max: 1
|
| 182 |
+
pix_min: 0.3
|
| 183 |
+
plot_freq: 5
|
| 184 |
+
pretrained: true
|
| 185 |
+
random_crop: false
|
| 186 |
+
random_grayscale_prob: 0.01
|
| 187 |
+
ratio:
|
| 188 |
+
- 0.75
|
| 189 |
+
- 1.3333333333333333
|
| 190 |
+
ratio_max: 2
|
| 191 |
+
ratio_min: 0.75
|
| 192 |
+
real_centering_loss: false
|
| 193 |
+
recount: 1
|
| 194 |
+
recovery_interval: 0
|
| 195 |
+
remode: pixel
|
| 196 |
+
reprob: 0.0
|
| 197 |
+
resize_max: 512
|
| 198 |
+
resize_min: 64
|
| 199 |
+
resplit: false
|
| 200 |
+
resume: ''
|
| 201 |
+
rotatio_max: 270
|
| 202 |
+
rotatio_min: 90
|
| 203 |
+
saturation_max: 1.5
|
| 204 |
+
saturation_min: 0.5
|
| 205 |
+
save_images: false
|
| 206 |
+
save_model_linear: false
|
| 207 |
+
scale:
|
| 208 |
+
- 0.08
|
| 209 |
+
- 1.0
|
| 210 |
+
scale_max: 1.5
|
| 211 |
+
scale_min: 0.5
|
| 212 |
+
sched: plateau
|
| 213 |
+
sched_on_updates: false
|
| 214 |
+
seed: 42
|
| 215 |
+
sharp_max: 2.0
|
| 216 |
+
sharp_min: 1.2
|
| 217 |
+
shuffle_max: 0.35
|
| 218 |
+
shuffle_min: 0.0
|
| 219 |
+
skew_max: 1.0
|
| 220 |
+
skew_min: -1.0
|
| 221 |
+
smoothing: 0.0
|
| 222 |
+
split_bn: false
|
| 223 |
+
start_epoch: null
|
| 224 |
+
std:
|
| 225 |
+
- 0.229
|
| 226 |
+
- 0.224
|
| 227 |
+
- 0.225
|
| 228 |
+
step: 5
|
| 229 |
+
sup_contrastive_loss: false
|
| 230 |
+
suppl: false
|
| 231 |
+
sync_bn: true
|
| 232 |
+
synchronize_step: false
|
| 233 |
+
teacher_temp: 0.07
|
| 234 |
+
teacher_temp_fix: false
|
| 235 |
+
test_augm: false
|
| 236 |
+
test_shards_augm: dataset/shards/coco-test-dict.shards
|
| 237 |
+
test_shards_no_augm: dataset/shards/coco-test-dict.shards
|
| 238 |
+
threshold_plateau: 0.001
|
| 239 |
+
torchcompile: null
|
| 240 |
+
torchscript: false
|
| 241 |
+
train_interpolation: random
|
| 242 |
+
train_shards: dataset/shards/elsav2-training.shards
|
| 243 |
+
train_split: train
|
| 244 |
+
triplet_loss: false
|
| 245 |
+
tta: 0
|
| 246 |
+
use_multi_epochs_loader: false
|
| 247 |
+
val: false
|
| 248 |
+
val_shards_augm: dataset/shards/validation_set-transf-elsav2.shards
|
| 249 |
+
val_shards_no_augm: dataset/shards/validation_set-no_transf-elsav2.shards
|
| 250 |
+
val_split: validation
|
| 251 |
+
validation_batch_size: 50
|
| 252 |
+
vflip: 0.0
|
| 253 |
+
wandb_entity: lorenzo_b_master_thesis
|
| 254 |
+
wandb_group: null
|
| 255 |
+
wandb_id: null
|
| 256 |
+
wandb_logging: false
|
| 257 |
+
wandb_name: null
|
| 258 |
+
wandb_notes: null
|
| 259 |
+
wandb_project_name: contrastive-fake
|
| 260 |
+
wandb_resume: allow
|
| 261 |
+
warmup_epochs: 0
|
| 262 |
+
warmup_lr: 1.0e-06
|
| 263 |
+
warmup_prefix: false
|
| 264 |
+
warmup_teacher_temp: 0.04
|
| 265 |
+
warmup_teacher_temp_epochs: 30
|
| 266 |
+
watermark_prob: 0.2
|
| 267 |
+
weight_decay: 2.0e-05
|
| 268 |
+
weight_decay_end: null
|
| 269 |
+
worker_seeding: all
|
| 270 |
+
workers: 8
|
| 271 |
+
workers_validate: 3
|
pretrained_linear/vit_tiny_code_retrain_d3/model_best.pth.tar
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8ea70970987cee595217a0fe6985b6e58dc8fb3159ed615b6713f1044a785c24
|
| 3 |
+
size 22167286
|
pretrained_linear/vit_tiny_code_retrain_d3/summary.csv
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epoch,train_loss,train_loss_contrastive_1,train_loss_contrastive_2,train_loss_dino,train_loss_mse,eval_loss,eval_loss_contrastive_1,eval_loss_contrastive_2,eval_loss_dino,eval_top1_tot,eval_top1_real,eval_top1_f0,eval_top1_f1,eval_top1_f2,eval_top1_f3,eval_accuracy,lr
|
| 2 |
+
0,0.3720096955294995,0.3720096955294995,0.0,0.0,0.0,0.21224851720035076,0.21224851720035076,0.0,0.0,0.9212083294987679,0.8770833214124044,0.8737499912579855,0.9412500138084093,0.9335416754086813,0.9804166803757349,0.9212083294987679,5e-05
|
| 3 |
+
1,0.28748565185815095,0.28748565185815095,0.0,0.0,0.0,0.19553815387189388,0.19553815387189388,0.0,0.0,0.9261249899864197,0.8793749908606211,0.8802083159486452,0.948333352804184,0.9395833412806193,0.9831250160932541,0.9261249899864197,5e-05
|
| 4 |
+
2,0.2787261040990843,0.2787261040990843,0.0,0.0,0.0,0.19202234223484993,0.19202234223484993,0.0,0.0,0.9257916584610939,0.8822916522622108,0.8789583196242651,0.9472916821638743,0.9372916718324026,0.9831250160932541,0.9257916584610939,5e-05
|
| 5 |
+
3,0.2742302328457727,0.2742302328457727,0.0,0.0,0.0,0.18989873118698597,0.18989873118698597,0.0,0.0,0.9252916673819224,0.8835416610042254,0.8766666526595751,0.9477083583672842,0.9364583368102709,0.9820833504199982,0.9252916673819224,5e-05
|
| 6 |
+
4,0.27157400547362426,0.27157400547362426,0.0,0.0,0.0,0.1877975029249986,0.1877975029249986,0.0,0.0,0.9263749991854032,0.8841666628917059,0.8791666527589163,0.9481250221530596,0.9381250018874804,0.9822916835546494,0.9263749991854032,5e-05
|
| 7 |
+
5,0.27049131704603924,0.27049131704603924,0.0,0.0,0.0,0.18657336570322514,0.18657336570322514,0.0,0.0,0.9269166688124338,0.8854166666666666,0.8799999877810478,0.9481250196695328,0.9391666700442632,0.981875017285347,0.9269166688124338,5e-05
|
| 8 |
+
6,0.26871031153508845,0.26871031153508845,0.0,0.0,0.0,0.1843882550795873,0.1843882550795873,0.0,0.0,0.9276666740576426,0.8839583322405815,0.8808333228031794,0.9500000203649203,0.9410416682561239,0.9825000166893005,0.9276666740576426,5e-05
|
| 9 |
+
7,0.26732318908633557,0.26732318908633557,0.0,0.0,0.0,0.18572811347742876,0.18572811347742876,0.0,0.0,0.9270416647195816,0.8864583273728689,0.8799999952316284,0.9477083534002304,0.9391666700442632,0.981875017285347,0.9270416647195816,5e-05
|
| 10 |
+
8,0.2672765173456248,0.2672765173456248,0.0,0.0,0.0,0.18469930378099284,0.18469930378099284,0.0,0.0,0.9273333251476288,0.885416661699613,0.8797916546463966,0.9493750209609667,0.9400000050663948,0.9820833504199982,0.9273333251476288,5e-05
|
| 11 |
+
9,0.2665476277908858,0.2665476277908858,0.0,0.0,0.0,0.18387764257689318,0.18387764257689318,0.0,0.0,0.9275833244125048,0.8839583297570547,0.8818749909599622,0.9495833516120911,0.940208338201046,0.9822916835546494,0.9275833244125048,5e-05
|
| 12 |
+
10,0.2652019637691624,0.2652019637691624,0.0,0.0,0.0,0.18286102078855038,0.18286102078855038,0.0,0.0,0.9282499998807907,0.8822916646798452,0.8835416560371717,0.9514583523074785,0.9418750032782555,0.9820833504199982,0.9282499998807907,5e-05
|
| 13 |
+
11,0.267613924634369,0.267613924634369,0.0,0.0,0.0,0.18203754536807537,0.18203754536807537,0.0,0.0,0.9282916585604349,0.8818749984105428,0.8837499891718229,0.9514583547910055,0.9418750032782555,0.9825000166893005,0.9282916585604349,5e-05
|
| 14 |
+
12,0.26410333232625444,0.26410333232625444,0.0,0.0,0.0,0.18234017367164293,0.18234017367164293,0.0,0.0,0.9278333236773809,0.8833333303531011,0.8833333229025205,0.9500000153978666,0.9406250019868215,0.981875017285347,0.9278333236773809,5e-05
|
| 15 |
+
13,0.2662334675407585,0.2662334675407585,0.0,0.0,0.0,0.1823637199898561,0.1823637199898561,0.0,0.0,0.9277499963839849,0.8833333303531011,0.8833333229025205,0.9497916822632154,0.9406250019868215,0.9816666841506958,0.9277499963839849,5e-06
|
| 16 |
+
14,0.2647036242463133,0.2647036242463133,0.0,0.0,0.0,0.18274893797934055,0.18274893797934055,0.0,0.0,0.9274166648586591,0.8833333303531011,0.8829166566332182,0.9495833491285642,0.9395833363135656,0.9816666841506958,0.9274166648586591,5e-06
|
| 17 |
+
15,0.2651700408581425,0.2651700408581425,0.0,0.0,0.0,0.1824071699132522,0.1824071699132522,0.0,0.0,0.9277916625142097,0.8833333303531011,0.8835416560371717,0.9502083510160446,0.940208338201046,0.9816666841506958,0.9277916625142097,5e-06
|
| 18 |
+
16,0.2642313089550418,0.2642313089550418,0.0,0.0,0.0,0.18203218219180903,0.18203218219180903,0.0,0.0,0.9279166609048843,0.88312499721845,0.8839583223064741,0.9500000178813934,0.9408333376049995,0.9816666841506958,0.9279166609048843,5e-06
|
| 19 |
+
17,0.26631898574311946,0.26631898574311946,0.0,0.0,0.0,0.18247221782803535,0.18247221782803535,0.0,0.0,0.9275416682163874,0.8833333303531011,0.8831249897678694,0.9500000178813934,0.9397916719317436,0.9814583510160446,0.9275416682163874,5e-06
|
| 20 |
+
18,0.2645486582070589,0.2645486582070589,0.0,0.0,0.0,0.18188781787951788,0.18188781787951788,0.0,0.0,0.9280416543285052,0.8829166640837988,0.8843749885757765,0.9502083510160446,0.9410416707396507,0.9816666841506958,0.9280416543285052,5e-06
|
pretrained_linear/vit_tiny_retrain_d3/args.yaml
ADDED
|
@@ -0,0 +1,271 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
aa: null
|
| 2 |
+
amp: true
|
| 3 |
+
amp_dtype: float16
|
| 4 |
+
amp_impl: native
|
| 5 |
+
aug_repeats: 0
|
| 6 |
+
aug_splits: 0
|
| 7 |
+
batch_size: 64
|
| 8 |
+
bce_loss: true
|
| 9 |
+
bce_target_thresh: null
|
| 10 |
+
benchmark: false
|
| 11 |
+
blur_max: 2
|
| 12 |
+
blur_min: 0.1
|
| 13 |
+
blur_prob: 0.5
|
| 14 |
+
blur_sig:
|
| 15 |
+
- 0
|
| 16 |
+
- 3.0
|
| 17 |
+
bn_eps: null
|
| 18 |
+
bn_momentum: null
|
| 19 |
+
brightness_max: 2
|
| 20 |
+
brightness_min: 0.5
|
| 21 |
+
channels_last: false
|
| 22 |
+
checkpoint_hist: 10
|
| 23 |
+
cineca: true
|
| 24 |
+
class_map: ''
|
| 25 |
+
classifier:
|
| 26 |
+
- linear
|
| 27 |
+
- knn
|
| 28 |
+
- svm
|
| 29 |
+
clip_grad: null
|
| 30 |
+
clip_mode: norm
|
| 31 |
+
color_jitter: 0.4
|
| 32 |
+
contrast_max: 1.5
|
| 33 |
+
contrast_min: 0.5
|
| 34 |
+
contrastive_loss: false
|
| 35 |
+
cooldown_epochs: 0
|
| 36 |
+
corvi_resnet: false
|
| 37 |
+
crop_max: 512
|
| 38 |
+
crop_min: 64
|
| 39 |
+
crop_pct: null
|
| 40 |
+
cutmix: 0.0
|
| 41 |
+
cutmix_minmax: null
|
| 42 |
+
data: null
|
| 43 |
+
data_dir: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/webdatasets_elsa_v2
|
| 44 |
+
data_dir_eval_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/transf
|
| 45 |
+
data_dir_eval_no_augm: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/dataset/Elsa_datasetv2_test_fix/wds_test_small/no_transf
|
| 46 |
+
data_generator: null
|
| 47 |
+
data_len_eval: 4800
|
| 48 |
+
data_len_linear: 9600
|
| 49 |
+
data_len_train: null
|
| 50 |
+
dataset: elsa_v2_binarycrossentropy
|
| 51 |
+
dataset_download: false
|
| 52 |
+
dataset_eval: elsa_v2_binarycrossentropy_all_gen
|
| 53 |
+
decay_epochs: 90
|
| 54 |
+
decay_milestones:
|
| 55 |
+
- 90
|
| 56 |
+
- 180
|
| 57 |
+
- 270
|
| 58 |
+
decay_rate: 0.1
|
| 59 |
+
defake: false
|
| 60 |
+
deterministic: true
|
| 61 |
+
dino_crop: false
|
| 62 |
+
dino_head: false
|
| 63 |
+
dino_loss: false
|
| 64 |
+
dino_loss_weight: 0.5
|
| 65 |
+
dino_temp: 0.1
|
| 66 |
+
dist_bn: reduce
|
| 67 |
+
distance: cosine
|
| 68 |
+
double_contrastive: false
|
| 69 |
+
drop: 0.0
|
| 70 |
+
drop_block: null
|
| 71 |
+
drop_connect: null
|
| 72 |
+
drop_path: null
|
| 73 |
+
early_stopping: false
|
| 74 |
+
epoch_repeats: 0.0
|
| 75 |
+
epochs: 150
|
| 76 |
+
epochs_classifier: 1500
|
| 77 |
+
eval_metric: accuracy
|
| 78 |
+
experiment: vit_tiny-linear_d3-augm_prob_0.5-vit_tiny_patch16_224.augreg_in21k_w8_transform_lr-5e-5-batch_size-256_epochs-150_loss-bce_optimizer-adam_fcocchi
|
| 79 |
+
external_transform: true
|
| 80 |
+
fast_norm: false
|
| 81 |
+
fuser: ''
|
| 82 |
+
global_crops_scale:
|
| 83 |
+
- 0.4
|
| 84 |
+
- 1.0
|
| 85 |
+
gp: null
|
| 86 |
+
grad_accum_steps: 1
|
| 87 |
+
grad_checkpointing: false
|
| 88 |
+
head_bottlenck: 256
|
| 89 |
+
head_hidden_dim: 384
|
| 90 |
+
head_init_bias: null
|
| 91 |
+
head_init_scale: null
|
| 92 |
+
head_out: 192
|
| 93 |
+
hflip: 0.5
|
| 94 |
+
img_size: null
|
| 95 |
+
in_chans: null
|
| 96 |
+
infonce_loss_temperature: 0.1
|
| 97 |
+
initial_checkpoint: ''
|
| 98 |
+
input_size:
|
| 99 |
+
- 3
|
| 100 |
+
- 224
|
| 101 |
+
- 224
|
| 102 |
+
interpolation: ''
|
| 103 |
+
jitter_max: 1.5
|
| 104 |
+
jitter_min: 0.5
|
| 105 |
+
job_id: 0
|
| 106 |
+
jpeg_max: 100
|
| 107 |
+
jpeg_min: 30
|
| 108 |
+
jpeg_prob: 0.5
|
| 109 |
+
jsd_loss: false
|
| 110 |
+
ladeda: false
|
| 111 |
+
lambda_loss: 10
|
| 112 |
+
last_crop: false
|
| 113 |
+
layer_decay: null
|
| 114 |
+
linear_pretrained: null
|
| 115 |
+
linear_train_shards: dataset/shards/elsa_v2_train_transf.shards
|
| 116 |
+
load_code: false
|
| 117 |
+
local_crops_scale:
|
| 118 |
+
- 0.05
|
| 119 |
+
- 0.4
|
| 120 |
+
local_rank: 0
|
| 121 |
+
log_interval: 5
|
| 122 |
+
log_wandb: true
|
| 123 |
+
lr: 5.0e-05
|
| 124 |
+
lr_base: 0.1
|
| 125 |
+
lr_base_scale: ''
|
| 126 |
+
lr_base_size: 256
|
| 127 |
+
lr_cycle_decay: 0.5
|
| 128 |
+
lr_cycle_limit: 1
|
| 129 |
+
lr_cycle_mul: 1.0
|
| 130 |
+
lr_k_decay: 1.0
|
| 131 |
+
lr_noise: null
|
| 132 |
+
lr_noise_pct: 0.67
|
| 133 |
+
lr_noise_std: 1.0
|
| 134 |
+
margin: 1
|
| 135 |
+
mean:
|
| 136 |
+
- 0.485
|
| 137 |
+
- 0.456
|
| 138 |
+
- 0.406
|
| 139 |
+
min_lr: 0.0
|
| 140 |
+
mixup: 0.0
|
| 141 |
+
mixup_mode: batch
|
| 142 |
+
mixup_off_epoch: 0
|
| 143 |
+
mixup_prob: 1.0
|
| 144 |
+
mixup_switch_prob: 0.5
|
| 145 |
+
model: vit_tiny_patch16_224.augreg_in21k
|
| 146 |
+
model_ema: false
|
| 147 |
+
model_ema_decay: 0.9998
|
| 148 |
+
model_ema_force_cpu: false
|
| 149 |
+
model_kwargs: {}
|
| 150 |
+
momentum: 0.9
|
| 151 |
+
multiple_evaluations: true
|
| 152 |
+
n_crops: 1
|
| 153 |
+
no_aug: false
|
| 154 |
+
no_ddp_bb: false
|
| 155 |
+
no_prefetcher: true
|
| 156 |
+
no_resume_opt: false
|
| 157 |
+
not_load_input_size: false
|
| 158 |
+
num_classes: null
|
| 159 |
+
num_jobs: 1
|
| 160 |
+
num_step: 6800
|
| 161 |
+
num_transform: 2
|
| 162 |
+
ojha_d3: false
|
| 163 |
+
only_linear_training: true
|
| 164 |
+
only_validate: false
|
| 165 |
+
opacity_max: 1.0
|
| 166 |
+
opacity_min: 0.2
|
| 167 |
+
opt: adam
|
| 168 |
+
opt_betas: null
|
| 169 |
+
opt_eps: null
|
| 170 |
+
opt_kwargs: {}
|
| 171 |
+
output: /leonardo_scratch/large/userexternal/fcocchi0/deepfake/runs
|
| 172 |
+
overlay_max: 0.35
|
| 173 |
+
overlay_min: 0.05
|
| 174 |
+
pad_max: 0.25
|
| 175 |
+
pad_min: 0.01
|
| 176 |
+
patience_counter: 0
|
| 177 |
+
patience_epochs: 5
|
| 178 |
+
permutation_fake: false
|
| 179 |
+
permutation_real: false
|
| 180 |
+
pin_mem: false
|
| 181 |
+
pix_max: 1
|
| 182 |
+
pix_min: 0.3
|
| 183 |
+
plot_freq: 5
|
| 184 |
+
pretrained: true
|
| 185 |
+
random_crop: false
|
| 186 |
+
random_grayscale_prob: 0.01
|
| 187 |
+
ratio:
|
| 188 |
+
- 0.75
|
| 189 |
+
- 1.3333333333333333
|
| 190 |
+
ratio_max: 2
|
| 191 |
+
ratio_min: 0.75
|
| 192 |
+
real_centering_loss: false
|
| 193 |
+
recount: 1
|
| 194 |
+
recovery_interval: 0
|
| 195 |
+
remode: pixel
|
| 196 |
+
reprob: 0.0
|
| 197 |
+
resize_max: 512
|
| 198 |
+
resize_min: 64
|
| 199 |
+
resplit: false
|
| 200 |
+
resume: ''
|
| 201 |
+
rotatio_max: 270
|
| 202 |
+
rotatio_min: 90
|
| 203 |
+
saturation_max: 1.5
|
| 204 |
+
saturation_min: 0.5
|
| 205 |
+
save_images: false
|
| 206 |
+
save_model_linear: false
|
| 207 |
+
scale:
|
| 208 |
+
- 0.08
|
| 209 |
+
- 1.0
|
| 210 |
+
scale_max: 1.5
|
| 211 |
+
scale_min: 0.5
|
| 212 |
+
sched: plateau
|
| 213 |
+
sched_on_updates: false
|
| 214 |
+
seed: 42
|
| 215 |
+
sharp_max: 2.0
|
| 216 |
+
sharp_min: 1.2
|
| 217 |
+
shuffle_max: 0.35
|
| 218 |
+
shuffle_min: 0.0
|
| 219 |
+
skew_max: 1.0
|
| 220 |
+
skew_min: -1.0
|
| 221 |
+
smoothing: 0.0
|
| 222 |
+
split_bn: false
|
| 223 |
+
start_epoch: null
|
| 224 |
+
std:
|
| 225 |
+
- 0.229
|
| 226 |
+
- 0.224
|
| 227 |
+
- 0.225
|
| 228 |
+
step: 5
|
| 229 |
+
sup_contrastive_loss: false
|
| 230 |
+
suppl: false
|
| 231 |
+
sync_bn: true
|
| 232 |
+
synchronize_step: false
|
| 233 |
+
teacher_temp: 0.07
|
| 234 |
+
teacher_temp_fix: false
|
| 235 |
+
test_augm: false
|
| 236 |
+
test_shards_augm: dataset/shards/coco-test-dict.shards
|
| 237 |
+
test_shards_no_augm: dataset/shards/coco-test-dict.shards
|
| 238 |
+
threshold_plateau: 0.001
|
| 239 |
+
torchcompile: null
|
| 240 |
+
torchscript: false
|
| 241 |
+
train_interpolation: random
|
| 242 |
+
train_shards: dataset/shards/elsav2-training.shards
|
| 243 |
+
train_split: train
|
| 244 |
+
triplet_loss: false
|
| 245 |
+
tta: 0
|
| 246 |
+
use_multi_epochs_loader: false
|
| 247 |
+
val: false
|
| 248 |
+
val_shards_augm: dataset/shards/validation_set-transf-elsav2.shards
|
| 249 |
+
val_shards_no_augm: dataset/shards/validation_set-no_transf-elsav2.shards
|
| 250 |
+
val_split: validation
|
| 251 |
+
validation_batch_size: 50
|
| 252 |
+
vflip: 0.0
|
| 253 |
+
wandb_entity: lorenzo_b_master_thesis
|
| 254 |
+
wandb_group: null
|
| 255 |
+
wandb_id: null
|
| 256 |
+
wandb_logging: false
|
| 257 |
+
wandb_name: null
|
| 258 |
+
wandb_notes: null
|
| 259 |
+
wandb_project_name: contrastive-fake
|
| 260 |
+
wandb_resume: allow
|
| 261 |
+
warmup_epochs: 0
|
| 262 |
+
warmup_lr: 1.0e-06
|
| 263 |
+
warmup_prefix: false
|
| 264 |
+
warmup_teacher_temp: 0.04
|
| 265 |
+
warmup_teacher_temp_epochs: 30
|
| 266 |
+
watermark_prob: 0.2
|
| 267 |
+
weight_decay: 2.0e-05
|
| 268 |
+
weight_decay_end: null
|
| 269 |
+
worker_seeding: all
|
| 270 |
+
workers: 8
|
| 271 |
+
workers_validate: 3
|
pretrained_linear/vit_tiny_retrain_d3/model_best.pth.tar
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d5a1566c1f9652a9056522148f029492267a539393529c78abc2450b810133b
|
| 3 |
+
size 22167286
|
pretrained_linear/vit_tiny_retrain_d3/summary.csv
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
epoch,train_loss,train_loss_contrastive_1,train_loss_contrastive_2,train_loss_dino,train_loss_mse,eval_loss,eval_loss_contrastive_1,eval_loss_contrastive_2,eval_loss_dino,eval_top1_tot,eval_top1_real,eval_top1_f0,eval_top1_f1,eval_top1_f2,eval_top1_f3,eval_accuracy,lr
|
| 2 |
+
0,0.4226443461197264,0.4226443461197264,0.0,0.0,0.0,0.394023089359204,0.394023089359204,0.0,0.0,0.8237499892711639,0.7552083233992258,0.7816666662693024,0.813333327571551,0.8435416569312414,0.9250000019868215,0.8237499892711639,5e-05
|
| 3 |
+
1,0.37773030104444305,0.37773030104444305,0.0,0.0,0.0,0.3889458974202474,0.3889458974202474,0.0,0.0,0.826124998430411,0.7514583269755045,0.7839583357175192,0.8187499990065893,0.8508333265781403,0.9256250013907751,0.826124998430411,5e-05
|
| 4 |
+
2,0.37595023874412564,0.37595023874412564,0.0,0.0,0.0,0.38465610270698863,0.38465610270698863,0.0,0.0,0.8281666686137518,0.7462499961256981,0.789791668454806,0.8247916648785273,0.8552083273728689,0.9247916638851166,0.8281666686137518,5e-05
|
| 5 |
+
3,0.3758119907011004,0.3758119907011004,0.0,0.0,0.0,0.3924189681808154,0.3924189681808154,0.0,0.0,0.8240416670838991,0.7554166615009308,0.7772916704416275,0.815833330154419,0.8489583233992258,0.9227083325386047,0.8240416670838991,5e-05
|
| 6 |
+
4,0.377113087343819,0.377113087343819,0.0,0.0,0.0,0.38882261887192726,0.38882261887192726,0.0,0.0,0.8261250009139379,0.7537499964237213,0.7825000012914339,0.8185416609048843,0.8508333240946134,0.9249999970197678,0.8261250009139379,5e-05
|
| 7 |
+
5,0.37594584377811235,0.37594584377811235,0.0,0.0,0.0,0.38932491714755696,0.38932491714755696,0.0,0.0,0.825874999165535,0.7516666675607363,0.7829166700442632,0.8183333327372869,0.8512499953309695,0.925208330154419,0.825874999165535,5e-05
|
| 8 |
+
6,0.3774271651664201,0.3774271651664201,0.0,0.0,0.0,0.3860248898466428,0.3860248898466428,0.0,0.0,0.8281666661302248,0.7493749981125196,0.7868749996026357,0.8229166691501936,0.8552083273728689,0.9264583339293798,0.8281666661302248,5e-05
|
| 9 |
+
7,0.37668778762659605,0.37668778762659605,0.0,0.0,0.0,0.39383075137933093,0.39383075137933093,0.0,0.0,0.8236666545271873,0.7568749984105428,0.7779166648785273,0.8131249944368998,0.8470833276708921,0.9233333319425583,0.8236666545271873,5e-05
|
| 10 |
+
8,0.37466930692248485,0.37466930692248485,0.0,0.0,0.0,0.3852132285634677,0.3852132285634677,0.0,0.0,0.8275833403070768,0.7458333298563957,0.7860416645805041,0.8239583298563957,0.8549999967217445,0.9270833358168602,0.8275833403070768,5e-05
|
| 11 |
+
9,0.37873199676327846,0.37873199676327846,0.0,0.0,0.0,0.3904148191213608,0.3904148191213608,0.0,0.0,0.8247083351016045,0.7539583320418993,0.7791666686534882,0.8170833364129066,0.8497916609048843,0.9235416650772095,0.8247083351016045,5e-06
|
| 12 |
+
10,0.3742280271123437,0.3742280271123437,0.0,0.0,0.0,0.387875451395909,0.387875451395909,0.0,0.0,0.826500008503596,0.7499999975164732,0.783750000099341,0.821041668454806,0.8535416622956594,0.924166664481163,0.826500008503596,5e-06
|
| 13 |
+
11,0.375747038424015,0.375747038424015,0.0,0.0,0.0,0.3900589806338151,0.3900589806338151,0.0,0.0,0.8249166682362556,0.752500000099341,0.7806250030795733,0.8168749983112017,0.8502083271741867,0.9243749976158142,0.8249166682362556,5e-06
|
| 14 |
+
12,0.3783050603945466,0.3783050603945466,0.0,0.0,0.0,0.3886970865229766,0.3886970865229766,0.0,0.0,0.8257499958078066,0.749791664381822,0.7829166675607363,0.8202083359162012,0.8518749922513962,0.9239583313465118,0.8257499958078066,5e-06
|
| 15 |
+
13,0.3758939314633608,0.3758939314633608,0.0,0.0,0.0,0.3884111742178599,0.3884111742178599,0.0,0.0,0.8260833298166593,0.7504166637857755,0.7839583332339922,0.82000000278155,0.8518749922513962,0.9241666669646899,0.8260833298166593,5e-06
|
| 16 |
+
14,0.3757469490827883,0.3757469490827883,0.0,0.0,0.0,0.38723477472861606,0.38723477472861606,0.0,0.0,0.8269166573882103,0.749791664381822,0.7858333314458529,0.8208333378036817,0.8529166604081789,0.9252083351214727,0.8269166573882103,5e-06
|