PheniX-Lab commited on Aug 19, 2025

Commit

b6ced23

verified ·

1 Parent(s): 4ae3a83

Upload 308 files

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

FoMo4Wheat/__init__.py +6 -0
FoMo4Wheat/__pycache__/__init__.cpython-310.pyc +0 -0
FoMo4Wheat/__pycache__/__init__.cpython-311.pyc +0 -0
FoMo4Wheat/__pycache__/__init__.cpython-312.pyc +0 -0
FoMo4Wheat/__pycache__/__init__.cpython-38.pyc +0 -0
FoMo4Wheat/__pycache__/__init__.cpython-39.pyc +0 -0
FoMo4Wheat/configs/__init__.py +22 -0
FoMo4Wheat/configs/__pycache__/__init__.cpython-310.pyc +0 -0
FoMo4Wheat/configs/__pycache__/__init__.cpython-311.pyc +0 -0
FoMo4Wheat/configs/__pycache__/__init__.cpython-39.pyc +0 -0
FoMo4Wheat/configs/distill/vitg2vitb_14_224.yaml +132 -0
FoMo4Wheat/configs/distill/vitg2vitb_14_518.yaml +132 -0
FoMo4Wheat/configs/distill/vitg2vitl_14_224.yaml +132 -0
FoMo4Wheat/configs/distill/vitg2vitl_14_518.yaml +132 -0
FoMo4Wheat/configs/distill_default_config.yaml +132 -0
FoMo4Wheat/configs/distill_default_config_large.yaml +132 -0
FoMo4Wheat/configs/eval/vitb14_pretrain.yaml +6 -0
FoMo4Wheat/configs/eval/vitb14_reg4_pretrain.yaml +9 -0
FoMo4Wheat/configs/eval/vitg14_pretrain.yaml +7 -0
FoMo4Wheat/configs/eval/vitg14_reg4_pretrain.yaml +10 -0
FoMo4Wheat/configs/eval/vitl14_pretrain.yaml +6 -0
FoMo4Wheat/configs/eval/vitl14_reg4_pretrain.yaml +9 -0
FoMo4Wheat/configs/eval/vits14_pretrain.yaml +6 -0
FoMo4Wheat/configs/eval/vits14_reg4_pretrain.yaml +9 -0
FoMo4Wheat/configs/ssl_default_config.yaml +119 -0
FoMo4Wheat/configs/train/vitg_14_224.yaml +30 -0
FoMo4Wheat/configs/train/vitg_14_518.yaml +32 -0
FoMo4Wheat/configs/y_distill_default_config.yaml +132 -0
FoMo4Wheat/data/__init__.py +10 -0
FoMo4Wheat/data/__pycache__/__init__.cpython-310.pyc +0 -0
FoMo4Wheat/data/__pycache__/__init__.cpython-311.pyc +0 -0
FoMo4Wheat/data/__pycache__/__init__.cpython-39.pyc +0 -0
FoMo4Wheat/data/__pycache__/adapters.cpython-310.pyc +0 -0
FoMo4Wheat/data/__pycache__/adapters.cpython-311.pyc +0 -0
FoMo4Wheat/data/__pycache__/adapters.cpython-39.pyc +0 -0
FoMo4Wheat/data/__pycache__/augmentations.cpython-310.pyc +0 -0
FoMo4Wheat/data/__pycache__/augmentations.cpython-311.pyc +0 -0
FoMo4Wheat/data/__pycache__/augmentations.cpython-39.pyc +0 -0
FoMo4Wheat/data/__pycache__/collate.cpython-310.pyc +0 -0
FoMo4Wheat/data/__pycache__/collate.cpython-311.pyc +0 -0
FoMo4Wheat/data/__pycache__/collate.cpython-39.pyc +0 -0
FoMo4Wheat/data/__pycache__/loaders.cpython-310.pyc +0 -0
FoMo4Wheat/data/__pycache__/loaders.cpython-311.pyc +0 -0
FoMo4Wheat/data/__pycache__/loaders.cpython-39.pyc +0 -0
FoMo4Wheat/data/__pycache__/masking.cpython-310.pyc +0 -0
FoMo4Wheat/data/__pycache__/masking.cpython-311.pyc +0 -0
FoMo4Wheat/data/__pycache__/masking.cpython-39.pyc +0 -0
FoMo4Wheat/data/__pycache__/samplers.cpython-310.pyc +0 -0
FoMo4Wheat/data/__pycache__/samplers.cpython-311.pyc +0 -0
FoMo4Wheat/data/__pycache__/samplers.cpython-39.pyc +0 -0

FoMo4Wheat/__init__.py ADDED Viewed

	@@ -0,0 +1,6 @@

+# Copyright (c) Meta Platforms, Inc. and affiliates.
+#
+# This source code is licensed under the Apache License, Version 2.0
+# found in the LICENSE file in the root directory of this source tree.
+__version__ = "0.0.1"

FoMo4Wheat/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (183 Bytes). View file

FoMo4Wheat/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (200 Bytes). View file

FoMo4Wheat/__pycache__/__init__.cpython-312.pyc ADDED Viewed

Binary file (194 Bytes). View file

FoMo4Wheat/__pycache__/__init__.cpython-38.pyc ADDED Viewed

Binary file (152 Bytes). View file

FoMo4Wheat/__pycache__/__init__.cpython-39.pyc ADDED Viewed

Binary file (181 Bytes). View file

FoMo4Wheat/configs/__init__.py ADDED Viewed

	@@ -0,0 +1,22 @@

+# Copyright (c) Meta Platforms, Inc. and affiliates.
+#
+# This source code is licensed under the Apache License, Version 2.0
+# found in the LICENSE file in the root directory of this source tree.
+import pathlib
+from omegaconf import OmegaConf
+def load_config(config_name: str):
+    config_filename = config_name + ".yaml"
+    return OmegaConf.load(pathlib.Path(__file__).parent.resolve() / config_filename)
+dinov2_default_config = load_config("ssl_default_config")
+def load_and_merge_config(config_name: str):
+    default_config = OmegaConf.create(dinov2_default_config)
+    loaded_config = load_config(config_name)
+    return OmegaConf.merge(default_config, loaded_config)

FoMo4Wheat/configs/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (731 Bytes). View file

FoMo4Wheat/configs/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (1.16 kB). View file

FoMo4Wheat/configs/__pycache__/__init__.cpython-39.pyc ADDED Viewed

Binary file (731 Bytes). View file

FoMo4Wheat/configs/distill/vitg2vitb_14_224.yaml ADDED Viewed

	@@ -0,0 +1,132 @@

+MODEL:
+  WEIGHTS: ''
+compute_precision:
+  grad_scaler: true
+  teacher:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+  student:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+dino:
+  loss_weight: 1.0
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 384
+  head_nlayers: 3
+  head_hidden_dim: 2048
+  koleo_loss_weight: 0.1
+ibot:
+  loss_weight: 1.0
+  mask_sample_probability: 0.5
+  mask_ratio_min_max:
+  - 0.1
+  - 0.5
+  separate_head: True
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 256
+  head_nlayers: 3
+  head_hidden_dim: 2048
+train:
+  batch_size_per_gpu: 64
+  dataset_path: ImageNet:split=TRAIN
+  output_dir: .
+  saveckp_freq: 20
+  seed: 0
+  num_workers: 16
+  OFFICIAL_EPOCH_LENGTH: 781
+  cache_dataset: true
+  centering: sinkhorn_knopp
+student:
+  arch: vit_base
+  patch_size: 14
+  drop_path_rate: 0.0
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "mlp"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+teacher:
+  arch: vit_giant2
+  patch_size: 14
+  drop_path_rate: 0.0
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "swiglufused"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  momentum_teacher: 0.994
+  final_momentum_teacher: 1
+  warmup_teacher_temp: 0.04
+  teacher_temp: 0.07
+  warmup_teacher_temp_epochs: 15
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+optim:
+  epochs: 25
+  weight_decay: 0.04
+  weight_decay_end: 0.2
+  base_lr: 1e-04 # learning rate for a batch size of 1024
+  lr: 0.  # will be set after applying scaling rule
+  warmup_epochs: 0
+  min_lr: 1.0e-06
+  clip_grad: 3.0
+  freeze_last_layer_epochs: 0
+  scaling_rule: sqrt_wrt_1024
+  patch_embed_lr_mult: 0.2
+  layerwise_decay: 0.9
+  adamw_beta1: 0.9
+  adamw_beta2: 0.999
+crops:
+  global_crops_scale:
+  - 0.32
+  - 1.0
+  local_crops_number: 8
+  local_crops_scale:
+  - 0.05
+  - 0.32
+  global_crops_size: 224
+  local_crops_size: 98
+evaluation:
+  eval_period_iterations: 2500

FoMo4Wheat/configs/distill/vitg2vitb_14_518.yaml ADDED Viewed

	@@ -0,0 +1,132 @@

+MODEL:
+  WEIGHTS: ''
+compute_precision:
+  grad_scaler: true
+  teacher:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+  student:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: bf16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+dino:
+  loss_weight: 1.0
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 384
+  head_nlayers: 3
+  head_hidden_dim: 2048
+  koleo_loss_weight: 0.1
+ibot:
+  loss_weight: 1.0
+  mask_sample_probability: 0.5
+  mask_ratio_min_max:
+  - 0.1
+  - 0.5
+  separate_head: True
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 256
+  head_nlayers: 3
+  head_hidden_dim: 2048
+train:
+  batch_size_per_gpu: 16
+  dataset_path: ImageNet:split=TRAIN
+  output_dir: .
+  saveckp_freq: 20
+  seed: 0
+  num_workers: 16
+  OFFICIAL_EPOCH_LENGTH: 1250
+  cache_dataset: true
+  centering: sinkhorn_knopp
+student:
+  arch: vit_base
+  patch_size: 14
+  drop_path_rate: 0.0
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "mlp"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+teacher:
+  arch: vit_giant2
+  patch_size: 14
+  drop_path_rate: 0.4
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "swiglufused"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  momentum_teacher: 0.994
+  final_momentum_teacher: 1
+  warmup_teacher_temp: 0.04
+  teacher_temp: 0.07
+  warmup_teacher_temp_epochs: 30
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+optim:
+  epochs: 100
+  weight_decay: 0.04
+  weight_decay_end: 0.2
+  base_lr: 5e-05 # learning rate for a batch size of 1024
+  lr: 0.  # will be set after applying scaling rule
+  warmup_epochs: 10
+  min_lr: 1.0e-06
+  clip_grad: 3.0
+  freeze_last_layer_epochs: 0
+  scaling_rule: sqrt_wrt_1024
+  patch_embed_lr_mult: 0.2
+  layerwise_decay: 0.9
+  adamw_beta1: 0.9
+  adamw_beta2: 0.999
+crops:
+  global_crops_scale:
+  - 0.32
+  - 1.0
+  local_crops_number: 8
+  local_crops_scale:
+  - 0.05
+  - 0.32
+  global_crops_size: 518
+  local_crops_size: 98
+evaluation:
+  eval_period_iterations: 1250

FoMo4Wheat/configs/distill/vitg2vitl_14_224.yaml ADDED Viewed

	@@ -0,0 +1,132 @@

+MODEL:
+  WEIGHTS: ''
+compute_precision:
+  grad_scaler: true
+  teacher:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+  student:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+dino:
+  loss_weight: 1.0
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 384
+  head_nlayers: 3
+  head_hidden_dim: 2048
+  koleo_loss_weight: 0.1
+ibot:
+  loss_weight: 1.0
+  mask_sample_probability: 0.5
+  mask_ratio_min_max:
+  - 0.1
+  - 0.5
+  separate_head: True
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 256
+  head_nlayers: 3
+  head_hidden_dim: 2048
+train:
+  batch_size_per_gpu: 64
+  dataset_path: ImageNet:split=TRAIN
+  output_dir: .
+  saveckp_freq: 20
+  seed: 0
+  num_workers: 16
+  OFFICIAL_EPOCH_LENGTH: 781
+  cache_dataset: true
+  centering: sinkhorn_knopp
+student:
+  arch: vit_large
+  patch_size: 14
+  drop_path_rate: 0.0
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: 'dinov2_vitl14_reg4_pretrain.pth'
+  ffn_layer: "mlp"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+teacher:
+  arch: vit_giant2
+  patch_size: 14
+  drop_path_rate: 0.0
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "swiglufused"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  momentum_teacher: 0.994
+  final_momentum_teacher: 1
+  warmup_teacher_temp: 0.04
+  teacher_temp: 0.07
+  warmup_teacher_temp_epochs: 15
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+optim:
+  epochs: 25
+  weight_decay: 0.04
+  weight_decay_end: 0.2
+  base_lr: 1e-04 # learning rate for a batch size of 1024
+  lr: 0.  # will be set after applying scaling rule
+  warmup_epochs: 0
+  min_lr: 1.0e-06
+  clip_grad: 3.0
+  freeze_last_layer_epochs: 0
+  scaling_rule: sqrt_wrt_1024
+  patch_embed_lr_mult: 0.2
+  layerwise_decay: 0.9
+  adamw_beta1: 0.9
+  adamw_beta2: 0.999
+crops:
+  global_crops_scale:
+  - 0.32
+  - 1.0
+  local_crops_number: 8
+  local_crops_scale:
+  - 0.05
+  - 0.32
+  global_crops_size: 224
+  local_crops_size: 98
+evaluation:
+  eval_period_iterations: 2500

FoMo4Wheat/configs/distill/vitg2vitl_14_518.yaml ADDED Viewed

	@@ -0,0 +1,132 @@

+MODEL:
+  WEIGHTS: ''
+compute_precision:
+  grad_scaler: true
+  teacher:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+  student:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: bf16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+dino:
+  loss_weight: 1.0
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 384
+  head_nlayers: 3
+  head_hidden_dim: 2048
+  koleo_loss_weight: 0.1
+ibot:
+  loss_weight: 1.0
+  mask_sample_probability: 0.5
+  mask_ratio_min_max:
+  - 0.1
+  - 0.5
+  separate_head: True
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 256
+  head_nlayers: 3
+  head_hidden_dim: 2048
+train:
+  batch_size_per_gpu: 16
+  dataset_path: ImageNet:split=TRAIN
+  output_dir: .
+  saveckp_freq: 20
+  seed: 0
+  num_workers: 16
+  OFFICIAL_EPOCH_LENGTH: 1250
+  cache_dataset: true
+  centering: sinkhorn_knopp
+student:
+  arch: vit_large
+  patch_size: 14
+  drop_path_rate: 0.0
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "mlp"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+teacher:
+  arch: vit_giant2
+  patch_size: 14
+  drop_path_rate: 0.4
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "swiglufused"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  momentum_teacher: 0.994
+  final_momentum_teacher: 1
+  warmup_teacher_temp: 0.04
+  teacher_temp: 0.07
+  warmup_teacher_temp_epochs: 30
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+optim:
+  epochs: 100
+  weight_decay: 0.04
+  weight_decay_end: 0.2
+  base_lr: 5e-05 # learning rate for a batch size of 1024
+  lr: 0.  # will be set after applying scaling rule
+  warmup_epochs: 10
+  min_lr: 1.0e-06
+  clip_grad: 3.0
+  freeze_last_layer_epochs: 0
+  scaling_rule: sqrt_wrt_1024
+  patch_embed_lr_mult: 0.2
+  layerwise_decay: 0.9
+  adamw_beta1: 0.9
+  adamw_beta2: 0.999
+crops:
+  global_crops_scale:
+  - 0.32
+  - 1.0
+  local_crops_number: 8
+  local_crops_scale:
+  - 0.05
+  - 0.32
+  global_crops_size: 518
+  local_crops_size: 98
+evaluation:
+  eval_period_iterations: 1250

FoMo4Wheat/configs/distill_default_config.yaml ADDED Viewed

	@@ -0,0 +1,132 @@

+MODEL:
+  WEIGHTS: ''
+compute_precision:
+  grad_scaler: true
+  teacher:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+  student:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: bf16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+dino:
+  loss_weight: 1.0
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 384
+  head_nlayers: 3
+  head_hidden_dim: 2048
+  koleo_loss_weight: -1
+ibot:
+  loss_weight: 1.0
+  mask_sample_probability: 0.5
+  mask_ratio_min_max:
+  - 0.1
+  - 0.5
+  separate_head: True
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 256
+  head_nlayers: 3
+  head_hidden_dim: 2048
+train:
+  batch_size_per_gpu: 16
+  dataset_path: ImageNet:split=TRAIN
+  output_dir: .
+  saveckp_freq: 20
+  seed: 0
+  num_workers: 16
+  OFFICIAL_EPOCH_LENGTH: 1250
+  cache_dataset: true
+  centering: sinkhorn_knopp
+student:
+  arch: vit_base
+  patch_size: 14
+  drop_path_rate: 0.0
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "mlp"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+teacher:
+  arch: vit_giant2
+  patch_size: 14
+  drop_path_rate: 0.4
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: '/hpc/home/2023222003/Phenix/wheat/foundation_model/distill_pretrain/518_vitg/teacher_checkpoint.pth'
+  ffn_layer: "swiglufused"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  momentum_teacher: 0.994
+  final_momentum_teacher: 1
+  warmup_teacher_temp: 0.04
+  teacher_temp: 0.07
+  warmup_teacher_temp_epochs: 30
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+optim:
+  epochs: 100
+  weight_decay: 0.04
+  weight_decay_end: 0.2
+  base_lr: 1e-04 # learning rate for a batch size of 1024
+  lr: 0.  # will be set after applying scaling rule
+  warmup_epochs: 10
+  min_lr: 1.0e-06
+  clip_grad: 3.0
+  freeze_last_layer_epochs: 0
+  scaling_rule: sqrt_wrt_1024
+  patch_embed_lr_mult: 0.2
+  layerwise_decay: 1
+  adamw_beta1: 0.9
+  adamw_beta2: 0.999
+crops:
+  global_crops_scale:
+  - 0.32
+  - 1.0
+  local_crops_number: 8
+  local_crops_scale:
+  - 0.05
+  - 0.32
+  global_crops_size: 518
+  local_crops_size: 98
+evaluation:
+  eval_period_iterations: 2500

FoMo4Wheat/configs/distill_default_config_large.yaml ADDED Viewed

	@@ -0,0 +1,132 @@

+MODEL:
+  WEIGHTS: ''
+compute_precision:
+  grad_scaler: true
+  teacher:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+  student:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: bf16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+dino:
+  loss_weight: 1.0
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 384
+  head_nlayers: 3
+  head_hidden_dim: 2048
+  koleo_loss_weight: -1
+ibot:
+  loss_weight: 1.0
+  mask_sample_probability: 0.5
+  mask_ratio_min_max:
+  - 0.1
+  - 0.5
+  separate_head: True
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 256
+  head_nlayers: 3
+  head_hidden_dim: 2048
+train:
+  batch_size_per_gpu: 16
+  dataset_path: ImageNet:split=TRAIN
+  output_dir: .
+  saveckp_freq: 20
+  seed: 0
+  num_workers: 16
+  OFFICIAL_EPOCH_LENGTH: 1250
+  cache_dataset: true
+  centering: sinkhorn_knopp
+student:
+  arch: vit_large
+  patch_size: 14
+  drop_path_rate: 0.0
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "mlp"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+teacher:
+  arch: vit_giant2
+  patch_size: 14
+  drop_path_rate: 0.4
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: '/hpc/home/2023222003/Phenix/wheat/foundation_model/distill_pretrain/518_vitg/teacher_checkpoint.pth'
+  ffn_layer: "swiglufused"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  momentum_teacher: 0.994
+  final_momentum_teacher: 1
+  warmup_teacher_temp: 0.04
+  teacher_temp: 0.07
+  warmup_teacher_temp_epochs: 30
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+optim:
+  epochs: 100
+  weight_decay: 0.04
+  weight_decay_end: 0.2
+  base_lr: 1e-04 # learning rate for a batch size of 1024
+  lr: 0.  # will be set after applying scaling rule
+  warmup_epochs: 10
+  min_lr: 1.0e-06
+  clip_grad: 3.0
+  freeze_last_layer_epochs: 0
+  scaling_rule: sqrt_wrt_1024
+  patch_embed_lr_mult: 0.2
+  layerwise_decay: 1
+  adamw_beta1: 0.9
+  adamw_beta2: 0.999
+crops:
+  global_crops_scale:
+  - 0.32
+  - 1.0
+  local_crops_number: 8
+  local_crops_scale:
+  - 0.05
+  - 0.32
+  global_crops_size: 518
+  local_crops_size: 98
+evaluation:
+  eval_period_iterations: 2500

FoMo4Wheat/configs/eval/vitb14_pretrain.yaml ADDED Viewed

	@@ -0,0 +1,6 @@

+student:
+  arch: vit_base
+  patch_size: 14
+crops:
+  global_crops_size: 518  # this is to set up the position embeddings properly
+  local_crops_size: 98

FoMo4Wheat/configs/eval/vitb14_reg4_pretrain.yaml ADDED Viewed

	@@ -0,0 +1,9 @@

+student:
+  arch: vit_base
+  patch_size: 14
+  num_register_tokens: 4
+  interpolate_antialias: true
+  interpolate_offset: 0.0
+crops:
+  global_crops_size: 518  # this is to set up the position embeddings properly
+  local_crops_size: 98

FoMo4Wheat/configs/eval/vitg14_pretrain.yaml ADDED Viewed

	@@ -0,0 +1,7 @@

+student:
+  arch: vit_giant2
+  patch_size: 14
+  ffn_layer: swiglufused
+crops:
+  global_crops_size: 518  # this is to set up the position embeddings properly
+  local_crops_size: 98

FoMo4Wheat/configs/eval/vitg14_reg4_pretrain.yaml ADDED Viewed

	@@ -0,0 +1,10 @@

+student:
+  arch: vit_giant2
+  patch_size: 14
+  ffn_layer: swiglufused
+  num_register_tokens: 4
+  interpolate_antialias: true
+  interpolate_offset: 0.0
+crops:
+  global_crops_size: 518  # this is to set up the position embeddings properly
+  local_crops_size: 98

FoMo4Wheat/configs/eval/vitl14_pretrain.yaml ADDED Viewed

	@@ -0,0 +1,6 @@

+student:
+  arch: vit_large
+  patch_size: 14
+crops:
+  global_crops_size: 518  # this is to set up the position embeddings properly
+  local_crops_size: 98

FoMo4Wheat/configs/eval/vitl14_reg4_pretrain.yaml ADDED Viewed

	@@ -0,0 +1,9 @@

+student:
+  arch: vit_large
+  patch_size: 14
+  num_register_tokens: 4
+  interpolate_antialias: true
+  interpolate_offset: 0.0
+crops:
+  global_crops_size: 518  # this is to set up the position embeddings properly
+  local_crops_size: 98

FoMo4Wheat/configs/eval/vits14_pretrain.yaml ADDED Viewed

	@@ -0,0 +1,6 @@

+student:
+  arch: vit_small
+  patch_size: 14
+crops:
+  global_crops_size: 518  # this is to set up the position embeddings properly
+  local_crops_size: 98

FoMo4Wheat/configs/eval/vits14_reg4_pretrain.yaml ADDED Viewed

	@@ -0,0 +1,9 @@

+student:
+  arch: vit_small
+  patch_size: 14
+  num_register_tokens: 4
+  interpolate_antialias: true
+  interpolate_offset: 0.0
+crops:
+  global_crops_size: 518  # this is to set up the position embeddings properly
+  local_crops_size: 98

FoMo4Wheat/configs/ssl_default_config.yaml ADDED Viewed

	@@ -0,0 +1,119 @@

+MODEL:
+  WEIGHTS: ''
+compute_precision:
+  grad_scaler: true
+  teacher:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+  student:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+dino:
+  loss_weight: 1.0
+  head_n_prototypes: 65536
+  head_bottleneck_dim: 256
+  head_nlayers: 3
+  head_hidden_dim: 2048
+  koleo_loss_weight: 0.1
+ibot:
+  loss_weight: 1.0
+  mask_sample_probability: 0.5
+  mask_ratio_min_max:
+  - 0.1
+  - 0.5
+  separate_head: false
+  head_n_prototypes: 65536
+  head_bottleneck_dim: 256
+  head_nlayers: 3
+  head_hidden_dim: 2048
+train:
+  batch_size_per_gpu: 64
+  dataset_path: ImageNet:split=TRAIN
+  output_dir: .
+  saveckp_freq: 20
+  seed: 0
+  num_workers: 6
+  OFFICIAL_EPOCH_LENGTH: 1250
+  cache_dataset: true
+  centering: "centering" # or "sinkhorn_knopp"
+student:
+  arch: vit_large
+  patch_size: 16
+  drop_path_rate: 0.3
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "mlp"
+  block_chunks: 0
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  num_register_tokens: 4
+  interpolate_antialias: false
+  interpolate_offset: 0.1
+teacher:
+  momentum_teacher: 0.992
+  final_momentum_teacher: 1
+  warmup_teacher_temp: 0.04
+  teacher_temp: 0.07
+  warmup_teacher_temp_epochs: 30
+optim:
+  epochs: 100
+  weight_decay: 0.04
+  weight_decay_end: 0.4
+  base_lr: 0.004  # learning rate for a batch size of 1024
+  lr: 0.  # will be set after applying scaling rule
+  warmup_epochs: 10
+  min_lr: 1.0e-06
+  clip_grad: 3.0
+  freeze_last_layer_epochs: 1
+  freeze_backbone_layer_epochs: 0
+  scaling_rule: sqrt_wrt_1024
+  patch_embed_lr_mult: 0.2
+  layerwise_decay: 0.9
+  adamw_beta1: 0.9
+  adamw_beta2: 0.999
+crops:
+  global_crops_scale:
+  - 0.32
+  - 1.0
+  local_crops_number: 8
+  local_crops_scale:
+  - 0.05
+  - 0.32
+  global_crops_size: 224
+  local_crops_size: 96
+evaluation:
+  eval_period_iterations: 12500

FoMo4Wheat/configs/train/vitg_14_224.yaml ADDED Viewed

	@@ -0,0 +1,30 @@

+dino:
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 384
+ibot:
+  separate_head: true
+  head_n_prototypes: 131072
+train:
+  batch_size_per_gpu: 12
+  dataset_path: TestDataset
+  centering: sinkhorn_knopp
+student:
+  arch: vit_giant2
+  patch_size: 14
+  drop_path_rate: 0.4
+  ffn_layer: swiglufused
+  block_chunks: 4
+  pretrained_weights: ''
+teacher:
+  momentum_teacher: 0.994
+  pretrained_weights: ''
+optim:
+  epochs: 200
+  weight_decay_end: 0.2
+  base_lr: 6.25e-05  # learning rate for a batch size of 1024
+  warmup_epochs: 40
+  layerwise_decay: 1.0
+  freeze_last_layer_epochs: 0
+  freeze_backbone_layer_epochs: 20
+crops:
+  local_crops_size: 98

FoMo4Wheat/configs/train/vitg_14_518.yaml ADDED Viewed

	@@ -0,0 +1,32 @@

+dino:
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 384
+ibot:
+  separate_head: true
+  head_n_prototypes: 131072
+train:
+  batch_size_per_gpu: 2
+  dataset_path: ImageNet22k
+  centering: sinkhorn_knopp
+student:
+  arch: vit_giant2
+  patch_size: 14
+  drop_path_rate: 0.4
+  ffn_layer: swiglufused
+  block_chunks: 4
+  pretrained_weights: ''
+teacher:
+  momentum_teacher: 0.994
+  pretrained_weights: ''
+optim:
+  epochs: 75
+  weight_decay_end: 0.2
+  base_lr: 1e-06  # learning rate for a batch size of 1024
+  min_lr: 1e-07
+  warmup_epochs: 0
+  layerwise_decay: 1.0
+  freeze_last_layer_epochs: 0
+  freeze_backbone_layer_epochs: 20
+crops:
+  local_crops_size: 98
+  global_crops_size: 518

FoMo4Wheat/configs/y_distill_default_config.yaml ADDED Viewed

	@@ -0,0 +1,132 @@

+MODEL:
+  WEIGHTS: ''
+compute_precision:
+  grad_scaler: true
+  teacher:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: fp16
+        reduce_dtype: fp16
+        buffer_dtype: fp32
+  student:
+    backbone:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: bf16
+        buffer_dtype: fp32
+    dino_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+    ibot_head:
+      sharding_strategy: SHARD_GRAD_OP
+      mixed_precision:
+        param_dtype: bf16
+        reduce_dtype: fp32
+        buffer_dtype: fp32
+dino:
+  loss_weight: 1.0
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 384
+  head_nlayers: 3
+  head_hidden_dim: 2048
+  koleo_loss_weight: -1
+ibot:
+  loss_weight: 1.0
+  mask_sample_probability: 0.5
+  mask_ratio_min_max:
+  - 0.1
+  - 0.5
+  separate_head: True
+  head_n_prototypes: 131072
+  head_bottleneck_dim: 256
+  head_nlayers: 3
+  head_hidden_dim: 2048
+train:
+  batch_size_per_gpu: 64
+  dataset_path: ImageNet:split=TRAIN
+  output_dir: .
+  saveckp_freq: 20
+  seed: 0
+  num_workers: 6
+  OFFICIAL_EPOCH_LENGTH: 1250
+  cache_dataset: true
+  centering: sinkhorn_knopp
+student:
+  arch: vit_base
+  patch_size: 14
+  drop_path_rate: 0.0
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: ''
+  ffn_layer: "mlp"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+teacher:
+  arch: vit_giant2
+  patch_size: 14
+  drop_path_rate: 0.4
+  layerscale: 1.0e-05
+  drop_path_uniform: true
+  pretrained_weights: '/hpc/home/2023222003/Phenix/wheat/foundation_model/distill_pretrain/518_vitg/downsampling_pos_embed_from_518_to_224__checkpoint.pth'
+  ffn_layer: "swiglufused"
+  block_chunks: 4
+  qkv_bias: true
+  proj_bias: true
+  ffn_bias: true
+  momentum_teacher: 0.994
+  final_momentum_teacher: 1
+  warmup_teacher_temp: 0.04
+  teacher_temp: 0.07
+  warmup_teacher_temp_epochs: 30
+  num_register_tokens: 4
+  interpolate_offset: 0.1
+  interpolate_antialias : false
+optim:
+  epochs: 100
+  weight_decay: 0.04
+  weight_decay_end: 0.2
+  base_lr: 1e-04 # learning rate for a batch size of 1024
+  lr: 0.  # will be set after applying scaling rule
+  warmup_epochs: 10
+  min_lr: 1.0e-06
+  clip_grad: 3.0
+  freeze_last_layer_epochs: 0
+  scaling_rule: sqrt_wrt_1024
+  patch_embed_lr_mult: 0.2
+  layerwise_decay: 1
+  adamw_beta1: 0.9
+  adamw_beta2: 0.999
+crops:
+  global_crops_scale:
+  - 0.32
+  - 1.0
+  local_crops_number: 8
+  local_crops_scale:
+  - 0.05
+  - 0.32
+  global_crops_size: 224
+  local_crops_size: 98
+evaluation:
+  eval_period_iterations: 2500

FoMo4Wheat/data/__init__.py ADDED Viewed

	@@ -0,0 +1,10 @@

+# Copyright (c) Meta Platforms, Inc. and affiliates.
+#
+# This source code is licensed under the Apache License, Version 2.0
+# found in the LICENSE file in the root directory of this source tree.
+from .adapters import DatasetWithEnumeratedTargets
+from .loaders import make_data_loader, make_dataset, SamplerType
+from .collate import collate_data_and_cast
+from .masking import MaskingGenerator
+from .augmentations import DataAugmentationDINO

FoMo4Wheat/data/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (480 Bytes). View file

FoMo4Wheat/data/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (588 Bytes). View file

FoMo4Wheat/data/__pycache__/__init__.cpython-39.pyc ADDED Viewed

Binary file (478 Bytes). View file

FoMo4Wheat/data/__pycache__/adapters.cpython-310.pyc ADDED Viewed

Binary file (1.41 kB). View file

FoMo4Wheat/data/__pycache__/adapters.cpython-311.pyc ADDED Viewed

Binary file (1.97 kB). View file

FoMo4Wheat/data/__pycache__/adapters.cpython-39.pyc ADDED Viewed

Binary file (1.41 kB). View file

FoMo4Wheat/data/__pycache__/augmentations.cpython-310.pyc ADDED Viewed

Binary file (2.62 kB). View file

FoMo4Wheat/data/__pycache__/augmentations.cpython-311.pyc ADDED Viewed

Binary file (5.11 kB). View file

FoMo4Wheat/data/__pycache__/augmentations.cpython-39.pyc ADDED Viewed

Binary file (2.61 kB). View file

FoMo4Wheat/data/__pycache__/collate.cpython-310.pyc ADDED Viewed

Binary file (1.62 kB). View file

FoMo4Wheat/data/__pycache__/collate.cpython-311.pyc ADDED Viewed

Binary file (3.61 kB). View file

FoMo4Wheat/data/__pycache__/collate.cpython-39.pyc ADDED Viewed

Binary file (1.65 kB). View file

FoMo4Wheat/data/__pycache__/loaders.cpython-310.pyc ADDED Viewed

Binary file (5.66 kB). View file

FoMo4Wheat/data/__pycache__/loaders.cpython-311.pyc ADDED Viewed

Binary file (8.86 kB). View file

FoMo4Wheat/data/__pycache__/loaders.cpython-39.pyc ADDED Viewed

Binary file (5.6 kB). View file

FoMo4Wheat/data/__pycache__/masking.cpython-310.pyc ADDED Viewed

Binary file (2.32 kB). View file

FoMo4Wheat/data/__pycache__/masking.cpython-311.pyc ADDED Viewed

Binary file (4.14 kB). View file

FoMo4Wheat/data/__pycache__/masking.cpython-39.pyc ADDED Viewed

Binary file (2.29 kB). View file

FoMo4Wheat/data/__pycache__/samplers.cpython-310.pyc ADDED Viewed

Binary file (6.53 kB). View file

FoMo4Wheat/data/__pycache__/samplers.cpython-311.pyc ADDED Viewed

Binary file (11.7 kB). View file

FoMo4Wheat/data/__pycache__/samplers.cpython-39.pyc ADDED Viewed

Binary file (6.46 kB). View file