File size: 1,257 Bytes
2b17178
19ecef7
2b17178
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
{
  "model_id": "google/siglip2-so400m-patch14-384",
  "dataset": "apartments",
  "apartments_jsonl": "data/apartments/question-image-dataset_labeled.jsonl",
  "apartments_images_dir": "data/apartments/images",
  "fmnist_root": "data",
  "output_root": "models",
  "run_name": null,
  "batch_size": 8,
  "stack_size": 1,
  "max_steps": 5000,
  "eval_interval": 10,
  "eval_batches": 2,
  "checkpoint_interval": 1000,
  "checkpoint_mode": "max_val_acc",
  "val_ratio": 0.1,
  "seed": 42,
  "num_workers_train": 4,
  "num_workers_val": 2,
  "lr_backbone": 2e-6,
  "lr_head": 0.0003,
  "weight_decay": 0.0,
  "freeze_backbone": false,
  "attention_heads": 2,
  "attention_dropout": 0.3,
  "image_self_attention_layers": 0,
  "head_hidden_dim": 512,
  "head_num_layers": 1,
  "head_dropout": 0.3,
  "head_activation": "swiglu",
  "label_smoothing": 0.05,
  "compile_model": false,
  "compile_fallback_to_eager": true,
  "resume_path": null,
  "min_free_space_gb": 1.0,
  "use_wandb": true,
  "wandb_project": "flash-judge",
  "wandb_entity": null,
  "wandb_run_name": null,
  "save_artifacts": true,
  "push_to_hub": true,
  "hub_org": "FuncAI",
  "hub_repo_name": "FlashJudge",
  "hub_private": false,
  "hub_token": null,
  "device": null,
  "use_amp": true
}