DornierDo17 commited on
Commit
a8d47f4
·
verified ·
1 Parent(s): c21621a

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. config.toml +69 -0
  2. model.pt +3 -0
config.toml ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed = 6
2
+ sampling_seed = 6
3
+ train_dataset_seed = 11
4
+ val_dataset_seed = 43
5
+ normalize_embeddings = true
6
+ mixed_precision = "bf16"
7
+ weight_init = "kaiming"
8
+ dataset = "nq"
9
+ max_seq_length = 32
10
+ unsup_emb = "stella"
11
+ sup_emb = "gte"
12
+ n_embs_per_batch = 1
13
+ finetune_mode = false
14
+ noise_level = 0.0
15
+ style = "res_mlp"
16
+ norm_style = "batch"
17
+ depth = 3
18
+ transform_depth = 4
19
+ d_adapter = 1024
20
+ d_hidden = 1024
21
+ d_transform = 1024
22
+ use_small_output_adapters = false
23
+ use_residual_adapters = true
24
+ gan_style = "least_squares"
25
+ disc_depth = 5
26
+ disc_dim = 1024
27
+ use_residual = true
28
+ bs = 256
29
+ gradient_accumulation_steps = 1
30
+ lr = 2e-5
31
+ no_scheduler = true
32
+ max_grad_norm = 1.0
33
+ loss_coefficient_reverse_rec = 0.0
34
+ loss_coefficient_rec = 1.0
35
+ loss_coefficient_vsp = 1.0
36
+ loss_coefficient_cc_trans = 10.0
37
+ loss_coefficient_cc_rec = 0.0
38
+ loss_coefficient_cc_vsp = 10.0
39
+ loss_coefficient_r1_penalty = 0.01
40
+ warmup_length = 2000
41
+ patience = 20
42
+ min_delta = 0.0
43
+ min_epochs = 80
44
+ disc_lr = 1e-5
45
+ eps = 6.25e-10
46
+ smooth = 0.9
47
+ loss_coefficient_disc = 1.0
48
+ loss_coefficient_gen = 1.0
49
+ loss_coefficient_latent_gen = 1.0
50
+ loss_coefficient_similarity_gen = 0.0
51
+ val_size = 4096
52
+ val_bs = 1024
53
+ top_k_size = 1024
54
+ top_k_batches = 4
55
+ k = 16
56
+ heatmap_size = 64
57
+ use_wandb = true
58
+ wandb_project = "unsupervised_disc"
59
+ wandb_name = "e:100,n:400000"
60
+ load_dir = "./finetuning_unsupervised/n:100000,e:10,s:n_double,d:4,d:4,d:64/"
61
+ save_dir = "./finetuning_unsupervised/{}/"
62
+ force_dump = true
63
+ epochs = 100
64
+ num_points = 400000
65
+ num_params = 21004800
66
+ num_disc_params = 3943425
67
+ num_sup_disc_params = 3943425
68
+ num_latent_disc_params = 4205569
69
+ num_similarity_disc_params = 3419137
model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:373a4a1b70e55a1c69f920f51d3365bd13fb78af8e50d88dea5f0256cb1c3414
3
+ size 84091695