DornierDo17 commited on
Commit
bc01282
·
verified ·
1 Parent(s): 179a358

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. config.toml +66 -0
  2. model.pt +3 -0
config.toml ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed = 5
2
+ sampling_seed = 5
3
+ train_dataset_seed = 10
4
+ val_dataset_seed = 42
5
+ normalize_embeddings = true
6
+ mixed_precision = "fp16"
7
+ weight_init = "kaiming"
8
+ dataset = "nq"
9
+ max_seq_length = 64
10
+ unsup_emb = "stella"
11
+ sup_emb = "gte"
12
+ n_embs_per_batch = 1
13
+ finetune_mode = false
14
+ noise_level = 0.0
15
+ style = "res_mlp"
16
+ norm_style = "batch"
17
+ depth = 3
18
+ transform_depth = 4
19
+ d_adapter = 1024
20
+ d_hidden = 1024
21
+ d_transform = 1024
22
+ use_small_output_adapters = false
23
+ use_residual_adapters = true
24
+ gan_style = "least_squares"
25
+ disc_depth = 5
26
+ disc_dim = 1024
27
+ use_residual = true
28
+ bs = 256
29
+ gradient_accumulation_steps = 1
30
+ lr = 2e-5
31
+ no_scheduler = true
32
+ max_grad_norm = 1000.0
33
+ loss_coefficient_reverse_rec = 0.0
34
+ loss_coefficient_rec = 1.0
35
+ loss_coefficient_vsp = 1.0
36
+ loss_coefficient_cc_trans = 10.0
37
+ loss_coefficient_cc_rec = 0.0
38
+ loss_coefficient_cc_vsp = 10.0
39
+ loss_coefficient_r1_penalty = 0.0
40
+ warmup_length = 2000
41
+ disc_lr = 1e-5
42
+ eps = 6.25e-10
43
+ smooth = 0.9
44
+ loss_coefficient_disc = 1.0
45
+ loss_coefficient_gen = 1.0
46
+ loss_coefficient_latent_gen = 1.0
47
+ loss_coefficient_similarity_gen = 0.0
48
+ val_size = 4096
49
+ val_bs = 1024
50
+ top_k_size = 1024
51
+ top_k_batches = 4
52
+ k = 16
53
+ heatmap_size = 64
54
+ use_wandb = true
55
+ wandb_project = "unsupervised"
56
+ wandb_name = "n:1000000,e:2000,u:stella,s:gte"
57
+ load_dir = "./finetuning_unsupervised/n:100000,e:10,s:n_double,d:4,d:4,d:64/"
58
+ save_dir = "./finetuning_unsupervised/{}/"
59
+ force_dump = true
60
+ num_points = 1000000
61
+ epochs = 2000
62
+ num_params = 21004800
63
+ num_disc_params = 3943425
64
+ num_sup_disc_params = 3943425
65
+ num_latent_disc_params = 4205569
66
+ num_similarity_disc_params = 3419137
model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3530043f988aeb25b1c9bb9de85ef708fd093827430242f31be3886769d1caa2
3
+ size 84090873