mond45 commited on
Commit
e86f9ce
·
verified ·
1 Parent(s): af68112

Upload folder using huggingface_hub

Browse files
checkpoints/epoch=3-step=11500-val_kendall=0.355.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48c9d53900313295a1da1d784e1fa825e818bafd16ac09cc5e7b9d34cc47b945
3
+ size 2260729956
events.out.tfevents.1747582192.19abeeb7bada.5173.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edf128d598d7f308e4b87b6520b232f1fa685617ada92920d8b6b01eaafdd74f
3
+ size 3227541
hparams.yaml ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ nr_frozen_epochs: 0.3
2
+ keep_embeddings_frozen: true
3
+ optimizer: AdamW
4
+ warmup_steps: 0
5
+ encoder_learning_rate: 1.0e-06
6
+ learning_rate: 1.5e-05
7
+ layerwise_decay: 0.95
8
+ encoder_model: XLM-RoBERTa
9
+ pretrained_model: microsoft/infoxlm-large
10
+ pool: avg
11
+ layer: mix
12
+ layer_transformation: sparsemax
13
+ layer_norm: false
14
+ loss: mse
15
+ dropout: 0.1
16
+ batch_size: 1
17
+ train_data:
18
+ - /content/COMET/data/train.csv
19
+ validation_data:
20
+ - /content/COMET/data/val.csv
21
+ class_identifier: unified_metric
22
+ load_pretrained_weights: true
23
+ local_files_only: false
24
+ sent_layer: mix
25
+ word_layer: 24
26
+ hidden_sizes:
27
+ - 3072
28
+ - 1024
29
+ activations: Tanh
30
+ final_activation: null
31
+ input_segments:
32
+ - mt
33
+ - src
34
+ word_level_training: false
35
+ loss_lambda: 0.65
36
+ error_labels:
37
+ - minor
38
+ - major
39
+ cross_entropy_weights: null