Add finetuned model
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +3 -0
- checkpoint-39/1_Pooling/config.json +10 -0
- checkpoint-39/README.md +1637 -0
- checkpoint-39/config.json +27 -0
- checkpoint-39/config_sentence_transformers.json +14 -0
- checkpoint-39/model.safetensors +3 -0
- checkpoint-39/modules.json +20 -0
- checkpoint-39/optimizer.pt +3 -0
- checkpoint-39/rng_state.pth +3 -0
- checkpoint-39/scheduler.pt +3 -0
- checkpoint-39/sentence_bert_config.json +4 -0
- checkpoint-39/sentencepiece.bpe.model +3 -0
- checkpoint-39/special_tokens_map.json +51 -0
- checkpoint-39/tokenizer.json +3 -0
- checkpoint-39/tokenizer_config.json +55 -0
- checkpoint-39/trainer_state.json +358 -0
- checkpoint-39/training_args.bin +3 -0
- checkpoint-52/1_Pooling/config.json +10 -0
- checkpoint-52/README.md +1640 -0
- checkpoint-52/config.json +27 -0
- checkpoint-52/config_sentence_transformers.json +14 -0
- checkpoint-52/model.safetensors +3 -0
- checkpoint-52/modules.json +20 -0
- checkpoint-52/optimizer.pt +3 -0
- checkpoint-52/rng_state.pth +3 -0
- checkpoint-52/scheduler.pt +3 -0
- checkpoint-52/sentence_bert_config.json +4 -0
- checkpoint-52/sentencepiece.bpe.model +3 -0
- checkpoint-52/special_tokens_map.json +51 -0
- checkpoint-52/tokenizer.json +3 -0
- checkpoint-52/tokenizer_config.json +55 -0
- checkpoint-52/trainer_state.json +470 -0
- checkpoint-52/training_args.bin +3 -0
- checkpoint-65/1_Pooling/config.json +10 -0
- checkpoint-65/README.md +1642 -0
- checkpoint-65/config.json +27 -0
- checkpoint-65/config_sentence_transformers.json +14 -0
- checkpoint-65/model.safetensors +3 -0
- checkpoint-65/modules.json +20 -0
- checkpoint-65/optimizer.pt +3 -0
- checkpoint-65/rng_state.pth +3 -0
- checkpoint-65/scheduler.pt +3 -0
- checkpoint-65/sentence_bert_config.json +4 -0
- checkpoint-65/sentencepiece.bpe.model +3 -0
- checkpoint-65/special_tokens_map.json +51 -0
- checkpoint-65/tokenizer.json +3 -0
- checkpoint-65/tokenizer_config.json +55 -0
- checkpoint-65/trainer_state.json +575 -0
- checkpoint-65/training_args.bin +3 -0
- eval/Information-Retrieval_evaluation_dim_1024_results.csv +5 -6
.gitattributes
CHANGED
|
@@ -37,3 +37,6 @@ checkpoint-196/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
| 37 |
checkpoint-294/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 38 |
checkpoint-98/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
| 37 |
checkpoint-294/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 38 |
checkpoint-98/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
checkpoint-39/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
checkpoint-52/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
checkpoint-65/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
checkpoint-39/1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 1024,
|
| 3 |
+
"pooling_mode_cls_token": false,
|
| 4 |
+
"pooling_mode_mean_tokens": true,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
checkpoint-39/README.md
ADDED
|
@@ -0,0 +1,1637 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
language:
|
| 3 |
+
- en
|
| 4 |
+
license: apache-2.0
|
| 5 |
+
tags:
|
| 6 |
+
- sentence-transformers
|
| 7 |
+
- sentence-similarity
|
| 8 |
+
- feature-extraction
|
| 9 |
+
- dense
|
| 10 |
+
- generated_from_trainer
|
| 11 |
+
- dataset_size:391
|
| 12 |
+
- loss:MatryoshkaLoss
|
| 13 |
+
- loss:MultipleNegativesRankingLoss
|
| 14 |
+
base_model: intfloat/multilingual-e5-large
|
| 15 |
+
widget:
|
| 16 |
+
- source_sentence: What is the responsibility of assisting and advising the data subjects
|
| 17 |
+
in exercising their rights?
|
| 18 |
+
sentences:
|
| 19 |
+
- '1.Personal data shall be: (a) processed lawfully, fairly and in a transparent
|
| 20 |
+
manner in relation to the data subject (‘lawfulness, fairness and transparency’);
|
| 21 |
+
(b) collected for specified, explicit and legitimate purposes and not further
|
| 22 |
+
processed in a manner that is incompatible with those purposes; further processing
|
| 23 |
+
for archiving purposes in the public interest, scientific or historical research
|
| 24 |
+
purposes or statistical purposes shall, in accordance with Article 89(1), not
|
| 25 |
+
be considered to be incompatible with the initial purposes (‘purpose limitation’);
|
| 26 |
+
(c) adequate, relevant and limited to what is necessary in relation to the purposes
|
| 27 |
+
for which they are processed (‘data minimisation’); (d) accurate and, where necessary,
|
| 28 |
+
kept up to date; every reasonable step must be taken to ensure that personal data
|
| 29 |
+
that are inaccurate, having regard to the purposes for which they are processed,
|
| 30 |
+
are erased or rectified without delay (‘accuracy’); 4.5.2016 L 119/35 (1) Directive
|
| 31 |
+
(EU) 2015/1535 of the European Parliament and of the Council of 9 September 2015
|
| 32 |
+
laying down a procedure for the provision of information in the field of technical
|
| 33 |
+
regulations and of rules on Information Society services (OJ L 241, 17.9.2015,
|
| 34 |
+
p. 1). (e) kept in a form which permits identification of data subjects for no
|
| 35 |
+
longer than is necessary for the purposes for which the personal data are processed;
|
| 36 |
+
personal data may be stored for longer periods insofar as the personal data will
|
| 37 |
+
be processed solely for archiving purposes in the public interest, scientific
|
| 38 |
+
or historical research purposes or statistical purposes in accordance with Article
|
| 39 |
+
89(1) subject to implementation of the appropriate technical and organisational
|
| 40 |
+
measures required by this Regulation in order to safeguard the rights and freedoms
|
| 41 |
+
of the data subject (‘storage limitation’); (f) processed in a manner that ensures
|
| 42 |
+
appropriate security of the personal data, including protection against unauthorised
|
| 43 |
+
or unlawful processing and against accidental loss, destruction or damage, using
|
| 44 |
+
appropriate technical or organisational measures (‘integrity and confidentiality’).
|
| 45 |
+
|
| 46 |
+
2.The controller shall be responsible for, and be able to demonstrate compliance
|
| 47 |
+
with, paragraph 1 (‘accountability’).'
|
| 48 |
+
- '1.A transfer of personal data to a third country or an international organisation
|
| 49 |
+
may take place where the Commission has decided that the third country, a territory
|
| 50 |
+
or one or more specified sectors within that third country, or the international
|
| 51 |
+
organisation in question ensures an adequate level of protection. Such a transfer
|
| 52 |
+
shall not require any specific authorisation.
|
| 53 |
+
|
| 54 |
+
2.When assessing the adequacy of the level of protection, the Commission shall,
|
| 55 |
+
in particular, take account of the following elements: (a) the rule of law, respect
|
| 56 |
+
for human rights and fundamental freedoms, relevant legislation, both general
|
| 57 |
+
and sectoral, including concerning public security, defence, national security
|
| 58 |
+
and criminal law and the access of public authorities to personal data, as well
|
| 59 |
+
as the implementation of such legislation, data protection rules, professional
|
| 60 |
+
rules and security measures, including rules for the onward transfer of personal
|
| 61 |
+
data to another third country or international organisation which are complied
|
| 62 |
+
with in that country or international organisation, case-law, as well as effective
|
| 63 |
+
and enforceable data subject rights and effective administrative and judicial
|
| 64 |
+
redress for the data subjects whose personal data are being transferred; (b) the
|
| 65 |
+
existence and effective functioning of one or more independent supervisory authorities
|
| 66 |
+
in the third country or to which an international organisation is subject, with
|
| 67 |
+
responsibility for ensuring and enforcing compliance with the data protection
|
| 68 |
+
rules, including adequate enforcement powers, for assisting and advising the data
|
| 69 |
+
subjects in exercising their rights and for cooperation with the supervisory authorities
|
| 70 |
+
of the Member States; and (c) the international commitments the third country
|
| 71 |
+
or international organisation concerned has entered into, or other obligations
|
| 72 |
+
arising from legally binding conventions or instruments as well as from its participation
|
| 73 |
+
in multilateral or regional systems, in particular in relation to the protection
|
| 74 |
+
of personal data.
|
| 75 |
+
|
| 76 |
+
3.The Commission, after assessing the adequacy of the level of protection, may
|
| 77 |
+
decide, by means of implementing act, that a third country, a territory or one
|
| 78 |
+
or more specified sectors within a third country, or an international organisation
|
| 79 |
+
ensures an adequate level of protection within the meaning of paragraph 2 of this
|
| 80 |
+
Article. The implementing act shall provide for a mechanism for a periodic review,
|
| 81 |
+
at least every four years, which shall take into account all relevant developments
|
| 82 |
+
in the third country or international organisation. The implementing act shall
|
| 83 |
+
specify its territorial and sectoral application and, where applicable, identify
|
| 84 |
+
the supervisory authority or authorities referred to in point (b) of paragraph
|
| 85 |
+
2 of this Article. The implementing act shall be adopted in accordance with the
|
| 86 |
+
examination procedure referred to in Article 93(2).
|
| 87 |
+
|
| 88 |
+
4.The Commission shall, on an ongoing basis, monitor developments in third countries
|
| 89 |
+
and international organisations that could affect the functioning of decisions
|
| 90 |
+
adopted pursuant to paragraph 3 of this Article and decisions adopted on the basis
|
| 91 |
+
of Article 25(6) of Directive 95/46/EC.
|
| 92 |
+
|
| 93 |
+
5.The Commission shall, where available information reveals, in particular following
|
| 94 |
+
the review referred to in paragraph 3 of this Article, that a third country, a
|
| 95 |
+
territory or one or more specified sectors within a third country, or an international
|
| 96 |
+
organisation no longer ensures an adequate level of protection within the meaning
|
| 97 |
+
of paragraph 2 of this Article, to the extent necessary, repeal, amend or suspend
|
| 98 |
+
the decision referred to in paragraph 3 of this Article by means of implementing
|
| 99 |
+
acts without retro-active effect. Those implementing acts shall be adopted in
|
| 100 |
+
accordance with the examination procedure referred to in Article 93(2). On duly
|
| 101 |
+
justified imperative grounds of urgency, the Commission shall adopt immediately
|
| 102 |
+
applicable implementing acts in accordance with the procedure referred to in Article
|
| 103 |
+
93(3).
|
| 104 |
+
|
| 105 |
+
6.The Commission shall enter into consultations with the third country or international
|
| 106 |
+
organisation with a view to remedying the situation giving rise to the decision
|
| 107 |
+
made pursuant to paragraph 5
|
| 108 |
+
|
| 109 |
+
7.A decision pursuant to paragraph 5 of this Article is without prejudice to transfers
|
| 110 |
+
of personal data to the third country, a territory or one or more specified sectors
|
| 111 |
+
within that third country, or the international organisation in question pursuant
|
| 112 |
+
to Articles 46 to 49
|
| 113 |
+
|
| 114 |
+
8.The Commission shall publish in the Official Journal of the European Union and
|
| 115 |
+
on its website a list of the third countries, territories and specified sectors
|
| 116 |
+
within a third country and international organisations for which it has decided
|
| 117 |
+
that an adequate level of protection is or is no longer ensured.
|
| 118 |
+
|
| 119 |
+
9.Decisions adopted by the Commission on the basis of Article 25(6) of Directive
|
| 120 |
+
95/46/EC shall remain in force until amended, replaced or repealed by a Commission
|
| 121 |
+
Decision adopted in accordance with paragraph 3 or 5 of this Article.'
|
| 122 |
+
- The legal systems of Denmark and Estonia do not allow for administrative fines
|
| 123 |
+
as set out in this Regulation. The rules on administrative fines may be applied
|
| 124 |
+
in such a manner that in Denmark the fine is imposed by competent national courts
|
| 125 |
+
as a criminal penalty and in Estonia the fine is imposed by the supervisory authority
|
| 126 |
+
in the framework of a misdemeanour procedure, provided that such an application
|
| 127 |
+
of the rules in those Member States has an equivalent effect to administrative
|
| 128 |
+
fines imposed by supervisory authorities. Therefore the competent national courts
|
| 129 |
+
should take into account the recommendation by the supervisory authority initiating
|
| 130 |
+
the fine. In any event, the fines imposed should be effective, proportionate and
|
| 131 |
+
dissuasive.
|
| 132 |
+
- source_sentence: Is the fine mandatory for the described offense?
|
| 133 |
+
sentences:
|
| 134 |
+
- "1.Each supervisory authority shall ensure that the imposition of administrative\
|
| 135 |
+
\ fines pursuant to this Article in respect of infringements of this Regulation\
|
| 136 |
+
\ referred to in paragraphs 4, 5 and 6 shall in each individual case be effective,\
|
| 137 |
+
\ proportionate and dissuasive.\n2.Administrative fines shall, depending on the\
|
| 138 |
+
\ circumstances of each individual case, be imposed in addition to, or instead\
|
| 139 |
+
\ of, measures referred to in points (a) to (h) and (j) of Article 58(2). When\
|
| 140 |
+
\ deciding whether to impose an administrative fine and deciding on the amount\
|
| 141 |
+
\ of the administrative fine in each individual case due regard shall be given\
|
| 142 |
+
\ to the following: (a) the nature, gravity and duration of the infringement\
|
| 143 |
+
\ taking into account the nature scope or purpose of the processing concerned\
|
| 144 |
+
\ as well as the number of data subjects affected and the level of damage suffered\
|
| 145 |
+
\ by them; (b) the intentional or negligent character of the infringement; (c)\
|
| 146 |
+
\ any action taken by the controller or processor to mitigate the damage suffered\
|
| 147 |
+
\ by data subjects; (d) the degree of responsibility of the controller or processor\
|
| 148 |
+
\ taking into account technical and organisational measures implemented by them\
|
| 149 |
+
\ pursuant to Articles 25 and 32; (e) any relevant previous infringements by\
|
| 150 |
+
\ the controller or processor; (f) the degree of cooperation with the supervisory\
|
| 151 |
+
\ authority, in order to remedy the infringement and mitigate the possible adverse\
|
| 152 |
+
\ effects of the infringement; (g) the categories of personal data affected by\
|
| 153 |
+
\ the infringement; (h) the manner in which the infringement became known to\
|
| 154 |
+
\ the supervisory authority, in particular whether, and if so to what extent,\
|
| 155 |
+
\ the controller or processor notified the infringement; (i) where measures referred\
|
| 156 |
+
\ to in Article 58(2) have previously been ordered against the controller or processor\
|
| 157 |
+
\ concerned with regard to the same subject-matter, compliance with those measures;\
|
| 158 |
+
\ (j) adherence to approved codes of conduct pursuant to Article 40 or approved\
|
| 159 |
+
\ certification mechanisms pursuant to Article 42; and (k) any other aggravating\
|
| 160 |
+
\ or mitigating factor applicable to the circumstances of the case, such as financial\
|
| 161 |
+
\ benefits gained, or losses avoided, directly or indirectly, from the infringement.\n\
|
| 162 |
+
3.If a controller or processor intentionally or negligently, for the same or linked\
|
| 163 |
+
\ processing operations, infringes several provisions of this Regulation, the\
|
| 164 |
+
\ total amount of the administrative fine shall not exceed the amount specified\
|
| 165 |
+
\ for the gravest infringement.\n4.Infringements of the following provisions shall,\
|
| 166 |
+
\ in accordance with paragraph 2, be subject to administrative fines up to 10\
|
| 167 |
+
\ 000 000 EUR, or in the case of an undertaking, up to 2 % of the total worldwide\
|
| 168 |
+
\ annual turnover of the preceding financial year, whichever is higher: (a) the\
|
| 169 |
+
\ obligations of the controller and the processor pursuant to Articles 8, 11,\
|
| 170 |
+
\ 25 to 39 and 42 and 43; (b) the obligations of the certification body pursuant\
|
| 171 |
+
\ to Articles 42 and 43; (c) the obligations of the monitoring body pursuant\
|
| 172 |
+
\ to Article 41(4). 4.5.2016 L 119/82 \n5.Infringements of the following provisions\
|
| 173 |
+
\ shall, in accordance with paragraph 2, be subject to administrative fines up\
|
| 174 |
+
\ to 20 000 000 EUR, or in the case of an undertaking, up to 4 % of the total\
|
| 175 |
+
\ worldwide annual turnover of the preceding financial year, whichever is higher:\
|
| 176 |
+
\ (a) the basic principles for processing, including conditions for consent,\
|
| 177 |
+
\ pursuant to Articles 5, 6, 7 and 9; (b) the data subjects' rights pursuant\
|
| 178 |
+
\ to Articles 12 to 22; (c) the transfers of personal data to a recipient in\
|
| 179 |
+
\ a third country or an international organisation pursuant to Articles 44 to\
|
| 180 |
+
\ 49; (d) any obligations pursuant to Member State law adopted under Chapter\
|
| 181 |
+
\ IX; (e) non-compliance with an order or a temporary or definitive limitation\
|
| 182 |
+
\ on processing or the suspension of data flows by the supervisory authority pursuant\
|
| 183 |
+
\ to Article 58(2) or failure to provide access in violation of Article 58(1).\n\
|
| 184 |
+
6.Non-compliance with an order by the supervisory authority as referred to in\
|
| 185 |
+
\ Article 58(2) shall, in accordance with paragraph 2 of this Article, be subject\
|
| 186 |
+
\ to administrative fines up to 20 000 000 EUR, or in the case of an undertaking,\
|
| 187 |
+
\ up to 4 % of the total worldwide annual turnover of the preceding financial\
|
| 188 |
+
\ year, whichever is higher.\n7.Without prejudice to the corrective powers of\
|
| 189 |
+
\ supervisory authorities pursuant to Article 58(2), each Member State may lay\
|
| 190 |
+
\ down the rules on whether and to what extent administrative fines may be imposed\
|
| 191 |
+
\ on public authorities and bodies established in that Member State.\n8.The exercise\
|
| 192 |
+
\ by the supervisory authority of its powers under this Article shall be subject\
|
| 193 |
+
\ to appropriate procedural safeguards in accordance with Union and Member State\
|
| 194 |
+
\ law, including effective judicial remedy and due process.\n9.Where the legal\
|
| 195 |
+
\ system of the Member State does not provide for administrative fines, this Article\
|
| 196 |
+
\ may be applied in such a manner that the fine is initiated by the competent\
|
| 197 |
+
\ supervisory authority and imposed by competent national courts, while ensuring\
|
| 198 |
+
\ that those legal remedies are effective and have an equivalent effect to the\
|
| 199 |
+
\ administrative fines imposed by supervisory authorities. In any event, the fines\
|
| 200 |
+
\ imposed shall be effective, proportionate and dissuasive. Those Member States\
|
| 201 |
+
\ shall notify to the Commission the provisions of their laws which they adopt\
|
| 202 |
+
\ pursuant to this paragraph by 25 May 2018 and, without delay, any subsequent\
|
| 203 |
+
\ amendment law or amendment affecting them."
|
| 204 |
+
- "Court (Civil/Criminal): Criminal \nProvisions: Article 386 of the Penal Code\
|
| 205 |
+
\ \nTime of commission of the act: \nResult (innocent, guilty): \nReasoning:\
|
| 206 |
+
\ Conviction for computer fraud committed repeatedly and professionally with a\
|
| 207 |
+
\ total benefit and damage exceeding €30,000. According to the majority opinion,\
|
| 208 |
+
\ the charge is substantiated in both its objective and subjective aspects, and\
|
| 209 |
+
\ the defendant must be declared guilty of the aforementioned criminal acts of\
|
| 210 |
+
\ fraud by means of a computer, committed repeatedly by a perpetrator acting professionally,\
|
| 211 |
+
\ where the total financial benefit and corresponding damage exceed the amount\
|
| 212 |
+
\ of €30,000, as well as for repeated embezzlement.\n\nFacts: The defendant accessed\
|
| 213 |
+
\ a website using a computer, employing, without the knowledge and consent of\
|
| 214 |
+
\ the complainants, the access codes for the electronic management system of the\
|
| 215 |
+
\ bank accounts held by the complainants at a Bank, and transferred money through\
|
| 216 |
+
\ electronically transmitted orders from the complainants' accounts to her own\
|
| 217 |
+
\ account. Specifically, during the period from June 2007 to June 2008, after\
|
| 218 |
+
\ unlawfully acquiring the aforementioned STICK containing the access codes, she\
|
| 219 |
+
\ accessed a website maintained by ..., using, without the complainants' knowledge\
|
| 220 |
+
\ (without their consent or approval), the access codes for the electronic management\
|
| 221 |
+
\ system of the bank accounts held at the aforementioned Bank, transferring through\
|
| 222 |
+
\ electronically transmitted orders to the joint account number ... of the complainants\
|
| 223 |
+
\ from bank accounts numbered ..., ..., and ..., the total amount of €55,710,\
|
| 224 |
+
\ as detailed in the orders, and subsequently, using an ATM card, she gradually\
|
| 225 |
+
\ withdrew from the aforementioned account number ..., the total amount of €55,710,\
|
| 226 |
+
\ making 84 individual withdrawals from automatic teller machines. In addition,\
|
| 227 |
+
\ the defendant, during the period from June 2008 to November 2008, in the same\
|
| 228 |
+
\ exact manner (through the electronic management system of the bank accounts),\
|
| 229 |
+
\ transferred through electronically transmitted orders to account number ...,\
|
| 230 |
+
\ which she had opened at ..., from the complainants' bank accounts numbered ...,\
|
| 231 |
+
\ ..., ..., ..., and ..., the total amount of €73,942, as detailed in the orders\
|
| 232 |
+
\ regarding the transfers of these amounts. Furthermore, during the period from\
|
| 233 |
+
\ February 2008 to November 2008, through multiple acts constituting a continuation\
|
| 234 |
+
\ of the crime, although she had received from the first complainant ... the amounts\
|
| 235 |
+
\ of €695.04, €695.04, and €845.04, in order to pay his insurance contributions\
|
| 236 |
+
\ to O.A.E.E. for the periods of January-February 2008, May-June 2008, and September-October\
|
| 237 |
+
\ 2008, as well as the amounts of €250 and €280, in order to settle credit card\
|
| 238 |
+
\ bills for \"...\", respectively, and from the second complainant ... she received\
|
| 239 |
+
\ the amounts of €283.64, €419.26, and €385.38, to pay the latter's insurance\
|
| 240 |
+
\ contributions to O.A.E.E. for the periods of July-August 2007, May-June 2008,\
|
| 241 |
+
\ September-October 2008, and November-December 2008, as well as the amount of\
|
| 242 |
+
\ €1,888.03 for the settlement of VAT, she never paid the above amounts to settle\
|
| 243 |
+
\ the aforementioned obligations, nor did she return them to the complainants,\
|
| 244 |
+
\ despite being urged to do so, but incorporated them into her assets and wrongfully\
|
| 245 |
+
\ appropriated them. The defendant denies the charges against her and claims that\
|
| 246 |
+
\ the withdrawals were made by the second complainant and that all the amounts\
|
| 247 |
+
\ transferred to her account were transferred to cover the company's expenses\
|
| 248 |
+
\ and their personal expenses, due to her cohabitation with the second complainant\
|
| 249 |
+
\ and with his knowledge, with whom she intended to marry. However, this claim\
|
| 250 |
+
\ is not supported by any evidence; on the contrary, it emerged that she conducted\
|
| 251 |
+
\ the transfers of the money and withdrawals without the complainants' knowledge,\
|
| 252 |
+
\ and when she learned that they had been informed about the account movements\
|
| 253 |
+
\ and met at the Bank, her behavior and demeanor indicated guilt, according to\
|
| 254 |
+
\ the testimony of the prosecution witness ..., an employee of the Pangrati branch\
|
| 255 |
+
\ of ..., who saw her on the same day at the aforementioned Bank when she met\
|
| 256 |
+
\ with the complainants. The ongoing act of fraud using a computer was committed\
|
| 257 |
+
\ by the defendant professionally, as evidenced by her repeated commission of\
|
| 258 |
+
\ the act, as well as the infrastructure she had established with the intent of\
|
| 259 |
+
\ repeated commission, based on a specific plan and methodology (transferring\
|
| 260 |
+
\ smaller amounts to a joint account of the complainants from the remaining accounts\
|
| 261 |
+
\ of the latter, and then withdrawing the transferred amounts with an ATM card,\
|
| 262 |
+
\ as well as directly transferring smaller amounts from the complainants' accounts\
|
| 263 |
+
\ to her personal account she had opened at the same bank), indicating her purpose\
|
| 264 |
+
\ to generate income, with the financial benefit she gained, corresponding to\
|
| 265 |
+
\ the complainants' damage, exceeding a total of €30,000."
|
| 266 |
+
- 'Any person who intentionally, through the technology of information and communication,
|
| 267 |
+
suggests an encounter between an adult and a minor under the age of fifteen, aiming
|
| 268 |
+
at the commitment of the crimes described in par. 1 and 2 of art. 339 and 348Α,
|
| 269 |
+
is sentenced to an imprisonment of at least two years and a fine of fifty to two
|
| 270 |
+
hundred thousand Euros, when the proposal is followed by further actions which
|
| 271 |
+
lead in the commitment of such crimes.
|
| 272 |
+
|
| 273 |
+
'
|
| 274 |
+
- source_sentence: Who should provide authorisation when safeguards are detailed in
|
| 275 |
+
non-legally binding administrative arrangements?
|
| 276 |
+
sentences:
|
| 277 |
+
- In the absence of an adequacy decision, the controller or processor should take
|
| 278 |
+
measures to compensate for the lack of data protection in a third country by way
|
| 279 |
+
of appropriate safeguards for the data subject. Such appropriate safeguards may
|
| 280 |
+
consist of making use of binding corporate rules, standard data protection clauses
|
| 281 |
+
adopted by the Commission, standard data protection clauses adopted by a supervisory
|
| 282 |
+
authority or contractual clauses authorised by a supervisory authority. Those
|
| 283 |
+
safeguards should ensure compliance with data protection requirements and the
|
| 284 |
+
rights of the data subjects appropriate to processing within the Union, including
|
| 285 |
+
the availability of enforceable data subject rights and of effective legal remedies,
|
| 286 |
+
including to obtain effective administrative or judicial redress and to claim
|
| 287 |
+
compensation, in the Union or in a third country. They should relate in particular
|
| 288 |
+
to compliance with the general principles relating to personal data processing,
|
| 289 |
+
the principles of data protection by design and by default. Transfers may also
|
| 290 |
+
be carried out by public authorities or bodies with public authorities or bodies
|
| 291 |
+
in third countries or with international organisations with corresponding duties
|
| 292 |
+
or functions, including on the basis of provisions to be inserted into administrative
|
| 293 |
+
arrangements, such as a memorandum of understanding, providing for enforceable
|
| 294 |
+
and effective rights for data subjects. Authorisation by the competent supervisory
|
| 295 |
+
authority should be obtained when the safeguards are provided for in administrative
|
| 296 |
+
arrangements that are not legally binding.
|
| 297 |
+
- '**Court (Civil/Criminal): Civil**
|
| 298 |
+
|
| 299 |
+
|
| 300 |
+
**Provisions:**
|
| 301 |
+
|
| 302 |
+
|
| 303 |
+
**Time of commission of the act:**
|
| 304 |
+
|
| 305 |
+
|
| 306 |
+
**Outcome (not guilty, guilty):**
|
| 307 |
+
|
| 308 |
+
|
| 309 |
+
**Rationale:**
|
| 310 |
+
|
| 311 |
+
|
| 312 |
+
**Facts:**
|
| 313 |
+
|
| 314 |
+
The plaintiff holds credit card number ............ with the defendant banking
|
| 315 |
+
corporation. Based on the application for alternative networks dated 19/7/2015
|
| 316 |
+
with number ......... submitted at a branch of the defendant, he was granted access
|
| 317 |
+
to the electronic banking service (e-banking) to conduct banking transactions
|
| 318 |
+
(debit, credit, updates, payments) remotely. On 30/11/2020, the plaintiff fell
|
| 319 |
+
victim to electronic fraud through the "phishing" method, whereby an unknown perpetrator
|
| 320 |
+
managed to withdraw a total amount of €3,121.75 from the aforementioned credit
|
| 321 |
+
card. Specifically, the plaintiff received an email at 1:35 PM on 29/11/2020 from
|
| 322 |
+
sender ...... with address ........, informing him that due to an impending system
|
| 323 |
+
change, he needed to verify the mobile phone number linked to the credit card,
|
| 324 |
+
urging him to complete the verification process within the next 24 hours by following
|
| 325 |
+
a link titled ........; otherwise, his account would be locked for security reasons.
|
| 326 |
+
The plaintiff read this email on the afternoon of 30 November 2020 and, believing
|
| 327 |
+
it was from the defendant, followed the instructions and proceeded via the provided
|
| 328 |
+
link to a website that was identical (a clone) to that of the defendant. On this
|
| 329 |
+
page, he was asked to enter the six-digit security code (.........) that had just
|
| 330 |
+
been sent to his mobile phone by the defendant at 3:41 PM, with the note that
|
| 331 |
+
it was an activation code for his ........ card at ........., which he entered.
|
| 332 |
+
|
| 333 |
+
|
| 334 |
+
Subsequently, the plaintiff received, according to his statements, a new email
|
| 335 |
+
(not submitted), which requested him to enter the details of the aforementioned
|
| 336 |
+
credit card, specifically the name of the cardholder and the card number, not
|
| 337 |
+
the PIN, which he also entered, convinced that he was within the online environment
|
| 338 |
+
of the defendant. Then, at 3:47 PM, he received a message on his mobile phone
|
| 339 |
+
from the defendant containing the exact same content as the one he received at
|
| 340 |
+
3:41 PM, while at 3:50 PM he received a message stating that the activation of
|
| 341 |
+
his ......... card at ....... had been completed. Once the plaintiff read this,
|
| 342 |
+
he became concerned that something was not right, and immediately called (at 4:41
|
| 343 |
+
PM) the defendant''s call center to inform them. There, the employees, with whom
|
| 344 |
+
he finally connected at 5:04 PM due to high call center volume, advised him to
|
| 345 |
+
delete the relevant emails, cancel his credit card, change his access passwords
|
| 346 |
+
for the service, and submit a dispute request regarding the conducted transactions.
|
| 347 |
+
The plaintiff electronically sent this request to the defendant, disputing the
|
| 348 |
+
detailed transactions amounting to €3,121.75, which were conducted on 30/11/2020
|
| 349 |
+
during the time frame of 16:37:45-16:43:34 PM, arguing that he had neither performed
|
| 350 |
+
them himself nor authorized anyone else to do so. The plaintiff specifically disputed
|
| 351 |
+
the following transactions, as evidenced by the account activity of the disputed
|
| 352 |
+
credit card during the aforementioned timeframe: a) transaction number .........
|
| 353 |
+
amounting to €150.62 conducted on 30/11/2020 at 4:43:34 PM, b) transaction number
|
| 354 |
+
........ amounting to €293.20 conducted on 30/11/2020 at 4:42:40 PM, c) transaction
|
| 355 |
+
number ............ amounting to €295.21 conducted on 30/11/2020 at 4:42:10 PM,
|
| 356 |
+
d) transaction number .......... amounting to €299.22 conducted on 30/11/2020
|
| 357 |
+
at 4:41:31 PM, e) transaction number ........ amounting to €297.21 conducted on
|
| 358 |
+
30/11/2020 at 4:41:01 PM, f) transaction number ........ amounting to €299.22
|
| 359 |
+
conducted on 30/11/2020 at 4:40:27 PM, g) transaction number ....... amounting
|
| 360 |
+
to €299.22 conducted on 30/11/2020 at 4:39:55 PM, h) transaction number ......
|
| 361 |
+
amounting to €299.22 conducted on 30/11/2020 at 4:39:22 PM, i) transaction number
|
| 362 |
+
......... amounting to €297.22 conducted on 30/11/2020 at 4:38:52 PM, j) transaction
|
| 363 |
+
number ......... amounting to €295.21 conducted on 30/11/2020 at 4:38:17 PM, and
|
| 364 |
+
k) transaction number ......... amounting to €296.21 conducted on 30/11/2020 at
|
| 365 |
+
4:37:45 PM. In its response letter dated 21/12/2020, the defendant denied responsibility
|
| 366 |
+
for the costs of the aforementioned transactions, placing the entire blame on
|
| 367 |
+
the plaintiff for the leak of his card details and security code to the fraudulent
|
| 368 |
+
page. The plaintiff, completely denying any fault for the conducted transactions,
|
| 369 |
+
repeatedly contacted the defendant, both by phone and via email (see emails dated
|
| 370 |
+
15/1/2021 and 11/2/2021), while on 2/3/2021, he electronically sent a report dated
|
| 371 |
+
1/03/2021 to the Consumer Advocate’s email address, recounting the events and
|
| 372 |
+
requesting that the aforementioned Independent Authority intervene to have the
|
| 373 |
+
disputed debt canceled. In its letter with reference number ...../27.04.2021,
|
| 374 |
+
the aforementioned Independent Authority informed the plaintiff that the case
|
| 375 |
+
was outside its mediating role and was therefore archived. Subsequently, the plaintiff
|
| 376 |
+
sent the defendant on 5/3/2021 his extrajudicial statement dated 4/3/2021, calling
|
| 377 |
+
upon it to fully cancel the debt of €3,121.75 that had been unjustly incurred
|
| 378 |
+
against him within two days and to immediately instruct the representatives of
|
| 379 |
+
the collection agency working with it to cease contacting him regarding the disputed
|
| 380 |
+
case. The defendant sent the plaintiff a message on his mobile phone on 20/04/2021
|
| 381 |
+
informing him that his case was still being processed due to lengthy operational
|
| 382 |
+
requirements, while on 23/04/2021, via email, it informed him that considering
|
| 383 |
+
their good cooperation and his efforts to keep them updated, it had reviewed his
|
| 384 |
+
case and decided to refund him the amounts of the transactions that were conducted
|
| 385 |
+
after his contact with their representatives on 30/11/2020 at 4:41 PM, totaling
|
| 386 |
+
€1,038.25, specifically the following: a) transaction of €150.62 conducted on
|
| 387 |
+
30/11/2020 at 4:43 PM, b) transaction of €295.21 conducted on 30/11/2020 at 4:42
|
| 388 |
+
PM, c) transaction of €293.20 conducted on 30/11/2020 at 4:42 PM, and d) transaction
|
| 389 |
+
of €299.22 conducted on 30/11/2020 at 4:41 PM. Beyond this, the defendant refused
|
| 390 |
+
to refund the plaintiff the amount of the remaining transactions conducted on
|
| 391 |
+
30/11/2020, totaling €2,376.08 (and not €2,376.48 as incorrectly stated by the
|
| 392 |
+
plaintiff in his lawsuit), which the plaintiff ultimately fully paid, transferring
|
| 393 |
+
€2,342.77 to the defendant on 7/06/2021 and €33.31 on 15/06/2021 (see related
|
| 394 |
+
deposit receipts).'
|
| 395 |
+
- "Court (Civil/Criminal): Civil \nProvisions: \nTime of commission: July 21,\
|
| 396 |
+
\ 2020 \nOutcome (innocent, guilty): Partially accepts the lawsuit against the\
|
| 397 |
+
\ Bank. \nReasoning: Alongside the bank's responsibility for the ineffective\
|
| 398 |
+
\ protection of its systems against the continually changing and evolving methods\
|
| 399 |
+
\ of deception that affect them, leading to financial damage for its clients who\
|
| 400 |
+
\ entrusted it, which constitutes a breach of its contractual obligations and\
|
| 401 |
+
\ generates contractual liability, there is also the personal responsibility of\
|
| 402 |
+
\ the plaintiff, who did not safeguard, as required, his sensitive banking information\
|
| 403 |
+
\ and disclosed it when he should not have, even though the message that misled\
|
| 404 |
+
\ him came from the context of an SMS conversation with the defendant, even if\
|
| 405 |
+
\ he was directed through the link to a website resembling that of the defendant,\
|
| 406 |
+
\ because he overlooked the relevant instructions and strict recommendations of\
|
| 407 |
+
\ the bank, violating his duty to safeguard them. Therefore, in light of the above,\
|
| 408 |
+
\ the court must partially accept the lawsuit regarding its substance, and with\
|
| 409 |
+
\ the defendant's objection regarding the plaintiff's fault being accepted at\
|
| 410 |
+
\ a rate of 1/6 of the damage suffered, it must be acknowledged – following the\
|
| 411 |
+
\ admissible and lawful modification of the lawsuit's request from a dismissive\
|
| 412 |
+
\ to a declaratory nature as proposed – the defendant's obligation to pay him\
|
| 413 |
+
\ the amount of €2,500, with legal interest, as specified in the operative part.\
|
| 414 |
+
\ Regarding the request to recognize the defendant's obligation to pay him €1,000\
|
| 415 |
+
\ as compensation for the moral damage he suffered from the fraud committed against\
|
| 416 |
+
\ him, this is deemed dismissible as unfounded, because the defendant's liability\
|
| 417 |
+
\ is contractual and not tortious, and there are no special conditions justifying\
|
| 418 |
+
\ the treatment of this specific non-contractual behavior as tortious, making\
|
| 419 |
+
\ it possible to attribute moral damage to the plaintiff from the defendant. \
|
| 420 |
+
\ \nFacts: The plaintiff maintained a joint bank account with his wife and had\
|
| 421 |
+
\ access to the defendant bank's e-banking. On July 21, 2020, following successful\
|
| 422 |
+
\ identification via the agreed-upon credentials (userID, password, OTP), a request\
|
| 423 |
+
\ was made to change the mobile phone number for receiving OTPs, which was completed\
|
| 424 |
+
\ through the bank's platform. However, this change was not made by the plaintiff\
|
| 425 |
+
\ himself, but by a third party who had previously deceived him using the phishing\
|
| 426 |
+
\ method, obtaining his banking details through a misleading SMS. Following the\
|
| 427 |
+
\ phone number change, on July 31, 2020, a transfer of €3,000 was made to a third\
|
| 428 |
+
\ party's account. The transaction was conducted using the necessary credentials\
|
| 429 |
+
\ and OTP sent to the new mobile phone, resulting in the bank considering the\
|
| 430 |
+
\ order valid and executing it. Once the plaintiff realized the transfer, he immediately\
|
| 431 |
+
\ contacted the bank and informed them that he had not given such an order himself.\
|
| 432 |
+
\ Despite the initial assurance that the funds could be recovered, they were ultimately\
|
| 433 |
+
\ not returned, as they had been transferred to a third party's account, and the\
|
| 434 |
+
\ bank denied any responsibility for the loss."
|
| 435 |
+
- source_sentence: When will the periodic review mechanism be conducted?
|
| 436 |
+
sentences:
|
| 437 |
+
- The Commission should monitor the functioning of decisions on the level of protection
|
| 438 |
+
in a third country, a territory or specified sector within a third country, or
|
| 439 |
+
an international organisation, and monitor the functioning of decisions adopted
|
| 440 |
+
on the basis of Article 25(6) or Article 26(4) of Directive 95/46/EC. In its adequacy
|
| 441 |
+
decisions, the Commission should provide for a periodic review mechanism of their
|
| 442 |
+
functioning. That periodic review should be conducted in consultation with the
|
| 443 |
+
third country or international organisation in question and take into account
|
| 444 |
+
all relevant developments in the third country or international organisation.
|
| 445 |
+
For the purposes of monitoring and of carrying out the periodic reviews, the Commission
|
| 446 |
+
should take into consideration the views and findings of the European Parliament
|
| 447 |
+
and of the Council as well as of other relevant bodies and sources. The Commission
|
| 448 |
+
should evaluate, within a reasonable time, the functioning of the latter decisions
|
| 449 |
+
and report any relevant findings to the Committee within the meaning of Regulation
|
| 450 |
+
(EU) No 182/2011 of the European Parliament and of the Council (1) as established
|
| 451 |
+
under this Regulation, to the European Parliament and to the Council.
|
| 452 |
+
- "**Court (Civil/Criminal): Civil** \n**Provisions:** \n**Time of commission\
|
| 453 |
+
\ of the act:** \n**Outcome (not guilty, guilty):** \n**Reasoning:** Partially\
|
| 454 |
+
\ accepts the lawsuit. \n**Facts:** The plaintiff, who works as a lawyer, maintains\
|
| 455 |
+
\ a savings account with the defendant banking corporation under account number\
|
| 456 |
+
\ GR.............. Pursuant to a contract dated June 11, 2010, established in\
|
| 457 |
+
\ Thessaloniki between the defendant and the plaintiff, the plaintiff was granted\
|
| 458 |
+
\ access to the electronic banking system (e-banking) to conduct banking transactions\
|
| 459 |
+
\ remotely. On October 10, 2020, the plaintiff fell victim to electronic fraud\
|
| 460 |
+
\ through the \"phishing\" method, whereby an unknown perpetrator managed to extract\
|
| 461 |
+
\ and transfer €3,000.00 from the plaintiff’s account to another account of the\
|
| 462 |
+
\ same bank. Specifically, on that day at 6:51 a.m., the plaintiff received an\
|
| 463 |
+
\ email from the sender \".........\", with the address ..........., informing\
|
| 464 |
+
\ him that his debit card had been suspended and that online payments and cash\
|
| 465 |
+
\ withdrawals could not be made until the issue was resolved. The email urged\
|
| 466 |
+
\ him to confirm his details within the next 72 hours by following a link titled\
|
| 467 |
+
\ \"card activation.\" \nThe plaintiff read the above email on his mobile phone\
|
| 468 |
+
\ around 8:00 a.m., and believing it came from the defendant, he followed the\
|
| 469 |
+
\ instructions and accessed a website that was identical (a clone) to that of\
|
| 470 |
+
\ the defendant. On this page, he was asked to enter his login credentials to\
|
| 471 |
+
\ connect to the service, which he did, and he was subsequently asked to input\
|
| 472 |
+
\ his debit card details for the alleged activation, which he also provided. Then,\
|
| 473 |
+
\ to complete the process, a number was sent to his mobile phone at 8:07 a.m.\
|
| 474 |
+
\ from the sender ........, which he entered, and two minutes later he received\
|
| 475 |
+
\ a message from the same sender in English stating that the quick access code\
|
| 476 |
+
\ had been activated on his mobile. A few minutes later, at 8:18 a.m., he received\
|
| 477 |
+
\ an email from the defendant informing him of the transfer of €3,000.00 from\
|
| 478 |
+
\ his account to account number GR ........... held at the same bank, with the\
|
| 479 |
+
\ beneficiary's details being .......... As soon as the plaintiff read this, he\
|
| 480 |
+
\ immediately called the defendant's call center and canceled his debit card,\
|
| 481 |
+
\ the access codes for the service ......., and locked the application ..........\
|
| 482 |
+
\ At the same time, he verbally submitted a request to dispute and cancel the\
|
| 483 |
+
\ contested transaction, and in a subsequent phone call, he also canceled his\
|
| 484 |
+
\ credit card. On the same day, he also sent an email to the defendant informing\
|
| 485 |
+
\ them in writing of the above and requesting the cancellation of the transaction\
|
| 486 |
+
\ and the return of the amount of €3,000.00 to his account, as this transfer was\
|
| 487 |
+
\ not made by him but by an unknown perpetrator through electronic fraud and was\
|
| 488 |
+
\ not approved by him. It should also be noted that the plaintiff, as the sole\
|
| 489 |
+
\ beneficiary according to the aforementioned contract for using the defendant's\
|
| 490 |
+
\ Internet Banking service, never received any update via SMS or the VIBER application\
|
| 491 |
+
\ from the bank regarding the transaction details before its completion, nor did\
|
| 492 |
+
\ he receive a one-time code (OTP) to approve the contested transaction. He subsequently\
|
| 493 |
+
\ filed a complaint against unknown persons at the Cyber Crime Division for the\
|
| 494 |
+
\ crime of fraud. The defendant sent an email to the plaintiff on October 16,\
|
| 495 |
+
\ 2020, informing him that his request had been forwarded to the appropriate department\
|
| 496 |
+
\ of the bank for investigation, stating that the bank would never send him an\
|
| 497 |
+
\ email or SMS asking him to enter his personal data and that as of October 7,\
|
| 498 |
+
\ 2020, there was a notice posted for its customers regarding malicious attempts\
|
| 499 |
+
\ to steal personal data in the \"Our News\" section on ....... A month after\
|
| 500 |
+
\ the disputed incident, on November 10, 2020, an amount of €2,296.82 was transferred\
|
| 501 |
+
\ to the plaintiff's account from the account to which the fraudulent credit had\
|
| 502 |
+
\ been made. The plaintiff immediately sent an email to the defendant asking to\
|
| 503 |
+
\ be informed whether this transfer was a return of part of the amount that had\
|
| 504 |
+
\ been illegally withdrawn from his account and requested the return of the remaining\
|
| 505 |
+
\ amount of €703.18. In its response dated January 13, 2021, the defendant confirmed\
|
| 506 |
+
\ that the aforementioned amount indeed came from the account to which the fraudulent\
|
| 507 |
+
\ credit had been made, following a freeze of that account initiated by the defendant\
|
| 508 |
+
\ during the investigation of the incident, but refused to return the remaining\
|
| 509 |
+
\ amount, claiming it bore no responsibility for the leak of the personal codes\
|
| 510 |
+
\ to third parties, according to the terms of the service contract established\
|
| 511 |
+
\ between them. \nFrom the entirety of the evidence presented to the court, there\
|
| 512 |
+
\ is no indication of the authenticity of the contested transaction, as the plaintiff\
|
| 513 |
+
\ did not give his consent for the execution of the transfer of the amount of\
|
| 514 |
+
\ €3,000.00, especially in light of the provision in Article 72 paragraph 2 of\
|
| 515 |
+
\ Law 4537/2018 stating that the mere use of the Internet Banking service by the\
|
| 516 |
+
\ plaintiff does not necessarily constitute sufficient evidence that the payer\
|
| 517 |
+
\ approved the payment action. Specifically, it was proven that the contested\
|
| 518 |
+
\ transaction was not carried out following a strong identification of the plaintiff\
|
| 519 |
+
\ – the sole beneficiary of the account – and his approval, as the latter may\
|
| 520 |
+
\ have entered his personal codes on the counterfeit website; however, he was\
|
| 521 |
+
\ never informed, before the completion of the contested transaction, of the amount\
|
| 522 |
+
\ that would be transferred from his account to a third-party account, nor did\
|
| 523 |
+
\ he receive on his mobile phone, either via SMS or through the VIBER application\
|
| 524 |
+
\ or any other means, the one-time code - extra PIN for its completion, which\
|
| 525 |
+
\ he was required to enter to approve the contested transaction (payment action)\
|
| 526 |
+
\ and thus complete his identification, a fact that was not countered by any evidence\
|
| 527 |
+
\ from the defendant. Furthermore, it is noted that the defendant's claims that\
|
| 528 |
+
\ it bears no responsibility under the terms of the banking services contract,\
|
| 529 |
+
\ whereby it is not liable for any damage to its customer in cases of unauthorized\
|
| 530 |
+
\ use of their personal access codes to the Internet Banking service, are to be\
|
| 531 |
+
\ rejected as fundamentally unfounded. This is because the aforementioned contractual\
|
| 532 |
+
\ terms are invalid according to the provision of Article 103 of Law 4537/2018,\
|
| 533 |
+
\ as they contradict the provisions of Articles 71, 73, and 92 of the same Law,\
|
| 534 |
+
\ which provide for the provider's universal liability and its exemption only\
|
| 535 |
+
\ for unusual and unforeseen circumstances that are beyond the control of the\
|
| 536 |
+
\ party invoking them and whose consequences could not have been avoided despite\
|
| 537 |
+
\ all efforts to the contrary; these provisions establish mandatory law in favor\
|
| 538 |
+
\ of users, as according to Article 103 of Law 4537/2018, payment service providers\
|
| 539 |
+
\ are prohibited from deviating from the provisions to the detriment of payment\
|
| 540 |
+
\ service users, unless the possibility of deviation is explicitly provided and\
|
| 541 |
+
\ they can decide to offer only more favorable terms to payment service users;\
|
| 542 |
+
\ the aforementioned contractual terms do not constitute more favorable terms\
|
| 543 |
+
\ but rather disadvantageous terms for the payment service user. In this case,\
|
| 544 |
+
\ however, the defendant did not prove the authenticity of the transaction and\
|
| 545 |
+
\ its approval by the plaintiff and did not invoke, nor did any unusual and unforeseen\
|
| 546 |
+
\ circumstances beyond its control, the consequences of which could not have been\
|
| 547 |
+
\ avoided despite all efforts to the contrary, come to light. Therefore, the contested\
|
| 548 |
+
\ transaction transferring the amount of €3,000.00 is considered, in the absence\
|
| 549 |
+
\ of demonstrable consent from the plaintiff, unapproved according to the provisions\
|
| 550 |
+
\ of Article 64 of Law 4537/2018, and the defendant's contrary claims are rejected,\
|
| 551 |
+
\ especially since the plaintiff proceeded, according to Article 71 paragraph\
|
| 552 |
+
\ 1 of Law 4537/2018, without undue delay to notify the defendant regarding the\
|
| 553 |
+
\ contested unapproved payment action. Consequently, the defendant is liable for\
|
| 554 |
+
\ compensating the plaintiff for the positive damage he suffered under Article\
|
| 555 |
+
\ 73 of Law 4537/2018 and is obliged to pay him the requested amount of €703.18,\
|
| 556 |
+
\ while the plaintiff’s fault in the occurrence of this damage cannot be established,\
|
| 557 |
+
\ as he entered his personal details in an online environment that was a faithful\
|
| 558 |
+
\ imitation of that of the defendant, as evidenced by the comparison of the screenshots\
|
| 559 |
+
\ of the fake website and the real website provided by the plaintiff, a fact that\
|
| 560 |
+
\ he could not have known while being fully convinced that he was transacting\
|
| 561 |
+
\ with the defendant. Furthermore, the defendant’s liability to compensate the\
|
| 562 |
+
\ plaintiff is based on the provision of Article 8 of Law 2251/1994, which applies\
|
| 563 |
+
\ in this case, as the plaintiff's damage resulted from inadequate fulfillment\
|
| 564 |
+
\ of its obligations in the context of providing its services, but also on the\
|
| 565 |
+
\ provision of Article 914 of the Civil Code in the sense of omission on its part\
|
| 566 |
+
\ of unlawfully and culpably imposed actions. In this case, given that during\
|
| 567 |
+
\ the relevant period there had been a multitude of similar incidents of fraud\
|
| 568 |
+
\ against the defendant's customers, the latter, as a service provider to the\
|
| 569 |
+
\ consumer public and bearing transactional obligations of care and security towards\
|
| 570 |
+
\ them, displayed gross negligence regarding the security provided for electronic\
|
| 571 |
+
\ transaction services, which was compromised by the fraudulent theft of funds,\
|
| 572 |
+
\ as it did not comply with all required high-security measures for executing\
|
| 573 |
+
\ the contested transaction, failing to implement the strict customer identification\
|
| 574 |
+
\ verification process and to check the authenticity of the account to which the\
|
| 575 |
+
\ funds were sent, thus not assuming the suspicious nature of the transaction,\
|
| 576 |
+
\ did not adopt comprehensive and improved protective measures to fully protect\
|
| 577 |
+
\ its customers against malicious attacks and online fraud and to prevent the\
|
| 578 |
+
\ infiltration of unauthorized third parties, nor did it fulfill its obligations\
|
| 579 |
+
\ to inform, accurately inform, and warn its consumers - customers, as it failed\
|
| 580 |
+
\ to adequately inform them of attempts to steal their personal data through the\
|
| 581 |
+
\ sending of informative emails or SMS, while merely posting in a section rather\
|
| 582 |
+
\ than on a central banner (as it later did) does not constitute adequate information\
|
| 583 |
+
\ such that it meets the requirement of protecting its customers and the increased\
|
| 584 |
+
\ safeguarding of their interests. Although the plaintiff acted promptly and informed\
|
| 585 |
+
\ the defendant on the same day about the contested incident, the defendant did\
|
| 586 |
+
\ not act as promptly regarding the investigation of the incident and the freezing\
|
| 587 |
+
\ of the account that held the fraudulent credit to prevent the plaintiff's loss,\
|
| 588 |
+
\ but only returned part of the funds to the plaintiff a month later. This behavior,\
|
| 589 |
+
\ beyond being culpable due to gross negligence, was also unlawful, as it would\
|
| 590 |
+
\ have been illegal even without the contractual relationship, as contrary to\
|
| 591 |
+
\ the provisions of Law 4537/2018 and Law 2251/1994, regarding the lack of security\
|
| 592 |
+
\ of the services that the consumer is legitimately entitled to expect, as well\
|
| 593 |
+
\ as the building of trust that is essential in banking transactions, elements\
|
| 594 |
+
\ that it was obligated to provide within the sphere of the services offered,\
|
| 595 |
+
\ and contrary to the principles of good faith and commercial ethics, as crystallized\
|
| 596 |
+
\ in the provision of Article 288 of the Civil Code, as well as the general duty\
|
| 597 |
+
\ imposed by Article 914 of the Civil Code not to cause harm to another culpably.\
|
| 598 |
+
\ This resulted not only in positive damage to the plaintiff but also in causing\
|
| 599 |
+
\ him moral harm consisting of his mental distress and the disruption, agitation,\
|
| 600 |
+
\ and sorrow he experienced, for which he must be awarded financial compensation.\
|
| 601 |
+
\ Taking into account all the general circumstances of the case, the extent of\
|
| 602 |
+
\ the plaintiff's damage, the severity of the defendant's fault, the mental distress\
|
| 603 |
+
\ suffered by the plaintiff, the insecurity he felt regarding his deposits, the\
|
| 604 |
+
\ sorrow he experienced, and the stress caused by his financial loss, which occurred\
|
| 605 |
+
\ during the pandemic period when his earnings from his professional activity\
|
| 606 |
+
\ had significantly decreased, as well as the financial and social situation of\
|
| 607 |
+
\ the parties, it is the court's opinion that he should be granted, as financial\
|
| 608 |
+
\ compensation for his moral harm, an amount of €250.00, which is deemed reasonable\
|
| 609 |
+
\ and fair. Therefore, the total monetary amount that the plaintiff is entitled\
|
| 610 |
+
\ to for his positive damage and financial compensation for the moral harm suffered\
|
| 611 |
+
\ amounts to a total of (€703.18 + €250.00) = €953.18."
|
| 612 |
+
- 'Failure to notify the Authority of file establishment or permit changes is punished
|
| 613 |
+
by up to three years’ imprisonment and a fine of one to five million Drachmas.
|
| 614 |
+
|
| 615 |
+
Maintaining a file without a permit or violating permit terms is punished by at
|
| 616 |
+
least one year’s imprisonment and a fine of one to five million Drachmas.
|
| 617 |
+
|
| 618 |
+
Unauthorized file interconnection or without permit is punished by up to three
|
| 619 |
+
years’ imprisonment and a fine of one to five million Drachmas.
|
| 620 |
+
|
| 621 |
+
Unlawful interference with personal data is punished by imprisonment and a fine;
|
| 622 |
+
for sensitive data, at least one year’s imprisonment and a fine of one to ten
|
| 623 |
+
million Drachmas.
|
| 624 |
+
|
| 625 |
+
Controllers who fail to comply with Authority decisions or violate data transfer
|
| 626 |
+
rules face at least two years’ imprisonment and a fine of one to five million
|
| 627 |
+
Drachmas.
|
| 628 |
+
|
| 629 |
+
If acts were committed for unlawful benefit or to cause harm, punishment is up
|
| 630 |
+
to ten years’ imprisonment and a fine of two to ten million Drachmas.
|
| 631 |
+
|
| 632 |
+
If acts jeopardize democratic governance or national security, punishment is confinement
|
| 633 |
+
in a penitentiary and a fine of five to ten million Drachmas.
|
| 634 |
+
|
| 635 |
+
Acts committed due to negligence result in at least three months’ imprisonment
|
| 636 |
+
and a fine.
|
| 637 |
+
|
| 638 |
+
If the Controller is not a natural person, the responsible party is the representative
|
| 639 |
+
or head of the organization with administrative or managerial duties.
|
| 640 |
+
|
| 641 |
+
Authorized members of the Authority may carry out preliminary investigations even
|
| 642 |
+
without Prosecutor’s order for certain offenses.
|
| 643 |
+
|
| 644 |
+
The Authority''s President must notify the Public Prosecutor of any offenses under
|
| 645 |
+
investigation, forwarding all relevant evidence.
|
| 646 |
+
|
| 647 |
+
Preliminary investigations must conclude within two months of charges, and trial
|
| 648 |
+
must begin within three months of completion.
|
| 649 |
+
|
| 650 |
+
Continuation of proceedings is allowed only once and for extremely important reasons,
|
| 651 |
+
with adjournment not exceeding two months.
|
| 652 |
+
|
| 653 |
+
Felonies under this law fall under the jurisdiction of the Court of Appeal.
|
| 654 |
+
|
| 655 |
+
'
|
| 656 |
+
- source_sentence: Who must facilitate the exercise of data subject rights?
|
| 657 |
+
sentences:
|
| 658 |
+
- '1.Processing of personal data revealing racial or ethnic origin, political opinions,
|
| 659 |
+
religious or philosophical beliefs, or trade union membership, and the processing
|
| 660 |
+
of genetic data, biometric data for the purpose of uniquely identifying a natural
|
| 661 |
+
person, data concerning health or data concerning a natural person''s sex life
|
| 662 |
+
or sexual orientation shall be prohibited.
|
| 663 |
+
|
| 664 |
+
2.Paragraph 1 shall not apply if one of the following applies: (a) the data subject
|
| 665 |
+
has given explicit consent to the processing of those personal data for one or
|
| 666 |
+
more specified purposes, except where Union or Member State law provide that the
|
| 667 |
+
prohibition referred to in paragraph 1 may not be lifted by the data subject;
|
| 668 |
+
(b) processing is necessary for the purposes of carrying out the obligations
|
| 669 |
+
and exercising specific rights of the controller or of the data subject in the
|
| 670 |
+
field of employment and social security and social protection law in so far as
|
| 671 |
+
it is authorised by Union or Member State law or a collective agreement pursuant
|
| 672 |
+
to Member State law providing for appropriate safeguards for the fundamental rights
|
| 673 |
+
and the interests of the data subject; (c) processing is necessary to protect
|
| 674 |
+
the vital interests of the data subject or of another natural person where the
|
| 675 |
+
data subject is physically or legally incapable of giving consent; (d) processing
|
| 676 |
+
is carried out in the course of its legitimate activities with appropriate safeguards
|
| 677 |
+
by a foundation, association or any other not-for-profit body with a political,
|
| 678 |
+
philosophical, religious or trade union aim and on condition that the processing
|
| 679 |
+
relates solely to the members or to former members of the body or to persons who
|
| 680 |
+
have regular contact with it in connection with its purposes and that the personal
|
| 681 |
+
data are not disclosed outside that body without the consent of the data subjects;
|
| 682 |
+
(e) processing relates to personal data which are manifestly made public by the
|
| 683 |
+
data subject; (f) processing is necessary for the establishment, exercise or
|
| 684 |
+
defence of legal claims or whenever courts are acting in their judicial capacity;
|
| 685 |
+
(g) processing is necessary for reasons of substantial public interest, on the
|
| 686 |
+
basis of Union or Member State law which shall be proportionate to the aim pursued,
|
| 687 |
+
respect the essence of the right to data protection and provide for suitable and
|
| 688 |
+
specific measures to safeguard the fundamental rights and the interests of the
|
| 689 |
+
data subject; (h) processing is necessary for the purposes of preventive or occupational
|
| 690 |
+
medicine, for the assessment of the working capacity of the employee, medical
|
| 691 |
+
diagnosis, the provision of health or social care or treatment or the management
|
| 692 |
+
of health or social care systems and services on the basis of Union or Member
|
| 693 |
+
State law or pursuant to contract with a health professional and subject to the
|
| 694 |
+
conditions and safeguards referred to in paragraph 3; (i) processing is necessary
|
| 695 |
+
for reasons of public interest in the area of public health, such as protecting
|
| 696 |
+
against serious cross-border threats to health or ensuring high standards of quality
|
| 697 |
+
and safety of health care and of medicinal products or medical devices, on the
|
| 698 |
+
basis of Union or Member State law which provides for suitable and specific measures
|
| 699 |
+
to safeguard the rights and freedoms of the data subject, in particular professional
|
| 700 |
+
secrecy; 4.5.2016 L 119/38 (j) processing is necessary for archiving purposes
|
| 701 |
+
in the public interest, scientific or historical research purposes or statistical
|
| 702 |
+
purposes in accordance with Article 89(1) based on Union or Member State law which
|
| 703 |
+
shall be proportionate to the aim pursued, respect the essence of the right to
|
| 704 |
+
data protection and provide for suitable and specific measures to safeguard the
|
| 705 |
+
fundamental rights and the interests of the data subject.
|
| 706 |
+
|
| 707 |
+
3.Personal data referred to in paragraph 1 may be processed for the purposes referred
|
| 708 |
+
to in point (h) of paragraph 2 when those data are processed by or under the responsibility
|
| 709 |
+
of a professional subject to the obligation of professional secrecy under Union
|
| 710 |
+
or Member State law or rules established by national competent bodies or by another
|
| 711 |
+
person also subject to an obligation of secrecy under Union or Member State law
|
| 712 |
+
or rules established by national competent bodies.
|
| 713 |
+
|
| 714 |
+
4.Member States may maintain or introduce further conditions, including limitations,
|
| 715 |
+
with regard to the processing of genetic data, biometric data or data concerning
|
| 716 |
+
health.'
|
| 717 |
+
- Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies
|
| 718 |
+
to the processing of personal data by the Union institutions, bodies, offices
|
| 719 |
+
and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable
|
| 720 |
+
to such processing of personal data should be adapted to the principles and rules
|
| 721 |
+
established in this Regulation and applied in the light of this Regulation. In
|
| 722 |
+
order to provide a strong and coherent data protection framework in the Union,
|
| 723 |
+
the necessary adaptations of Regulation (EC) No 45/2001 should follow after the
|
| 724 |
+
adoption of this Regulation, in order to allow application at the same time as
|
| 725 |
+
this Regulation.
|
| 726 |
+
- "1.The controller shall take appropriate measures to provide any information referred\
|
| 727 |
+
\ to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34\
|
| 728 |
+
\ relating to processing to the data subject in a concise, transparent, intelligible\
|
| 729 |
+
\ and easily accessible form, using clear and plain language, in particular for\
|
| 730 |
+
\ any information addressed specifically to a child. The information shall be\
|
| 731 |
+
\ provided in writing, or by other means, including, where appropriate, by electronic\
|
| 732 |
+
\ means. When requested by the data subject, the information may be provided orally,\
|
| 733 |
+
\ provided that the identity of the data subject is proven by other means. 4.5.2016\
|
| 734 |
+
\ L 119/39 \n2.The controller shall facilitate the exercise of data subject rights\
|
| 735 |
+
\ under Articles 15 to 22. In the cases referred to in Article 11(2), the controller\
|
| 736 |
+
\ shall not refuse to act on the request of the data subject for exercising his\
|
| 737 |
+
\ or her rights under Articles 15 to 22, unless the controller demonstrates that\
|
| 738 |
+
\ it is not in a position to identify the data subject.\n3.The controller shall\
|
| 739 |
+
\ provide information on action taken on a request under Articles 15 to 22 to\
|
| 740 |
+
\ the data subject without undue delay and in any event within one month of receipt\
|
| 741 |
+
\ of the request. That period may be extended by two further months where necessary,\
|
| 742 |
+
\ taking into account the complexity and number of the requests. The controller\
|
| 743 |
+
\ shall inform the data subject of any such extension within one month of receipt\
|
| 744 |
+
\ of the request, together with the reasons for the delay. Where the data subject\
|
| 745 |
+
\ makes the request by electronic form means, the information shall be provided\
|
| 746 |
+
\ by electronic means where possible, unless otherwise requested by the data subject.\n\
|
| 747 |
+
4.If the controller does not take action on the request of the data subject, the\
|
| 748 |
+
\ controller shall inform the data subject without delay and at the latest within\
|
| 749 |
+
\ one month of receipt of the request of the reasons for not taking action and\
|
| 750 |
+
\ on the possibility of lodging a complaint with a supervisory authority and seeking\
|
| 751 |
+
\ a judicial remedy.\n5.Information provided under Articles 13 and 14 and any\
|
| 752 |
+
\ communication and any actions taken under Articles 15 to 22 and 34 shall be\
|
| 753 |
+
\ provided free of charge. Where requests from a data subject are manifestly unfounded\
|
| 754 |
+
\ or excessive, in particular because of their repetitive character, the controller\
|
| 755 |
+
\ may either: (a) charge a reasonable fee taking into account the administrative\
|
| 756 |
+
\ costs of providing the information or communication or taking the action requested;\
|
| 757 |
+
\ or (b) refuse to act on the request. The controller shall bear the burden of\
|
| 758 |
+
\ demonstrating the manifestly unfounded or excessive character of the request.\n\
|
| 759 |
+
6.Without prejudice to Article 11, where the controller has reasonable doubts\
|
| 760 |
+
\ concerning the identity of the natural person making the request referred to\
|
| 761 |
+
\ in Articles 15 to 21, the controller may request the provision of additional\
|
| 762 |
+
\ information necessary to confirm the identity of the data subject.\n7.The information\
|
| 763 |
+
\ to be provided to data subjects pursuant to Articles 13 and 14 may be provided\
|
| 764 |
+
\ in combination with standardised icons in order to give in an easily visible,\
|
| 765 |
+
\ intelligible and clearly legible manner a meaningful overview of the intended\
|
| 766 |
+
\ processing. Where the icons are presented electronically they shall be machine-readable.\n\
|
| 767 |
+
8.The Commission shall be empowered to adopt delegated acts in accordance with\
|
| 768 |
+
\ Article 92 for the purpose of determining the information to be presented by\
|
| 769 |
+
\ the icons and the procedures for providing standardised icons. Section 2 Information\
|
| 770 |
+
\ and access to personal data"
|
| 771 |
+
pipeline_tag: sentence-similarity
|
| 772 |
+
library_name: sentence-transformers
|
| 773 |
+
metrics:
|
| 774 |
+
- cosine_accuracy@1
|
| 775 |
+
- cosine_accuracy@3
|
| 776 |
+
- cosine_accuracy@5
|
| 777 |
+
- cosine_accuracy@10
|
| 778 |
+
- cosine_precision@1
|
| 779 |
+
- cosine_precision@3
|
| 780 |
+
- cosine_precision@5
|
| 781 |
+
- cosine_precision@10
|
| 782 |
+
- cosine_recall@1
|
| 783 |
+
- cosine_recall@3
|
| 784 |
+
- cosine_recall@5
|
| 785 |
+
- cosine_recall@10
|
| 786 |
+
- cosine_ndcg@10
|
| 787 |
+
- cosine_mrr@10
|
| 788 |
+
- cosine_map@100
|
| 789 |
+
model-index:
|
| 790 |
+
- name: multilingual-e5-large
|
| 791 |
+
results:
|
| 792 |
+
- task:
|
| 793 |
+
type: information-retrieval
|
| 794 |
+
name: Information Retrieval
|
| 795 |
+
dataset:
|
| 796 |
+
name: dim 1024
|
| 797 |
+
type: dim_1024
|
| 798 |
+
metrics:
|
| 799 |
+
- type: cosine_accuracy@1
|
| 800 |
+
value: 0.4180537772087068
|
| 801 |
+
name: Cosine Accuracy@1
|
| 802 |
+
- type: cosine_accuracy@3
|
| 803 |
+
value: 0.42189500640204863
|
| 804 |
+
name: Cosine Accuracy@3
|
| 805 |
+
- type: cosine_accuracy@5
|
| 806 |
+
value: 0.4500640204865557
|
| 807 |
+
name: Cosine Accuracy@5
|
| 808 |
+
- type: cosine_accuracy@10
|
| 809 |
+
value: 0.49039692701664533
|
| 810 |
+
name: Cosine Accuracy@10
|
| 811 |
+
- type: cosine_precision@1
|
| 812 |
+
value: 0.4180537772087068
|
| 813 |
+
name: Cosine Precision@1
|
| 814 |
+
- type: cosine_precision@3
|
| 815 |
+
value: 0.4163465642338881
|
| 816 |
+
name: Cosine Precision@3
|
| 817 |
+
- type: cosine_precision@5
|
| 818 |
+
value: 0.4043533930857874
|
| 819 |
+
name: Cosine Precision@5
|
| 820 |
+
- type: cosine_precision@10
|
| 821 |
+
value: 0.36869398207426374
|
| 822 |
+
name: Cosine Precision@10
|
| 823 |
+
- type: cosine_recall@1
|
| 824 |
+
value: 0.04734422767263886
|
| 825 |
+
name: Cosine Recall@1
|
| 826 |
+
- type: cosine_recall@3
|
| 827 |
+
value: 0.138064233626932
|
| 828 |
+
name: Cosine Recall@3
|
| 829 |
+
- type: cosine_recall@5
|
| 830 |
+
value: 0.2069980430010945
|
| 831 |
+
name: Cosine Recall@5
|
| 832 |
+
- type: cosine_recall@10
|
| 833 |
+
value: 0.308531274625124
|
| 834 |
+
name: Cosine Recall@10
|
| 835 |
+
- type: cosine_ndcg@10
|
| 836 |
+
value: 0.44178501209869797
|
| 837 |
+
name: Cosine Ndcg@10
|
| 838 |
+
- type: cosine_mrr@10
|
| 839 |
+
value: 0.42985717334308843
|
| 840 |
+
name: Cosine Mrr@10
|
| 841 |
+
- type: cosine_map@100
|
| 842 |
+
value: 0.506794523350519
|
| 843 |
+
name: Cosine Map@100
|
| 844 |
+
- task:
|
| 845 |
+
type: information-retrieval
|
| 846 |
+
name: Information Retrieval
|
| 847 |
+
dataset:
|
| 848 |
+
name: dim 768
|
| 849 |
+
type: dim_768
|
| 850 |
+
metrics:
|
| 851 |
+
- type: cosine_accuracy@1
|
| 852 |
+
value: 0.41037131882202305
|
| 853 |
+
name: Cosine Accuracy@1
|
| 854 |
+
- type: cosine_accuracy@3
|
| 855 |
+
value: 0.4142125480153649
|
| 856 |
+
name: Cosine Accuracy@3
|
| 857 |
+
- type: cosine_accuracy@5
|
| 858 |
+
value: 0.44430217669654287
|
| 859 |
+
name: Cosine Accuracy@5
|
| 860 |
+
- type: cosine_accuracy@10
|
| 861 |
+
value: 0.4833546734955186
|
| 862 |
+
name: Cosine Accuracy@10
|
| 863 |
+
- type: cosine_precision@1
|
| 864 |
+
value: 0.41037131882202305
|
| 865 |
+
name: Cosine Precision@1
|
| 866 |
+
- type: cosine_precision@3
|
| 867 |
+
value: 0.4086641058472044
|
| 868 |
+
name: Cosine Precision@3
|
| 869 |
+
- type: cosine_precision@5
|
| 870 |
+
value: 0.3969270166453265
|
| 871 |
+
name: Cosine Precision@5
|
| 872 |
+
- type: cosine_precision@10
|
| 873 |
+
value: 0.36165172855313704
|
| 874 |
+
name: Cosine Precision@10
|
| 875 |
+
- type: cosine_recall@1
|
| 876 |
+
value: 0.047186779325657804
|
| 877 |
+
name: Cosine Recall@1
|
| 878 |
+
- type: cosine_recall@3
|
| 879 |
+
value: 0.1375709294981283
|
| 880 |
+
name: Cosine Recall@3
|
| 881 |
+
- type: cosine_recall@5
|
| 882 |
+
value: 0.20603724780478358
|
| 883 |
+
name: Cosine Recall@5
|
| 884 |
+
- type: cosine_recall@10
|
| 885 |
+
value: 0.30540044861465576
|
| 886 |
+
name: Cosine Recall@10
|
| 887 |
+
- type: cosine_ndcg@10
|
| 888 |
+
value: 0.4349862241563486
|
| 889 |
+
name: Cosine Ndcg@10
|
| 890 |
+
- type: cosine_mrr@10
|
| 891 |
+
value: 0.4224889742495374
|
| 892 |
+
name: Cosine Mrr@10
|
| 893 |
+
- type: cosine_map@100
|
| 894 |
+
value: 0.500478306774528
|
| 895 |
+
name: Cosine Map@100
|
| 896 |
+
- task:
|
| 897 |
+
type: information-retrieval
|
| 898 |
+
name: Information Retrieval
|
| 899 |
+
dataset:
|
| 900 |
+
name: dim 512
|
| 901 |
+
type: dim_512
|
| 902 |
+
metrics:
|
| 903 |
+
- type: cosine_accuracy@1
|
| 904 |
+
value: 0.4065300896286812
|
| 905 |
+
name: Cosine Accuracy@1
|
| 906 |
+
- type: cosine_accuracy@3
|
| 907 |
+
value: 0.41229193341869397
|
| 908 |
+
name: Cosine Accuracy@3
|
| 909 |
+
- type: cosine_accuracy@5
|
| 910 |
+
value: 0.44494238156209986
|
| 911 |
+
name: Cosine Accuracy@5
|
| 912 |
+
- type: cosine_accuracy@10
|
| 913 |
+
value: 0.4814340588988476
|
| 914 |
+
name: Cosine Accuracy@10
|
| 915 |
+
- type: cosine_precision@1
|
| 916 |
+
value: 0.4065300896286812
|
| 917 |
+
name: Cosine Precision@1
|
| 918 |
+
- type: cosine_precision@3
|
| 919 |
+
value: 0.4054630815194195
|
| 920 |
+
name: Cosine Precision@3
|
| 921 |
+
- type: cosine_precision@5
|
| 922 |
+
value: 0.3947503201024327
|
| 923 |
+
name: Cosine Precision@5
|
| 924 |
+
- type: cosine_precision@10
|
| 925 |
+
value: 0.3596030729833547
|
| 926 |
+
name: Cosine Precision@10
|
| 927 |
+
- type: cosine_recall@1
|
| 928 |
+
value: 0.047372341735862133
|
| 929 |
+
name: Cosine Recall@1
|
| 930 |
+
- type: cosine_recall@3
|
| 931 |
+
value: 0.1383106496582531
|
| 932 |
+
name: Cosine Recall@3
|
| 933 |
+
- type: cosine_recall@5
|
| 934 |
+
value: 0.20757258542171747
|
| 935 |
+
name: Cosine Recall@5
|
| 936 |
+
- type: cosine_recall@10
|
| 937 |
+
value: 0.3071623578952262
|
| 938 |
+
name: Cosine Recall@10
|
| 939 |
+
- type: cosine_ndcg@10
|
| 940 |
+
value: 0.4329095460408428
|
| 941 |
+
name: Cosine Ndcg@10
|
| 942 |
+
- type: cosine_mrr@10
|
| 943 |
+
value: 0.41950236774180394
|
| 944 |
+
name: Cosine Mrr@10
|
| 945 |
+
- type: cosine_map@100
|
| 946 |
+
value: 0.49555759572196095
|
| 947 |
+
name: Cosine Map@100
|
| 948 |
+
- task:
|
| 949 |
+
type: information-retrieval
|
| 950 |
+
name: Information Retrieval
|
| 951 |
+
dataset:
|
| 952 |
+
name: dim 256
|
| 953 |
+
type: dim_256
|
| 954 |
+
metrics:
|
| 955 |
+
- type: cosine_accuracy@1
|
| 956 |
+
value: 0.38348271446862997
|
| 957 |
+
name: Cosine Accuracy@1
|
| 958 |
+
- type: cosine_accuracy@3
|
| 959 |
+
value: 0.3886043533930858
|
| 960 |
+
name: Cosine Accuracy@3
|
| 961 |
+
- type: cosine_accuracy@5
|
| 962 |
+
value: 0.4206145966709347
|
| 963 |
+
name: Cosine Accuracy@5
|
| 964 |
+
- type: cosine_accuracy@10
|
| 965 |
+
value: 0.4551856594110115
|
| 966 |
+
name: Cosine Accuracy@10
|
| 967 |
+
- type: cosine_precision@1
|
| 968 |
+
value: 0.38348271446862997
|
| 969 |
+
name: Cosine Precision@1
|
| 970 |
+
- type: cosine_precision@3
|
| 971 |
+
value: 0.382202304737516
|
| 972 |
+
name: Cosine Precision@3
|
| 973 |
+
- type: cosine_precision@5
|
| 974 |
+
value: 0.3718309859154929
|
| 975 |
+
name: Cosine Precision@5
|
| 976 |
+
- type: cosine_precision@10
|
| 977 |
+
value: 0.33886043533930854
|
| 978 |
+
name: Cosine Precision@10
|
| 979 |
+
- type: cosine_recall@1
|
| 980 |
+
value: 0.04466034705404223
|
| 981 |
+
name: Cosine Recall@1
|
| 982 |
+
- type: cosine_recall@3
|
| 983 |
+
value: 0.1301795023253766
|
| 984 |
+
name: Cosine Recall@3
|
| 985 |
+
- type: cosine_recall@5
|
| 986 |
+
value: 0.19500340584044382
|
| 987 |
+
name: Cosine Recall@5
|
| 988 |
+
- type: cosine_recall@10
|
| 989 |
+
value: 0.2892016292717267
|
| 990 |
+
name: Cosine Recall@10
|
| 991 |
+
- type: cosine_ndcg@10
|
| 992 |
+
value: 0.4087462230477571
|
| 993 |
+
name: Cosine Ndcg@10
|
| 994 |
+
- type: cosine_mrr@10
|
| 995 |
+
value: 0.3957850639188662
|
| 996 |
+
name: Cosine Mrr@10
|
| 997 |
+
- type: cosine_map@100
|
| 998 |
+
value: 0.4709582085612654
|
| 999 |
+
name: Cosine Map@100
|
| 1000 |
+
- task:
|
| 1001 |
+
type: information-retrieval
|
| 1002 |
+
name: Information Retrieval
|
| 1003 |
+
dataset:
|
| 1004 |
+
name: dim 128
|
| 1005 |
+
type: dim_128
|
| 1006 |
+
metrics:
|
| 1007 |
+
- type: cosine_accuracy@1
|
| 1008 |
+
value: 0.34699103713188223
|
| 1009 |
+
name: Cosine Accuracy@1
|
| 1010 |
+
- type: cosine_accuracy@3
|
| 1011 |
+
value: 0.35147247119078107
|
| 1012 |
+
name: Cosine Accuracy@3
|
| 1013 |
+
- type: cosine_accuracy@5
|
| 1014 |
+
value: 0.37900128040973113
|
| 1015 |
+
name: Cosine Accuracy@5
|
| 1016 |
+
- type: cosine_accuracy@10
|
| 1017 |
+
value: 0.4212548015364917
|
| 1018 |
+
name: Cosine Accuracy@10
|
| 1019 |
+
- type: cosine_precision@1
|
| 1020 |
+
value: 0.34699103713188223
|
| 1021 |
+
name: Cosine Precision@1
|
| 1022 |
+
- type: cosine_precision@3
|
| 1023 |
+
value: 0.34571062740076824
|
| 1024 |
+
name: Cosine Precision@3
|
| 1025 |
+
- type: cosine_precision@5
|
| 1026 |
+
value: 0.3352112676056338
|
| 1027 |
+
name: Cosine Precision@5
|
| 1028 |
+
- type: cosine_precision@10
|
| 1029 |
+
value: 0.3042893725992318
|
| 1030 |
+
name: Cosine Precision@10
|
| 1031 |
+
- type: cosine_recall@1
|
| 1032 |
+
value: 0.04217848526747235
|
| 1033 |
+
name: Cosine Recall@1
|
| 1034 |
+
- type: cosine_recall@3
|
| 1035 |
+
value: 0.12288848071178002
|
| 1036 |
+
name: Cosine Recall@3
|
| 1037 |
+
- type: cosine_recall@5
|
| 1038 |
+
value: 0.18344012521240954
|
| 1039 |
+
name: Cosine Recall@5
|
| 1040 |
+
- type: cosine_recall@10
|
| 1041 |
+
value: 0.2706183968947745
|
| 1042 |
+
name: Cosine Recall@10
|
| 1043 |
+
- type: cosine_ndcg@10
|
| 1044 |
+
value: 0.37139192897263235
|
| 1045 |
+
name: Cosine Ndcg@10
|
| 1046 |
+
- type: cosine_mrr@10
|
| 1047 |
+
value: 0.35916305916305874
|
| 1048 |
+
name: Cosine Mrr@10
|
| 1049 |
+
- type: cosine_map@100
|
| 1050 |
+
value: 0.4338211299784659
|
| 1051 |
+
name: Cosine Map@100
|
| 1052 |
+
- task:
|
| 1053 |
+
type: information-retrieval
|
| 1054 |
+
name: Information Retrieval
|
| 1055 |
+
dataset:
|
| 1056 |
+
name: dim 64
|
| 1057 |
+
type: dim_64
|
| 1058 |
+
metrics:
|
| 1059 |
+
- type: cosine_accuracy@1
|
| 1060 |
+
value: 0.3207426376440461
|
| 1061 |
+
name: Cosine Accuracy@1
|
| 1062 |
+
- type: cosine_accuracy@3
|
| 1063 |
+
value: 0.322663252240717
|
| 1064 |
+
name: Cosine Accuracy@3
|
| 1065 |
+
- type: cosine_accuracy@5
|
| 1066 |
+
value: 0.3405889884763124
|
| 1067 |
+
name: Cosine Accuracy@5
|
| 1068 |
+
- type: cosine_accuracy@10
|
| 1069 |
+
value: 0.3725992317541613
|
| 1070 |
+
name: Cosine Accuracy@10
|
| 1071 |
+
- type: cosine_precision@1
|
| 1072 |
+
value: 0.3207426376440461
|
| 1073 |
+
name: Cosine Precision@1
|
| 1074 |
+
- type: cosine_precision@3
|
| 1075 |
+
value: 0.3188220230473751
|
| 1076 |
+
name: Cosine Precision@3
|
| 1077 |
+
- type: cosine_precision@5
|
| 1078 |
+
value: 0.3088348271446863
|
| 1079 |
+
name: Cosine Precision@5
|
| 1080 |
+
- type: cosine_precision@10
|
| 1081 |
+
value: 0.2797055057618438
|
| 1082 |
+
name: Cosine Precision@10
|
| 1083 |
+
- type: cosine_recall@1
|
| 1084 |
+
value: 0.036318765090758674
|
| 1085 |
+
name: Cosine Recall@1
|
| 1086 |
+
- type: cosine_recall@3
|
| 1087 |
+
value: 0.10562189493083342
|
| 1088 |
+
name: Cosine Recall@3
|
| 1089 |
+
- type: cosine_recall@5
|
| 1090 |
+
value: 0.15867125525021739
|
| 1091 |
+
name: Cosine Recall@5
|
| 1092 |
+
- type: cosine_recall@10
|
| 1093 |
+
value: 0.23840960718091392
|
| 1094 |
+
name: Cosine Recall@10
|
| 1095 |
+
- type: cosine_ndcg@10
|
| 1096 |
+
value: 0.3371953828075091
|
| 1097 |
+
name: Cosine Ndcg@10
|
| 1098 |
+
- type: cosine_mrr@10
|
| 1099 |
+
value: 0.32884732638253733
|
| 1100 |
+
name: Cosine Mrr@10
|
| 1101 |
+
- type: cosine_map@100
|
| 1102 |
+
value: 0.3933467041096336
|
| 1103 |
+
name: Cosine Map@100
|
| 1104 |
+
---
|
| 1105 |
+
|
| 1106 |
+
# multilingual-e5-large
|
| 1107 |
+
|
| 1108 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large). It maps sentences & paragraphs to a 1024-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 1109 |
+
|
| 1110 |
+
## Model Details
|
| 1111 |
+
|
| 1112 |
+
### Model Description
|
| 1113 |
+
- **Model Type:** Sentence Transformer
|
| 1114 |
+
- **Base model:** [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large) <!-- at revision 0dc5580a448e4284468b8909bae50fa925907bc5 -->
|
| 1115 |
+
- **Maximum Sequence Length:** 512 tokens
|
| 1116 |
+
- **Output Dimensionality:** 1024 dimensions
|
| 1117 |
+
- **Similarity Function:** Cosine Similarity
|
| 1118 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 1119 |
+
- **Language:** en
|
| 1120 |
+
- **License:** apache-2.0
|
| 1121 |
+
|
| 1122 |
+
### Model Sources
|
| 1123 |
+
|
| 1124 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 1125 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 1126 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 1127 |
+
|
| 1128 |
+
### Full Model Architecture
|
| 1129 |
+
|
| 1130 |
+
```
|
| 1131 |
+
SentenceTransformer(
|
| 1132 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': False, 'architecture': 'XLMRobertaModel'})
|
| 1133 |
+
(1): Pooling({'word_embedding_dimension': 1024, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 1134 |
+
(2): Normalize()
|
| 1135 |
+
)
|
| 1136 |
+
```
|
| 1137 |
+
|
| 1138 |
+
## Usage
|
| 1139 |
+
|
| 1140 |
+
### Direct Usage (Sentence Transformers)
|
| 1141 |
+
|
| 1142 |
+
First install the Sentence Transformers library:
|
| 1143 |
+
|
| 1144 |
+
```bash
|
| 1145 |
+
pip install -U sentence-transformers
|
| 1146 |
+
```
|
| 1147 |
+
|
| 1148 |
+
Then you can load this model and run inference.
|
| 1149 |
+
```python
|
| 1150 |
+
from sentence_transformers import SentenceTransformer
|
| 1151 |
+
|
| 1152 |
+
# Download from the 🤗 Hub
|
| 1153 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
| 1154 |
+
# Run inference
|
| 1155 |
+
sentences = [
|
| 1156 |
+
'Who must facilitate the exercise of data subject rights?',
|
| 1157 |
+
'1.The controller shall take appropriate measures to provide any information referred to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34 relating to processing to the data subject in a concise, transparent, intelligible and easily accessible form, using clear and plain language, in particular for any information addressed specifically to a child. The information shall be provided in writing, or by other means, including, where appropriate, by electronic means. When requested by the data subject, the information may be provided orally, provided that the identity of the data subject is proven by other means. 4.5.2016 L 119/39 \n2.The controller shall facilitate the exercise of data subject rights under Articles 15 to 22. In the cases referred to in Article 11(2), the controller shall not refuse to act on the request of the data subject for exercising his or her rights under Articles 15 to 22, unless the controller demonstrates that it is not in a position to identify the data subject.\n3.The controller shall provide information on action taken on a request under Articles 15 to 22 to the data subject without undue delay and in any event within one month of receipt of the request. That period may be extended by two further months where necessary, taking into account the complexity and number of the requests. The controller shall inform the data subject of any such extension within one month of receipt of the request, together with the reasons for the delay. Where the data subject makes the request by electronic form means, the information shall be provided by electronic means where possible, unless otherwise requested by the data subject.\n4.If the controller does not take action on the request of the data subject, the controller shall inform the data subject without delay and at the latest within one month of receipt of the request of the reasons for not taking action and on the possibility of lodging a complaint with a supervisory authority and seeking a judicial remedy.\n5.Information provided under Articles 13 and 14 and any communication and any actions taken under Articles 15 to 22 and 34 shall be provided free of charge. Where requests from a data subject are manifestly unfounded or excessive, in particular because of their repetitive character, the controller may either: (a) charge a reasonable fee taking into account the administrative costs of providing the information or communication or taking the action requested; or (b) refuse to act on the request. The controller shall bear the burden of demonstrating the manifestly unfounded or excessive character of the request.\n6.Without prejudice to Article 11, where the controller has reasonable doubts concerning the identity of the natural person making the request referred to in Articles 15 to 21, the controller may request the provision of additional information necessary to confirm the identity of the data subject.\n7.The information to be provided to data subjects pursuant to Articles 13 and 14 may be provided in combination with standardised icons in order to give in an easily visible, intelligible and clearly legible manner a meaningful overview of the intended processing. Where the icons are presented electronically they shall be machine-readable.\n8.The Commission shall be empowered to adopt delegated acts in accordance with Article 92 for the purpose of determining the information to be presented by the icons and the procedures for providing standardised icons. Section 2 Information and access to personal data',
|
| 1158 |
+
'Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies to the processing of personal data by the Union institutions, bodies, offices and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable to such processing of personal data should be adapted to the principles and rules established in this Regulation and applied in the light of this Regulation. In order to provide a strong and coherent data protection framework in the Union, the necessary adaptations of Regulation (EC) No 45/2001 should follow after the adoption of this Regulation, in order to allow application at the same time as this Regulation.',
|
| 1159 |
+
]
|
| 1160 |
+
embeddings = model.encode(sentences)
|
| 1161 |
+
print(embeddings.shape)
|
| 1162 |
+
# [3, 1024]
|
| 1163 |
+
|
| 1164 |
+
# Get the similarity scores for the embeddings
|
| 1165 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 1166 |
+
print(similarities)
|
| 1167 |
+
# tensor([[1.0000, 0.5748, 0.4790],
|
| 1168 |
+
# [0.5748, 1.0000, 0.3993],
|
| 1169 |
+
# [0.4790, 0.3993, 1.0000]])
|
| 1170 |
+
```
|
| 1171 |
+
|
| 1172 |
+
<!--
|
| 1173 |
+
### Direct Usage (Transformers)
|
| 1174 |
+
|
| 1175 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 1176 |
+
|
| 1177 |
+
</details>
|
| 1178 |
+
-->
|
| 1179 |
+
|
| 1180 |
+
<!--
|
| 1181 |
+
### Downstream Usage (Sentence Transformers)
|
| 1182 |
+
|
| 1183 |
+
You can finetune this model on your own dataset.
|
| 1184 |
+
|
| 1185 |
+
<details><summary>Click to expand</summary>
|
| 1186 |
+
|
| 1187 |
+
</details>
|
| 1188 |
+
-->
|
| 1189 |
+
|
| 1190 |
+
<!--
|
| 1191 |
+
### Out-of-Scope Use
|
| 1192 |
+
|
| 1193 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 1194 |
+
-->
|
| 1195 |
+
|
| 1196 |
+
## Evaluation
|
| 1197 |
+
|
| 1198 |
+
### Metrics
|
| 1199 |
+
|
| 1200 |
+
#### Information Retrieval
|
| 1201 |
+
|
| 1202 |
+
* Dataset: `dim_1024`
|
| 1203 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1204 |
+
```json
|
| 1205 |
+
{
|
| 1206 |
+
"truncate_dim": 1024
|
| 1207 |
+
}
|
| 1208 |
+
```
|
| 1209 |
+
|
| 1210 |
+
| Metric | Value |
|
| 1211 |
+
|:--------------------|:-----------|
|
| 1212 |
+
| cosine_accuracy@1 | 0.4181 |
|
| 1213 |
+
| cosine_accuracy@3 | 0.4219 |
|
| 1214 |
+
| cosine_accuracy@5 | 0.4501 |
|
| 1215 |
+
| cosine_accuracy@10 | 0.4904 |
|
| 1216 |
+
| cosine_precision@1 | 0.4181 |
|
| 1217 |
+
| cosine_precision@3 | 0.4163 |
|
| 1218 |
+
| cosine_precision@5 | 0.4044 |
|
| 1219 |
+
| cosine_precision@10 | 0.3687 |
|
| 1220 |
+
| cosine_recall@1 | 0.0473 |
|
| 1221 |
+
| cosine_recall@3 | 0.1381 |
|
| 1222 |
+
| cosine_recall@5 | 0.207 |
|
| 1223 |
+
| cosine_recall@10 | 0.3085 |
|
| 1224 |
+
| **cosine_ndcg@10** | **0.4418** |
|
| 1225 |
+
| cosine_mrr@10 | 0.4299 |
|
| 1226 |
+
| cosine_map@100 | 0.5068 |
|
| 1227 |
+
|
| 1228 |
+
#### Information Retrieval
|
| 1229 |
+
|
| 1230 |
+
* Dataset: `dim_768`
|
| 1231 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1232 |
+
```json
|
| 1233 |
+
{
|
| 1234 |
+
"truncate_dim": 768
|
| 1235 |
+
}
|
| 1236 |
+
```
|
| 1237 |
+
|
| 1238 |
+
| Metric | Value |
|
| 1239 |
+
|:--------------------|:----------|
|
| 1240 |
+
| cosine_accuracy@1 | 0.4104 |
|
| 1241 |
+
| cosine_accuracy@3 | 0.4142 |
|
| 1242 |
+
| cosine_accuracy@5 | 0.4443 |
|
| 1243 |
+
| cosine_accuracy@10 | 0.4834 |
|
| 1244 |
+
| cosine_precision@1 | 0.4104 |
|
| 1245 |
+
| cosine_precision@3 | 0.4087 |
|
| 1246 |
+
| cosine_precision@5 | 0.3969 |
|
| 1247 |
+
| cosine_precision@10 | 0.3617 |
|
| 1248 |
+
| cosine_recall@1 | 0.0472 |
|
| 1249 |
+
| cosine_recall@3 | 0.1376 |
|
| 1250 |
+
| cosine_recall@5 | 0.206 |
|
| 1251 |
+
| cosine_recall@10 | 0.3054 |
|
| 1252 |
+
| **cosine_ndcg@10** | **0.435** |
|
| 1253 |
+
| cosine_mrr@10 | 0.4225 |
|
| 1254 |
+
| cosine_map@100 | 0.5005 |
|
| 1255 |
+
|
| 1256 |
+
#### Information Retrieval
|
| 1257 |
+
|
| 1258 |
+
* Dataset: `dim_512`
|
| 1259 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1260 |
+
```json
|
| 1261 |
+
{
|
| 1262 |
+
"truncate_dim": 512
|
| 1263 |
+
}
|
| 1264 |
+
```
|
| 1265 |
+
|
| 1266 |
+
| Metric | Value |
|
| 1267 |
+
|:--------------------|:-----------|
|
| 1268 |
+
| cosine_accuracy@1 | 0.4065 |
|
| 1269 |
+
| cosine_accuracy@3 | 0.4123 |
|
| 1270 |
+
| cosine_accuracy@5 | 0.4449 |
|
| 1271 |
+
| cosine_accuracy@10 | 0.4814 |
|
| 1272 |
+
| cosine_precision@1 | 0.4065 |
|
| 1273 |
+
| cosine_precision@3 | 0.4055 |
|
| 1274 |
+
| cosine_precision@5 | 0.3948 |
|
| 1275 |
+
| cosine_precision@10 | 0.3596 |
|
| 1276 |
+
| cosine_recall@1 | 0.0474 |
|
| 1277 |
+
| cosine_recall@3 | 0.1383 |
|
| 1278 |
+
| cosine_recall@5 | 0.2076 |
|
| 1279 |
+
| cosine_recall@10 | 0.3072 |
|
| 1280 |
+
| **cosine_ndcg@10** | **0.4329** |
|
| 1281 |
+
| cosine_mrr@10 | 0.4195 |
|
| 1282 |
+
| cosine_map@100 | 0.4956 |
|
| 1283 |
+
|
| 1284 |
+
#### Information Retrieval
|
| 1285 |
+
|
| 1286 |
+
* Dataset: `dim_256`
|
| 1287 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1288 |
+
```json
|
| 1289 |
+
{
|
| 1290 |
+
"truncate_dim": 256
|
| 1291 |
+
}
|
| 1292 |
+
```
|
| 1293 |
+
|
| 1294 |
+
| Metric | Value |
|
| 1295 |
+
|:--------------------|:-----------|
|
| 1296 |
+
| cosine_accuracy@1 | 0.3835 |
|
| 1297 |
+
| cosine_accuracy@3 | 0.3886 |
|
| 1298 |
+
| cosine_accuracy@5 | 0.4206 |
|
| 1299 |
+
| cosine_accuracy@10 | 0.4552 |
|
| 1300 |
+
| cosine_precision@1 | 0.3835 |
|
| 1301 |
+
| cosine_precision@3 | 0.3822 |
|
| 1302 |
+
| cosine_precision@5 | 0.3718 |
|
| 1303 |
+
| cosine_precision@10 | 0.3389 |
|
| 1304 |
+
| cosine_recall@1 | 0.0447 |
|
| 1305 |
+
| cosine_recall@3 | 0.1302 |
|
| 1306 |
+
| cosine_recall@5 | 0.195 |
|
| 1307 |
+
| cosine_recall@10 | 0.2892 |
|
| 1308 |
+
| **cosine_ndcg@10** | **0.4087** |
|
| 1309 |
+
| cosine_mrr@10 | 0.3958 |
|
| 1310 |
+
| cosine_map@100 | 0.471 |
|
| 1311 |
+
|
| 1312 |
+
#### Information Retrieval
|
| 1313 |
+
|
| 1314 |
+
* Dataset: `dim_128`
|
| 1315 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1316 |
+
```json
|
| 1317 |
+
{
|
| 1318 |
+
"truncate_dim": 128
|
| 1319 |
+
}
|
| 1320 |
+
```
|
| 1321 |
+
|
| 1322 |
+
| Metric | Value |
|
| 1323 |
+
|:--------------------|:-----------|
|
| 1324 |
+
| cosine_accuracy@1 | 0.347 |
|
| 1325 |
+
| cosine_accuracy@3 | 0.3515 |
|
| 1326 |
+
| cosine_accuracy@5 | 0.379 |
|
| 1327 |
+
| cosine_accuracy@10 | 0.4213 |
|
| 1328 |
+
| cosine_precision@1 | 0.347 |
|
| 1329 |
+
| cosine_precision@3 | 0.3457 |
|
| 1330 |
+
| cosine_precision@5 | 0.3352 |
|
| 1331 |
+
| cosine_precision@10 | 0.3043 |
|
| 1332 |
+
| cosine_recall@1 | 0.0422 |
|
| 1333 |
+
| cosine_recall@3 | 0.1229 |
|
| 1334 |
+
| cosine_recall@5 | 0.1834 |
|
| 1335 |
+
| cosine_recall@10 | 0.2706 |
|
| 1336 |
+
| **cosine_ndcg@10** | **0.3714** |
|
| 1337 |
+
| cosine_mrr@10 | 0.3592 |
|
| 1338 |
+
| cosine_map@100 | 0.4338 |
|
| 1339 |
+
|
| 1340 |
+
#### Information Retrieval
|
| 1341 |
+
|
| 1342 |
+
* Dataset: `dim_64`
|
| 1343 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1344 |
+
```json
|
| 1345 |
+
{
|
| 1346 |
+
"truncate_dim": 64
|
| 1347 |
+
}
|
| 1348 |
+
```
|
| 1349 |
+
|
| 1350 |
+
| Metric | Value |
|
| 1351 |
+
|:--------------------|:-----------|
|
| 1352 |
+
| cosine_accuracy@1 | 0.3207 |
|
| 1353 |
+
| cosine_accuracy@3 | 0.3227 |
|
| 1354 |
+
| cosine_accuracy@5 | 0.3406 |
|
| 1355 |
+
| cosine_accuracy@10 | 0.3726 |
|
| 1356 |
+
| cosine_precision@1 | 0.3207 |
|
| 1357 |
+
| cosine_precision@3 | 0.3188 |
|
| 1358 |
+
| cosine_precision@5 | 0.3088 |
|
| 1359 |
+
| cosine_precision@10 | 0.2797 |
|
| 1360 |
+
| cosine_recall@1 | 0.0363 |
|
| 1361 |
+
| cosine_recall@3 | 0.1056 |
|
| 1362 |
+
| cosine_recall@5 | 0.1587 |
|
| 1363 |
+
| cosine_recall@10 | 0.2384 |
|
| 1364 |
+
| **cosine_ndcg@10** | **0.3372** |
|
| 1365 |
+
| cosine_mrr@10 | 0.3288 |
|
| 1366 |
+
| cosine_map@100 | 0.3933 |
|
| 1367 |
+
|
| 1368 |
+
<!--
|
| 1369 |
+
## Bias, Risks and Limitations
|
| 1370 |
+
|
| 1371 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 1372 |
+
-->
|
| 1373 |
+
|
| 1374 |
+
<!--
|
| 1375 |
+
### Recommendations
|
| 1376 |
+
|
| 1377 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 1378 |
+
-->
|
| 1379 |
+
|
| 1380 |
+
## Training Details
|
| 1381 |
+
|
| 1382 |
+
### Training Dataset
|
| 1383 |
+
|
| 1384 |
+
#### Unnamed Dataset
|
| 1385 |
+
|
| 1386 |
+
* Size: 391 training samples
|
| 1387 |
+
* Columns: <code>anchor</code> and <code>positive</code>
|
| 1388 |
+
* Approximate statistics based on the first 391 samples:
|
| 1389 |
+
| | anchor | positive |
|
| 1390 |
+
|:--------|:----------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
|
| 1391 |
+
| type | string | string |
|
| 1392 |
+
| details | <ul><li>min: 8 tokens</li><li>mean: 17.16 tokens</li><li>max: 32 tokens</li></ul> | <ul><li>min: 27 tokens</li><li>mean: 377.93 tokens</li><li>max: 512 tokens</li></ul> |
|
| 1393 |
+
* Samples:
|
| 1394 |
+
| anchor | positive |
|
| 1395 |
+
|:-------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 1396 |
+
| <code>What measures must be taken according to Article 32?</code> | <code>1.Where processing is to be carried out on behalf of a controller, the controller shall use only processors providing sufficient guarantees to implement appropriate technical and organisational measures in such a manner that processing will meet the requirements of this Regulation and ensure the protection of the rights of the data subject.<br>2.The processor shall not engage another processor without prior specific or general written authorisation of the controller. In the case of general written authorisation, the processor shall inform the controller of any intended changes concerning the addition or replacement of other processors, thereby giving the controller the opportunity to object to such changes.<br>3.Processing by a processor shall be governed by a contract or other legal act under Union or Member State law, that is binding on the processor with regard to the controller and that sets out the subject-matter and duration of the processing, the nature and purpose of the processing, ...</code> |
|
| 1397 |
+
| <code>What is the responsibility of assisting and advising the data subjects in exercising their rights?</code> | <code>1.A transfer of personal data to a third country or an international organisation may take place where the Commission has decided that the third country, a territory or one or more specified sectors within that third country, or the international organisation in question ensures an adequate level of protection. Such a transfer shall not require any specific authorisation.<br>2.When assessing the adequacy of the level of protection, the Commission shall, in particular, take account of the following elements: (a) the rule of law, respect for human rights and fundamental freedoms, relevant legislation, both general and sectoral, including concerning public security, defence, national security and criminal law and the access of public authorities to personal data, as well as the implementation of such legislation, data protection rules, professional rules and security measures, including rules for the onward transfer of personal data to another third country or international organisation whi...</code> |
|
| 1398 |
+
| <code>What should Member States be authorized to provide for regarding personal data processing for archiving purposes?</code> | <code>Where personal data are processed for archiving purposes, this Regulation should also apply to that processing, bearing in mind that this Regulation should not apply to deceased persons. Public authorities or public or private bodies that hold records of public interest should be services which, pursuant to Union or Member State law, have a legal obligation to acquire, preserve, appraise, arrange, describe, communicate, promote, disseminate and provide access to records of enduring value for general public interest. Member States should also be authorised to provide for the further processing of personal data for archiving purposes, for example with a view to providing specific information related to the political behaviour under former totalitarian state regimes, genocide, crimes against humanity, in particular the Holocaust, or war crimes. 4.5.2016 L 119/29 Official Journal of the European Union EN</code> |
|
| 1399 |
+
* Loss: [<code>MatryoshkaLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#matryoshkaloss) with these parameters:
|
| 1400 |
+
```json
|
| 1401 |
+
{
|
| 1402 |
+
"loss": "MultipleNegativesRankingLoss",
|
| 1403 |
+
"matryoshka_dims": [
|
| 1404 |
+
1024,
|
| 1405 |
+
768,
|
| 1406 |
+
512,
|
| 1407 |
+
256,
|
| 1408 |
+
128,
|
| 1409 |
+
64
|
| 1410 |
+
],
|
| 1411 |
+
"matryoshka_weights": [
|
| 1412 |
+
1,
|
| 1413 |
+
1,
|
| 1414 |
+
1,
|
| 1415 |
+
1,
|
| 1416 |
+
1,
|
| 1417 |
+
1
|
| 1418 |
+
],
|
| 1419 |
+
"n_dims_per_step": -1
|
| 1420 |
+
}
|
| 1421 |
+
```
|
| 1422 |
+
|
| 1423 |
+
### Training Hyperparameters
|
| 1424 |
+
#### Non-Default Hyperparameters
|
| 1425 |
+
|
| 1426 |
+
- `eval_strategy`: epoch
|
| 1427 |
+
- `per_device_eval_batch_size`: 16
|
| 1428 |
+
- `gradient_accumulation_steps`: 4
|
| 1429 |
+
- `learning_rate`: 2e-05
|
| 1430 |
+
- `num_train_epochs`: 20
|
| 1431 |
+
- `lr_scheduler_type`: cosine
|
| 1432 |
+
- `warmup_ratio`: 0.1
|
| 1433 |
+
- `bf16`: True
|
| 1434 |
+
- `load_best_model_at_end`: True
|
| 1435 |
+
- `optim`: adamw_torch_fused
|
| 1436 |
+
- `batch_sampler`: no_duplicates
|
| 1437 |
+
|
| 1438 |
+
#### All Hyperparameters
|
| 1439 |
+
<details><summary>Click to expand</summary>
|
| 1440 |
+
|
| 1441 |
+
- `overwrite_output_dir`: False
|
| 1442 |
+
- `do_predict`: False
|
| 1443 |
+
- `eval_strategy`: epoch
|
| 1444 |
+
- `prediction_loss_only`: True
|
| 1445 |
+
- `per_device_train_batch_size`: 8
|
| 1446 |
+
- `per_device_eval_batch_size`: 16
|
| 1447 |
+
- `per_gpu_train_batch_size`: None
|
| 1448 |
+
- `per_gpu_eval_batch_size`: None
|
| 1449 |
+
- `gradient_accumulation_steps`: 4
|
| 1450 |
+
- `eval_accumulation_steps`: None
|
| 1451 |
+
- `torch_empty_cache_steps`: None
|
| 1452 |
+
- `learning_rate`: 2e-05
|
| 1453 |
+
- `weight_decay`: 0.0
|
| 1454 |
+
- `adam_beta1`: 0.9
|
| 1455 |
+
- `adam_beta2`: 0.999
|
| 1456 |
+
- `adam_epsilon`: 1e-08
|
| 1457 |
+
- `max_grad_norm`: 1.0
|
| 1458 |
+
- `num_train_epochs`: 20
|
| 1459 |
+
- `max_steps`: -1
|
| 1460 |
+
- `lr_scheduler_type`: cosine
|
| 1461 |
+
- `lr_scheduler_kwargs`: {}
|
| 1462 |
+
- `warmup_ratio`: 0.1
|
| 1463 |
+
- `warmup_steps`: 0
|
| 1464 |
+
- `log_level`: passive
|
| 1465 |
+
- `log_level_replica`: warning
|
| 1466 |
+
- `log_on_each_node`: True
|
| 1467 |
+
- `logging_nan_inf_filter`: True
|
| 1468 |
+
- `save_safetensors`: True
|
| 1469 |
+
- `save_on_each_node`: False
|
| 1470 |
+
- `save_only_model`: False
|
| 1471 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 1472 |
+
- `no_cuda`: False
|
| 1473 |
+
- `use_cpu`: False
|
| 1474 |
+
- `use_mps_device`: False
|
| 1475 |
+
- `seed`: 42
|
| 1476 |
+
- `data_seed`: None
|
| 1477 |
+
- `jit_mode_eval`: False
|
| 1478 |
+
- `use_ipex`: False
|
| 1479 |
+
- `bf16`: True
|
| 1480 |
+
- `fp16`: False
|
| 1481 |
+
- `fp16_opt_level`: O1
|
| 1482 |
+
- `half_precision_backend`: auto
|
| 1483 |
+
- `bf16_full_eval`: False
|
| 1484 |
+
- `fp16_full_eval`: False
|
| 1485 |
+
- `tf32`: None
|
| 1486 |
+
- `local_rank`: 0
|
| 1487 |
+
- `ddp_backend`: None
|
| 1488 |
+
- `tpu_num_cores`: None
|
| 1489 |
+
- `tpu_metrics_debug`: False
|
| 1490 |
+
- `debug`: []
|
| 1491 |
+
- `dataloader_drop_last`: False
|
| 1492 |
+
- `dataloader_num_workers`: 0
|
| 1493 |
+
- `dataloader_prefetch_factor`: None
|
| 1494 |
+
- `past_index`: -1
|
| 1495 |
+
- `disable_tqdm`: False
|
| 1496 |
+
- `remove_unused_columns`: True
|
| 1497 |
+
- `label_names`: None
|
| 1498 |
+
- `load_best_model_at_end`: True
|
| 1499 |
+
- `ignore_data_skip`: False
|
| 1500 |
+
- `fsdp`: []
|
| 1501 |
+
- `fsdp_min_num_params`: 0
|
| 1502 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 1503 |
+
- `tp_size`: 0
|
| 1504 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 1505 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 1506 |
+
- `deepspeed`: None
|
| 1507 |
+
- `label_smoothing_factor`: 0.0
|
| 1508 |
+
- `optim`: adamw_torch_fused
|
| 1509 |
+
- `optim_args`: None
|
| 1510 |
+
- `adafactor`: False
|
| 1511 |
+
- `group_by_length`: False
|
| 1512 |
+
- `length_column_name`: length
|
| 1513 |
+
- `ddp_find_unused_parameters`: None
|
| 1514 |
+
- `ddp_bucket_cap_mb`: None
|
| 1515 |
+
- `ddp_broadcast_buffers`: False
|
| 1516 |
+
- `dataloader_pin_memory`: True
|
| 1517 |
+
- `dataloader_persistent_workers`: False
|
| 1518 |
+
- `skip_memory_metrics`: True
|
| 1519 |
+
- `use_legacy_prediction_loop`: False
|
| 1520 |
+
- `push_to_hub`: False
|
| 1521 |
+
- `resume_from_checkpoint`: None
|
| 1522 |
+
- `hub_model_id`: None
|
| 1523 |
+
- `hub_strategy`: every_save
|
| 1524 |
+
- `hub_private_repo`: None
|
| 1525 |
+
- `hub_always_push`: False
|
| 1526 |
+
- `gradient_checkpointing`: False
|
| 1527 |
+
- `gradient_checkpointing_kwargs`: None
|
| 1528 |
+
- `include_inputs_for_metrics`: False
|
| 1529 |
+
- `include_for_metrics`: []
|
| 1530 |
+
- `eval_do_concat_batches`: True
|
| 1531 |
+
- `fp16_backend`: auto
|
| 1532 |
+
- `push_to_hub_model_id`: None
|
| 1533 |
+
- `push_to_hub_organization`: None
|
| 1534 |
+
- `mp_parameters`:
|
| 1535 |
+
- `auto_find_batch_size`: False
|
| 1536 |
+
- `full_determinism`: False
|
| 1537 |
+
- `torchdynamo`: None
|
| 1538 |
+
- `ray_scope`: last
|
| 1539 |
+
- `ddp_timeout`: 1800
|
| 1540 |
+
- `torch_compile`: False
|
| 1541 |
+
- `torch_compile_backend`: None
|
| 1542 |
+
- `torch_compile_mode`: None
|
| 1543 |
+
- `include_tokens_per_second`: False
|
| 1544 |
+
- `include_num_input_tokens_seen`: False
|
| 1545 |
+
- `neftune_noise_alpha`: None
|
| 1546 |
+
- `optim_target_modules`: None
|
| 1547 |
+
- `batch_eval_metrics`: False
|
| 1548 |
+
- `eval_on_start`: False
|
| 1549 |
+
- `use_liger_kernel`: False
|
| 1550 |
+
- `eval_use_gather_object`: False
|
| 1551 |
+
- `average_tokens_across_devices`: False
|
| 1552 |
+
- `prompts`: None
|
| 1553 |
+
- `batch_sampler`: no_duplicates
|
| 1554 |
+
- `multi_dataset_batch_sampler`: proportional
|
| 1555 |
+
- `router_mapping`: {}
|
| 1556 |
+
- `learning_rate_mapping`: {}
|
| 1557 |
+
|
| 1558 |
+
</details>
|
| 1559 |
+
|
| 1560 |
+
### Training Logs
|
| 1561 |
+
| Epoch | Step | Training Loss | dim_1024_cosine_ndcg@10 | dim_768_cosine_ndcg@10 | dim_512_cosine_ndcg@10 | dim_256_cosine_ndcg@10 | dim_128_cosine_ndcg@10 | dim_64_cosine_ndcg@10 |
|
| 1562 |
+
|:------:|:----:|:-------------:|:-----------------------:|:----------------------:|:----------------------:|:----------------------:|:----------------------:|:---------------------:|
|
| 1563 |
+
| 0.8163 | 10 | 31.5155 | - | - | - | - | - | - |
|
| 1564 |
+
| 1.0 | 13 | - | 0.4494 | 0.4446 | 0.4364 | 0.3947 | 0.3362 | 0.2621 |
|
| 1565 |
+
| 1.5714 | 20 | 19.0409 | - | - | - | - | - | - |
|
| 1566 |
+
| 2.0 | 26 | - | 0.4065 | 0.4004 | 0.4013 | 0.3692 | 0.3418 | 0.2882 |
|
| 1567 |
+
| 2.3265 | 30 | 14.5314 | - | - | - | - | - | - |
|
| 1568 |
+
| 3.0 | 39 | - | 0.4418 | 0.4350 | 0.4329 | 0.4087 | 0.3714 | 0.3372 |
|
| 1569 |
+
|
| 1570 |
+
|
| 1571 |
+
### Framework Versions
|
| 1572 |
+
- Python: 3.12.11
|
| 1573 |
+
- Sentence Transformers: 5.1.0
|
| 1574 |
+
- Transformers: 4.51.3
|
| 1575 |
+
- PyTorch: 2.8.0+cu126
|
| 1576 |
+
- Accelerate: 1.10.1
|
| 1577 |
+
- Datasets: 4.0.0
|
| 1578 |
+
- Tokenizers: 0.21.4
|
| 1579 |
+
|
| 1580 |
+
## Citation
|
| 1581 |
+
|
| 1582 |
+
### BibTeX
|
| 1583 |
+
|
| 1584 |
+
#### Sentence Transformers
|
| 1585 |
+
```bibtex
|
| 1586 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 1587 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 1588 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 1589 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 1590 |
+
month = "11",
|
| 1591 |
+
year = "2019",
|
| 1592 |
+
publisher = "Association for Computational Linguistics",
|
| 1593 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 1594 |
+
}
|
| 1595 |
+
```
|
| 1596 |
+
|
| 1597 |
+
#### MatryoshkaLoss
|
| 1598 |
+
```bibtex
|
| 1599 |
+
@misc{kusupati2024matryoshka,
|
| 1600 |
+
title={Matryoshka Representation Learning},
|
| 1601 |
+
author={Aditya Kusupati and Gantavya Bhatt and Aniket Rege and Matthew Wallingford and Aditya Sinha and Vivek Ramanujan and William Howard-Snyder and Kaifeng Chen and Sham Kakade and Prateek Jain and Ali Farhadi},
|
| 1602 |
+
year={2024},
|
| 1603 |
+
eprint={2205.13147},
|
| 1604 |
+
archivePrefix={arXiv},
|
| 1605 |
+
primaryClass={cs.LG}
|
| 1606 |
+
}
|
| 1607 |
+
```
|
| 1608 |
+
|
| 1609 |
+
#### MultipleNegativesRankingLoss
|
| 1610 |
+
```bibtex
|
| 1611 |
+
@misc{henderson2017efficient,
|
| 1612 |
+
title={Efficient Natural Language Response Suggestion for Smart Reply},
|
| 1613 |
+
author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
|
| 1614 |
+
year={2017},
|
| 1615 |
+
eprint={1705.00652},
|
| 1616 |
+
archivePrefix={arXiv},
|
| 1617 |
+
primaryClass={cs.CL}
|
| 1618 |
+
}
|
| 1619 |
+
```
|
| 1620 |
+
|
| 1621 |
+
<!--
|
| 1622 |
+
## Glossary
|
| 1623 |
+
|
| 1624 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 1625 |
+
-->
|
| 1626 |
+
|
| 1627 |
+
<!--
|
| 1628 |
+
## Model Card Authors
|
| 1629 |
+
|
| 1630 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 1631 |
+
-->
|
| 1632 |
+
|
| 1633 |
+
<!--
|
| 1634 |
+
## Model Card Contact
|
| 1635 |
+
|
| 1636 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 1637 |
+
-->
|
checkpoint-39/config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"XLMRobertaModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"bos_token_id": 0,
|
| 7 |
+
"classifier_dropout": null,
|
| 8 |
+
"eos_token_id": 2,
|
| 9 |
+
"hidden_act": "gelu",
|
| 10 |
+
"hidden_dropout_prob": 0.1,
|
| 11 |
+
"hidden_size": 1024,
|
| 12 |
+
"initializer_range": 0.02,
|
| 13 |
+
"intermediate_size": 4096,
|
| 14 |
+
"layer_norm_eps": 1e-05,
|
| 15 |
+
"max_position_embeddings": 514,
|
| 16 |
+
"model_type": "xlm-roberta",
|
| 17 |
+
"num_attention_heads": 16,
|
| 18 |
+
"num_hidden_layers": 24,
|
| 19 |
+
"output_past": true,
|
| 20 |
+
"pad_token_id": 1,
|
| 21 |
+
"position_embedding_type": "absolute",
|
| 22 |
+
"torch_dtype": "float32",
|
| 23 |
+
"transformers_version": "4.51.3",
|
| 24 |
+
"type_vocab_size": 1,
|
| 25 |
+
"use_cache": true,
|
| 26 |
+
"vocab_size": 250002
|
| 27 |
+
}
|
checkpoint-39/config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "SentenceTransformer",
|
| 3 |
+
"__version__": {
|
| 4 |
+
"sentence_transformers": "5.1.0",
|
| 5 |
+
"transformers": "4.51.3",
|
| 6 |
+
"pytorch": "2.8.0+cu126"
|
| 7 |
+
},
|
| 8 |
+
"prompts": {
|
| 9 |
+
"query": "",
|
| 10 |
+
"document": ""
|
| 11 |
+
},
|
| 12 |
+
"default_prompt_name": null,
|
| 13 |
+
"similarity_fn_name": "cosine"
|
| 14 |
+
}
|
checkpoint-39/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:606517f0bbfd9d0965e1f76f2da0525a6ed6a2c70afc1966a9b0134b9474e775
|
| 3 |
+
size 2239607176
|
checkpoint-39/modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
checkpoint-39/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9c909a2d90a6be41dec525d4f69773b1b7ef98feaaad0925b99faff29a123cb
|
| 3 |
+
size 4471067142
|
checkpoint-39/rng_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b43253bbaef563ee65793ca453e451021b8a647dbc8d80b82193bbfb19542943
|
| 3 |
+
size 14645
|
checkpoint-39/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bbe9b9462c0e6409f0e0b402c3d44d048e656208116af5441a4baa2dfc585878
|
| 3 |
+
size 1465
|
checkpoint-39/sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 512,
|
| 3 |
+
"do_lower_case": false
|
| 4 |
+
}
|
checkpoint-39/sentencepiece.bpe.model
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
|
| 3 |
+
size 5069051
|
checkpoint-39/special_tokens_map.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"cls_token": {
|
| 10 |
+
"content": "<s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"eos_token": {
|
| 17 |
+
"content": "</s>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"mask_token": {
|
| 24 |
+
"content": "<mask>",
|
| 25 |
+
"lstrip": true,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"pad_token": {
|
| 31 |
+
"content": "<pad>",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
},
|
| 37 |
+
"sep_token": {
|
| 38 |
+
"content": "</s>",
|
| 39 |
+
"lstrip": false,
|
| 40 |
+
"normalized": false,
|
| 41 |
+
"rstrip": false,
|
| 42 |
+
"single_word": false
|
| 43 |
+
},
|
| 44 |
+
"unk_token": {
|
| 45 |
+
"content": "<unk>",
|
| 46 |
+
"lstrip": false,
|
| 47 |
+
"normalized": false,
|
| 48 |
+
"rstrip": false,
|
| 49 |
+
"single_word": false
|
| 50 |
+
}
|
| 51 |
+
}
|
checkpoint-39/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:883b037111086fd4dfebbbc9b7cee11e1517b5e0c0514879478661440f137085
|
| 3 |
+
size 17082987
|
checkpoint-39/tokenizer_config.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "<s>",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<pad>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "</s>",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "<unk>",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"250001": {
|
| 36 |
+
"content": "<mask>",
|
| 37 |
+
"lstrip": true,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"bos_token": "<s>",
|
| 45 |
+
"clean_up_tokenization_spaces": true,
|
| 46 |
+
"cls_token": "<s>",
|
| 47 |
+
"eos_token": "</s>",
|
| 48 |
+
"extra_special_tokens": {},
|
| 49 |
+
"mask_token": "<mask>",
|
| 50 |
+
"model_max_length": 512,
|
| 51 |
+
"pad_token": "<pad>",
|
| 52 |
+
"sep_token": "</s>",
|
| 53 |
+
"tokenizer_class": "XLMRobertaTokenizer",
|
| 54 |
+
"unk_token": "<unk>"
|
| 55 |
+
}
|
checkpoint-39/trainer_state.json
ADDED
|
@@ -0,0 +1,358 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"best_global_step": 39,
|
| 3 |
+
"best_metric": 0.37139192897263235,
|
| 4 |
+
"best_model_checkpoint": "intfloat/multilingual-e5-large/checkpoint-39",
|
| 5 |
+
"epoch": 3.0,
|
| 6 |
+
"eval_steps": 500,
|
| 7 |
+
"global_step": 39,
|
| 8 |
+
"is_hyper_param_search": false,
|
| 9 |
+
"is_local_process_zero": true,
|
| 10 |
+
"is_world_process_zero": true,
|
| 11 |
+
"log_history": [
|
| 12 |
+
{
|
| 13 |
+
"epoch": 0.8163265306122449,
|
| 14 |
+
"grad_norm": 307.08624267578125,
|
| 15 |
+
"learning_rate": 7.500000000000001e-06,
|
| 16 |
+
"loss": 31.5155,
|
| 17 |
+
"step": 10
|
| 18 |
+
},
|
| 19 |
+
{
|
| 20 |
+
"epoch": 1.0,
|
| 21 |
+
"eval_dim_1024_cosine_accuracy@1": 0.42509603072983354,
|
| 22 |
+
"eval_dim_1024_cosine_accuracy@10": 0.49295774647887325,
|
| 23 |
+
"eval_dim_1024_cosine_accuracy@3": 0.43085787451984636,
|
| 24 |
+
"eval_dim_1024_cosine_accuracy@5": 0.46030729833546735,
|
| 25 |
+
"eval_dim_1024_cosine_map@100": 0.508986346237021,
|
| 26 |
+
"eval_dim_1024_cosine_mrr@10": 0.4369535394183281,
|
| 27 |
+
"eval_dim_1024_cosine_ndcg@10": 0.4493804868009024,
|
| 28 |
+
"eval_dim_1024_cosine_precision@1": 0.42509603072983354,
|
| 29 |
+
"eval_dim_1024_cosine_precision@10": 0.376056338028169,
|
| 30 |
+
"eval_dim_1024_cosine_precision@3": 0.42402902262057185,
|
| 31 |
+
"eval_dim_1024_cosine_precision@5": 0.4133162612035851,
|
| 32 |
+
"eval_dim_1024_cosine_recall@1": 0.04813624827530403,
|
| 33 |
+
"eval_dim_1024_cosine_recall@10": 0.3150476790176975,
|
| 34 |
+
"eval_dim_1024_cosine_recall@3": 0.1404092551990217,
|
| 35 |
+
"eval_dim_1024_cosine_recall@5": 0.21147403835662126,
|
| 36 |
+
"eval_dim_128_cosine_accuracy@1": 0.31370038412291934,
|
| 37 |
+
"eval_dim_128_cosine_accuracy@10": 0.38156209987195905,
|
| 38 |
+
"eval_dim_128_cosine_accuracy@3": 0.31946222791293216,
|
| 39 |
+
"eval_dim_128_cosine_accuracy@5": 0.34571062740076824,
|
| 40 |
+
"eval_dim_128_cosine_map@100": 0.3991669558616212,
|
| 41 |
+
"eval_dim_128_cosine_mrr@10": 0.32517427799117904,
|
| 42 |
+
"eval_dim_128_cosine_ndcg@10": 0.33618283481296385,
|
| 43 |
+
"eval_dim_128_cosine_precision@1": 0.31370038412291934,
|
| 44 |
+
"eval_dim_128_cosine_precision@10": 0.2764404609475032,
|
| 45 |
+
"eval_dim_128_cosine_precision@3": 0.31284677763551,
|
| 46 |
+
"eval_dim_128_cosine_precision@5": 0.30422535211267604,
|
| 47 |
+
"eval_dim_128_cosine_recall@1": 0.037933385936292925,
|
| 48 |
+
"eval_dim_128_cosine_recall@10": 0.24798465115464788,
|
| 49 |
+
"eval_dim_128_cosine_recall@3": 0.11100168654049715,
|
| 50 |
+
"eval_dim_128_cosine_recall@5": 0.1670926413559068,
|
| 51 |
+
"eval_dim_256_cosine_accuracy@1": 0.36427656850192064,
|
| 52 |
+
"eval_dim_256_cosine_accuracy@10": 0.44814340588988477,
|
| 53 |
+
"eval_dim_256_cosine_accuracy@3": 0.36939820742637647,
|
| 54 |
+
"eval_dim_256_cosine_accuracy@5": 0.4090909090909091,
|
| 55 |
+
"eval_dim_256_cosine_map@100": 0.45841270037343096,
|
| 56 |
+
"eval_dim_256_cosine_mrr@10": 0.37879397597707415,
|
| 57 |
+
"eval_dim_256_cosine_ndcg@10": 0.3947006636735062,
|
| 58 |
+
"eval_dim_256_cosine_precision@1": 0.36427656850192064,
|
| 59 |
+
"eval_dim_256_cosine_precision@10": 0.3289372599231754,
|
| 60 |
+
"eval_dim_256_cosine_precision@3": 0.36363636363636365,
|
| 61 |
+
"eval_dim_256_cosine_precision@5": 0.3560819462227913,
|
| 62 |
+
"eval_dim_256_cosine_recall@1": 0.04277277943657814,
|
| 63 |
+
"eval_dim_256_cosine_recall@10": 0.28617844199333936,
|
| 64 |
+
"eval_dim_256_cosine_recall@3": 0.1253991943934714,
|
| 65 |
+
"eval_dim_256_cosine_recall@5": 0.18947388504512186,
|
| 66 |
+
"eval_dim_512_cosine_accuracy@1": 0.4084507042253521,
|
| 67 |
+
"eval_dim_512_cosine_accuracy@10": 0.4871959026888604,
|
| 68 |
+
"eval_dim_512_cosine_accuracy@3": 0.41357234314980795,
|
| 69 |
+
"eval_dim_512_cosine_accuracy@5": 0.4519846350832266,
|
| 70 |
+
"eval_dim_512_cosine_map@100": 0.495554245202425,
|
| 71 |
+
"eval_dim_512_cosine_mrr@10": 0.42213127248338495,
|
| 72 |
+
"eval_dim_512_cosine_ndcg@10": 0.43644305450989757,
|
| 73 |
+
"eval_dim_512_cosine_precision@1": 0.4084507042253521,
|
| 74 |
+
"eval_dim_512_cosine_precision@10": 0.36606914212548014,
|
| 75 |
+
"eval_dim_512_cosine_precision@3": 0.40738369611609043,
|
| 76 |
+
"eval_dim_512_cosine_precision@5": 0.39846350832266325,
|
| 77 |
+
"eval_dim_512_cosine_recall@1": 0.04628035514721453,
|
| 78 |
+
"eval_dim_512_cosine_recall@10": 0.30419701916496145,
|
| 79 |
+
"eval_dim_512_cosine_recall@3": 0.13522898183596205,
|
| 80 |
+
"eval_dim_512_cosine_recall@5": 0.20394662187726964,
|
| 81 |
+
"eval_dim_64_cosine_accuracy@1": 0.24199743918053776,
|
| 82 |
+
"eval_dim_64_cosine_accuracy@10": 0.29641485275288093,
|
| 83 |
+
"eval_dim_64_cosine_accuracy@3": 0.24775928297055058,
|
| 84 |
+
"eval_dim_64_cosine_accuracy@5": 0.26952624839948786,
|
| 85 |
+
"eval_dim_64_cosine_map@100": 0.31803601064541553,
|
| 86 |
+
"eval_dim_64_cosine_mrr@10": 0.25159771761884414,
|
| 87 |
+
"eval_dim_64_cosine_ndcg@10": 0.2620553065689597,
|
| 88 |
+
"eval_dim_64_cosine_precision@1": 0.24199743918053776,
|
| 89 |
+
"eval_dim_64_cosine_precision@10": 0.21568501920614594,
|
| 90 |
+
"eval_dim_64_cosine_precision@3": 0.24199743918053776,
|
| 91 |
+
"eval_dim_64_cosine_precision@5": 0.23649167733674775,
|
| 92 |
+
"eval_dim_64_cosine_recall@1": 0.029110868794154622,
|
| 93 |
+
"eval_dim_64_cosine_recall@10": 0.19521971714475267,
|
| 94 |
+
"eval_dim_64_cosine_recall@3": 0.08524734139651896,
|
| 95 |
+
"eval_dim_64_cosine_recall@5": 0.12921904680249943,
|
| 96 |
+
"eval_dim_768_cosine_accuracy@1": 0.4193341869398207,
|
| 97 |
+
"eval_dim_768_cosine_accuracy@10": 0.4910371318822023,
|
| 98 |
+
"eval_dim_768_cosine_accuracy@3": 0.4238156209987196,
|
| 99 |
+
"eval_dim_768_cosine_accuracy@5": 0.4551856594110115,
|
| 100 |
+
"eval_dim_768_cosine_map@100": 0.5037778776293926,
|
| 101 |
+
"eval_dim_768_cosine_mrr@10": 0.4315339003719285,
|
| 102 |
+
"eval_dim_768_cosine_ndcg@10": 0.44456410503401034,
|
| 103 |
+
"eval_dim_768_cosine_precision@1": 0.4193341869398207,
|
| 104 |
+
"eval_dim_768_cosine_precision@10": 0.37272727272727274,
|
| 105 |
+
"eval_dim_768_cosine_precision@3": 0.4180537772087068,
|
| 106 |
+
"eval_dim_768_cosine_precision@5": 0.4076824583866837,
|
| 107 |
+
"eval_dim_768_cosine_recall@1": 0.04699592881851732,
|
| 108 |
+
"eval_dim_768_cosine_recall@10": 0.3107289399017082,
|
| 109 |
+
"eval_dim_768_cosine_recall@3": 0.13721565163348118,
|
| 110 |
+
"eval_dim_768_cosine_recall@5": 0.20710427114944024,
|
| 111 |
+
"eval_runtime": 98.6525,
|
| 112 |
+
"eval_samples_per_second": 0.0,
|
| 113 |
+
"eval_sequential_score": 0.2620553065689597,
|
| 114 |
+
"eval_steps_per_second": 0.0,
|
| 115 |
+
"step": 13
|
| 116 |
+
},
|
| 117 |
+
{
|
| 118 |
+
"epoch": 1.5714285714285714,
|
| 119 |
+
"grad_norm": 280.07818603515625,
|
| 120 |
+
"learning_rate": 1.5833333333333333e-05,
|
| 121 |
+
"loss": 19.0409,
|
| 122 |
+
"step": 20
|
| 123 |
+
},
|
| 124 |
+
{
|
| 125 |
+
"epoch": 2.0,
|
| 126 |
+
"eval_dim_1024_cosine_accuracy@1": 0.3854033290653009,
|
| 127 |
+
"eval_dim_1024_cosine_accuracy@10": 0.45454545454545453,
|
| 128 |
+
"eval_dim_1024_cosine_accuracy@3": 0.3886043533930858,
|
| 129 |
+
"eval_dim_1024_cosine_accuracy@5": 0.41101152368758004,
|
| 130 |
+
"eval_dim_1024_cosine_map@100": 0.47259820099791205,
|
| 131 |
+
"eval_dim_1024_cosine_mrr@10": 0.39624870434729537,
|
| 132 |
+
"eval_dim_1024_cosine_ndcg@10": 0.4065329035406967,
|
| 133 |
+
"eval_dim_1024_cosine_precision@1": 0.3854033290653009,
|
| 134 |
+
"eval_dim_1024_cosine_precision@10": 0.3357874519846351,
|
| 135 |
+
"eval_dim_1024_cosine_precision@3": 0.3839095177123346,
|
| 136 |
+
"eval_dim_1024_cosine_precision@5": 0.3713188220230474,
|
| 137 |
+
"eval_dim_1024_cosine_recall@1": 0.0451686782205082,
|
| 138 |
+
"eval_dim_1024_cosine_recall@10": 0.2918225395020212,
|
| 139 |
+
"eval_dim_1024_cosine_recall@3": 0.13200270380544088,
|
| 140 |
+
"eval_dim_1024_cosine_recall@5": 0.19735476247586825,
|
| 141 |
+
"eval_dim_128_cosine_accuracy@1": 0.31562099871959026,
|
| 142 |
+
"eval_dim_128_cosine_accuracy@10": 0.39180537772087065,
|
| 143 |
+
"eval_dim_128_cosine_accuracy@3": 0.3207426376440461,
|
| 144 |
+
"eval_dim_128_cosine_accuracy@5": 0.352112676056338,
|
| 145 |
+
"eval_dim_128_cosine_map@100": 0.40471008477532144,
|
| 146 |
+
"eval_dim_128_cosine_mrr@10": 0.32839105339105285,
|
| 147 |
+
"eval_dim_128_cosine_ndcg@10": 0.34177784905202935,
|
| 148 |
+
"eval_dim_128_cosine_precision@1": 0.31562099871959026,
|
| 149 |
+
"eval_dim_128_cosine_precision@10": 0.280729833546735,
|
| 150 |
+
"eval_dim_128_cosine_precision@3": 0.31455399061032857,
|
| 151 |
+
"eval_dim_128_cosine_precision@5": 0.30640204865556975,
|
| 152 |
+
"eval_dim_128_cosine_recall@1": 0.03888088094516579,
|
| 153 |
+
"eval_dim_128_cosine_recall@10": 0.2550464126190524,
|
| 154 |
+
"eval_dim_128_cosine_recall@3": 0.11341113256173359,
|
| 155 |
+
"eval_dim_128_cosine_recall@5": 0.17046484922169536,
|
| 156 |
+
"eval_dim_256_cosine_accuracy@1": 0.3418693982074264,
|
| 157 |
+
"eval_dim_256_cosine_accuracy@10": 0.4238156209987196,
|
| 158 |
+
"eval_dim_256_cosine_accuracy@3": 0.34763124199743917,
|
| 159 |
+
"eval_dim_256_cosine_accuracy@5": 0.38092189500640206,
|
| 160 |
+
"eval_dim_256_cosine_map@100": 0.43770217754051305,
|
| 161 |
+
"eval_dim_256_cosine_mrr@10": 0.35596482938032165,
|
| 162 |
+
"eval_dim_256_cosine_ndcg@10": 0.36923043791328775,
|
| 163 |
+
"eval_dim_256_cosine_precision@1": 0.3418693982074264,
|
| 164 |
+
"eval_dim_256_cosine_precision@10": 0.30441741357234314,
|
| 165 |
+
"eval_dim_256_cosine_precision@3": 0.34165599658557405,
|
| 166 |
+
"eval_dim_256_cosine_precision@5": 0.3322663252240717,
|
| 167 |
+
"eval_dim_256_cosine_recall@1": 0.041410929155814194,
|
| 168 |
+
"eval_dim_256_cosine_recall@10": 0.2705196189189818,
|
| 169 |
+
"eval_dim_256_cosine_recall@3": 0.1212642412965687,
|
| 170 |
+
"eval_dim_256_cosine_recall@5": 0.18173918651563936,
|
| 171 |
+
"eval_dim_512_cosine_accuracy@1": 0.37708066581306016,
|
| 172 |
+
"eval_dim_512_cosine_accuracy@10": 0.4532650448143406,
|
| 173 |
+
"eval_dim_512_cosine_accuracy@3": 0.38092189500640206,
|
| 174 |
+
"eval_dim_512_cosine_accuracy@5": 0.4084507042253521,
|
| 175 |
+
"eval_dim_512_cosine_map@100": 0.4678017780580059,
|
| 176 |
+
"eval_dim_512_cosine_mrr@10": 0.3893670101416575,
|
| 177 |
+
"eval_dim_512_cosine_ndcg@10": 0.40127522003513455,
|
| 178 |
+
"eval_dim_512_cosine_precision@1": 0.37708066581306016,
|
| 179 |
+
"eval_dim_512_cosine_precision@10": 0.33156209987195906,
|
| 180 |
+
"eval_dim_512_cosine_precision@3": 0.37537345283824153,
|
| 181 |
+
"eval_dim_512_cosine_precision@5": 0.36402048655569774,
|
| 182 |
+
"eval_dim_512_cosine_recall@1": 0.04457309853297402,
|
| 183 |
+
"eval_dim_512_cosine_recall@10": 0.2883968018428671,
|
| 184 |
+
"eval_dim_512_cosine_recall@3": 0.13007205872054822,
|
| 185 |
+
"eval_dim_512_cosine_recall@5": 0.19449520589871025,
|
| 186 |
+
"eval_dim_64_cosine_accuracy@1": 0.26696542893725994,
|
| 187 |
+
"eval_dim_64_cosine_accuracy@10": 0.33098591549295775,
|
| 188 |
+
"eval_dim_64_cosine_accuracy@3": 0.27208706786171577,
|
| 189 |
+
"eval_dim_64_cosine_accuracy@5": 0.293213828425096,
|
| 190 |
+
"eval_dim_64_cosine_map@100": 0.34719730722747555,
|
| 191 |
+
"eval_dim_64_cosine_mrr@10": 0.2776957197731842,
|
| 192 |
+
"eval_dim_64_cosine_ndcg@10": 0.2881905192612941,
|
| 193 |
+
"eval_dim_64_cosine_precision@1": 0.26696542893725994,
|
| 194 |
+
"eval_dim_64_cosine_precision@10": 0.237708066581306,
|
| 195 |
+
"eval_dim_64_cosine_precision@3": 0.26717883055911223,
|
| 196 |
+
"eval_dim_64_cosine_precision@5": 0.2596670934699104,
|
| 197 |
+
"eval_dim_64_cosine_recall@1": 0.031692344067516816,
|
| 198 |
+
"eval_dim_64_cosine_recall@10": 0.21473974122936995,
|
| 199 |
+
"eval_dim_64_cosine_recall@3": 0.09327455064654774,
|
| 200 |
+
"eval_dim_64_cosine_recall@5": 0.14131510912407144,
|
| 201 |
+
"eval_dim_768_cosine_accuracy@1": 0.37451984635083224,
|
| 202 |
+
"eval_dim_768_cosine_accuracy@10": 0.4539052496798976,
|
| 203 |
+
"eval_dim_768_cosine_accuracy@3": 0.37900128040973113,
|
| 204 |
+
"eval_dim_768_cosine_accuracy@5": 0.40973111395646605,
|
| 205 |
+
"eval_dim_768_cosine_map@100": 0.4672061011440217,
|
| 206 |
+
"eval_dim_768_cosine_mrr@10": 0.38746671950897227,
|
| 207 |
+
"eval_dim_768_cosine_ndcg@10": 0.4004027303245026,
|
| 208 |
+
"eval_dim_768_cosine_precision@1": 0.37451984635083224,
|
| 209 |
+
"eval_dim_768_cosine_precision@10": 0.3318181818181818,
|
| 210 |
+
"eval_dim_768_cosine_precision@3": 0.3734528382415706,
|
| 211 |
+
"eval_dim_768_cosine_precision@5": 0.3632522407170295,
|
| 212 |
+
"eval_dim_768_cosine_recall@1": 0.04413921317349132,
|
| 213 |
+
"eval_dim_768_cosine_recall@10": 0.28955317519546525,
|
| 214 |
+
"eval_dim_768_cosine_recall@3": 0.12896663310051748,
|
| 215 |
+
"eval_dim_768_cosine_recall@5": 0.19376203165061448,
|
| 216 |
+
"eval_runtime": 98.4244,
|
| 217 |
+
"eval_samples_per_second": 0.0,
|
| 218 |
+
"eval_sequential_score": 0.2881905192612941,
|
| 219 |
+
"eval_steps_per_second": 0.0,
|
| 220 |
+
"step": 26
|
| 221 |
+
},
|
| 222 |
+
{
|
| 223 |
+
"epoch": 2.326530612244898,
|
| 224 |
+
"grad_norm": 305.66259765625,
|
| 225 |
+
"learning_rate": 1.9973569167005725e-05,
|
| 226 |
+
"loss": 14.5314,
|
| 227 |
+
"step": 30
|
| 228 |
+
},
|
| 229 |
+
{
|
| 230 |
+
"epoch": 3.0,
|
| 231 |
+
"eval_dim_1024_cosine_accuracy@1": 0.4180537772087068,
|
| 232 |
+
"eval_dim_1024_cosine_accuracy@10": 0.49039692701664533,
|
| 233 |
+
"eval_dim_1024_cosine_accuracy@3": 0.42189500640204863,
|
| 234 |
+
"eval_dim_1024_cosine_accuracy@5": 0.4500640204865557,
|
| 235 |
+
"eval_dim_1024_cosine_map@100": 0.506794523350519,
|
| 236 |
+
"eval_dim_1024_cosine_mrr@10": 0.42985717334308843,
|
| 237 |
+
"eval_dim_1024_cosine_ndcg@10": 0.44178501209869797,
|
| 238 |
+
"eval_dim_1024_cosine_precision@1": 0.4180537772087068,
|
| 239 |
+
"eval_dim_1024_cosine_precision@10": 0.36869398207426374,
|
| 240 |
+
"eval_dim_1024_cosine_precision@3": 0.4163465642338881,
|
| 241 |
+
"eval_dim_1024_cosine_precision@5": 0.4043533930857874,
|
| 242 |
+
"eval_dim_1024_cosine_recall@1": 0.04734422767263886,
|
| 243 |
+
"eval_dim_1024_cosine_recall@10": 0.308531274625124,
|
| 244 |
+
"eval_dim_1024_cosine_recall@3": 0.138064233626932,
|
| 245 |
+
"eval_dim_1024_cosine_recall@5": 0.2069980430010945,
|
| 246 |
+
"eval_dim_128_cosine_accuracy@1": 0.34699103713188223,
|
| 247 |
+
"eval_dim_128_cosine_accuracy@10": 0.4212548015364917,
|
| 248 |
+
"eval_dim_128_cosine_accuracy@3": 0.35147247119078107,
|
| 249 |
+
"eval_dim_128_cosine_accuracy@5": 0.37900128040973113,
|
| 250 |
+
"eval_dim_128_cosine_map@100": 0.4338211299784659,
|
| 251 |
+
"eval_dim_128_cosine_mrr@10": 0.35916305916305874,
|
| 252 |
+
"eval_dim_128_cosine_ndcg@10": 0.37139192897263235,
|
| 253 |
+
"eval_dim_128_cosine_precision@1": 0.34699103713188223,
|
| 254 |
+
"eval_dim_128_cosine_precision@10": 0.3042893725992318,
|
| 255 |
+
"eval_dim_128_cosine_precision@3": 0.34571062740076824,
|
| 256 |
+
"eval_dim_128_cosine_precision@5": 0.3352112676056338,
|
| 257 |
+
"eval_dim_128_cosine_recall@1": 0.04217848526747235,
|
| 258 |
+
"eval_dim_128_cosine_recall@10": 0.2706183968947745,
|
| 259 |
+
"eval_dim_128_cosine_recall@3": 0.12288848071178002,
|
| 260 |
+
"eval_dim_128_cosine_recall@5": 0.18344012521240954,
|
| 261 |
+
"eval_dim_256_cosine_accuracy@1": 0.38348271446862997,
|
| 262 |
+
"eval_dim_256_cosine_accuracy@10": 0.4551856594110115,
|
| 263 |
+
"eval_dim_256_cosine_accuracy@3": 0.3886043533930858,
|
| 264 |
+
"eval_dim_256_cosine_accuracy@5": 0.4206145966709347,
|
| 265 |
+
"eval_dim_256_cosine_map@100": 0.4709582085612654,
|
| 266 |
+
"eval_dim_256_cosine_mrr@10": 0.3957850639188662,
|
| 267 |
+
"eval_dim_256_cosine_ndcg@10": 0.4087462230477571,
|
| 268 |
+
"eval_dim_256_cosine_precision@1": 0.38348271446862997,
|
| 269 |
+
"eval_dim_256_cosine_precision@10": 0.33886043533930854,
|
| 270 |
+
"eval_dim_256_cosine_precision@3": 0.382202304737516,
|
| 271 |
+
"eval_dim_256_cosine_precision@5": 0.3718309859154929,
|
| 272 |
+
"eval_dim_256_cosine_recall@1": 0.04466034705404223,
|
| 273 |
+
"eval_dim_256_cosine_recall@10": 0.2892016292717267,
|
| 274 |
+
"eval_dim_256_cosine_recall@3": 0.1301795023253766,
|
| 275 |
+
"eval_dim_256_cosine_recall@5": 0.19500340584044382,
|
| 276 |
+
"eval_dim_512_cosine_accuracy@1": 0.4065300896286812,
|
| 277 |
+
"eval_dim_512_cosine_accuracy@10": 0.4814340588988476,
|
| 278 |
+
"eval_dim_512_cosine_accuracy@3": 0.41229193341869397,
|
| 279 |
+
"eval_dim_512_cosine_accuracy@5": 0.44494238156209986,
|
| 280 |
+
"eval_dim_512_cosine_map@100": 0.49555759572196095,
|
| 281 |
+
"eval_dim_512_cosine_mrr@10": 0.41950236774180394,
|
| 282 |
+
"eval_dim_512_cosine_ndcg@10": 0.4329095460408428,
|
| 283 |
+
"eval_dim_512_cosine_precision@1": 0.4065300896286812,
|
| 284 |
+
"eval_dim_512_cosine_precision@10": 0.3596030729833547,
|
| 285 |
+
"eval_dim_512_cosine_precision@3": 0.4054630815194195,
|
| 286 |
+
"eval_dim_512_cosine_precision@5": 0.3947503201024327,
|
| 287 |
+
"eval_dim_512_cosine_recall@1": 0.047372341735862133,
|
| 288 |
+
"eval_dim_512_cosine_recall@10": 0.3071623578952262,
|
| 289 |
+
"eval_dim_512_cosine_recall@3": 0.1383106496582531,
|
| 290 |
+
"eval_dim_512_cosine_recall@5": 0.20757258542171747,
|
| 291 |
+
"eval_dim_64_cosine_accuracy@1": 0.3207426376440461,
|
| 292 |
+
"eval_dim_64_cosine_accuracy@10": 0.3725992317541613,
|
| 293 |
+
"eval_dim_64_cosine_accuracy@3": 0.322663252240717,
|
| 294 |
+
"eval_dim_64_cosine_accuracy@5": 0.3405889884763124,
|
| 295 |
+
"eval_dim_64_cosine_map@100": 0.3933467041096336,
|
| 296 |
+
"eval_dim_64_cosine_mrr@10": 0.32884732638253733,
|
| 297 |
+
"eval_dim_64_cosine_ndcg@10": 0.3371953828075091,
|
| 298 |
+
"eval_dim_64_cosine_precision@1": 0.3207426376440461,
|
| 299 |
+
"eval_dim_64_cosine_precision@10": 0.2797055057618438,
|
| 300 |
+
"eval_dim_64_cosine_precision@3": 0.3188220230473751,
|
| 301 |
+
"eval_dim_64_cosine_precision@5": 0.3088348271446863,
|
| 302 |
+
"eval_dim_64_cosine_recall@1": 0.036318765090758674,
|
| 303 |
+
"eval_dim_64_cosine_recall@10": 0.23840960718091392,
|
| 304 |
+
"eval_dim_64_cosine_recall@3": 0.10562189493083342,
|
| 305 |
+
"eval_dim_64_cosine_recall@5": 0.15867125525021739,
|
| 306 |
+
"eval_dim_768_cosine_accuracy@1": 0.41037131882202305,
|
| 307 |
+
"eval_dim_768_cosine_accuracy@10": 0.4833546734955186,
|
| 308 |
+
"eval_dim_768_cosine_accuracy@3": 0.4142125480153649,
|
| 309 |
+
"eval_dim_768_cosine_accuracy@5": 0.44430217669654287,
|
| 310 |
+
"eval_dim_768_cosine_map@100": 0.500478306774528,
|
| 311 |
+
"eval_dim_768_cosine_mrr@10": 0.4224889742495374,
|
| 312 |
+
"eval_dim_768_cosine_ndcg@10": 0.4349862241563486,
|
| 313 |
+
"eval_dim_768_cosine_precision@1": 0.41037131882202305,
|
| 314 |
+
"eval_dim_768_cosine_precision@10": 0.36165172855313704,
|
| 315 |
+
"eval_dim_768_cosine_precision@3": 0.4086641058472044,
|
| 316 |
+
"eval_dim_768_cosine_precision@5": 0.3969270166453265,
|
| 317 |
+
"eval_dim_768_cosine_recall@1": 0.047186779325657804,
|
| 318 |
+
"eval_dim_768_cosine_recall@10": 0.30540044861465576,
|
| 319 |
+
"eval_dim_768_cosine_recall@3": 0.1375709294981283,
|
| 320 |
+
"eval_dim_768_cosine_recall@5": 0.20603724780478358,
|
| 321 |
+
"eval_runtime": 98.5908,
|
| 322 |
+
"eval_samples_per_second": 0.0,
|
| 323 |
+
"eval_sequential_score": 0.3371953828075091,
|
| 324 |
+
"eval_steps_per_second": 0.0,
|
| 325 |
+
"step": 39
|
| 326 |
+
}
|
| 327 |
+
],
|
| 328 |
+
"logging_steps": 10,
|
| 329 |
+
"max_steps": 240,
|
| 330 |
+
"num_input_tokens_seen": 0,
|
| 331 |
+
"num_train_epochs": 20,
|
| 332 |
+
"save_steps": 500,
|
| 333 |
+
"stateful_callbacks": {
|
| 334 |
+
"EarlyStoppingCallback": {
|
| 335 |
+
"args": {
|
| 336 |
+
"early_stopping_patience": 2,
|
| 337 |
+
"early_stopping_threshold": 0.0
|
| 338 |
+
},
|
| 339 |
+
"attributes": {
|
| 340 |
+
"early_stopping_patience_counter": 0
|
| 341 |
+
}
|
| 342 |
+
},
|
| 343 |
+
"TrainerControl": {
|
| 344 |
+
"args": {
|
| 345 |
+
"should_epoch_stop": false,
|
| 346 |
+
"should_evaluate": false,
|
| 347 |
+
"should_log": false,
|
| 348 |
+
"should_save": true,
|
| 349 |
+
"should_training_stop": false
|
| 350 |
+
},
|
| 351 |
+
"attributes": {}
|
| 352 |
+
}
|
| 353 |
+
},
|
| 354 |
+
"total_flos": 0.0,
|
| 355 |
+
"train_batch_size": 8,
|
| 356 |
+
"trial_name": null,
|
| 357 |
+
"trial_params": null
|
| 358 |
+
}
|
checkpoint-39/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd906d94b017c1a7fa871b608776d19ecf4218c10c253401fe78ba8ce84435be
|
| 3 |
+
size 6097
|
checkpoint-52/1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 1024,
|
| 3 |
+
"pooling_mode_cls_token": false,
|
| 4 |
+
"pooling_mode_mean_tokens": true,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
checkpoint-52/README.md
ADDED
|
@@ -0,0 +1,1640 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
language:
|
| 3 |
+
- en
|
| 4 |
+
license: apache-2.0
|
| 5 |
+
tags:
|
| 6 |
+
- sentence-transformers
|
| 7 |
+
- sentence-similarity
|
| 8 |
+
- feature-extraction
|
| 9 |
+
- dense
|
| 10 |
+
- generated_from_trainer
|
| 11 |
+
- dataset_size:391
|
| 12 |
+
- loss:MatryoshkaLoss
|
| 13 |
+
- loss:MultipleNegativesRankingLoss
|
| 14 |
+
base_model: intfloat/multilingual-e5-large
|
| 15 |
+
widget:
|
| 16 |
+
- source_sentence: What is the responsibility of assisting and advising the data subjects
|
| 17 |
+
in exercising their rights?
|
| 18 |
+
sentences:
|
| 19 |
+
- '1.Personal data shall be: (a) processed lawfully, fairly and in a transparent
|
| 20 |
+
manner in relation to the data subject (‘lawfulness, fairness and transparency’);
|
| 21 |
+
(b) collected for specified, explicit and legitimate purposes and not further
|
| 22 |
+
processed in a manner that is incompatible with those purposes; further processing
|
| 23 |
+
for archiving purposes in the public interest, scientific or historical research
|
| 24 |
+
purposes or statistical purposes shall, in accordance with Article 89(1), not
|
| 25 |
+
be considered to be incompatible with the initial purposes (‘purpose limitation’);
|
| 26 |
+
(c) adequate, relevant and limited to what is necessary in relation to the purposes
|
| 27 |
+
for which they are processed (‘data minimisation’); (d) accurate and, where necessary,
|
| 28 |
+
kept up to date; every reasonable step must be taken to ensure that personal data
|
| 29 |
+
that are inaccurate, having regard to the purposes for which they are processed,
|
| 30 |
+
are erased or rectified without delay (‘accuracy’); 4.5.2016 L 119/35 (1) Directive
|
| 31 |
+
(EU) 2015/1535 of the European Parliament and of the Council of 9 September 2015
|
| 32 |
+
laying down a procedure for the provision of information in the field of technical
|
| 33 |
+
regulations and of rules on Information Society services (OJ L 241, 17.9.2015,
|
| 34 |
+
p. 1). (e) kept in a form which permits identification of data subjects for no
|
| 35 |
+
longer than is necessary for the purposes for which the personal data are processed;
|
| 36 |
+
personal data may be stored for longer periods insofar as the personal data will
|
| 37 |
+
be processed solely for archiving purposes in the public interest, scientific
|
| 38 |
+
or historical research purposes or statistical purposes in accordance with Article
|
| 39 |
+
89(1) subject to implementation of the appropriate technical and organisational
|
| 40 |
+
measures required by this Regulation in order to safeguard the rights and freedoms
|
| 41 |
+
of the data subject (‘storage limitation’); (f) processed in a manner that ensures
|
| 42 |
+
appropriate security of the personal data, including protection against unauthorised
|
| 43 |
+
or unlawful processing and against accidental loss, destruction or damage, using
|
| 44 |
+
appropriate technical or organisational measures (‘integrity and confidentiality’).
|
| 45 |
+
|
| 46 |
+
2.The controller shall be responsible for, and be able to demonstrate compliance
|
| 47 |
+
with, paragraph 1 (‘accountability’).'
|
| 48 |
+
- '1.A transfer of personal data to a third country or an international organisation
|
| 49 |
+
may take place where the Commission has decided that the third country, a territory
|
| 50 |
+
or one or more specified sectors within that third country, or the international
|
| 51 |
+
organisation in question ensures an adequate level of protection. Such a transfer
|
| 52 |
+
shall not require any specific authorisation.
|
| 53 |
+
|
| 54 |
+
2.When assessing the adequacy of the level of protection, the Commission shall,
|
| 55 |
+
in particular, take account of the following elements: (a) the rule of law, respect
|
| 56 |
+
for human rights and fundamental freedoms, relevant legislation, both general
|
| 57 |
+
and sectoral, including concerning public security, defence, national security
|
| 58 |
+
and criminal law and the access of public authorities to personal data, as well
|
| 59 |
+
as the implementation of such legislation, data protection rules, professional
|
| 60 |
+
rules and security measures, including rules for the onward transfer of personal
|
| 61 |
+
data to another third country or international organisation which are complied
|
| 62 |
+
with in that country or international organisation, case-law, as well as effective
|
| 63 |
+
and enforceable data subject rights and effective administrative and judicial
|
| 64 |
+
redress for the data subjects whose personal data are being transferred; (b) the
|
| 65 |
+
existence and effective functioning of one or more independent supervisory authorities
|
| 66 |
+
in the third country or to which an international organisation is subject, with
|
| 67 |
+
responsibility for ensuring and enforcing compliance with the data protection
|
| 68 |
+
rules, including adequate enforcement powers, for assisting and advising the data
|
| 69 |
+
subjects in exercising their rights and for cooperation with the supervisory authorities
|
| 70 |
+
of the Member States; and (c) the international commitments the third country
|
| 71 |
+
or international organisation concerned has entered into, or other obligations
|
| 72 |
+
arising from legally binding conventions or instruments as well as from its participation
|
| 73 |
+
in multilateral or regional systems, in particular in relation to the protection
|
| 74 |
+
of personal data.
|
| 75 |
+
|
| 76 |
+
3.The Commission, after assessing the adequacy of the level of protection, may
|
| 77 |
+
decide, by means of implementing act, that a third country, a territory or one
|
| 78 |
+
or more specified sectors within a third country, or an international organisation
|
| 79 |
+
ensures an adequate level of protection within the meaning of paragraph 2 of this
|
| 80 |
+
Article. The implementing act shall provide for a mechanism for a periodic review,
|
| 81 |
+
at least every four years, which shall take into account all relevant developments
|
| 82 |
+
in the third country or international organisation. The implementing act shall
|
| 83 |
+
specify its territorial and sectoral application and, where applicable, identify
|
| 84 |
+
the supervisory authority or authorities referred to in point (b) of paragraph
|
| 85 |
+
2 of this Article. The implementing act shall be adopted in accordance with the
|
| 86 |
+
examination procedure referred to in Article 93(2).
|
| 87 |
+
|
| 88 |
+
4.The Commission shall, on an ongoing basis, monitor developments in third countries
|
| 89 |
+
and international organisations that could affect the functioning of decisions
|
| 90 |
+
adopted pursuant to paragraph 3 of this Article and decisions adopted on the basis
|
| 91 |
+
of Article 25(6) of Directive 95/46/EC.
|
| 92 |
+
|
| 93 |
+
5.The Commission shall, where available information reveals, in particular following
|
| 94 |
+
the review referred to in paragraph 3 of this Article, that a third country, a
|
| 95 |
+
territory or one or more specified sectors within a third country, or an international
|
| 96 |
+
organisation no longer ensures an adequate level of protection within the meaning
|
| 97 |
+
of paragraph 2 of this Article, to the extent necessary, repeal, amend or suspend
|
| 98 |
+
the decision referred to in paragraph 3 of this Article by means of implementing
|
| 99 |
+
acts without retro-active effect. Those implementing acts shall be adopted in
|
| 100 |
+
accordance with the examination procedure referred to in Article 93(2). On duly
|
| 101 |
+
justified imperative grounds of urgency, the Commission shall adopt immediately
|
| 102 |
+
applicable implementing acts in accordance with the procedure referred to in Article
|
| 103 |
+
93(3).
|
| 104 |
+
|
| 105 |
+
6.The Commission shall enter into consultations with the third country or international
|
| 106 |
+
organisation with a view to remedying the situation giving rise to the decision
|
| 107 |
+
made pursuant to paragraph 5
|
| 108 |
+
|
| 109 |
+
7.A decision pursuant to paragraph 5 of this Article is without prejudice to transfers
|
| 110 |
+
of personal data to the third country, a territory or one or more specified sectors
|
| 111 |
+
within that third country, or the international organisation in question pursuant
|
| 112 |
+
to Articles 46 to 49
|
| 113 |
+
|
| 114 |
+
8.The Commission shall publish in the Official Journal of the European Union and
|
| 115 |
+
on its website a list of the third countries, territories and specified sectors
|
| 116 |
+
within a third country and international organisations for which it has decided
|
| 117 |
+
that an adequate level of protection is or is no longer ensured.
|
| 118 |
+
|
| 119 |
+
9.Decisions adopted by the Commission on the basis of Article 25(6) of Directive
|
| 120 |
+
95/46/EC shall remain in force until amended, replaced or repealed by a Commission
|
| 121 |
+
Decision adopted in accordance with paragraph 3 or 5 of this Article.'
|
| 122 |
+
- The legal systems of Denmark and Estonia do not allow for administrative fines
|
| 123 |
+
as set out in this Regulation. The rules on administrative fines may be applied
|
| 124 |
+
in such a manner that in Denmark the fine is imposed by competent national courts
|
| 125 |
+
as a criminal penalty and in Estonia the fine is imposed by the supervisory authority
|
| 126 |
+
in the framework of a misdemeanour procedure, provided that such an application
|
| 127 |
+
of the rules in those Member States has an equivalent effect to administrative
|
| 128 |
+
fines imposed by supervisory authorities. Therefore the competent national courts
|
| 129 |
+
should take into account the recommendation by the supervisory authority initiating
|
| 130 |
+
the fine. In any event, the fines imposed should be effective, proportionate and
|
| 131 |
+
dissuasive.
|
| 132 |
+
- source_sentence: Is the fine mandatory for the described offense?
|
| 133 |
+
sentences:
|
| 134 |
+
- "1.Each supervisory authority shall ensure that the imposition of administrative\
|
| 135 |
+
\ fines pursuant to this Article in respect of infringements of this Regulation\
|
| 136 |
+
\ referred to in paragraphs 4, 5 and 6 shall in each individual case be effective,\
|
| 137 |
+
\ proportionate and dissuasive.\n2.Administrative fines shall, depending on the\
|
| 138 |
+
\ circumstances of each individual case, be imposed in addition to, or instead\
|
| 139 |
+
\ of, measures referred to in points (a) to (h) and (j) of Article 58(2). When\
|
| 140 |
+
\ deciding whether to impose an administrative fine and deciding on the amount\
|
| 141 |
+
\ of the administrative fine in each individual case due regard shall be given\
|
| 142 |
+
\ to the following: (a) the nature, gravity and duration of the infringement\
|
| 143 |
+
\ taking into account the nature scope or purpose of the processing concerned\
|
| 144 |
+
\ as well as the number of data subjects affected and the level of damage suffered\
|
| 145 |
+
\ by them; (b) the intentional or negligent character of the infringement; (c)\
|
| 146 |
+
\ any action taken by the controller or processor to mitigate the damage suffered\
|
| 147 |
+
\ by data subjects; (d) the degree of responsibility of the controller or processor\
|
| 148 |
+
\ taking into account technical and organisational measures implemented by them\
|
| 149 |
+
\ pursuant to Articles 25 and 32; (e) any relevant previous infringements by\
|
| 150 |
+
\ the controller or processor; (f) the degree of cooperation with the supervisory\
|
| 151 |
+
\ authority, in order to remedy the infringement and mitigate the possible adverse\
|
| 152 |
+
\ effects of the infringement; (g) the categories of personal data affected by\
|
| 153 |
+
\ the infringement; (h) the manner in which the infringement became known to\
|
| 154 |
+
\ the supervisory authority, in particular whether, and if so to what extent,\
|
| 155 |
+
\ the controller or processor notified the infringement; (i) where measures referred\
|
| 156 |
+
\ to in Article 58(2) have previously been ordered against the controller or processor\
|
| 157 |
+
\ concerned with regard to the same subject-matter, compliance with those measures;\
|
| 158 |
+
\ (j) adherence to approved codes of conduct pursuant to Article 40 or approved\
|
| 159 |
+
\ certification mechanisms pursuant to Article 42; and (k) any other aggravating\
|
| 160 |
+
\ or mitigating factor applicable to the circumstances of the case, such as financial\
|
| 161 |
+
\ benefits gained, or losses avoided, directly or indirectly, from the infringement.\n\
|
| 162 |
+
3.If a controller or processor intentionally or negligently, for the same or linked\
|
| 163 |
+
\ processing operations, infringes several provisions of this Regulation, the\
|
| 164 |
+
\ total amount of the administrative fine shall not exceed the amount specified\
|
| 165 |
+
\ for the gravest infringement.\n4.Infringements of the following provisions shall,\
|
| 166 |
+
\ in accordance with paragraph 2, be subject to administrative fines up to 10\
|
| 167 |
+
\ 000 000 EUR, or in the case of an undertaking, up to 2 % of the total worldwide\
|
| 168 |
+
\ annual turnover of the preceding financial year, whichever is higher: (a) the\
|
| 169 |
+
\ obligations of the controller and the processor pursuant to Articles 8, 11,\
|
| 170 |
+
\ 25 to 39 and 42 and 43; (b) the obligations of the certification body pursuant\
|
| 171 |
+
\ to Articles 42 and 43; (c) the obligations of the monitoring body pursuant\
|
| 172 |
+
\ to Article 41(4). 4.5.2016 L 119/82 \n5.Infringements of the following provisions\
|
| 173 |
+
\ shall, in accordance with paragraph 2, be subject to administrative fines up\
|
| 174 |
+
\ to 20 000 000 EUR, or in the case of an undertaking, up to 4 % of the total\
|
| 175 |
+
\ worldwide annual turnover of the preceding financial year, whichever is higher:\
|
| 176 |
+
\ (a) the basic principles for processing, including conditions for consent,\
|
| 177 |
+
\ pursuant to Articles 5, 6, 7 and 9; (b) the data subjects' rights pursuant\
|
| 178 |
+
\ to Articles 12 to 22; (c) the transfers of personal data to a recipient in\
|
| 179 |
+
\ a third country or an international organisation pursuant to Articles 44 to\
|
| 180 |
+
\ 49; (d) any obligations pursuant to Member State law adopted under Chapter\
|
| 181 |
+
\ IX; (e) non-compliance with an order or a temporary or definitive limitation\
|
| 182 |
+
\ on processing or the suspension of data flows by the supervisory authority pursuant\
|
| 183 |
+
\ to Article 58(2) or failure to provide access in violation of Article 58(1).\n\
|
| 184 |
+
6.Non-compliance with an order by the supervisory authority as referred to in\
|
| 185 |
+
\ Article 58(2) shall, in accordance with paragraph 2 of this Article, be subject\
|
| 186 |
+
\ to administrative fines up to 20 000 000 EUR, or in the case of an undertaking,\
|
| 187 |
+
\ up to 4 % of the total worldwide annual turnover of the preceding financial\
|
| 188 |
+
\ year, whichever is higher.\n7.Without prejudice to the corrective powers of\
|
| 189 |
+
\ supervisory authorities pursuant to Article 58(2), each Member State may lay\
|
| 190 |
+
\ down the rules on whether and to what extent administrative fines may be imposed\
|
| 191 |
+
\ on public authorities and bodies established in that Member State.\n8.The exercise\
|
| 192 |
+
\ by the supervisory authority of its powers under this Article shall be subject\
|
| 193 |
+
\ to appropriate procedural safeguards in accordance with Union and Member State\
|
| 194 |
+
\ law, including effective judicial remedy and due process.\n9.Where the legal\
|
| 195 |
+
\ system of the Member State does not provide for administrative fines, this Article\
|
| 196 |
+
\ may be applied in such a manner that the fine is initiated by the competent\
|
| 197 |
+
\ supervisory authority and imposed by competent national courts, while ensuring\
|
| 198 |
+
\ that those legal remedies are effective and have an equivalent effect to the\
|
| 199 |
+
\ administrative fines imposed by supervisory authorities. In any event, the fines\
|
| 200 |
+
\ imposed shall be effective, proportionate and dissuasive. Those Member States\
|
| 201 |
+
\ shall notify to the Commission the provisions of their laws which they adopt\
|
| 202 |
+
\ pursuant to this paragraph by 25 May 2018 and, without delay, any subsequent\
|
| 203 |
+
\ amendment law or amendment affecting them."
|
| 204 |
+
- "Court (Civil/Criminal): Criminal \nProvisions: Article 386 of the Penal Code\
|
| 205 |
+
\ \nTime of commission of the act: \nResult (innocent, guilty): \nReasoning:\
|
| 206 |
+
\ Conviction for computer fraud committed repeatedly and professionally with a\
|
| 207 |
+
\ total benefit and damage exceeding €30,000. According to the majority opinion,\
|
| 208 |
+
\ the charge is substantiated in both its objective and subjective aspects, and\
|
| 209 |
+
\ the defendant must be declared guilty of the aforementioned criminal acts of\
|
| 210 |
+
\ fraud by means of a computer, committed repeatedly by a perpetrator acting professionally,\
|
| 211 |
+
\ where the total financial benefit and corresponding damage exceed the amount\
|
| 212 |
+
\ of €30,000, as well as for repeated embezzlement.\n\nFacts: The defendant accessed\
|
| 213 |
+
\ a website using a computer, employing, without the knowledge and consent of\
|
| 214 |
+
\ the complainants, the access codes for the electronic management system of the\
|
| 215 |
+
\ bank accounts held by the complainants at a Bank, and transferred money through\
|
| 216 |
+
\ electronically transmitted orders from the complainants' accounts to her own\
|
| 217 |
+
\ account. Specifically, during the period from June 2007 to June 2008, after\
|
| 218 |
+
\ unlawfully acquiring the aforementioned STICK containing the access codes, she\
|
| 219 |
+
\ accessed a website maintained by ..., using, without the complainants' knowledge\
|
| 220 |
+
\ (without their consent or approval), the access codes for the electronic management\
|
| 221 |
+
\ system of the bank accounts held at the aforementioned Bank, transferring through\
|
| 222 |
+
\ electronically transmitted orders to the joint account number ... of the complainants\
|
| 223 |
+
\ from bank accounts numbered ..., ..., and ..., the total amount of €55,710,\
|
| 224 |
+
\ as detailed in the orders, and subsequently, using an ATM card, she gradually\
|
| 225 |
+
\ withdrew from the aforementioned account number ..., the total amount of €55,710,\
|
| 226 |
+
\ making 84 individual withdrawals from automatic teller machines. In addition,\
|
| 227 |
+
\ the defendant, during the period from June 2008 to November 2008, in the same\
|
| 228 |
+
\ exact manner (through the electronic management system of the bank accounts),\
|
| 229 |
+
\ transferred through electronically transmitted orders to account number ...,\
|
| 230 |
+
\ which she had opened at ..., from the complainants' bank accounts numbered ...,\
|
| 231 |
+
\ ..., ..., ..., and ..., the total amount of €73,942, as detailed in the orders\
|
| 232 |
+
\ regarding the transfers of these amounts. Furthermore, during the period from\
|
| 233 |
+
\ February 2008 to November 2008, through multiple acts constituting a continuation\
|
| 234 |
+
\ of the crime, although she had received from the first complainant ... the amounts\
|
| 235 |
+
\ of €695.04, €695.04, and €845.04, in order to pay his insurance contributions\
|
| 236 |
+
\ to O.A.E.E. for the periods of January-February 2008, May-June 2008, and September-October\
|
| 237 |
+
\ 2008, as well as the amounts of €250 and €280, in order to settle credit card\
|
| 238 |
+
\ bills for \"...\", respectively, and from the second complainant ... she received\
|
| 239 |
+
\ the amounts of €283.64, €419.26, and €385.38, to pay the latter's insurance\
|
| 240 |
+
\ contributions to O.A.E.E. for the periods of July-August 2007, May-June 2008,\
|
| 241 |
+
\ September-October 2008, and November-December 2008, as well as the amount of\
|
| 242 |
+
\ €1,888.03 for the settlement of VAT, she never paid the above amounts to settle\
|
| 243 |
+
\ the aforementioned obligations, nor did she return them to the complainants,\
|
| 244 |
+
\ despite being urged to do so, but incorporated them into her assets and wrongfully\
|
| 245 |
+
\ appropriated them. The defendant denies the charges against her and claims that\
|
| 246 |
+
\ the withdrawals were made by the second complainant and that all the amounts\
|
| 247 |
+
\ transferred to her account were transferred to cover the company's expenses\
|
| 248 |
+
\ and their personal expenses, due to her cohabitation with the second complainant\
|
| 249 |
+
\ and with his knowledge, with whom she intended to marry. However, this claim\
|
| 250 |
+
\ is not supported by any evidence; on the contrary, it emerged that she conducted\
|
| 251 |
+
\ the transfers of the money and withdrawals without the complainants' knowledge,\
|
| 252 |
+
\ and when she learned that they had been informed about the account movements\
|
| 253 |
+
\ and met at the Bank, her behavior and demeanor indicated guilt, according to\
|
| 254 |
+
\ the testimony of the prosecution witness ..., an employee of the Pangrati branch\
|
| 255 |
+
\ of ..., who saw her on the same day at the aforementioned Bank when she met\
|
| 256 |
+
\ with the complainants. The ongoing act of fraud using a computer was committed\
|
| 257 |
+
\ by the defendant professionally, as evidenced by her repeated commission of\
|
| 258 |
+
\ the act, as well as the infrastructure she had established with the intent of\
|
| 259 |
+
\ repeated commission, based on a specific plan and methodology (transferring\
|
| 260 |
+
\ smaller amounts to a joint account of the complainants from the remaining accounts\
|
| 261 |
+
\ of the latter, and then withdrawing the transferred amounts with an ATM card,\
|
| 262 |
+
\ as well as directly transferring smaller amounts from the complainants' accounts\
|
| 263 |
+
\ to her personal account she had opened at the same bank), indicating her purpose\
|
| 264 |
+
\ to generate income, with the financial benefit she gained, corresponding to\
|
| 265 |
+
\ the complainants' damage, exceeding a total of €30,000."
|
| 266 |
+
- 'Any person who intentionally, through the technology of information and communication,
|
| 267 |
+
suggests an encounter between an adult and a minor under the age of fifteen, aiming
|
| 268 |
+
at the commitment of the crimes described in par. 1 and 2 of art. 339 and 348Α,
|
| 269 |
+
is sentenced to an imprisonment of at least two years and a fine of fifty to two
|
| 270 |
+
hundred thousand Euros, when the proposal is followed by further actions which
|
| 271 |
+
lead in the commitment of such crimes.
|
| 272 |
+
|
| 273 |
+
'
|
| 274 |
+
- source_sentence: Who should provide authorisation when safeguards are detailed in
|
| 275 |
+
non-legally binding administrative arrangements?
|
| 276 |
+
sentences:
|
| 277 |
+
- In the absence of an adequacy decision, the controller or processor should take
|
| 278 |
+
measures to compensate for the lack of data protection in a third country by way
|
| 279 |
+
of appropriate safeguards for the data subject. Such appropriate safeguards may
|
| 280 |
+
consist of making use of binding corporate rules, standard data protection clauses
|
| 281 |
+
adopted by the Commission, standard data protection clauses adopted by a supervisory
|
| 282 |
+
authority or contractual clauses authorised by a supervisory authority. Those
|
| 283 |
+
safeguards should ensure compliance with data protection requirements and the
|
| 284 |
+
rights of the data subjects appropriate to processing within the Union, including
|
| 285 |
+
the availability of enforceable data subject rights and of effective legal remedies,
|
| 286 |
+
including to obtain effective administrative or judicial redress and to claim
|
| 287 |
+
compensation, in the Union or in a third country. They should relate in particular
|
| 288 |
+
to compliance with the general principles relating to personal data processing,
|
| 289 |
+
the principles of data protection by design and by default. Transfers may also
|
| 290 |
+
be carried out by public authorities or bodies with public authorities or bodies
|
| 291 |
+
in third countries or with international organisations with corresponding duties
|
| 292 |
+
or functions, including on the basis of provisions to be inserted into administrative
|
| 293 |
+
arrangements, such as a memorandum of understanding, providing for enforceable
|
| 294 |
+
and effective rights for data subjects. Authorisation by the competent supervisory
|
| 295 |
+
authority should be obtained when the safeguards are provided for in administrative
|
| 296 |
+
arrangements that are not legally binding.
|
| 297 |
+
- '**Court (Civil/Criminal): Civil**
|
| 298 |
+
|
| 299 |
+
|
| 300 |
+
**Provisions:**
|
| 301 |
+
|
| 302 |
+
|
| 303 |
+
**Time of commission of the act:**
|
| 304 |
+
|
| 305 |
+
|
| 306 |
+
**Outcome (not guilty, guilty):**
|
| 307 |
+
|
| 308 |
+
|
| 309 |
+
**Rationale:**
|
| 310 |
+
|
| 311 |
+
|
| 312 |
+
**Facts:**
|
| 313 |
+
|
| 314 |
+
The plaintiff holds credit card number ............ with the defendant banking
|
| 315 |
+
corporation. Based on the application for alternative networks dated 19/7/2015
|
| 316 |
+
with number ......... submitted at a branch of the defendant, he was granted access
|
| 317 |
+
to the electronic banking service (e-banking) to conduct banking transactions
|
| 318 |
+
(debit, credit, updates, payments) remotely. On 30/11/2020, the plaintiff fell
|
| 319 |
+
victim to electronic fraud through the "phishing" method, whereby an unknown perpetrator
|
| 320 |
+
managed to withdraw a total amount of €3,121.75 from the aforementioned credit
|
| 321 |
+
card. Specifically, the plaintiff received an email at 1:35 PM on 29/11/2020 from
|
| 322 |
+
sender ...... with address ........, informing him that due to an impending system
|
| 323 |
+
change, he needed to verify the mobile phone number linked to the credit card,
|
| 324 |
+
urging him to complete the verification process within the next 24 hours by following
|
| 325 |
+
a link titled ........; otherwise, his account would be locked for security reasons.
|
| 326 |
+
The plaintiff read this email on the afternoon of 30 November 2020 and, believing
|
| 327 |
+
it was from the defendant, followed the instructions and proceeded via the provided
|
| 328 |
+
link to a website that was identical (a clone) to that of the defendant. On this
|
| 329 |
+
page, he was asked to enter the six-digit security code (.........) that had just
|
| 330 |
+
been sent to his mobile phone by the defendant at 3:41 PM, with the note that
|
| 331 |
+
it was an activation code for his ........ card at ........., which he entered.
|
| 332 |
+
|
| 333 |
+
|
| 334 |
+
Subsequently, the plaintiff received, according to his statements, a new email
|
| 335 |
+
(not submitted), which requested him to enter the details of the aforementioned
|
| 336 |
+
credit card, specifically the name of the cardholder and the card number, not
|
| 337 |
+
the PIN, which he also entered, convinced that he was within the online environment
|
| 338 |
+
of the defendant. Then, at 3:47 PM, he received a message on his mobile phone
|
| 339 |
+
from the defendant containing the exact same content as the one he received at
|
| 340 |
+
3:41 PM, while at 3:50 PM he received a message stating that the activation of
|
| 341 |
+
his ......... card at ....... had been completed. Once the plaintiff read this,
|
| 342 |
+
he became concerned that something was not right, and immediately called (at 4:41
|
| 343 |
+
PM) the defendant''s call center to inform them. There, the employees, with whom
|
| 344 |
+
he finally connected at 5:04 PM due to high call center volume, advised him to
|
| 345 |
+
delete the relevant emails, cancel his credit card, change his access passwords
|
| 346 |
+
for the service, and submit a dispute request regarding the conducted transactions.
|
| 347 |
+
The plaintiff electronically sent this request to the defendant, disputing the
|
| 348 |
+
detailed transactions amounting to €3,121.75, which were conducted on 30/11/2020
|
| 349 |
+
during the time frame of 16:37:45-16:43:34 PM, arguing that he had neither performed
|
| 350 |
+
them himself nor authorized anyone else to do so. The plaintiff specifically disputed
|
| 351 |
+
the following transactions, as evidenced by the account activity of the disputed
|
| 352 |
+
credit card during the aforementioned timeframe: a) transaction number .........
|
| 353 |
+
amounting to €150.62 conducted on 30/11/2020 at 4:43:34 PM, b) transaction number
|
| 354 |
+
........ amounting to €293.20 conducted on 30/11/2020 at 4:42:40 PM, c) transaction
|
| 355 |
+
number ............ amounting to €295.21 conducted on 30/11/2020 at 4:42:10 PM,
|
| 356 |
+
d) transaction number .......... amounting to €299.22 conducted on 30/11/2020
|
| 357 |
+
at 4:41:31 PM, e) transaction number ........ amounting to €297.21 conducted on
|
| 358 |
+
30/11/2020 at 4:41:01 PM, f) transaction number ........ amounting to €299.22
|
| 359 |
+
conducted on 30/11/2020 at 4:40:27 PM, g) transaction number ....... amounting
|
| 360 |
+
to €299.22 conducted on 30/11/2020 at 4:39:55 PM, h) transaction number ......
|
| 361 |
+
amounting to €299.22 conducted on 30/11/2020 at 4:39:22 PM, i) transaction number
|
| 362 |
+
......... amounting to €297.22 conducted on 30/11/2020 at 4:38:52 PM, j) transaction
|
| 363 |
+
number ......... amounting to €295.21 conducted on 30/11/2020 at 4:38:17 PM, and
|
| 364 |
+
k) transaction number ......... amounting to €296.21 conducted on 30/11/2020 at
|
| 365 |
+
4:37:45 PM. In its response letter dated 21/12/2020, the defendant denied responsibility
|
| 366 |
+
for the costs of the aforementioned transactions, placing the entire blame on
|
| 367 |
+
the plaintiff for the leak of his card details and security code to the fraudulent
|
| 368 |
+
page. The plaintiff, completely denying any fault for the conducted transactions,
|
| 369 |
+
repeatedly contacted the defendant, both by phone and via email (see emails dated
|
| 370 |
+
15/1/2021 and 11/2/2021), while on 2/3/2021, he electronically sent a report dated
|
| 371 |
+
1/03/2021 to the Consumer Advocate’s email address, recounting the events and
|
| 372 |
+
requesting that the aforementioned Independent Authority intervene to have the
|
| 373 |
+
disputed debt canceled. In its letter with reference number ...../27.04.2021,
|
| 374 |
+
the aforementioned Independent Authority informed the plaintiff that the case
|
| 375 |
+
was outside its mediating role and was therefore archived. Subsequently, the plaintiff
|
| 376 |
+
sent the defendant on 5/3/2021 his extrajudicial statement dated 4/3/2021, calling
|
| 377 |
+
upon it to fully cancel the debt of €3,121.75 that had been unjustly incurred
|
| 378 |
+
against him within two days and to immediately instruct the representatives of
|
| 379 |
+
the collection agency working with it to cease contacting him regarding the disputed
|
| 380 |
+
case. The defendant sent the plaintiff a message on his mobile phone on 20/04/2021
|
| 381 |
+
informing him that his case was still being processed due to lengthy operational
|
| 382 |
+
requirements, while on 23/04/2021, via email, it informed him that considering
|
| 383 |
+
their good cooperation and his efforts to keep them updated, it had reviewed his
|
| 384 |
+
case and decided to refund him the amounts of the transactions that were conducted
|
| 385 |
+
after his contact with their representatives on 30/11/2020 at 4:41 PM, totaling
|
| 386 |
+
€1,038.25, specifically the following: a) transaction of €150.62 conducted on
|
| 387 |
+
30/11/2020 at 4:43 PM, b) transaction of €295.21 conducted on 30/11/2020 at 4:42
|
| 388 |
+
PM, c) transaction of €293.20 conducted on 30/11/2020 at 4:42 PM, and d) transaction
|
| 389 |
+
of €299.22 conducted on 30/11/2020 at 4:41 PM. Beyond this, the defendant refused
|
| 390 |
+
to refund the plaintiff the amount of the remaining transactions conducted on
|
| 391 |
+
30/11/2020, totaling €2,376.08 (and not €2,376.48 as incorrectly stated by the
|
| 392 |
+
plaintiff in his lawsuit), which the plaintiff ultimately fully paid, transferring
|
| 393 |
+
€2,342.77 to the defendant on 7/06/2021 and €33.31 on 15/06/2021 (see related
|
| 394 |
+
deposit receipts).'
|
| 395 |
+
- "Court (Civil/Criminal): Civil \nProvisions: \nTime of commission: July 21,\
|
| 396 |
+
\ 2020 \nOutcome (innocent, guilty): Partially accepts the lawsuit against the\
|
| 397 |
+
\ Bank. \nReasoning: Alongside the bank's responsibility for the ineffective\
|
| 398 |
+
\ protection of its systems against the continually changing and evolving methods\
|
| 399 |
+
\ of deception that affect them, leading to financial damage for its clients who\
|
| 400 |
+
\ entrusted it, which constitutes a breach of its contractual obligations and\
|
| 401 |
+
\ generates contractual liability, there is also the personal responsibility of\
|
| 402 |
+
\ the plaintiff, who did not safeguard, as required, his sensitive banking information\
|
| 403 |
+
\ and disclosed it when he should not have, even though the message that misled\
|
| 404 |
+
\ him came from the context of an SMS conversation with the defendant, even if\
|
| 405 |
+
\ he was directed through the link to a website resembling that of the defendant,\
|
| 406 |
+
\ because he overlooked the relevant instructions and strict recommendations of\
|
| 407 |
+
\ the bank, violating his duty to safeguard them. Therefore, in light of the above,\
|
| 408 |
+
\ the court must partially accept the lawsuit regarding its substance, and with\
|
| 409 |
+
\ the defendant's objection regarding the plaintiff's fault being accepted at\
|
| 410 |
+
\ a rate of 1/6 of the damage suffered, it must be acknowledged – following the\
|
| 411 |
+
\ admissible and lawful modification of the lawsuit's request from a dismissive\
|
| 412 |
+
\ to a declaratory nature as proposed – the defendant's obligation to pay him\
|
| 413 |
+
\ the amount of €2,500, with legal interest, as specified in the operative part.\
|
| 414 |
+
\ Regarding the request to recognize the defendant's obligation to pay him €1,000\
|
| 415 |
+
\ as compensation for the moral damage he suffered from the fraud committed against\
|
| 416 |
+
\ him, this is deemed dismissible as unfounded, because the defendant's liability\
|
| 417 |
+
\ is contractual and not tortious, and there are no special conditions justifying\
|
| 418 |
+
\ the treatment of this specific non-contractual behavior as tortious, making\
|
| 419 |
+
\ it possible to attribute moral damage to the plaintiff from the defendant. \
|
| 420 |
+
\ \nFacts: The plaintiff maintained a joint bank account with his wife and had\
|
| 421 |
+
\ access to the defendant bank's e-banking. On July 21, 2020, following successful\
|
| 422 |
+
\ identification via the agreed-upon credentials (userID, password, OTP), a request\
|
| 423 |
+
\ was made to change the mobile phone number for receiving OTPs, which was completed\
|
| 424 |
+
\ through the bank's platform. However, this change was not made by the plaintiff\
|
| 425 |
+
\ himself, but by a third party who had previously deceived him using the phishing\
|
| 426 |
+
\ method, obtaining his banking details through a misleading SMS. Following the\
|
| 427 |
+
\ phone number change, on July 31, 2020, a transfer of €3,000 was made to a third\
|
| 428 |
+
\ party's account. The transaction was conducted using the necessary credentials\
|
| 429 |
+
\ and OTP sent to the new mobile phone, resulting in the bank considering the\
|
| 430 |
+
\ order valid and executing it. Once the plaintiff realized the transfer, he immediately\
|
| 431 |
+
\ contacted the bank and informed them that he had not given such an order himself.\
|
| 432 |
+
\ Despite the initial assurance that the funds could be recovered, they were ultimately\
|
| 433 |
+
\ not returned, as they had been transferred to a third party's account, and the\
|
| 434 |
+
\ bank denied any responsibility for the loss."
|
| 435 |
+
- source_sentence: When will the periodic review mechanism be conducted?
|
| 436 |
+
sentences:
|
| 437 |
+
- The Commission should monitor the functioning of decisions on the level of protection
|
| 438 |
+
in a third country, a territory or specified sector within a third country, or
|
| 439 |
+
an international organisation, and monitor the functioning of decisions adopted
|
| 440 |
+
on the basis of Article 25(6) or Article 26(4) of Directive 95/46/EC. In its adequacy
|
| 441 |
+
decisions, the Commission should provide for a periodic review mechanism of their
|
| 442 |
+
functioning. That periodic review should be conducted in consultation with the
|
| 443 |
+
third country or international organisation in question and take into account
|
| 444 |
+
all relevant developments in the third country or international organisation.
|
| 445 |
+
For the purposes of monitoring and of carrying out the periodic reviews, the Commission
|
| 446 |
+
should take into consideration the views and findings of the European Parliament
|
| 447 |
+
and of the Council as well as of other relevant bodies and sources. The Commission
|
| 448 |
+
should evaluate, within a reasonable time, the functioning of the latter decisions
|
| 449 |
+
and report any relevant findings to the Committee within the meaning of Regulation
|
| 450 |
+
(EU) No 182/2011 of the European Parliament and of the Council (1) as established
|
| 451 |
+
under this Regulation, to the European Parliament and to the Council.
|
| 452 |
+
- "**Court (Civil/Criminal): Civil** \n**Provisions:** \n**Time of commission\
|
| 453 |
+
\ of the act:** \n**Outcome (not guilty, guilty):** \n**Reasoning:** Partially\
|
| 454 |
+
\ accepts the lawsuit. \n**Facts:** The plaintiff, who works as a lawyer, maintains\
|
| 455 |
+
\ a savings account with the defendant banking corporation under account number\
|
| 456 |
+
\ GR.............. Pursuant to a contract dated June 11, 2010, established in\
|
| 457 |
+
\ Thessaloniki between the defendant and the plaintiff, the plaintiff was granted\
|
| 458 |
+
\ access to the electronic banking system (e-banking) to conduct banking transactions\
|
| 459 |
+
\ remotely. On October 10, 2020, the plaintiff fell victim to electronic fraud\
|
| 460 |
+
\ through the \"phishing\" method, whereby an unknown perpetrator managed to extract\
|
| 461 |
+
\ and transfer €3,000.00 from the plaintiff’s account to another account of the\
|
| 462 |
+
\ same bank. Specifically, on that day at 6:51 a.m., the plaintiff received an\
|
| 463 |
+
\ email from the sender \".........\", with the address ..........., informing\
|
| 464 |
+
\ him that his debit card had been suspended and that online payments and cash\
|
| 465 |
+
\ withdrawals could not be made until the issue was resolved. The email urged\
|
| 466 |
+
\ him to confirm his details within the next 72 hours by following a link titled\
|
| 467 |
+
\ \"card activation.\" \nThe plaintiff read the above email on his mobile phone\
|
| 468 |
+
\ around 8:00 a.m., and believing it came from the defendant, he followed the\
|
| 469 |
+
\ instructions and accessed a website that was identical (a clone) to that of\
|
| 470 |
+
\ the defendant. On this page, he was asked to enter his login credentials to\
|
| 471 |
+
\ connect to the service, which he did, and he was subsequently asked to input\
|
| 472 |
+
\ his debit card details for the alleged activation, which he also provided. Then,\
|
| 473 |
+
\ to complete the process, a number was sent to his mobile phone at 8:07 a.m.\
|
| 474 |
+
\ from the sender ........, which he entered, and two minutes later he received\
|
| 475 |
+
\ a message from the same sender in English stating that the quick access code\
|
| 476 |
+
\ had been activated on his mobile. A few minutes later, at 8:18 a.m., he received\
|
| 477 |
+
\ an email from the defendant informing him of the transfer of €3,000.00 from\
|
| 478 |
+
\ his account to account number GR ........... held at the same bank, with the\
|
| 479 |
+
\ beneficiary's details being .......... As soon as the plaintiff read this, he\
|
| 480 |
+
\ immediately called the defendant's call center and canceled his debit card,\
|
| 481 |
+
\ the access codes for the service ......., and locked the application ..........\
|
| 482 |
+
\ At the same time, he verbally submitted a request to dispute and cancel the\
|
| 483 |
+
\ contested transaction, and in a subsequent phone call, he also canceled his\
|
| 484 |
+
\ credit card. On the same day, he also sent an email to the defendant informing\
|
| 485 |
+
\ them in writing of the above and requesting the cancellation of the transaction\
|
| 486 |
+
\ and the return of the amount of €3,000.00 to his account, as this transfer was\
|
| 487 |
+
\ not made by him but by an unknown perpetrator through electronic fraud and was\
|
| 488 |
+
\ not approved by him. It should also be noted that the plaintiff, as the sole\
|
| 489 |
+
\ beneficiary according to the aforementioned contract for using the defendant's\
|
| 490 |
+
\ Internet Banking service, never received any update via SMS or the VIBER application\
|
| 491 |
+
\ from the bank regarding the transaction details before its completion, nor did\
|
| 492 |
+
\ he receive a one-time code (OTP) to approve the contested transaction. He subsequently\
|
| 493 |
+
\ filed a complaint against unknown persons at the Cyber Crime Division for the\
|
| 494 |
+
\ crime of fraud. The defendant sent an email to the plaintiff on October 16,\
|
| 495 |
+
\ 2020, informing him that his request had been forwarded to the appropriate department\
|
| 496 |
+
\ of the bank for investigation, stating that the bank would never send him an\
|
| 497 |
+
\ email or SMS asking him to enter his personal data and that as of October 7,\
|
| 498 |
+
\ 2020, there was a notice posted for its customers regarding malicious attempts\
|
| 499 |
+
\ to steal personal data in the \"Our News\" section on ....... A month after\
|
| 500 |
+
\ the disputed incident, on November 10, 2020, an amount of €2,296.82 was transferred\
|
| 501 |
+
\ to the plaintiff's account from the account to which the fraudulent credit had\
|
| 502 |
+
\ been made. The plaintiff immediately sent an email to the defendant asking to\
|
| 503 |
+
\ be informed whether this transfer was a return of part of the amount that had\
|
| 504 |
+
\ been illegally withdrawn from his account and requested the return of the remaining\
|
| 505 |
+
\ amount of €703.18. In its response dated January 13, 2021, the defendant confirmed\
|
| 506 |
+
\ that the aforementioned amount indeed came from the account to which the fraudulent\
|
| 507 |
+
\ credit had been made, following a freeze of that account initiated by the defendant\
|
| 508 |
+
\ during the investigation of the incident, but refused to return the remaining\
|
| 509 |
+
\ amount, claiming it bore no responsibility for the leak of the personal codes\
|
| 510 |
+
\ to third parties, according to the terms of the service contract established\
|
| 511 |
+
\ between them. \nFrom the entirety of the evidence presented to the court, there\
|
| 512 |
+
\ is no indication of the authenticity of the contested transaction, as the plaintiff\
|
| 513 |
+
\ did not give his consent for the execution of the transfer of the amount of\
|
| 514 |
+
\ €3,000.00, especially in light of the provision in Article 72 paragraph 2 of\
|
| 515 |
+
\ Law 4537/2018 stating that the mere use of the Internet Banking service by the\
|
| 516 |
+
\ plaintiff does not necessarily constitute sufficient evidence that the payer\
|
| 517 |
+
\ approved the payment action. Specifically, it was proven that the contested\
|
| 518 |
+
\ transaction was not carried out following a strong identification of the plaintiff\
|
| 519 |
+
\ – the sole beneficiary of the account – and his approval, as the latter may\
|
| 520 |
+
\ have entered his personal codes on the counterfeit website; however, he was\
|
| 521 |
+
\ never informed, before the completion of the contested transaction, of the amount\
|
| 522 |
+
\ that would be transferred from his account to a third-party account, nor did\
|
| 523 |
+
\ he receive on his mobile phone, either via SMS or through the VIBER application\
|
| 524 |
+
\ or any other means, the one-time code - extra PIN for its completion, which\
|
| 525 |
+
\ he was required to enter to approve the contested transaction (payment action)\
|
| 526 |
+
\ and thus complete his identification, a fact that was not countered by any evidence\
|
| 527 |
+
\ from the defendant. Furthermore, it is noted that the defendant's claims that\
|
| 528 |
+
\ it bears no responsibility under the terms of the banking services contract,\
|
| 529 |
+
\ whereby it is not liable for any damage to its customer in cases of unauthorized\
|
| 530 |
+
\ use of their personal access codes to the Internet Banking service, are to be\
|
| 531 |
+
\ rejected as fundamentally unfounded. This is because the aforementioned contractual\
|
| 532 |
+
\ terms are invalid according to the provision of Article 103 of Law 4537/2018,\
|
| 533 |
+
\ as they contradict the provisions of Articles 71, 73, and 92 of the same Law,\
|
| 534 |
+
\ which provide for the provider's universal liability and its exemption only\
|
| 535 |
+
\ for unusual and unforeseen circumstances that are beyond the control of the\
|
| 536 |
+
\ party invoking them and whose consequences could not have been avoided despite\
|
| 537 |
+
\ all efforts to the contrary; these provisions establish mandatory law in favor\
|
| 538 |
+
\ of users, as according to Article 103 of Law 4537/2018, payment service providers\
|
| 539 |
+
\ are prohibited from deviating from the provisions to the detriment of payment\
|
| 540 |
+
\ service users, unless the possibility of deviation is explicitly provided and\
|
| 541 |
+
\ they can decide to offer only more favorable terms to payment service users;\
|
| 542 |
+
\ the aforementioned contractual terms do not constitute more favorable terms\
|
| 543 |
+
\ but rather disadvantageous terms for the payment service user. In this case,\
|
| 544 |
+
\ however, the defendant did not prove the authenticity of the transaction and\
|
| 545 |
+
\ its approval by the plaintiff and did not invoke, nor did any unusual and unforeseen\
|
| 546 |
+
\ circumstances beyond its control, the consequences of which could not have been\
|
| 547 |
+
\ avoided despite all efforts to the contrary, come to light. Therefore, the contested\
|
| 548 |
+
\ transaction transferring the amount of €3,000.00 is considered, in the absence\
|
| 549 |
+
\ of demonstrable consent from the plaintiff, unapproved according to the provisions\
|
| 550 |
+
\ of Article 64 of Law 4537/2018, and the defendant's contrary claims are rejected,\
|
| 551 |
+
\ especially since the plaintiff proceeded, according to Article 71 paragraph\
|
| 552 |
+
\ 1 of Law 4537/2018, without undue delay to notify the defendant regarding the\
|
| 553 |
+
\ contested unapproved payment action. Consequently, the defendant is liable for\
|
| 554 |
+
\ compensating the plaintiff for the positive damage he suffered under Article\
|
| 555 |
+
\ 73 of Law 4537/2018 and is obliged to pay him the requested amount of €703.18,\
|
| 556 |
+
\ while the plaintiff’s fault in the occurrence of this damage cannot be established,\
|
| 557 |
+
\ as he entered his personal details in an online environment that was a faithful\
|
| 558 |
+
\ imitation of that of the defendant, as evidenced by the comparison of the screenshots\
|
| 559 |
+
\ of the fake website and the real website provided by the plaintiff, a fact that\
|
| 560 |
+
\ he could not have known while being fully convinced that he was transacting\
|
| 561 |
+
\ with the defendant. Furthermore, the defendant’s liability to compensate the\
|
| 562 |
+
\ plaintiff is based on the provision of Article 8 of Law 2251/1994, which applies\
|
| 563 |
+
\ in this case, as the plaintiff's damage resulted from inadequate fulfillment\
|
| 564 |
+
\ of its obligations in the context of providing its services, but also on the\
|
| 565 |
+
\ provision of Article 914 of the Civil Code in the sense of omission on its part\
|
| 566 |
+
\ of unlawfully and culpably imposed actions. In this case, given that during\
|
| 567 |
+
\ the relevant period there had been a multitude of similar incidents of fraud\
|
| 568 |
+
\ against the defendant's customers, the latter, as a service provider to the\
|
| 569 |
+
\ consumer public and bearing transactional obligations of care and security towards\
|
| 570 |
+
\ them, displayed gross negligence regarding the security provided for electronic\
|
| 571 |
+
\ transaction services, which was compromised by the fraudulent theft of funds,\
|
| 572 |
+
\ as it did not comply with all required high-security measures for executing\
|
| 573 |
+
\ the contested transaction, failing to implement the strict customer identification\
|
| 574 |
+
\ verification process and to check the authenticity of the account to which the\
|
| 575 |
+
\ funds were sent, thus not assuming the suspicious nature of the transaction,\
|
| 576 |
+
\ did not adopt comprehensive and improved protective measures to fully protect\
|
| 577 |
+
\ its customers against malicious attacks and online fraud and to prevent the\
|
| 578 |
+
\ infiltration of unauthorized third parties, nor did it fulfill its obligations\
|
| 579 |
+
\ to inform, accurately inform, and warn its consumers - customers, as it failed\
|
| 580 |
+
\ to adequately inform them of attempts to steal their personal data through the\
|
| 581 |
+
\ sending of informative emails or SMS, while merely posting in a section rather\
|
| 582 |
+
\ than on a central banner (as it later did) does not constitute adequate information\
|
| 583 |
+
\ such that it meets the requirement of protecting its customers and the increased\
|
| 584 |
+
\ safeguarding of their interests. Although the plaintiff acted promptly and informed\
|
| 585 |
+
\ the defendant on the same day about the contested incident, the defendant did\
|
| 586 |
+
\ not act as promptly regarding the investigation of the incident and the freezing\
|
| 587 |
+
\ of the account that held the fraudulent credit to prevent the plaintiff's loss,\
|
| 588 |
+
\ but only returned part of the funds to the plaintiff a month later. This behavior,\
|
| 589 |
+
\ beyond being culpable due to gross negligence, was also unlawful, as it would\
|
| 590 |
+
\ have been illegal even without the contractual relationship, as contrary to\
|
| 591 |
+
\ the provisions of Law 4537/2018 and Law 2251/1994, regarding the lack of security\
|
| 592 |
+
\ of the services that the consumer is legitimately entitled to expect, as well\
|
| 593 |
+
\ as the building of trust that is essential in banking transactions, elements\
|
| 594 |
+
\ that it was obligated to provide within the sphere of the services offered,\
|
| 595 |
+
\ and contrary to the principles of good faith and commercial ethics, as crystallized\
|
| 596 |
+
\ in the provision of Article 288 of the Civil Code, as well as the general duty\
|
| 597 |
+
\ imposed by Article 914 of the Civil Code not to cause harm to another culpably.\
|
| 598 |
+
\ This resulted not only in positive damage to the plaintiff but also in causing\
|
| 599 |
+
\ him moral harm consisting of his mental distress and the disruption, agitation,\
|
| 600 |
+
\ and sorrow he experienced, for which he must be awarded financial compensation.\
|
| 601 |
+
\ Taking into account all the general circumstances of the case, the extent of\
|
| 602 |
+
\ the plaintiff's damage, the severity of the defendant's fault, the mental distress\
|
| 603 |
+
\ suffered by the plaintiff, the insecurity he felt regarding his deposits, the\
|
| 604 |
+
\ sorrow he experienced, and the stress caused by his financial loss, which occurred\
|
| 605 |
+
\ during the pandemic period when his earnings from his professional activity\
|
| 606 |
+
\ had significantly decreased, as well as the financial and social situation of\
|
| 607 |
+
\ the parties, it is the court's opinion that he should be granted, as financial\
|
| 608 |
+
\ compensation for his moral harm, an amount of €250.00, which is deemed reasonable\
|
| 609 |
+
\ and fair. Therefore, the total monetary amount that the plaintiff is entitled\
|
| 610 |
+
\ to for his positive damage and financial compensation for the moral harm suffered\
|
| 611 |
+
\ amounts to a total of (€703.18 + €250.00) = €953.18."
|
| 612 |
+
- 'Failure to notify the Authority of file establishment or permit changes is punished
|
| 613 |
+
by up to three years’ imprisonment and a fine of one to five million Drachmas.
|
| 614 |
+
|
| 615 |
+
Maintaining a file without a permit or violating permit terms is punished by at
|
| 616 |
+
least one year’s imprisonment and a fine of one to five million Drachmas.
|
| 617 |
+
|
| 618 |
+
Unauthorized file interconnection or without permit is punished by up to three
|
| 619 |
+
years’ imprisonment and a fine of one to five million Drachmas.
|
| 620 |
+
|
| 621 |
+
Unlawful interference with personal data is punished by imprisonment and a fine;
|
| 622 |
+
for sensitive data, at least one year’s imprisonment and a fine of one to ten
|
| 623 |
+
million Drachmas.
|
| 624 |
+
|
| 625 |
+
Controllers who fail to comply with Authority decisions or violate data transfer
|
| 626 |
+
rules face at least two years’ imprisonment and a fine of one to five million
|
| 627 |
+
Drachmas.
|
| 628 |
+
|
| 629 |
+
If acts were committed for unlawful benefit or to cause harm, punishment is up
|
| 630 |
+
to ten years’ imprisonment and a fine of two to ten million Drachmas.
|
| 631 |
+
|
| 632 |
+
If acts jeopardize democratic governance or national security, punishment is confinement
|
| 633 |
+
in a penitentiary and a fine of five to ten million Drachmas.
|
| 634 |
+
|
| 635 |
+
Acts committed due to negligence result in at least three months’ imprisonment
|
| 636 |
+
and a fine.
|
| 637 |
+
|
| 638 |
+
If the Controller is not a natural person, the responsible party is the representative
|
| 639 |
+
or head of the organization with administrative or managerial duties.
|
| 640 |
+
|
| 641 |
+
Authorized members of the Authority may carry out preliminary investigations even
|
| 642 |
+
without Prosecutor’s order for certain offenses.
|
| 643 |
+
|
| 644 |
+
The Authority''s President must notify the Public Prosecutor of any offenses under
|
| 645 |
+
investigation, forwarding all relevant evidence.
|
| 646 |
+
|
| 647 |
+
Preliminary investigations must conclude within two months of charges, and trial
|
| 648 |
+
must begin within three months of completion.
|
| 649 |
+
|
| 650 |
+
Continuation of proceedings is allowed only once and for extremely important reasons,
|
| 651 |
+
with adjournment not exceeding two months.
|
| 652 |
+
|
| 653 |
+
Felonies under this law fall under the jurisdiction of the Court of Appeal.
|
| 654 |
+
|
| 655 |
+
'
|
| 656 |
+
- source_sentence: Who must facilitate the exercise of data subject rights?
|
| 657 |
+
sentences:
|
| 658 |
+
- '1.Processing of personal data revealing racial or ethnic origin, political opinions,
|
| 659 |
+
religious or philosophical beliefs, or trade union membership, and the processing
|
| 660 |
+
of genetic data, biometric data for the purpose of uniquely identifying a natural
|
| 661 |
+
person, data concerning health or data concerning a natural person''s sex life
|
| 662 |
+
or sexual orientation shall be prohibited.
|
| 663 |
+
|
| 664 |
+
2.Paragraph 1 shall not apply if one of the following applies: (a) the data subject
|
| 665 |
+
has given explicit consent to the processing of those personal data for one or
|
| 666 |
+
more specified purposes, except where Union or Member State law provide that the
|
| 667 |
+
prohibition referred to in paragraph 1 may not be lifted by the data subject;
|
| 668 |
+
(b) processing is necessary for the purposes of carrying out the obligations
|
| 669 |
+
and exercising specific rights of the controller or of the data subject in the
|
| 670 |
+
field of employment and social security and social protection law in so far as
|
| 671 |
+
it is authorised by Union or Member State law or a collective agreement pursuant
|
| 672 |
+
to Member State law providing for appropriate safeguards for the fundamental rights
|
| 673 |
+
and the interests of the data subject; (c) processing is necessary to protect
|
| 674 |
+
the vital interests of the data subject or of another natural person where the
|
| 675 |
+
data subject is physically or legally incapable of giving consent; (d) processing
|
| 676 |
+
is carried out in the course of its legitimate activities with appropriate safeguards
|
| 677 |
+
by a foundation, association or any other not-for-profit body with a political,
|
| 678 |
+
philosophical, religious or trade union aim and on condition that the processing
|
| 679 |
+
relates solely to the members or to former members of the body or to persons who
|
| 680 |
+
have regular contact with it in connection with its purposes and that the personal
|
| 681 |
+
data are not disclosed outside that body without the consent of the data subjects;
|
| 682 |
+
(e) processing relates to personal data which are manifestly made public by the
|
| 683 |
+
data subject; (f) processing is necessary for the establishment, exercise or
|
| 684 |
+
defence of legal claims or whenever courts are acting in their judicial capacity;
|
| 685 |
+
(g) processing is necessary for reasons of substantial public interest, on the
|
| 686 |
+
basis of Union or Member State law which shall be proportionate to the aim pursued,
|
| 687 |
+
respect the essence of the right to data protection and provide for suitable and
|
| 688 |
+
specific measures to safeguard the fundamental rights and the interests of the
|
| 689 |
+
data subject; (h) processing is necessary for the purposes of preventive or occupational
|
| 690 |
+
medicine, for the assessment of the working capacity of the employee, medical
|
| 691 |
+
diagnosis, the provision of health or social care or treatment or the management
|
| 692 |
+
of health or social care systems and services on the basis of Union or Member
|
| 693 |
+
State law or pursuant to contract with a health professional and subject to the
|
| 694 |
+
conditions and safeguards referred to in paragraph 3; (i) processing is necessary
|
| 695 |
+
for reasons of public interest in the area of public health, such as protecting
|
| 696 |
+
against serious cross-border threats to health or ensuring high standards of quality
|
| 697 |
+
and safety of health care and of medicinal products or medical devices, on the
|
| 698 |
+
basis of Union or Member State law which provides for suitable and specific measures
|
| 699 |
+
to safeguard the rights and freedoms of the data subject, in particular professional
|
| 700 |
+
secrecy; 4.5.2016 L 119/38 (j) processing is necessary for archiving purposes
|
| 701 |
+
in the public interest, scientific or historical research purposes or statistical
|
| 702 |
+
purposes in accordance with Article 89(1) based on Union or Member State law which
|
| 703 |
+
shall be proportionate to the aim pursued, respect the essence of the right to
|
| 704 |
+
data protection and provide for suitable and specific measures to safeguard the
|
| 705 |
+
fundamental rights and the interests of the data subject.
|
| 706 |
+
|
| 707 |
+
3.Personal data referred to in paragraph 1 may be processed for the purposes referred
|
| 708 |
+
to in point (h) of paragraph 2 when those data are processed by or under the responsibility
|
| 709 |
+
of a professional subject to the obligation of professional secrecy under Union
|
| 710 |
+
or Member State law or rules established by national competent bodies or by another
|
| 711 |
+
person also subject to an obligation of secrecy under Union or Member State law
|
| 712 |
+
or rules established by national competent bodies.
|
| 713 |
+
|
| 714 |
+
4.Member States may maintain or introduce further conditions, including limitations,
|
| 715 |
+
with regard to the processing of genetic data, biometric data or data concerning
|
| 716 |
+
health.'
|
| 717 |
+
- Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies
|
| 718 |
+
to the processing of personal data by the Union institutions, bodies, offices
|
| 719 |
+
and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable
|
| 720 |
+
to such processing of personal data should be adapted to the principles and rules
|
| 721 |
+
established in this Regulation and applied in the light of this Regulation. In
|
| 722 |
+
order to provide a strong and coherent data protection framework in the Union,
|
| 723 |
+
the necessary adaptations of Regulation (EC) No 45/2001 should follow after the
|
| 724 |
+
adoption of this Regulation, in order to allow application at the same time as
|
| 725 |
+
this Regulation.
|
| 726 |
+
- "1.The controller shall take appropriate measures to provide any information referred\
|
| 727 |
+
\ to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34\
|
| 728 |
+
\ relating to processing to the data subject in a concise, transparent, intelligible\
|
| 729 |
+
\ and easily accessible form, using clear and plain language, in particular for\
|
| 730 |
+
\ any information addressed specifically to a child. The information shall be\
|
| 731 |
+
\ provided in writing, or by other means, including, where appropriate, by electronic\
|
| 732 |
+
\ means. When requested by the data subject, the information may be provided orally,\
|
| 733 |
+
\ provided that the identity of the data subject is proven by other means. 4.5.2016\
|
| 734 |
+
\ L 119/39 \n2.The controller shall facilitate the exercise of data subject rights\
|
| 735 |
+
\ under Articles 15 to 22. In the cases referred to in Article 11(2), the controller\
|
| 736 |
+
\ shall not refuse to act on the request of the data subject for exercising his\
|
| 737 |
+
\ or her rights under Articles 15 to 22, unless the controller demonstrates that\
|
| 738 |
+
\ it is not in a position to identify the data subject.\n3.The controller shall\
|
| 739 |
+
\ provide information on action taken on a request under Articles 15 to 22 to\
|
| 740 |
+
\ the data subject without undue delay and in any event within one month of receipt\
|
| 741 |
+
\ of the request. That period may be extended by two further months where necessary,\
|
| 742 |
+
\ taking into account the complexity and number of the requests. The controller\
|
| 743 |
+
\ shall inform the data subject of any such extension within one month of receipt\
|
| 744 |
+
\ of the request, together with the reasons for the delay. Where the data subject\
|
| 745 |
+
\ makes the request by electronic form means, the information shall be provided\
|
| 746 |
+
\ by electronic means where possible, unless otherwise requested by the data subject.\n\
|
| 747 |
+
4.If the controller does not take action on the request of the data subject, the\
|
| 748 |
+
\ controller shall inform the data subject without delay and at the latest within\
|
| 749 |
+
\ one month of receipt of the request of the reasons for not taking action and\
|
| 750 |
+
\ on the possibility of lodging a complaint with a supervisory authority and seeking\
|
| 751 |
+
\ a judicial remedy.\n5.Information provided under Articles 13 and 14 and any\
|
| 752 |
+
\ communication and any actions taken under Articles 15 to 22 and 34 shall be\
|
| 753 |
+
\ provided free of charge. Where requests from a data subject are manifestly unfounded\
|
| 754 |
+
\ or excessive, in particular because of their repetitive character, the controller\
|
| 755 |
+
\ may either: (a) charge a reasonable fee taking into account the administrative\
|
| 756 |
+
\ costs of providing the information or communication or taking the action requested;\
|
| 757 |
+
\ or (b) refuse to act on the request. The controller shall bear the burden of\
|
| 758 |
+
\ demonstrating the manifestly unfounded or excessive character of the request.\n\
|
| 759 |
+
6.Without prejudice to Article 11, where the controller has reasonable doubts\
|
| 760 |
+
\ concerning the identity of the natural person making the request referred to\
|
| 761 |
+
\ in Articles 15 to 21, the controller may request the provision of additional\
|
| 762 |
+
\ information necessary to confirm the identity of the data subject.\n7.The information\
|
| 763 |
+
\ to be provided to data subjects pursuant to Articles 13 and 14 may be provided\
|
| 764 |
+
\ in combination with standardised icons in order to give in an easily visible,\
|
| 765 |
+
\ intelligible and clearly legible manner a meaningful overview of the intended\
|
| 766 |
+
\ processing. Where the icons are presented electronically they shall be machine-readable.\n\
|
| 767 |
+
8.The Commission shall be empowered to adopt delegated acts in accordance with\
|
| 768 |
+
\ Article 92 for the purpose of determining the information to be presented by\
|
| 769 |
+
\ the icons and the procedures for providing standardised icons. Section 2 Information\
|
| 770 |
+
\ and access to personal data"
|
| 771 |
+
pipeline_tag: sentence-similarity
|
| 772 |
+
library_name: sentence-transformers
|
| 773 |
+
metrics:
|
| 774 |
+
- cosine_accuracy@1
|
| 775 |
+
- cosine_accuracy@3
|
| 776 |
+
- cosine_accuracy@5
|
| 777 |
+
- cosine_accuracy@10
|
| 778 |
+
- cosine_precision@1
|
| 779 |
+
- cosine_precision@3
|
| 780 |
+
- cosine_precision@5
|
| 781 |
+
- cosine_precision@10
|
| 782 |
+
- cosine_recall@1
|
| 783 |
+
- cosine_recall@3
|
| 784 |
+
- cosine_recall@5
|
| 785 |
+
- cosine_recall@10
|
| 786 |
+
- cosine_ndcg@10
|
| 787 |
+
- cosine_mrr@10
|
| 788 |
+
- cosine_map@100
|
| 789 |
+
model-index:
|
| 790 |
+
- name: multilingual-e5-large
|
| 791 |
+
results:
|
| 792 |
+
- task:
|
| 793 |
+
type: information-retrieval
|
| 794 |
+
name: Information Retrieval
|
| 795 |
+
dataset:
|
| 796 |
+
name: dim 1024
|
| 797 |
+
type: dim_1024
|
| 798 |
+
metrics:
|
| 799 |
+
- type: cosine_accuracy@1
|
| 800 |
+
value: 0.4046094750320102
|
| 801 |
+
name: Cosine Accuracy@1
|
| 802 |
+
- type: cosine_accuracy@3
|
| 803 |
+
value: 0.4090909090909091
|
| 804 |
+
name: Cosine Accuracy@3
|
| 805 |
+
- type: cosine_accuracy@5
|
| 806 |
+
value: 0.43918053777208704
|
| 807 |
+
name: Cosine Accuracy@5
|
| 808 |
+
- type: cosine_accuracy@10
|
| 809 |
+
value: 0.47823303457106275
|
| 810 |
+
name: Cosine Accuracy@10
|
| 811 |
+
- type: cosine_precision@1
|
| 812 |
+
value: 0.4046094750320102
|
| 813 |
+
name: Cosine Precision@1
|
| 814 |
+
- type: cosine_precision@3
|
| 815 |
+
value: 0.40311566367904395
|
| 816 |
+
name: Cosine Precision@3
|
| 817 |
+
- type: cosine_precision@5
|
| 818 |
+
value: 0.39180537772087065
|
| 819 |
+
name: Cosine Precision@5
|
| 820 |
+
- type: cosine_precision@10
|
| 821 |
+
value: 0.3565941101152369
|
| 822 |
+
name: Cosine Precision@10
|
| 823 |
+
- type: cosine_recall@1
|
| 824 |
+
value: 0.04660606778759063
|
| 825 |
+
name: Cosine Recall@1
|
| 826 |
+
- type: cosine_recall@3
|
| 827 |
+
value: 0.13592596883673455
|
| 828 |
+
name: Cosine Recall@3
|
| 829 |
+
- type: cosine_recall@5
|
| 830 |
+
value: 0.20379253880710943
|
| 831 |
+
name: Cosine Recall@5
|
| 832 |
+
- type: cosine_recall@10
|
| 833 |
+
value: 0.3014663479400921
|
| 834 |
+
name: Cosine Recall@10
|
| 835 |
+
- type: cosine_ndcg@10
|
| 836 |
+
value: 0.42913551824501384
|
| 837 |
+
name: Cosine Ndcg@10
|
| 838 |
+
- type: cosine_mrr@10
|
| 839 |
+
value: 0.4168417068064951
|
| 840 |
+
name: Cosine Mrr@10
|
| 841 |
+
- type: cosine_map@100
|
| 842 |
+
value: 0.490599623630225
|
| 843 |
+
name: Cosine Map@100
|
| 844 |
+
- task:
|
| 845 |
+
type: information-retrieval
|
| 846 |
+
name: Information Retrieval
|
| 847 |
+
dataset:
|
| 848 |
+
name: dim 768
|
| 849 |
+
type: dim_768
|
| 850 |
+
metrics:
|
| 851 |
+
- type: cosine_accuracy@1
|
| 852 |
+
value: 0.3994878361075544
|
| 853 |
+
name: Cosine Accuracy@1
|
| 854 |
+
- type: cosine_accuracy@3
|
| 855 |
+
value: 0.4046094750320102
|
| 856 |
+
name: Cosine Accuracy@3
|
| 857 |
+
- type: cosine_accuracy@5
|
| 858 |
+
value: 0.4359795134443022
|
| 859 |
+
name: Cosine Accuracy@5
|
| 860 |
+
- type: cosine_accuracy@10
|
| 861 |
+
value: 0.4737516005121639
|
| 862 |
+
name: Cosine Accuracy@10
|
| 863 |
+
- type: cosine_precision@1
|
| 864 |
+
value: 0.3994878361075544
|
| 865 |
+
name: Cosine Precision@1
|
| 866 |
+
- type: cosine_precision@3
|
| 867 |
+
value: 0.39820742637644047
|
| 868 |
+
name: Cosine Precision@3
|
| 869 |
+
- type: cosine_precision@5
|
| 870 |
+
value: 0.3868117797695263
|
| 871 |
+
name: Cosine Precision@5
|
| 872 |
+
- type: cosine_precision@10
|
| 873 |
+
value: 0.352752880921895
|
| 874 |
+
name: Cosine Precision@10
|
| 875 |
+
- type: cosine_recall@1
|
| 876 |
+
value: 0.046132270416131195
|
| 877 |
+
name: Cosine Recall@1
|
| 878 |
+
- type: cosine_recall@3
|
| 879 |
+
value: 0.13453018491697852
|
| 880 |
+
name: Cosine Recall@3
|
| 881 |
+
- type: cosine_recall@5
|
| 882 |
+
value: 0.20078864250336506
|
| 883 |
+
name: Cosine Recall@5
|
| 884 |
+
- type: cosine_recall@10
|
| 885 |
+
value: 0.29681183299989666
|
| 886 |
+
name: Cosine Recall@10
|
| 887 |
+
- type: cosine_ndcg@10
|
| 888 |
+
value: 0.4244383191680289
|
| 889 |
+
name: Cosine Ndcg@10
|
| 890 |
+
- type: cosine_mrr@10
|
| 891 |
+
value: 0.41201019246793846
|
| 892 |
+
name: Cosine Mrr@10
|
| 893 |
+
- type: cosine_map@100
|
| 894 |
+
value: 0.48680507317454147
|
| 895 |
+
name: Cosine Map@100
|
| 896 |
+
- task:
|
| 897 |
+
type: information-retrieval
|
| 898 |
+
name: Information Retrieval
|
| 899 |
+
dataset:
|
| 900 |
+
name: dim 512
|
| 901 |
+
type: dim_512
|
| 902 |
+
metrics:
|
| 903 |
+
- type: cosine_accuracy@1
|
| 904 |
+
value: 0.39884763124199746
|
| 905 |
+
name: Cosine Accuracy@1
|
| 906 |
+
- type: cosine_accuracy@3
|
| 907 |
+
value: 0.4052496798975672
|
| 908 |
+
name: Cosine Accuracy@3
|
| 909 |
+
- type: cosine_accuracy@5
|
| 910 |
+
value: 0.44558258642765686
|
| 911 |
+
name: Cosine Accuracy@5
|
| 912 |
+
- type: cosine_accuracy@10
|
| 913 |
+
value: 0.47823303457106275
|
| 914 |
+
name: Cosine Accuracy@10
|
| 915 |
+
- type: cosine_precision@1
|
| 916 |
+
value: 0.39884763124199746
|
| 917 |
+
name: Cosine Precision@1
|
| 918 |
+
- type: cosine_precision@3
|
| 919 |
+
value: 0.3975672215108835
|
| 920 |
+
name: Cosine Precision@3
|
| 921 |
+
- type: cosine_precision@5
|
| 922 |
+
value: 0.3888604353393086
|
| 923 |
+
name: Cosine Precision@5
|
| 924 |
+
- type: cosine_precision@10
|
| 925 |
+
value: 0.35793854033290645
|
| 926 |
+
name: Cosine Precision@10
|
| 927 |
+
- type: cosine_recall@1
|
| 928 |
+
value: 0.04570727180608771
|
| 929 |
+
name: Cosine Recall@1
|
| 930 |
+
- type: cosine_recall@3
|
| 931 |
+
value: 0.13329368345632836
|
| 932 |
+
name: Cosine Recall@3
|
| 933 |
+
- type: cosine_recall@5
|
| 934 |
+
value: 0.2006035854063678
|
| 935 |
+
name: Cosine Recall@5
|
| 936 |
+
- type: cosine_recall@10
|
| 937 |
+
value: 0.2993652309972795
|
| 938 |
+
name: Cosine Recall@10
|
| 939 |
+
- type: cosine_ndcg@10
|
| 940 |
+
value: 0.42824151108259556
|
| 941 |
+
name: Cosine Ndcg@10
|
| 942 |
+
- type: cosine_mrr@10
|
| 943 |
+
value: 0.41307745462675005
|
| 944 |
+
name: Cosine Mrr@10
|
| 945 |
+
- type: cosine_map@100
|
| 946 |
+
value: 0.4876319198894288
|
| 947 |
+
name: Cosine Map@100
|
| 948 |
+
- task:
|
| 949 |
+
type: information-retrieval
|
| 950 |
+
name: Information Retrieval
|
| 951 |
+
dataset:
|
| 952 |
+
name: dim 256
|
| 953 |
+
type: dim_256
|
| 954 |
+
metrics:
|
| 955 |
+
- type: cosine_accuracy@1
|
| 956 |
+
value: 0.3738796414852753
|
| 957 |
+
name: Cosine Accuracy@1
|
| 958 |
+
- type: cosine_accuracy@3
|
| 959 |
+
value: 0.37772087067861715
|
| 960 |
+
name: Cosine Accuracy@3
|
| 961 |
+
- type: cosine_accuracy@5
|
| 962 |
+
value: 0.40717029449423814
|
| 963 |
+
name: Cosine Accuracy@5
|
| 964 |
+
- type: cosine_accuracy@10
|
| 965 |
+
value: 0.44558258642765686
|
| 966 |
+
name: Cosine Accuracy@10
|
| 967 |
+
- type: cosine_precision@1
|
| 968 |
+
value: 0.3738796414852753
|
| 969 |
+
name: Cosine Precision@1
|
| 970 |
+
- type: cosine_precision@3
|
| 971 |
+
value: 0.37238583013230897
|
| 972 |
+
name: Cosine Precision@3
|
| 973 |
+
- type: cosine_precision@5
|
| 974 |
+
value: 0.3615877080665813
|
| 975 |
+
name: Cosine Precision@5
|
| 976 |
+
- type: cosine_precision@10
|
| 977 |
+
value: 0.3297695262483995
|
| 978 |
+
name: Cosine Precision@10
|
| 979 |
+
- type: cosine_recall@1
|
| 980 |
+
value: 0.043086085492826574
|
| 981 |
+
name: Cosine Recall@1
|
| 982 |
+
- type: cosine_recall@3
|
| 983 |
+
value: 0.125747799799009
|
| 984 |
+
name: Cosine Recall@3
|
| 985 |
+
- type: cosine_recall@5
|
| 986 |
+
value: 0.18837022600852496
|
| 987 |
+
name: Cosine Recall@5
|
| 988 |
+
- type: cosine_recall@10
|
| 989 |
+
value: 0.2792649180924836
|
| 990 |
+
name: Cosine Recall@10
|
| 991 |
+
- type: cosine_ndcg@10
|
| 992 |
+
value: 0.3980442434686935
|
| 993 |
+
name: Cosine Ndcg@10
|
| 994 |
+
- type: cosine_mrr@10
|
| 995 |
+
value: 0.38572571794402755
|
| 996 |
+
name: Cosine Mrr@10
|
| 997 |
+
- type: cosine_map@100
|
| 998 |
+
value: 0.45855798848430374
|
| 999 |
+
name: Cosine Map@100
|
| 1000 |
+
- task:
|
| 1001 |
+
type: information-retrieval
|
| 1002 |
+
name: Information Retrieval
|
| 1003 |
+
dataset:
|
| 1004 |
+
name: dim 128
|
| 1005 |
+
type: dim_128
|
| 1006 |
+
metrics:
|
| 1007 |
+
- type: cosine_accuracy@1
|
| 1008 |
+
value: 0.34314980793854033
|
| 1009 |
+
name: Cosine Accuracy@1
|
| 1010 |
+
- type: cosine_accuracy@3
|
| 1011 |
+
value: 0.34763124199743917
|
| 1012 |
+
name: Cosine Accuracy@3
|
| 1013 |
+
- type: cosine_accuracy@5
|
| 1014 |
+
value: 0.37708066581306016
|
| 1015 |
+
name: Cosine Accuracy@5
|
| 1016 |
+
- type: cosine_accuracy@10
|
| 1017 |
+
value: 0.4148527528809219
|
| 1018 |
+
name: Cosine Accuracy@10
|
| 1019 |
+
- type: cosine_precision@1
|
| 1020 |
+
value: 0.34314980793854033
|
| 1021 |
+
name: Cosine Precision@1
|
| 1022 |
+
- type: cosine_precision@3
|
| 1023 |
+
value: 0.3418693982074264
|
| 1024 |
+
name: Cosine Precision@3
|
| 1025 |
+
- type: cosine_precision@5
|
| 1026 |
+
value: 0.3322663252240717
|
| 1027 |
+
name: Cosine Precision@5
|
| 1028 |
+
- type: cosine_precision@10
|
| 1029 |
+
value: 0.302752880921895
|
| 1030 |
+
name: Cosine Precision@10
|
| 1031 |
+
- type: cosine_recall@1
|
| 1032 |
+
value: 0.040652627677675406
|
| 1033 |
+
name: Cosine Recall@1
|
| 1034 |
+
- type: cosine_recall@3
|
| 1035 |
+
value: 0.1184519992454523
|
| 1036 |
+
name: Cosine Recall@3
|
| 1037 |
+
- type: cosine_recall@5
|
| 1038 |
+
value: 0.1774839552040709
|
| 1039 |
+
name: Cosine Recall@5
|
| 1040 |
+
- type: cosine_recall@10
|
| 1041 |
+
value: 0.26330336421247125
|
| 1042 |
+
name: Cosine Recall@10
|
| 1043 |
+
- type: cosine_ndcg@10
|
| 1044 |
+
value: 0.36765573601526275
|
| 1045 |
+
name: Cosine Ndcg@10
|
| 1046 |
+
- type: cosine_mrr@10
|
| 1047 |
+
value: 0.35513180090644836
|
| 1048 |
+
name: Cosine Mrr@10
|
| 1049 |
+
- type: cosine_map@100
|
| 1050 |
+
value: 0.4276696379169563
|
| 1051 |
+
name: Cosine Map@100
|
| 1052 |
+
- task:
|
| 1053 |
+
type: information-retrieval
|
| 1054 |
+
name: Information Retrieval
|
| 1055 |
+
dataset:
|
| 1056 |
+
name: dim 64
|
| 1057 |
+
type: dim_64
|
| 1058 |
+
metrics:
|
| 1059 |
+
- type: cosine_accuracy@1
|
| 1060 |
+
value: 0.3079385403329065
|
| 1061 |
+
name: Cosine Accuracy@1
|
| 1062 |
+
- type: cosine_accuracy@3
|
| 1063 |
+
value: 0.31241997439180536
|
| 1064 |
+
name: Cosine Accuracy@3
|
| 1065 |
+
- type: cosine_accuracy@5
|
| 1066 |
+
value: 0.33290653008962867
|
| 1067 |
+
name: Cosine Accuracy@5
|
| 1068 |
+
- type: cosine_accuracy@10
|
| 1069 |
+
value: 0.36555697823303457
|
| 1070 |
+
name: Cosine Accuracy@10
|
| 1071 |
+
- type: cosine_precision@1
|
| 1072 |
+
value: 0.3079385403329065
|
| 1073 |
+
name: Cosine Precision@1
|
| 1074 |
+
- type: cosine_precision@3
|
| 1075 |
+
value: 0.3070849338454972
|
| 1076 |
+
name: Cosine Precision@3
|
| 1077 |
+
- type: cosine_precision@5
|
| 1078 |
+
value: 0.29820742637644043
|
| 1079 |
+
name: Cosine Precision@5
|
| 1080 |
+
- type: cosine_precision@10
|
| 1081 |
+
value: 0.27215108834827145
|
| 1082 |
+
name: Cosine Precision@10
|
| 1083 |
+
- type: cosine_recall@1
|
| 1084 |
+
value: 0.03504677697523653
|
| 1085 |
+
name: Cosine Recall@1
|
| 1086 |
+
- type: cosine_recall@3
|
| 1087 |
+
value: 0.10211269541567973
|
| 1088 |
+
name: Cosine Recall@3
|
| 1089 |
+
- type: cosine_recall@5
|
| 1090 |
+
value: 0.15297976910096123
|
| 1091 |
+
name: Cosine Recall@5
|
| 1092 |
+
- type: cosine_recall@10
|
| 1093 |
+
value: 0.23026653514933906
|
| 1094 |
+
name: Cosine Recall@10
|
| 1095 |
+
- type: cosine_ndcg@10
|
| 1096 |
+
value: 0.3275369456141822
|
| 1097 |
+
name: Cosine Ndcg@10
|
| 1098 |
+
- type: cosine_mrr@10
|
| 1099 |
+
value: 0.31748394406845065
|
| 1100 |
+
name: Cosine Mrr@10
|
| 1101 |
+
- type: cosine_map@100
|
| 1102 |
+
value: 0.38184314430829974
|
| 1103 |
+
name: Cosine Map@100
|
| 1104 |
+
---
|
| 1105 |
+
|
| 1106 |
+
# multilingual-e5-large
|
| 1107 |
+
|
| 1108 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large). It maps sentences & paragraphs to a 1024-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 1109 |
+
|
| 1110 |
+
## Model Details
|
| 1111 |
+
|
| 1112 |
+
### Model Description
|
| 1113 |
+
- **Model Type:** Sentence Transformer
|
| 1114 |
+
- **Base model:** [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large) <!-- at revision 0dc5580a448e4284468b8909bae50fa925907bc5 -->
|
| 1115 |
+
- **Maximum Sequence Length:** 512 tokens
|
| 1116 |
+
- **Output Dimensionality:** 1024 dimensions
|
| 1117 |
+
- **Similarity Function:** Cosine Similarity
|
| 1118 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 1119 |
+
- **Language:** en
|
| 1120 |
+
- **License:** apache-2.0
|
| 1121 |
+
|
| 1122 |
+
### Model Sources
|
| 1123 |
+
|
| 1124 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 1125 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 1126 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 1127 |
+
|
| 1128 |
+
### Full Model Architecture
|
| 1129 |
+
|
| 1130 |
+
```
|
| 1131 |
+
SentenceTransformer(
|
| 1132 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': False, 'architecture': 'XLMRobertaModel'})
|
| 1133 |
+
(1): Pooling({'word_embedding_dimension': 1024, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 1134 |
+
(2): Normalize()
|
| 1135 |
+
)
|
| 1136 |
+
```
|
| 1137 |
+
|
| 1138 |
+
## Usage
|
| 1139 |
+
|
| 1140 |
+
### Direct Usage (Sentence Transformers)
|
| 1141 |
+
|
| 1142 |
+
First install the Sentence Transformers library:
|
| 1143 |
+
|
| 1144 |
+
```bash
|
| 1145 |
+
pip install -U sentence-transformers
|
| 1146 |
+
```
|
| 1147 |
+
|
| 1148 |
+
Then you can load this model and run inference.
|
| 1149 |
+
```python
|
| 1150 |
+
from sentence_transformers import SentenceTransformer
|
| 1151 |
+
|
| 1152 |
+
# Download from the 🤗 Hub
|
| 1153 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
| 1154 |
+
# Run inference
|
| 1155 |
+
sentences = [
|
| 1156 |
+
'Who must facilitate the exercise of data subject rights?',
|
| 1157 |
+
'1.The controller shall take appropriate measures to provide any information referred to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34 relating to processing to the data subject in a concise, transparent, intelligible and easily accessible form, using clear and plain language, in particular for any information addressed specifically to a child. The information shall be provided in writing, or by other means, including, where appropriate, by electronic means. When requested by the data subject, the information may be provided orally, provided that the identity of the data subject is proven by other means. 4.5.2016 L 119/39 \n2.The controller shall facilitate the exercise of data subject rights under Articles 15 to 22. In the cases referred to in Article 11(2), the controller shall not refuse to act on the request of the data subject for exercising his or her rights under Articles 15 to 22, unless the controller demonstrates that it is not in a position to identify the data subject.\n3.The controller shall provide information on action taken on a request under Articles 15 to 22 to the data subject without undue delay and in any event within one month of receipt of the request. That period may be extended by two further months where necessary, taking into account the complexity and number of the requests. The controller shall inform the data subject of any such extension within one month of receipt of the request, together with the reasons for the delay. Where the data subject makes the request by electronic form means, the information shall be provided by electronic means where possible, unless otherwise requested by the data subject.\n4.If the controller does not take action on the request of the data subject, the controller shall inform the data subject without delay and at the latest within one month of receipt of the request of the reasons for not taking action and on the possibility of lodging a complaint with a supervisory authority and seeking a judicial remedy.\n5.Information provided under Articles 13 and 14 and any communication and any actions taken under Articles 15 to 22 and 34 shall be provided free of charge. Where requests from a data subject are manifestly unfounded or excessive, in particular because of their repetitive character, the controller may either: (a) charge a reasonable fee taking into account the administrative costs of providing the information or communication or taking the action requested; or (b) refuse to act on the request. The controller shall bear the burden of demonstrating the manifestly unfounded or excessive character of the request.\n6.Without prejudice to Article 11, where the controller has reasonable doubts concerning the identity of the natural person making the request referred to in Articles 15 to 21, the controller may request the provision of additional information necessary to confirm the identity of the data subject.\n7.The information to be provided to data subjects pursuant to Articles 13 and 14 may be provided in combination with standardised icons in order to give in an easily visible, intelligible and clearly legible manner a meaningful overview of the intended processing. Where the icons are presented electronically they shall be machine-readable.\n8.The Commission shall be empowered to adopt delegated acts in accordance with Article 92 for the purpose of determining the information to be presented by the icons and the procedures for providing standardised icons. Section 2 Information and access to personal data',
|
| 1158 |
+
'Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies to the processing of personal data by the Union institutions, bodies, offices and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable to such processing of personal data should be adapted to the principles and rules established in this Regulation and applied in the light of this Regulation. In order to provide a strong and coherent data protection framework in the Union, the necessary adaptations of Regulation (EC) No 45/2001 should follow after the adoption of this Regulation, in order to allow application at the same time as this Regulation.',
|
| 1159 |
+
]
|
| 1160 |
+
embeddings = model.encode(sentences)
|
| 1161 |
+
print(embeddings.shape)
|
| 1162 |
+
# [3, 1024]
|
| 1163 |
+
|
| 1164 |
+
# Get the similarity scores for the embeddings
|
| 1165 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 1166 |
+
print(similarities)
|
| 1167 |
+
# tensor([[1.0000, 0.6418, 0.3512],
|
| 1168 |
+
# [0.6418, 1.0000, 0.3027],
|
| 1169 |
+
# [0.3512, 0.3027, 1.0000]])
|
| 1170 |
+
```
|
| 1171 |
+
|
| 1172 |
+
<!--
|
| 1173 |
+
### Direct Usage (Transformers)
|
| 1174 |
+
|
| 1175 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 1176 |
+
|
| 1177 |
+
</details>
|
| 1178 |
+
-->
|
| 1179 |
+
|
| 1180 |
+
<!--
|
| 1181 |
+
### Downstream Usage (Sentence Transformers)
|
| 1182 |
+
|
| 1183 |
+
You can finetune this model on your own dataset.
|
| 1184 |
+
|
| 1185 |
+
<details><summary>Click to expand</summary>
|
| 1186 |
+
|
| 1187 |
+
</details>
|
| 1188 |
+
-->
|
| 1189 |
+
|
| 1190 |
+
<!--
|
| 1191 |
+
### Out-of-Scope Use
|
| 1192 |
+
|
| 1193 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 1194 |
+
-->
|
| 1195 |
+
|
| 1196 |
+
## Evaluation
|
| 1197 |
+
|
| 1198 |
+
### Metrics
|
| 1199 |
+
|
| 1200 |
+
#### Information Retrieval
|
| 1201 |
+
|
| 1202 |
+
* Dataset: `dim_1024`
|
| 1203 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1204 |
+
```json
|
| 1205 |
+
{
|
| 1206 |
+
"truncate_dim": 1024
|
| 1207 |
+
}
|
| 1208 |
+
```
|
| 1209 |
+
|
| 1210 |
+
| Metric | Value |
|
| 1211 |
+
|:--------------------|:-----------|
|
| 1212 |
+
| cosine_accuracy@1 | 0.4046 |
|
| 1213 |
+
| cosine_accuracy@3 | 0.4091 |
|
| 1214 |
+
| cosine_accuracy@5 | 0.4392 |
|
| 1215 |
+
| cosine_accuracy@10 | 0.4782 |
|
| 1216 |
+
| cosine_precision@1 | 0.4046 |
|
| 1217 |
+
| cosine_precision@3 | 0.4031 |
|
| 1218 |
+
| cosine_precision@5 | 0.3918 |
|
| 1219 |
+
| cosine_precision@10 | 0.3566 |
|
| 1220 |
+
| cosine_recall@1 | 0.0466 |
|
| 1221 |
+
| cosine_recall@3 | 0.1359 |
|
| 1222 |
+
| cosine_recall@5 | 0.2038 |
|
| 1223 |
+
| cosine_recall@10 | 0.3015 |
|
| 1224 |
+
| **cosine_ndcg@10** | **0.4291** |
|
| 1225 |
+
| cosine_mrr@10 | 0.4168 |
|
| 1226 |
+
| cosine_map@100 | 0.4906 |
|
| 1227 |
+
|
| 1228 |
+
#### Information Retrieval
|
| 1229 |
+
|
| 1230 |
+
* Dataset: `dim_768`
|
| 1231 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1232 |
+
```json
|
| 1233 |
+
{
|
| 1234 |
+
"truncate_dim": 768
|
| 1235 |
+
}
|
| 1236 |
+
```
|
| 1237 |
+
|
| 1238 |
+
| Metric | Value |
|
| 1239 |
+
|:--------------------|:-----------|
|
| 1240 |
+
| cosine_accuracy@1 | 0.3995 |
|
| 1241 |
+
| cosine_accuracy@3 | 0.4046 |
|
| 1242 |
+
| cosine_accuracy@5 | 0.436 |
|
| 1243 |
+
| cosine_accuracy@10 | 0.4738 |
|
| 1244 |
+
| cosine_precision@1 | 0.3995 |
|
| 1245 |
+
| cosine_precision@3 | 0.3982 |
|
| 1246 |
+
| cosine_precision@5 | 0.3868 |
|
| 1247 |
+
| cosine_precision@10 | 0.3528 |
|
| 1248 |
+
| cosine_recall@1 | 0.0461 |
|
| 1249 |
+
| cosine_recall@3 | 0.1345 |
|
| 1250 |
+
| cosine_recall@5 | 0.2008 |
|
| 1251 |
+
| cosine_recall@10 | 0.2968 |
|
| 1252 |
+
| **cosine_ndcg@10** | **0.4244** |
|
| 1253 |
+
| cosine_mrr@10 | 0.412 |
|
| 1254 |
+
| cosine_map@100 | 0.4868 |
|
| 1255 |
+
|
| 1256 |
+
#### Information Retrieval
|
| 1257 |
+
|
| 1258 |
+
* Dataset: `dim_512`
|
| 1259 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1260 |
+
```json
|
| 1261 |
+
{
|
| 1262 |
+
"truncate_dim": 512
|
| 1263 |
+
}
|
| 1264 |
+
```
|
| 1265 |
+
|
| 1266 |
+
| Metric | Value |
|
| 1267 |
+
|:--------------------|:-----------|
|
| 1268 |
+
| cosine_accuracy@1 | 0.3988 |
|
| 1269 |
+
| cosine_accuracy@3 | 0.4052 |
|
| 1270 |
+
| cosine_accuracy@5 | 0.4456 |
|
| 1271 |
+
| cosine_accuracy@10 | 0.4782 |
|
| 1272 |
+
| cosine_precision@1 | 0.3988 |
|
| 1273 |
+
| cosine_precision@3 | 0.3976 |
|
| 1274 |
+
| cosine_precision@5 | 0.3889 |
|
| 1275 |
+
| cosine_precision@10 | 0.3579 |
|
| 1276 |
+
| cosine_recall@1 | 0.0457 |
|
| 1277 |
+
| cosine_recall@3 | 0.1333 |
|
| 1278 |
+
| cosine_recall@5 | 0.2006 |
|
| 1279 |
+
| cosine_recall@10 | 0.2994 |
|
| 1280 |
+
| **cosine_ndcg@10** | **0.4282** |
|
| 1281 |
+
| cosine_mrr@10 | 0.4131 |
|
| 1282 |
+
| cosine_map@100 | 0.4876 |
|
| 1283 |
+
|
| 1284 |
+
#### Information Retrieval
|
| 1285 |
+
|
| 1286 |
+
* Dataset: `dim_256`
|
| 1287 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1288 |
+
```json
|
| 1289 |
+
{
|
| 1290 |
+
"truncate_dim": 256
|
| 1291 |
+
}
|
| 1292 |
+
```
|
| 1293 |
+
|
| 1294 |
+
| Metric | Value |
|
| 1295 |
+
|:--------------------|:----------|
|
| 1296 |
+
| cosine_accuracy@1 | 0.3739 |
|
| 1297 |
+
| cosine_accuracy@3 | 0.3777 |
|
| 1298 |
+
| cosine_accuracy@5 | 0.4072 |
|
| 1299 |
+
| cosine_accuracy@10 | 0.4456 |
|
| 1300 |
+
| cosine_precision@1 | 0.3739 |
|
| 1301 |
+
| cosine_precision@3 | 0.3724 |
|
| 1302 |
+
| cosine_precision@5 | 0.3616 |
|
| 1303 |
+
| cosine_precision@10 | 0.3298 |
|
| 1304 |
+
| cosine_recall@1 | 0.0431 |
|
| 1305 |
+
| cosine_recall@3 | 0.1257 |
|
| 1306 |
+
| cosine_recall@5 | 0.1884 |
|
| 1307 |
+
| cosine_recall@10 | 0.2793 |
|
| 1308 |
+
| **cosine_ndcg@10** | **0.398** |
|
| 1309 |
+
| cosine_mrr@10 | 0.3857 |
|
| 1310 |
+
| cosine_map@100 | 0.4586 |
|
| 1311 |
+
|
| 1312 |
+
#### Information Retrieval
|
| 1313 |
+
|
| 1314 |
+
* Dataset: `dim_128`
|
| 1315 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1316 |
+
```json
|
| 1317 |
+
{
|
| 1318 |
+
"truncate_dim": 128
|
| 1319 |
+
}
|
| 1320 |
+
```
|
| 1321 |
+
|
| 1322 |
+
| Metric | Value |
|
| 1323 |
+
|:--------------------|:-----------|
|
| 1324 |
+
| cosine_accuracy@1 | 0.3431 |
|
| 1325 |
+
| cosine_accuracy@3 | 0.3476 |
|
| 1326 |
+
| cosine_accuracy@5 | 0.3771 |
|
| 1327 |
+
| cosine_accuracy@10 | 0.4149 |
|
| 1328 |
+
| cosine_precision@1 | 0.3431 |
|
| 1329 |
+
| cosine_precision@3 | 0.3419 |
|
| 1330 |
+
| cosine_precision@5 | 0.3323 |
|
| 1331 |
+
| cosine_precision@10 | 0.3028 |
|
| 1332 |
+
| cosine_recall@1 | 0.0407 |
|
| 1333 |
+
| cosine_recall@3 | 0.1185 |
|
| 1334 |
+
| cosine_recall@5 | 0.1775 |
|
| 1335 |
+
| cosine_recall@10 | 0.2633 |
|
| 1336 |
+
| **cosine_ndcg@10** | **0.3677** |
|
| 1337 |
+
| cosine_mrr@10 | 0.3551 |
|
| 1338 |
+
| cosine_map@100 | 0.4277 |
|
| 1339 |
+
|
| 1340 |
+
#### Information Retrieval
|
| 1341 |
+
|
| 1342 |
+
* Dataset: `dim_64`
|
| 1343 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1344 |
+
```json
|
| 1345 |
+
{
|
| 1346 |
+
"truncate_dim": 64
|
| 1347 |
+
}
|
| 1348 |
+
```
|
| 1349 |
+
|
| 1350 |
+
| Metric | Value |
|
| 1351 |
+
|:--------------------|:-----------|
|
| 1352 |
+
| cosine_accuracy@1 | 0.3079 |
|
| 1353 |
+
| cosine_accuracy@3 | 0.3124 |
|
| 1354 |
+
| cosine_accuracy@5 | 0.3329 |
|
| 1355 |
+
| cosine_accuracy@10 | 0.3656 |
|
| 1356 |
+
| cosine_precision@1 | 0.3079 |
|
| 1357 |
+
| cosine_precision@3 | 0.3071 |
|
| 1358 |
+
| cosine_precision@5 | 0.2982 |
|
| 1359 |
+
| cosine_precision@10 | 0.2722 |
|
| 1360 |
+
| cosine_recall@1 | 0.035 |
|
| 1361 |
+
| cosine_recall@3 | 0.1021 |
|
| 1362 |
+
| cosine_recall@5 | 0.153 |
|
| 1363 |
+
| cosine_recall@10 | 0.2303 |
|
| 1364 |
+
| **cosine_ndcg@10** | **0.3275** |
|
| 1365 |
+
| cosine_mrr@10 | 0.3175 |
|
| 1366 |
+
| cosine_map@100 | 0.3818 |
|
| 1367 |
+
|
| 1368 |
+
<!--
|
| 1369 |
+
## Bias, Risks and Limitations
|
| 1370 |
+
|
| 1371 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 1372 |
+
-->
|
| 1373 |
+
|
| 1374 |
+
<!--
|
| 1375 |
+
### Recommendations
|
| 1376 |
+
|
| 1377 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 1378 |
+
-->
|
| 1379 |
+
|
| 1380 |
+
## Training Details
|
| 1381 |
+
|
| 1382 |
+
### Training Dataset
|
| 1383 |
+
|
| 1384 |
+
#### Unnamed Dataset
|
| 1385 |
+
|
| 1386 |
+
* Size: 391 training samples
|
| 1387 |
+
* Columns: <code>anchor</code> and <code>positive</code>
|
| 1388 |
+
* Approximate statistics based on the first 391 samples:
|
| 1389 |
+
| | anchor | positive |
|
| 1390 |
+
|:--------|:----------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
|
| 1391 |
+
| type | string | string |
|
| 1392 |
+
| details | <ul><li>min: 8 tokens</li><li>mean: 17.16 tokens</li><li>max: 32 tokens</li></ul> | <ul><li>min: 27 tokens</li><li>mean: 377.93 tokens</li><li>max: 512 tokens</li></ul> |
|
| 1393 |
+
* Samples:
|
| 1394 |
+
| anchor | positive |
|
| 1395 |
+
|:-------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 1396 |
+
| <code>What measures must be taken according to Article 32?</code> | <code>1.Where processing is to be carried out on behalf of a controller, the controller shall use only processors providing sufficient guarantees to implement appropriate technical and organisational measures in such a manner that processing will meet the requirements of this Regulation and ensure the protection of the rights of the data subject.<br>2.The processor shall not engage another processor without prior specific or general written authorisation of the controller. In the case of general written authorisation, the processor shall inform the controller of any intended changes concerning the addition or replacement of other processors, thereby giving the controller the opportunity to object to such changes.<br>3.Processing by a processor shall be governed by a contract or other legal act under Union or Member State law, that is binding on the processor with regard to the controller and that sets out the subject-matter and duration of the processing, the nature and purpose of the processing, ...</code> |
|
| 1397 |
+
| <code>What is the responsibility of assisting and advising the data subjects in exercising their rights?</code> | <code>1.A transfer of personal data to a third country or an international organisation may take place where the Commission has decided that the third country, a territory or one or more specified sectors within that third country, or the international organisation in question ensures an adequate level of protection. Such a transfer shall not require any specific authorisation.<br>2.When assessing the adequacy of the level of protection, the Commission shall, in particular, take account of the following elements: (a) the rule of law, respect for human rights and fundamental freedoms, relevant legislation, both general and sectoral, including concerning public security, defence, national security and criminal law and the access of public authorities to personal data, as well as the implementation of such legislation, data protection rules, professional rules and security measures, including rules for the onward transfer of personal data to another third country or international organisation whi...</code> |
|
| 1398 |
+
| <code>What should Member States be authorized to provide for regarding personal data processing for archiving purposes?</code> | <code>Where personal data are processed for archiving purposes, this Regulation should also apply to that processing, bearing in mind that this Regulation should not apply to deceased persons. Public authorities or public or private bodies that hold records of public interest should be services which, pursuant to Union or Member State law, have a legal obligation to acquire, preserve, appraise, arrange, describe, communicate, promote, disseminate and provide access to records of enduring value for general public interest. Member States should also be authorised to provide for the further processing of personal data for archiving purposes, for example with a view to providing specific information related to the political behaviour under former totalitarian state regimes, genocide, crimes against humanity, in particular the Holocaust, or war crimes. 4.5.2016 L 119/29 Official Journal of the European Union EN</code> |
|
| 1399 |
+
* Loss: [<code>MatryoshkaLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#matryoshkaloss) with these parameters:
|
| 1400 |
+
```json
|
| 1401 |
+
{
|
| 1402 |
+
"loss": "MultipleNegativesRankingLoss",
|
| 1403 |
+
"matryoshka_dims": [
|
| 1404 |
+
1024,
|
| 1405 |
+
768,
|
| 1406 |
+
512,
|
| 1407 |
+
256,
|
| 1408 |
+
128,
|
| 1409 |
+
64
|
| 1410 |
+
],
|
| 1411 |
+
"matryoshka_weights": [
|
| 1412 |
+
1,
|
| 1413 |
+
1,
|
| 1414 |
+
1,
|
| 1415 |
+
1,
|
| 1416 |
+
1,
|
| 1417 |
+
1
|
| 1418 |
+
],
|
| 1419 |
+
"n_dims_per_step": -1
|
| 1420 |
+
}
|
| 1421 |
+
```
|
| 1422 |
+
|
| 1423 |
+
### Training Hyperparameters
|
| 1424 |
+
#### Non-Default Hyperparameters
|
| 1425 |
+
|
| 1426 |
+
- `eval_strategy`: epoch
|
| 1427 |
+
- `per_device_eval_batch_size`: 16
|
| 1428 |
+
- `gradient_accumulation_steps`: 4
|
| 1429 |
+
- `learning_rate`: 2e-05
|
| 1430 |
+
- `num_train_epochs`: 20
|
| 1431 |
+
- `lr_scheduler_type`: cosine
|
| 1432 |
+
- `warmup_ratio`: 0.1
|
| 1433 |
+
- `bf16`: True
|
| 1434 |
+
- `load_best_model_at_end`: True
|
| 1435 |
+
- `optim`: adamw_torch_fused
|
| 1436 |
+
- `batch_sampler`: no_duplicates
|
| 1437 |
+
|
| 1438 |
+
#### All Hyperparameters
|
| 1439 |
+
<details><summary>Click to expand</summary>
|
| 1440 |
+
|
| 1441 |
+
- `overwrite_output_dir`: False
|
| 1442 |
+
- `do_predict`: False
|
| 1443 |
+
- `eval_strategy`: epoch
|
| 1444 |
+
- `prediction_loss_only`: True
|
| 1445 |
+
- `per_device_train_batch_size`: 8
|
| 1446 |
+
- `per_device_eval_batch_size`: 16
|
| 1447 |
+
- `per_gpu_train_batch_size`: None
|
| 1448 |
+
- `per_gpu_eval_batch_size`: None
|
| 1449 |
+
- `gradient_accumulation_steps`: 4
|
| 1450 |
+
- `eval_accumulation_steps`: None
|
| 1451 |
+
- `torch_empty_cache_steps`: None
|
| 1452 |
+
- `learning_rate`: 2e-05
|
| 1453 |
+
- `weight_decay`: 0.0
|
| 1454 |
+
- `adam_beta1`: 0.9
|
| 1455 |
+
- `adam_beta2`: 0.999
|
| 1456 |
+
- `adam_epsilon`: 1e-08
|
| 1457 |
+
- `max_grad_norm`: 1.0
|
| 1458 |
+
- `num_train_epochs`: 20
|
| 1459 |
+
- `max_steps`: -1
|
| 1460 |
+
- `lr_scheduler_type`: cosine
|
| 1461 |
+
- `lr_scheduler_kwargs`: {}
|
| 1462 |
+
- `warmup_ratio`: 0.1
|
| 1463 |
+
- `warmup_steps`: 0
|
| 1464 |
+
- `log_level`: passive
|
| 1465 |
+
- `log_level_replica`: warning
|
| 1466 |
+
- `log_on_each_node`: True
|
| 1467 |
+
- `logging_nan_inf_filter`: True
|
| 1468 |
+
- `save_safetensors`: True
|
| 1469 |
+
- `save_on_each_node`: False
|
| 1470 |
+
- `save_only_model`: False
|
| 1471 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 1472 |
+
- `no_cuda`: False
|
| 1473 |
+
- `use_cpu`: False
|
| 1474 |
+
- `use_mps_device`: False
|
| 1475 |
+
- `seed`: 42
|
| 1476 |
+
- `data_seed`: None
|
| 1477 |
+
- `jit_mode_eval`: False
|
| 1478 |
+
- `use_ipex`: False
|
| 1479 |
+
- `bf16`: True
|
| 1480 |
+
- `fp16`: False
|
| 1481 |
+
- `fp16_opt_level`: O1
|
| 1482 |
+
- `half_precision_backend`: auto
|
| 1483 |
+
- `bf16_full_eval`: False
|
| 1484 |
+
- `fp16_full_eval`: False
|
| 1485 |
+
- `tf32`: None
|
| 1486 |
+
- `local_rank`: 0
|
| 1487 |
+
- `ddp_backend`: None
|
| 1488 |
+
- `tpu_num_cores`: None
|
| 1489 |
+
- `tpu_metrics_debug`: False
|
| 1490 |
+
- `debug`: []
|
| 1491 |
+
- `dataloader_drop_last`: False
|
| 1492 |
+
- `dataloader_num_workers`: 0
|
| 1493 |
+
- `dataloader_prefetch_factor`: None
|
| 1494 |
+
- `past_index`: -1
|
| 1495 |
+
- `disable_tqdm`: False
|
| 1496 |
+
- `remove_unused_columns`: True
|
| 1497 |
+
- `label_names`: None
|
| 1498 |
+
- `load_best_model_at_end`: True
|
| 1499 |
+
- `ignore_data_skip`: False
|
| 1500 |
+
- `fsdp`: []
|
| 1501 |
+
- `fsdp_min_num_params`: 0
|
| 1502 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 1503 |
+
- `tp_size`: 0
|
| 1504 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 1505 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 1506 |
+
- `deepspeed`: None
|
| 1507 |
+
- `label_smoothing_factor`: 0.0
|
| 1508 |
+
- `optim`: adamw_torch_fused
|
| 1509 |
+
- `optim_args`: None
|
| 1510 |
+
- `adafactor`: False
|
| 1511 |
+
- `group_by_length`: False
|
| 1512 |
+
- `length_column_name`: length
|
| 1513 |
+
- `ddp_find_unused_parameters`: None
|
| 1514 |
+
- `ddp_bucket_cap_mb`: None
|
| 1515 |
+
- `ddp_broadcast_buffers`: False
|
| 1516 |
+
- `dataloader_pin_memory`: True
|
| 1517 |
+
- `dataloader_persistent_workers`: False
|
| 1518 |
+
- `skip_memory_metrics`: True
|
| 1519 |
+
- `use_legacy_prediction_loop`: False
|
| 1520 |
+
- `push_to_hub`: False
|
| 1521 |
+
- `resume_from_checkpoint`: None
|
| 1522 |
+
- `hub_model_id`: None
|
| 1523 |
+
- `hub_strategy`: every_save
|
| 1524 |
+
- `hub_private_repo`: None
|
| 1525 |
+
- `hub_always_push`: False
|
| 1526 |
+
- `gradient_checkpointing`: False
|
| 1527 |
+
- `gradient_checkpointing_kwargs`: None
|
| 1528 |
+
- `include_inputs_for_metrics`: False
|
| 1529 |
+
- `include_for_metrics`: []
|
| 1530 |
+
- `eval_do_concat_batches`: True
|
| 1531 |
+
- `fp16_backend`: auto
|
| 1532 |
+
- `push_to_hub_model_id`: None
|
| 1533 |
+
- `push_to_hub_organization`: None
|
| 1534 |
+
- `mp_parameters`:
|
| 1535 |
+
- `auto_find_batch_size`: False
|
| 1536 |
+
- `full_determinism`: False
|
| 1537 |
+
- `torchdynamo`: None
|
| 1538 |
+
- `ray_scope`: last
|
| 1539 |
+
- `ddp_timeout`: 1800
|
| 1540 |
+
- `torch_compile`: False
|
| 1541 |
+
- `torch_compile_backend`: None
|
| 1542 |
+
- `torch_compile_mode`: None
|
| 1543 |
+
- `include_tokens_per_second`: False
|
| 1544 |
+
- `include_num_input_tokens_seen`: False
|
| 1545 |
+
- `neftune_noise_alpha`: None
|
| 1546 |
+
- `optim_target_modules`: None
|
| 1547 |
+
- `batch_eval_metrics`: False
|
| 1548 |
+
- `eval_on_start`: False
|
| 1549 |
+
- `use_liger_kernel`: False
|
| 1550 |
+
- `eval_use_gather_object`: False
|
| 1551 |
+
- `average_tokens_across_devices`: False
|
| 1552 |
+
- `prompts`: None
|
| 1553 |
+
- `batch_sampler`: no_duplicates
|
| 1554 |
+
- `multi_dataset_batch_sampler`: proportional
|
| 1555 |
+
- `router_mapping`: {}
|
| 1556 |
+
- `learning_rate_mapping`: {}
|
| 1557 |
+
|
| 1558 |
+
</details>
|
| 1559 |
+
|
| 1560 |
+
### Training Logs
|
| 1561 |
+
| Epoch | Step | Training Loss | dim_1024_cosine_ndcg@10 | dim_768_cosine_ndcg@10 | dim_512_cosine_ndcg@10 | dim_256_cosine_ndcg@10 | dim_128_cosine_ndcg@10 | dim_64_cosine_ndcg@10 |
|
| 1562 |
+
|:------:|:----:|:-------------:|:-----------------------:|:----------------------:|:----------------------:|:----------------------:|:----------------------:|:---------------------:|
|
| 1563 |
+
| 0.8163 | 10 | 31.5155 | - | - | - | - | - | - |
|
| 1564 |
+
| 1.0 | 13 | - | 0.4494 | 0.4446 | 0.4364 | 0.3947 | 0.3362 | 0.2621 |
|
| 1565 |
+
| 1.5714 | 20 | 19.0409 | - | - | - | - | - | - |
|
| 1566 |
+
| 2.0 | 26 | - | 0.4065 | 0.4004 | 0.4013 | 0.3692 | 0.3418 | 0.2882 |
|
| 1567 |
+
| 2.3265 | 30 | 14.5314 | - | - | - | - | - | - |
|
| 1568 |
+
| 3.0 | 39 | - | 0.4418 | 0.4350 | 0.4329 | 0.4087 | 0.3714 | 0.3372 |
|
| 1569 |
+
| 3.0816 | 40 | 8.6778 | - | - | - | - | - | - |
|
| 1570 |
+
| 3.8980 | 50 | 6.0257 | - | - | - | - | - | - |
|
| 1571 |
+
| 4.0 | 52 | - | 0.4291 | 0.4244 | 0.4282 | 0.3980 | 0.3677 | 0.3275 |
|
| 1572 |
+
|
| 1573 |
+
|
| 1574 |
+
### Framework Versions
|
| 1575 |
+
- Python: 3.12.11
|
| 1576 |
+
- Sentence Transformers: 5.1.0
|
| 1577 |
+
- Transformers: 4.51.3
|
| 1578 |
+
- PyTorch: 2.8.0+cu126
|
| 1579 |
+
- Accelerate: 1.10.1
|
| 1580 |
+
- Datasets: 4.0.0
|
| 1581 |
+
- Tokenizers: 0.21.4
|
| 1582 |
+
|
| 1583 |
+
## Citation
|
| 1584 |
+
|
| 1585 |
+
### BibTeX
|
| 1586 |
+
|
| 1587 |
+
#### Sentence Transformers
|
| 1588 |
+
```bibtex
|
| 1589 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 1590 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 1591 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 1592 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 1593 |
+
month = "11",
|
| 1594 |
+
year = "2019",
|
| 1595 |
+
publisher = "Association for Computational Linguistics",
|
| 1596 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 1597 |
+
}
|
| 1598 |
+
```
|
| 1599 |
+
|
| 1600 |
+
#### MatryoshkaLoss
|
| 1601 |
+
```bibtex
|
| 1602 |
+
@misc{kusupati2024matryoshka,
|
| 1603 |
+
title={Matryoshka Representation Learning},
|
| 1604 |
+
author={Aditya Kusupati and Gantavya Bhatt and Aniket Rege and Matthew Wallingford and Aditya Sinha and Vivek Ramanujan and William Howard-Snyder and Kaifeng Chen and Sham Kakade and Prateek Jain and Ali Farhadi},
|
| 1605 |
+
year={2024},
|
| 1606 |
+
eprint={2205.13147},
|
| 1607 |
+
archivePrefix={arXiv},
|
| 1608 |
+
primaryClass={cs.LG}
|
| 1609 |
+
}
|
| 1610 |
+
```
|
| 1611 |
+
|
| 1612 |
+
#### MultipleNegativesRankingLoss
|
| 1613 |
+
```bibtex
|
| 1614 |
+
@misc{henderson2017efficient,
|
| 1615 |
+
title={Efficient Natural Language Response Suggestion for Smart Reply},
|
| 1616 |
+
author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
|
| 1617 |
+
year={2017},
|
| 1618 |
+
eprint={1705.00652},
|
| 1619 |
+
archivePrefix={arXiv},
|
| 1620 |
+
primaryClass={cs.CL}
|
| 1621 |
+
}
|
| 1622 |
+
```
|
| 1623 |
+
|
| 1624 |
+
<!--
|
| 1625 |
+
## Glossary
|
| 1626 |
+
|
| 1627 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 1628 |
+
-->
|
| 1629 |
+
|
| 1630 |
+
<!--
|
| 1631 |
+
## Model Card Authors
|
| 1632 |
+
|
| 1633 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 1634 |
+
-->
|
| 1635 |
+
|
| 1636 |
+
<!--
|
| 1637 |
+
## Model Card Contact
|
| 1638 |
+
|
| 1639 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 1640 |
+
-->
|
checkpoint-52/config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"XLMRobertaModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"bos_token_id": 0,
|
| 7 |
+
"classifier_dropout": null,
|
| 8 |
+
"eos_token_id": 2,
|
| 9 |
+
"hidden_act": "gelu",
|
| 10 |
+
"hidden_dropout_prob": 0.1,
|
| 11 |
+
"hidden_size": 1024,
|
| 12 |
+
"initializer_range": 0.02,
|
| 13 |
+
"intermediate_size": 4096,
|
| 14 |
+
"layer_norm_eps": 1e-05,
|
| 15 |
+
"max_position_embeddings": 514,
|
| 16 |
+
"model_type": "xlm-roberta",
|
| 17 |
+
"num_attention_heads": 16,
|
| 18 |
+
"num_hidden_layers": 24,
|
| 19 |
+
"output_past": true,
|
| 20 |
+
"pad_token_id": 1,
|
| 21 |
+
"position_embedding_type": "absolute",
|
| 22 |
+
"torch_dtype": "float32",
|
| 23 |
+
"transformers_version": "4.51.3",
|
| 24 |
+
"type_vocab_size": 1,
|
| 25 |
+
"use_cache": true,
|
| 26 |
+
"vocab_size": 250002
|
| 27 |
+
}
|
checkpoint-52/config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "SentenceTransformer",
|
| 3 |
+
"__version__": {
|
| 4 |
+
"sentence_transformers": "5.1.0",
|
| 5 |
+
"transformers": "4.51.3",
|
| 6 |
+
"pytorch": "2.8.0+cu126"
|
| 7 |
+
},
|
| 8 |
+
"prompts": {
|
| 9 |
+
"query": "",
|
| 10 |
+
"document": ""
|
| 11 |
+
},
|
| 12 |
+
"default_prompt_name": null,
|
| 13 |
+
"similarity_fn_name": "cosine"
|
| 14 |
+
}
|
checkpoint-52/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12735f3a106f01897dc07522651bedf61ab577bc550f0ec0823f59ac498655a3
|
| 3 |
+
size 2239607176
|
checkpoint-52/modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
checkpoint-52/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e985e11ca6344c991936a462d715ab4737a81f1e7ae1d7b9d5018c4289d6330a
|
| 3 |
+
size 4471067142
|
checkpoint-52/rng_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97826e6974b5be8ca805050e2834698ca64f84d84dd6dafae567ebf4b5323c64
|
| 3 |
+
size 14645
|
checkpoint-52/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:124a2148c993404cea26c3ac1105405f4d64009654d6294d1bcc583643552613
|
| 3 |
+
size 1465
|
checkpoint-52/sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 512,
|
| 3 |
+
"do_lower_case": false
|
| 4 |
+
}
|
checkpoint-52/sentencepiece.bpe.model
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
|
| 3 |
+
size 5069051
|
checkpoint-52/special_tokens_map.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"cls_token": {
|
| 10 |
+
"content": "<s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"eos_token": {
|
| 17 |
+
"content": "</s>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"mask_token": {
|
| 24 |
+
"content": "<mask>",
|
| 25 |
+
"lstrip": true,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"pad_token": {
|
| 31 |
+
"content": "<pad>",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
},
|
| 37 |
+
"sep_token": {
|
| 38 |
+
"content": "</s>",
|
| 39 |
+
"lstrip": false,
|
| 40 |
+
"normalized": false,
|
| 41 |
+
"rstrip": false,
|
| 42 |
+
"single_word": false
|
| 43 |
+
},
|
| 44 |
+
"unk_token": {
|
| 45 |
+
"content": "<unk>",
|
| 46 |
+
"lstrip": false,
|
| 47 |
+
"normalized": false,
|
| 48 |
+
"rstrip": false,
|
| 49 |
+
"single_word": false
|
| 50 |
+
}
|
| 51 |
+
}
|
checkpoint-52/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:883b037111086fd4dfebbbc9b7cee11e1517b5e0c0514879478661440f137085
|
| 3 |
+
size 17082987
|
checkpoint-52/tokenizer_config.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "<s>",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<pad>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "</s>",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "<unk>",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"250001": {
|
| 36 |
+
"content": "<mask>",
|
| 37 |
+
"lstrip": true,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"bos_token": "<s>",
|
| 45 |
+
"clean_up_tokenization_spaces": true,
|
| 46 |
+
"cls_token": "<s>",
|
| 47 |
+
"eos_token": "</s>",
|
| 48 |
+
"extra_special_tokens": {},
|
| 49 |
+
"mask_token": "<mask>",
|
| 50 |
+
"model_max_length": 512,
|
| 51 |
+
"pad_token": "<pad>",
|
| 52 |
+
"sep_token": "</s>",
|
| 53 |
+
"tokenizer_class": "XLMRobertaTokenizer",
|
| 54 |
+
"unk_token": "<unk>"
|
| 55 |
+
}
|
checkpoint-52/trainer_state.json
ADDED
|
@@ -0,0 +1,470 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"best_global_step": 39,
|
| 3 |
+
"best_metric": 0.37139192897263235,
|
| 4 |
+
"best_model_checkpoint": "intfloat/multilingual-e5-large/checkpoint-39",
|
| 5 |
+
"epoch": 4.0,
|
| 6 |
+
"eval_steps": 500,
|
| 7 |
+
"global_step": 52,
|
| 8 |
+
"is_hyper_param_search": false,
|
| 9 |
+
"is_local_process_zero": true,
|
| 10 |
+
"is_world_process_zero": true,
|
| 11 |
+
"log_history": [
|
| 12 |
+
{
|
| 13 |
+
"epoch": 0.8163265306122449,
|
| 14 |
+
"grad_norm": 307.08624267578125,
|
| 15 |
+
"learning_rate": 7.500000000000001e-06,
|
| 16 |
+
"loss": 31.5155,
|
| 17 |
+
"step": 10
|
| 18 |
+
},
|
| 19 |
+
{
|
| 20 |
+
"epoch": 1.0,
|
| 21 |
+
"eval_dim_1024_cosine_accuracy@1": 0.42509603072983354,
|
| 22 |
+
"eval_dim_1024_cosine_accuracy@10": 0.49295774647887325,
|
| 23 |
+
"eval_dim_1024_cosine_accuracy@3": 0.43085787451984636,
|
| 24 |
+
"eval_dim_1024_cosine_accuracy@5": 0.46030729833546735,
|
| 25 |
+
"eval_dim_1024_cosine_map@100": 0.508986346237021,
|
| 26 |
+
"eval_dim_1024_cosine_mrr@10": 0.4369535394183281,
|
| 27 |
+
"eval_dim_1024_cosine_ndcg@10": 0.4493804868009024,
|
| 28 |
+
"eval_dim_1024_cosine_precision@1": 0.42509603072983354,
|
| 29 |
+
"eval_dim_1024_cosine_precision@10": 0.376056338028169,
|
| 30 |
+
"eval_dim_1024_cosine_precision@3": 0.42402902262057185,
|
| 31 |
+
"eval_dim_1024_cosine_precision@5": 0.4133162612035851,
|
| 32 |
+
"eval_dim_1024_cosine_recall@1": 0.04813624827530403,
|
| 33 |
+
"eval_dim_1024_cosine_recall@10": 0.3150476790176975,
|
| 34 |
+
"eval_dim_1024_cosine_recall@3": 0.1404092551990217,
|
| 35 |
+
"eval_dim_1024_cosine_recall@5": 0.21147403835662126,
|
| 36 |
+
"eval_dim_128_cosine_accuracy@1": 0.31370038412291934,
|
| 37 |
+
"eval_dim_128_cosine_accuracy@10": 0.38156209987195905,
|
| 38 |
+
"eval_dim_128_cosine_accuracy@3": 0.31946222791293216,
|
| 39 |
+
"eval_dim_128_cosine_accuracy@5": 0.34571062740076824,
|
| 40 |
+
"eval_dim_128_cosine_map@100": 0.3991669558616212,
|
| 41 |
+
"eval_dim_128_cosine_mrr@10": 0.32517427799117904,
|
| 42 |
+
"eval_dim_128_cosine_ndcg@10": 0.33618283481296385,
|
| 43 |
+
"eval_dim_128_cosine_precision@1": 0.31370038412291934,
|
| 44 |
+
"eval_dim_128_cosine_precision@10": 0.2764404609475032,
|
| 45 |
+
"eval_dim_128_cosine_precision@3": 0.31284677763551,
|
| 46 |
+
"eval_dim_128_cosine_precision@5": 0.30422535211267604,
|
| 47 |
+
"eval_dim_128_cosine_recall@1": 0.037933385936292925,
|
| 48 |
+
"eval_dim_128_cosine_recall@10": 0.24798465115464788,
|
| 49 |
+
"eval_dim_128_cosine_recall@3": 0.11100168654049715,
|
| 50 |
+
"eval_dim_128_cosine_recall@5": 0.1670926413559068,
|
| 51 |
+
"eval_dim_256_cosine_accuracy@1": 0.36427656850192064,
|
| 52 |
+
"eval_dim_256_cosine_accuracy@10": 0.44814340588988477,
|
| 53 |
+
"eval_dim_256_cosine_accuracy@3": 0.36939820742637647,
|
| 54 |
+
"eval_dim_256_cosine_accuracy@5": 0.4090909090909091,
|
| 55 |
+
"eval_dim_256_cosine_map@100": 0.45841270037343096,
|
| 56 |
+
"eval_dim_256_cosine_mrr@10": 0.37879397597707415,
|
| 57 |
+
"eval_dim_256_cosine_ndcg@10": 0.3947006636735062,
|
| 58 |
+
"eval_dim_256_cosine_precision@1": 0.36427656850192064,
|
| 59 |
+
"eval_dim_256_cosine_precision@10": 0.3289372599231754,
|
| 60 |
+
"eval_dim_256_cosine_precision@3": 0.36363636363636365,
|
| 61 |
+
"eval_dim_256_cosine_precision@5": 0.3560819462227913,
|
| 62 |
+
"eval_dim_256_cosine_recall@1": 0.04277277943657814,
|
| 63 |
+
"eval_dim_256_cosine_recall@10": 0.28617844199333936,
|
| 64 |
+
"eval_dim_256_cosine_recall@3": 0.1253991943934714,
|
| 65 |
+
"eval_dim_256_cosine_recall@5": 0.18947388504512186,
|
| 66 |
+
"eval_dim_512_cosine_accuracy@1": 0.4084507042253521,
|
| 67 |
+
"eval_dim_512_cosine_accuracy@10": 0.4871959026888604,
|
| 68 |
+
"eval_dim_512_cosine_accuracy@3": 0.41357234314980795,
|
| 69 |
+
"eval_dim_512_cosine_accuracy@5": 0.4519846350832266,
|
| 70 |
+
"eval_dim_512_cosine_map@100": 0.495554245202425,
|
| 71 |
+
"eval_dim_512_cosine_mrr@10": 0.42213127248338495,
|
| 72 |
+
"eval_dim_512_cosine_ndcg@10": 0.43644305450989757,
|
| 73 |
+
"eval_dim_512_cosine_precision@1": 0.4084507042253521,
|
| 74 |
+
"eval_dim_512_cosine_precision@10": 0.36606914212548014,
|
| 75 |
+
"eval_dim_512_cosine_precision@3": 0.40738369611609043,
|
| 76 |
+
"eval_dim_512_cosine_precision@5": 0.39846350832266325,
|
| 77 |
+
"eval_dim_512_cosine_recall@1": 0.04628035514721453,
|
| 78 |
+
"eval_dim_512_cosine_recall@10": 0.30419701916496145,
|
| 79 |
+
"eval_dim_512_cosine_recall@3": 0.13522898183596205,
|
| 80 |
+
"eval_dim_512_cosine_recall@5": 0.20394662187726964,
|
| 81 |
+
"eval_dim_64_cosine_accuracy@1": 0.24199743918053776,
|
| 82 |
+
"eval_dim_64_cosine_accuracy@10": 0.29641485275288093,
|
| 83 |
+
"eval_dim_64_cosine_accuracy@3": 0.24775928297055058,
|
| 84 |
+
"eval_dim_64_cosine_accuracy@5": 0.26952624839948786,
|
| 85 |
+
"eval_dim_64_cosine_map@100": 0.31803601064541553,
|
| 86 |
+
"eval_dim_64_cosine_mrr@10": 0.25159771761884414,
|
| 87 |
+
"eval_dim_64_cosine_ndcg@10": 0.2620553065689597,
|
| 88 |
+
"eval_dim_64_cosine_precision@1": 0.24199743918053776,
|
| 89 |
+
"eval_dim_64_cosine_precision@10": 0.21568501920614594,
|
| 90 |
+
"eval_dim_64_cosine_precision@3": 0.24199743918053776,
|
| 91 |
+
"eval_dim_64_cosine_precision@5": 0.23649167733674775,
|
| 92 |
+
"eval_dim_64_cosine_recall@1": 0.029110868794154622,
|
| 93 |
+
"eval_dim_64_cosine_recall@10": 0.19521971714475267,
|
| 94 |
+
"eval_dim_64_cosine_recall@3": 0.08524734139651896,
|
| 95 |
+
"eval_dim_64_cosine_recall@5": 0.12921904680249943,
|
| 96 |
+
"eval_dim_768_cosine_accuracy@1": 0.4193341869398207,
|
| 97 |
+
"eval_dim_768_cosine_accuracy@10": 0.4910371318822023,
|
| 98 |
+
"eval_dim_768_cosine_accuracy@3": 0.4238156209987196,
|
| 99 |
+
"eval_dim_768_cosine_accuracy@5": 0.4551856594110115,
|
| 100 |
+
"eval_dim_768_cosine_map@100": 0.5037778776293926,
|
| 101 |
+
"eval_dim_768_cosine_mrr@10": 0.4315339003719285,
|
| 102 |
+
"eval_dim_768_cosine_ndcg@10": 0.44456410503401034,
|
| 103 |
+
"eval_dim_768_cosine_precision@1": 0.4193341869398207,
|
| 104 |
+
"eval_dim_768_cosine_precision@10": 0.37272727272727274,
|
| 105 |
+
"eval_dim_768_cosine_precision@3": 0.4180537772087068,
|
| 106 |
+
"eval_dim_768_cosine_precision@5": 0.4076824583866837,
|
| 107 |
+
"eval_dim_768_cosine_recall@1": 0.04699592881851732,
|
| 108 |
+
"eval_dim_768_cosine_recall@10": 0.3107289399017082,
|
| 109 |
+
"eval_dim_768_cosine_recall@3": 0.13721565163348118,
|
| 110 |
+
"eval_dim_768_cosine_recall@5": 0.20710427114944024,
|
| 111 |
+
"eval_runtime": 98.6525,
|
| 112 |
+
"eval_samples_per_second": 0.0,
|
| 113 |
+
"eval_sequential_score": 0.2620553065689597,
|
| 114 |
+
"eval_steps_per_second": 0.0,
|
| 115 |
+
"step": 13
|
| 116 |
+
},
|
| 117 |
+
{
|
| 118 |
+
"epoch": 1.5714285714285714,
|
| 119 |
+
"grad_norm": 280.07818603515625,
|
| 120 |
+
"learning_rate": 1.5833333333333333e-05,
|
| 121 |
+
"loss": 19.0409,
|
| 122 |
+
"step": 20
|
| 123 |
+
},
|
| 124 |
+
{
|
| 125 |
+
"epoch": 2.0,
|
| 126 |
+
"eval_dim_1024_cosine_accuracy@1": 0.3854033290653009,
|
| 127 |
+
"eval_dim_1024_cosine_accuracy@10": 0.45454545454545453,
|
| 128 |
+
"eval_dim_1024_cosine_accuracy@3": 0.3886043533930858,
|
| 129 |
+
"eval_dim_1024_cosine_accuracy@5": 0.41101152368758004,
|
| 130 |
+
"eval_dim_1024_cosine_map@100": 0.47259820099791205,
|
| 131 |
+
"eval_dim_1024_cosine_mrr@10": 0.39624870434729537,
|
| 132 |
+
"eval_dim_1024_cosine_ndcg@10": 0.4065329035406967,
|
| 133 |
+
"eval_dim_1024_cosine_precision@1": 0.3854033290653009,
|
| 134 |
+
"eval_dim_1024_cosine_precision@10": 0.3357874519846351,
|
| 135 |
+
"eval_dim_1024_cosine_precision@3": 0.3839095177123346,
|
| 136 |
+
"eval_dim_1024_cosine_precision@5": 0.3713188220230474,
|
| 137 |
+
"eval_dim_1024_cosine_recall@1": 0.0451686782205082,
|
| 138 |
+
"eval_dim_1024_cosine_recall@10": 0.2918225395020212,
|
| 139 |
+
"eval_dim_1024_cosine_recall@3": 0.13200270380544088,
|
| 140 |
+
"eval_dim_1024_cosine_recall@5": 0.19735476247586825,
|
| 141 |
+
"eval_dim_128_cosine_accuracy@1": 0.31562099871959026,
|
| 142 |
+
"eval_dim_128_cosine_accuracy@10": 0.39180537772087065,
|
| 143 |
+
"eval_dim_128_cosine_accuracy@3": 0.3207426376440461,
|
| 144 |
+
"eval_dim_128_cosine_accuracy@5": 0.352112676056338,
|
| 145 |
+
"eval_dim_128_cosine_map@100": 0.40471008477532144,
|
| 146 |
+
"eval_dim_128_cosine_mrr@10": 0.32839105339105285,
|
| 147 |
+
"eval_dim_128_cosine_ndcg@10": 0.34177784905202935,
|
| 148 |
+
"eval_dim_128_cosine_precision@1": 0.31562099871959026,
|
| 149 |
+
"eval_dim_128_cosine_precision@10": 0.280729833546735,
|
| 150 |
+
"eval_dim_128_cosine_precision@3": 0.31455399061032857,
|
| 151 |
+
"eval_dim_128_cosine_precision@5": 0.30640204865556975,
|
| 152 |
+
"eval_dim_128_cosine_recall@1": 0.03888088094516579,
|
| 153 |
+
"eval_dim_128_cosine_recall@10": 0.2550464126190524,
|
| 154 |
+
"eval_dim_128_cosine_recall@3": 0.11341113256173359,
|
| 155 |
+
"eval_dim_128_cosine_recall@5": 0.17046484922169536,
|
| 156 |
+
"eval_dim_256_cosine_accuracy@1": 0.3418693982074264,
|
| 157 |
+
"eval_dim_256_cosine_accuracy@10": 0.4238156209987196,
|
| 158 |
+
"eval_dim_256_cosine_accuracy@3": 0.34763124199743917,
|
| 159 |
+
"eval_dim_256_cosine_accuracy@5": 0.38092189500640206,
|
| 160 |
+
"eval_dim_256_cosine_map@100": 0.43770217754051305,
|
| 161 |
+
"eval_dim_256_cosine_mrr@10": 0.35596482938032165,
|
| 162 |
+
"eval_dim_256_cosine_ndcg@10": 0.36923043791328775,
|
| 163 |
+
"eval_dim_256_cosine_precision@1": 0.3418693982074264,
|
| 164 |
+
"eval_dim_256_cosine_precision@10": 0.30441741357234314,
|
| 165 |
+
"eval_dim_256_cosine_precision@3": 0.34165599658557405,
|
| 166 |
+
"eval_dim_256_cosine_precision@5": 0.3322663252240717,
|
| 167 |
+
"eval_dim_256_cosine_recall@1": 0.041410929155814194,
|
| 168 |
+
"eval_dim_256_cosine_recall@10": 0.2705196189189818,
|
| 169 |
+
"eval_dim_256_cosine_recall@3": 0.1212642412965687,
|
| 170 |
+
"eval_dim_256_cosine_recall@5": 0.18173918651563936,
|
| 171 |
+
"eval_dim_512_cosine_accuracy@1": 0.37708066581306016,
|
| 172 |
+
"eval_dim_512_cosine_accuracy@10": 0.4532650448143406,
|
| 173 |
+
"eval_dim_512_cosine_accuracy@3": 0.38092189500640206,
|
| 174 |
+
"eval_dim_512_cosine_accuracy@5": 0.4084507042253521,
|
| 175 |
+
"eval_dim_512_cosine_map@100": 0.4678017780580059,
|
| 176 |
+
"eval_dim_512_cosine_mrr@10": 0.3893670101416575,
|
| 177 |
+
"eval_dim_512_cosine_ndcg@10": 0.40127522003513455,
|
| 178 |
+
"eval_dim_512_cosine_precision@1": 0.37708066581306016,
|
| 179 |
+
"eval_dim_512_cosine_precision@10": 0.33156209987195906,
|
| 180 |
+
"eval_dim_512_cosine_precision@3": 0.37537345283824153,
|
| 181 |
+
"eval_dim_512_cosine_precision@5": 0.36402048655569774,
|
| 182 |
+
"eval_dim_512_cosine_recall@1": 0.04457309853297402,
|
| 183 |
+
"eval_dim_512_cosine_recall@10": 0.2883968018428671,
|
| 184 |
+
"eval_dim_512_cosine_recall@3": 0.13007205872054822,
|
| 185 |
+
"eval_dim_512_cosine_recall@5": 0.19449520589871025,
|
| 186 |
+
"eval_dim_64_cosine_accuracy@1": 0.26696542893725994,
|
| 187 |
+
"eval_dim_64_cosine_accuracy@10": 0.33098591549295775,
|
| 188 |
+
"eval_dim_64_cosine_accuracy@3": 0.27208706786171577,
|
| 189 |
+
"eval_dim_64_cosine_accuracy@5": 0.293213828425096,
|
| 190 |
+
"eval_dim_64_cosine_map@100": 0.34719730722747555,
|
| 191 |
+
"eval_dim_64_cosine_mrr@10": 0.2776957197731842,
|
| 192 |
+
"eval_dim_64_cosine_ndcg@10": 0.2881905192612941,
|
| 193 |
+
"eval_dim_64_cosine_precision@1": 0.26696542893725994,
|
| 194 |
+
"eval_dim_64_cosine_precision@10": 0.237708066581306,
|
| 195 |
+
"eval_dim_64_cosine_precision@3": 0.26717883055911223,
|
| 196 |
+
"eval_dim_64_cosine_precision@5": 0.2596670934699104,
|
| 197 |
+
"eval_dim_64_cosine_recall@1": 0.031692344067516816,
|
| 198 |
+
"eval_dim_64_cosine_recall@10": 0.21473974122936995,
|
| 199 |
+
"eval_dim_64_cosine_recall@3": 0.09327455064654774,
|
| 200 |
+
"eval_dim_64_cosine_recall@5": 0.14131510912407144,
|
| 201 |
+
"eval_dim_768_cosine_accuracy@1": 0.37451984635083224,
|
| 202 |
+
"eval_dim_768_cosine_accuracy@10": 0.4539052496798976,
|
| 203 |
+
"eval_dim_768_cosine_accuracy@3": 0.37900128040973113,
|
| 204 |
+
"eval_dim_768_cosine_accuracy@5": 0.40973111395646605,
|
| 205 |
+
"eval_dim_768_cosine_map@100": 0.4672061011440217,
|
| 206 |
+
"eval_dim_768_cosine_mrr@10": 0.38746671950897227,
|
| 207 |
+
"eval_dim_768_cosine_ndcg@10": 0.4004027303245026,
|
| 208 |
+
"eval_dim_768_cosine_precision@1": 0.37451984635083224,
|
| 209 |
+
"eval_dim_768_cosine_precision@10": 0.3318181818181818,
|
| 210 |
+
"eval_dim_768_cosine_precision@3": 0.3734528382415706,
|
| 211 |
+
"eval_dim_768_cosine_precision@5": 0.3632522407170295,
|
| 212 |
+
"eval_dim_768_cosine_recall@1": 0.04413921317349132,
|
| 213 |
+
"eval_dim_768_cosine_recall@10": 0.28955317519546525,
|
| 214 |
+
"eval_dim_768_cosine_recall@3": 0.12896663310051748,
|
| 215 |
+
"eval_dim_768_cosine_recall@5": 0.19376203165061448,
|
| 216 |
+
"eval_runtime": 98.4244,
|
| 217 |
+
"eval_samples_per_second": 0.0,
|
| 218 |
+
"eval_sequential_score": 0.2881905192612941,
|
| 219 |
+
"eval_steps_per_second": 0.0,
|
| 220 |
+
"step": 26
|
| 221 |
+
},
|
| 222 |
+
{
|
| 223 |
+
"epoch": 2.326530612244898,
|
| 224 |
+
"grad_norm": 305.66259765625,
|
| 225 |
+
"learning_rate": 1.9973569167005725e-05,
|
| 226 |
+
"loss": 14.5314,
|
| 227 |
+
"step": 30
|
| 228 |
+
},
|
| 229 |
+
{
|
| 230 |
+
"epoch": 3.0,
|
| 231 |
+
"eval_dim_1024_cosine_accuracy@1": 0.4180537772087068,
|
| 232 |
+
"eval_dim_1024_cosine_accuracy@10": 0.49039692701664533,
|
| 233 |
+
"eval_dim_1024_cosine_accuracy@3": 0.42189500640204863,
|
| 234 |
+
"eval_dim_1024_cosine_accuracy@5": 0.4500640204865557,
|
| 235 |
+
"eval_dim_1024_cosine_map@100": 0.506794523350519,
|
| 236 |
+
"eval_dim_1024_cosine_mrr@10": 0.42985717334308843,
|
| 237 |
+
"eval_dim_1024_cosine_ndcg@10": 0.44178501209869797,
|
| 238 |
+
"eval_dim_1024_cosine_precision@1": 0.4180537772087068,
|
| 239 |
+
"eval_dim_1024_cosine_precision@10": 0.36869398207426374,
|
| 240 |
+
"eval_dim_1024_cosine_precision@3": 0.4163465642338881,
|
| 241 |
+
"eval_dim_1024_cosine_precision@5": 0.4043533930857874,
|
| 242 |
+
"eval_dim_1024_cosine_recall@1": 0.04734422767263886,
|
| 243 |
+
"eval_dim_1024_cosine_recall@10": 0.308531274625124,
|
| 244 |
+
"eval_dim_1024_cosine_recall@3": 0.138064233626932,
|
| 245 |
+
"eval_dim_1024_cosine_recall@5": 0.2069980430010945,
|
| 246 |
+
"eval_dim_128_cosine_accuracy@1": 0.34699103713188223,
|
| 247 |
+
"eval_dim_128_cosine_accuracy@10": 0.4212548015364917,
|
| 248 |
+
"eval_dim_128_cosine_accuracy@3": 0.35147247119078107,
|
| 249 |
+
"eval_dim_128_cosine_accuracy@5": 0.37900128040973113,
|
| 250 |
+
"eval_dim_128_cosine_map@100": 0.4338211299784659,
|
| 251 |
+
"eval_dim_128_cosine_mrr@10": 0.35916305916305874,
|
| 252 |
+
"eval_dim_128_cosine_ndcg@10": 0.37139192897263235,
|
| 253 |
+
"eval_dim_128_cosine_precision@1": 0.34699103713188223,
|
| 254 |
+
"eval_dim_128_cosine_precision@10": 0.3042893725992318,
|
| 255 |
+
"eval_dim_128_cosine_precision@3": 0.34571062740076824,
|
| 256 |
+
"eval_dim_128_cosine_precision@5": 0.3352112676056338,
|
| 257 |
+
"eval_dim_128_cosine_recall@1": 0.04217848526747235,
|
| 258 |
+
"eval_dim_128_cosine_recall@10": 0.2706183968947745,
|
| 259 |
+
"eval_dim_128_cosine_recall@3": 0.12288848071178002,
|
| 260 |
+
"eval_dim_128_cosine_recall@5": 0.18344012521240954,
|
| 261 |
+
"eval_dim_256_cosine_accuracy@1": 0.38348271446862997,
|
| 262 |
+
"eval_dim_256_cosine_accuracy@10": 0.4551856594110115,
|
| 263 |
+
"eval_dim_256_cosine_accuracy@3": 0.3886043533930858,
|
| 264 |
+
"eval_dim_256_cosine_accuracy@5": 0.4206145966709347,
|
| 265 |
+
"eval_dim_256_cosine_map@100": 0.4709582085612654,
|
| 266 |
+
"eval_dim_256_cosine_mrr@10": 0.3957850639188662,
|
| 267 |
+
"eval_dim_256_cosine_ndcg@10": 0.4087462230477571,
|
| 268 |
+
"eval_dim_256_cosine_precision@1": 0.38348271446862997,
|
| 269 |
+
"eval_dim_256_cosine_precision@10": 0.33886043533930854,
|
| 270 |
+
"eval_dim_256_cosine_precision@3": 0.382202304737516,
|
| 271 |
+
"eval_dim_256_cosine_precision@5": 0.3718309859154929,
|
| 272 |
+
"eval_dim_256_cosine_recall@1": 0.04466034705404223,
|
| 273 |
+
"eval_dim_256_cosine_recall@10": 0.2892016292717267,
|
| 274 |
+
"eval_dim_256_cosine_recall@3": 0.1301795023253766,
|
| 275 |
+
"eval_dim_256_cosine_recall@5": 0.19500340584044382,
|
| 276 |
+
"eval_dim_512_cosine_accuracy@1": 0.4065300896286812,
|
| 277 |
+
"eval_dim_512_cosine_accuracy@10": 0.4814340588988476,
|
| 278 |
+
"eval_dim_512_cosine_accuracy@3": 0.41229193341869397,
|
| 279 |
+
"eval_dim_512_cosine_accuracy@5": 0.44494238156209986,
|
| 280 |
+
"eval_dim_512_cosine_map@100": 0.49555759572196095,
|
| 281 |
+
"eval_dim_512_cosine_mrr@10": 0.41950236774180394,
|
| 282 |
+
"eval_dim_512_cosine_ndcg@10": 0.4329095460408428,
|
| 283 |
+
"eval_dim_512_cosine_precision@1": 0.4065300896286812,
|
| 284 |
+
"eval_dim_512_cosine_precision@10": 0.3596030729833547,
|
| 285 |
+
"eval_dim_512_cosine_precision@3": 0.4054630815194195,
|
| 286 |
+
"eval_dim_512_cosine_precision@5": 0.3947503201024327,
|
| 287 |
+
"eval_dim_512_cosine_recall@1": 0.047372341735862133,
|
| 288 |
+
"eval_dim_512_cosine_recall@10": 0.3071623578952262,
|
| 289 |
+
"eval_dim_512_cosine_recall@3": 0.1383106496582531,
|
| 290 |
+
"eval_dim_512_cosine_recall@5": 0.20757258542171747,
|
| 291 |
+
"eval_dim_64_cosine_accuracy@1": 0.3207426376440461,
|
| 292 |
+
"eval_dim_64_cosine_accuracy@10": 0.3725992317541613,
|
| 293 |
+
"eval_dim_64_cosine_accuracy@3": 0.322663252240717,
|
| 294 |
+
"eval_dim_64_cosine_accuracy@5": 0.3405889884763124,
|
| 295 |
+
"eval_dim_64_cosine_map@100": 0.3933467041096336,
|
| 296 |
+
"eval_dim_64_cosine_mrr@10": 0.32884732638253733,
|
| 297 |
+
"eval_dim_64_cosine_ndcg@10": 0.3371953828075091,
|
| 298 |
+
"eval_dim_64_cosine_precision@1": 0.3207426376440461,
|
| 299 |
+
"eval_dim_64_cosine_precision@10": 0.2797055057618438,
|
| 300 |
+
"eval_dim_64_cosine_precision@3": 0.3188220230473751,
|
| 301 |
+
"eval_dim_64_cosine_precision@5": 0.3088348271446863,
|
| 302 |
+
"eval_dim_64_cosine_recall@1": 0.036318765090758674,
|
| 303 |
+
"eval_dim_64_cosine_recall@10": 0.23840960718091392,
|
| 304 |
+
"eval_dim_64_cosine_recall@3": 0.10562189493083342,
|
| 305 |
+
"eval_dim_64_cosine_recall@5": 0.15867125525021739,
|
| 306 |
+
"eval_dim_768_cosine_accuracy@1": 0.41037131882202305,
|
| 307 |
+
"eval_dim_768_cosine_accuracy@10": 0.4833546734955186,
|
| 308 |
+
"eval_dim_768_cosine_accuracy@3": 0.4142125480153649,
|
| 309 |
+
"eval_dim_768_cosine_accuracy@5": 0.44430217669654287,
|
| 310 |
+
"eval_dim_768_cosine_map@100": 0.500478306774528,
|
| 311 |
+
"eval_dim_768_cosine_mrr@10": 0.4224889742495374,
|
| 312 |
+
"eval_dim_768_cosine_ndcg@10": 0.4349862241563486,
|
| 313 |
+
"eval_dim_768_cosine_precision@1": 0.41037131882202305,
|
| 314 |
+
"eval_dim_768_cosine_precision@10": 0.36165172855313704,
|
| 315 |
+
"eval_dim_768_cosine_precision@3": 0.4086641058472044,
|
| 316 |
+
"eval_dim_768_cosine_precision@5": 0.3969270166453265,
|
| 317 |
+
"eval_dim_768_cosine_recall@1": 0.047186779325657804,
|
| 318 |
+
"eval_dim_768_cosine_recall@10": 0.30540044861465576,
|
| 319 |
+
"eval_dim_768_cosine_recall@3": 0.1375709294981283,
|
| 320 |
+
"eval_dim_768_cosine_recall@5": 0.20603724780478358,
|
| 321 |
+
"eval_runtime": 98.5908,
|
| 322 |
+
"eval_samples_per_second": 0.0,
|
| 323 |
+
"eval_sequential_score": 0.3371953828075091,
|
| 324 |
+
"eval_steps_per_second": 0.0,
|
| 325 |
+
"step": 39
|
| 326 |
+
},
|
| 327 |
+
{
|
| 328 |
+
"epoch": 3.0816326530612246,
|
| 329 |
+
"grad_norm": 255.65982055664062,
|
| 330 |
+
"learning_rate": 1.9762960071199334e-05,
|
| 331 |
+
"loss": 8.6778,
|
| 332 |
+
"step": 40
|
| 333 |
+
},
|
| 334 |
+
{
|
| 335 |
+
"epoch": 3.8979591836734695,
|
| 336 |
+
"grad_norm": 470.4803771972656,
|
| 337 |
+
"learning_rate": 1.9346189253489888e-05,
|
| 338 |
+
"loss": 6.0257,
|
| 339 |
+
"step": 50
|
| 340 |
+
},
|
| 341 |
+
{
|
| 342 |
+
"epoch": 4.0,
|
| 343 |
+
"eval_dim_1024_cosine_accuracy@1": 0.4046094750320102,
|
| 344 |
+
"eval_dim_1024_cosine_accuracy@10": 0.47823303457106275,
|
| 345 |
+
"eval_dim_1024_cosine_accuracy@3": 0.4090909090909091,
|
| 346 |
+
"eval_dim_1024_cosine_accuracy@5": 0.43918053777208704,
|
| 347 |
+
"eval_dim_1024_cosine_map@100": 0.490599623630225,
|
| 348 |
+
"eval_dim_1024_cosine_mrr@10": 0.4168417068064951,
|
| 349 |
+
"eval_dim_1024_cosine_ndcg@10": 0.42913551824501384,
|
| 350 |
+
"eval_dim_1024_cosine_precision@1": 0.4046094750320102,
|
| 351 |
+
"eval_dim_1024_cosine_precision@10": 0.3565941101152369,
|
| 352 |
+
"eval_dim_1024_cosine_precision@3": 0.40311566367904395,
|
| 353 |
+
"eval_dim_1024_cosine_precision@5": 0.39180537772087065,
|
| 354 |
+
"eval_dim_1024_cosine_recall@1": 0.04660606778759063,
|
| 355 |
+
"eval_dim_1024_cosine_recall@10": 0.3014663479400921,
|
| 356 |
+
"eval_dim_1024_cosine_recall@3": 0.13592596883673455,
|
| 357 |
+
"eval_dim_1024_cosine_recall@5": 0.20379253880710943,
|
| 358 |
+
"eval_dim_128_cosine_accuracy@1": 0.34314980793854033,
|
| 359 |
+
"eval_dim_128_cosine_accuracy@10": 0.4148527528809219,
|
| 360 |
+
"eval_dim_128_cosine_accuracy@3": 0.34763124199743917,
|
| 361 |
+
"eval_dim_128_cosine_accuracy@5": 0.37708066581306016,
|
| 362 |
+
"eval_dim_128_cosine_map@100": 0.4276696379169563,
|
| 363 |
+
"eval_dim_128_cosine_mrr@10": 0.35513180090644836,
|
| 364 |
+
"eval_dim_128_cosine_ndcg@10": 0.36765573601526275,
|
| 365 |
+
"eval_dim_128_cosine_precision@1": 0.34314980793854033,
|
| 366 |
+
"eval_dim_128_cosine_precision@10": 0.302752880921895,
|
| 367 |
+
"eval_dim_128_cosine_precision@3": 0.3418693982074264,
|
| 368 |
+
"eval_dim_128_cosine_precision@5": 0.3322663252240717,
|
| 369 |
+
"eval_dim_128_cosine_recall@1": 0.040652627677675406,
|
| 370 |
+
"eval_dim_128_cosine_recall@10": 0.26330336421247125,
|
| 371 |
+
"eval_dim_128_cosine_recall@3": 0.1184519992454523,
|
| 372 |
+
"eval_dim_128_cosine_recall@5": 0.1774839552040709,
|
| 373 |
+
"eval_dim_256_cosine_accuracy@1": 0.3738796414852753,
|
| 374 |
+
"eval_dim_256_cosine_accuracy@10": 0.44558258642765686,
|
| 375 |
+
"eval_dim_256_cosine_accuracy@3": 0.37772087067861715,
|
| 376 |
+
"eval_dim_256_cosine_accuracy@5": 0.40717029449423814,
|
| 377 |
+
"eval_dim_256_cosine_map@100": 0.45855798848430374,
|
| 378 |
+
"eval_dim_256_cosine_mrr@10": 0.38572571794402755,
|
| 379 |
+
"eval_dim_256_cosine_ndcg@10": 0.3980442434686935,
|
| 380 |
+
"eval_dim_256_cosine_precision@1": 0.3738796414852753,
|
| 381 |
+
"eval_dim_256_cosine_precision@10": 0.3297695262483995,
|
| 382 |
+
"eval_dim_256_cosine_precision@3": 0.37238583013230897,
|
| 383 |
+
"eval_dim_256_cosine_precision@5": 0.3615877080665813,
|
| 384 |
+
"eval_dim_256_cosine_recall@1": 0.043086085492826574,
|
| 385 |
+
"eval_dim_256_cosine_recall@10": 0.2792649180924836,
|
| 386 |
+
"eval_dim_256_cosine_recall@3": 0.125747799799009,
|
| 387 |
+
"eval_dim_256_cosine_recall@5": 0.18837022600852496,
|
| 388 |
+
"eval_dim_512_cosine_accuracy@1": 0.39884763124199746,
|
| 389 |
+
"eval_dim_512_cosine_accuracy@10": 0.47823303457106275,
|
| 390 |
+
"eval_dim_512_cosine_accuracy@3": 0.4052496798975672,
|
| 391 |
+
"eval_dim_512_cosine_accuracy@5": 0.44558258642765686,
|
| 392 |
+
"eval_dim_512_cosine_map@100": 0.4876319198894288,
|
| 393 |
+
"eval_dim_512_cosine_mrr@10": 0.41307745462675005,
|
| 394 |
+
"eval_dim_512_cosine_ndcg@10": 0.42824151108259556,
|
| 395 |
+
"eval_dim_512_cosine_precision@1": 0.39884763124199746,
|
| 396 |
+
"eval_dim_512_cosine_precision@10": 0.35793854033290645,
|
| 397 |
+
"eval_dim_512_cosine_precision@3": 0.3975672215108835,
|
| 398 |
+
"eval_dim_512_cosine_precision@5": 0.3888604353393086,
|
| 399 |
+
"eval_dim_512_cosine_recall@1": 0.04570727180608771,
|
| 400 |
+
"eval_dim_512_cosine_recall@10": 0.2993652309972795,
|
| 401 |
+
"eval_dim_512_cosine_recall@3": 0.13329368345632836,
|
| 402 |
+
"eval_dim_512_cosine_recall@5": 0.2006035854063678,
|
| 403 |
+
"eval_dim_64_cosine_accuracy@1": 0.3079385403329065,
|
| 404 |
+
"eval_dim_64_cosine_accuracy@10": 0.36555697823303457,
|
| 405 |
+
"eval_dim_64_cosine_accuracy@3": 0.31241997439180536,
|
| 406 |
+
"eval_dim_64_cosine_accuracy@5": 0.33290653008962867,
|
| 407 |
+
"eval_dim_64_cosine_map@100": 0.38184314430829974,
|
| 408 |
+
"eval_dim_64_cosine_mrr@10": 0.31748394406845065,
|
| 409 |
+
"eval_dim_64_cosine_ndcg@10": 0.3275369456141822,
|
| 410 |
+
"eval_dim_64_cosine_precision@1": 0.3079385403329065,
|
| 411 |
+
"eval_dim_64_cosine_precision@10": 0.27215108834827145,
|
| 412 |
+
"eval_dim_64_cosine_precision@3": 0.3070849338454972,
|
| 413 |
+
"eval_dim_64_cosine_precision@5": 0.29820742637644043,
|
| 414 |
+
"eval_dim_64_cosine_recall@1": 0.03504677697523653,
|
| 415 |
+
"eval_dim_64_cosine_recall@10": 0.23026653514933906,
|
| 416 |
+
"eval_dim_64_cosine_recall@3": 0.10211269541567973,
|
| 417 |
+
"eval_dim_64_cosine_recall@5": 0.15297976910096123,
|
| 418 |
+
"eval_dim_768_cosine_accuracy@1": 0.3994878361075544,
|
| 419 |
+
"eval_dim_768_cosine_accuracy@10": 0.4737516005121639,
|
| 420 |
+
"eval_dim_768_cosine_accuracy@3": 0.4046094750320102,
|
| 421 |
+
"eval_dim_768_cosine_accuracy@5": 0.4359795134443022,
|
| 422 |
+
"eval_dim_768_cosine_map@100": 0.48680507317454147,
|
| 423 |
+
"eval_dim_768_cosine_mrr@10": 0.41201019246793846,
|
| 424 |
+
"eval_dim_768_cosine_ndcg@10": 0.4244383191680289,
|
| 425 |
+
"eval_dim_768_cosine_precision@1": 0.3994878361075544,
|
| 426 |
+
"eval_dim_768_cosine_precision@10": 0.352752880921895,
|
| 427 |
+
"eval_dim_768_cosine_precision@3": 0.39820742637644047,
|
| 428 |
+
"eval_dim_768_cosine_precision@5": 0.3868117797695263,
|
| 429 |
+
"eval_dim_768_cosine_recall@1": 0.046132270416131195,
|
| 430 |
+
"eval_dim_768_cosine_recall@10": 0.29681183299989666,
|
| 431 |
+
"eval_dim_768_cosine_recall@3": 0.13453018491697852,
|
| 432 |
+
"eval_dim_768_cosine_recall@5": 0.20078864250336506,
|
| 433 |
+
"eval_runtime": 98.6751,
|
| 434 |
+
"eval_samples_per_second": 0.0,
|
| 435 |
+
"eval_sequential_score": 0.3275369456141822,
|
| 436 |
+
"eval_steps_per_second": 0.0,
|
| 437 |
+
"step": 52
|
| 438 |
+
}
|
| 439 |
+
],
|
| 440 |
+
"logging_steps": 10,
|
| 441 |
+
"max_steps": 240,
|
| 442 |
+
"num_input_tokens_seen": 0,
|
| 443 |
+
"num_train_epochs": 20,
|
| 444 |
+
"save_steps": 500,
|
| 445 |
+
"stateful_callbacks": {
|
| 446 |
+
"EarlyStoppingCallback": {
|
| 447 |
+
"args": {
|
| 448 |
+
"early_stopping_patience": 2,
|
| 449 |
+
"early_stopping_threshold": 0.0
|
| 450 |
+
},
|
| 451 |
+
"attributes": {
|
| 452 |
+
"early_stopping_patience_counter": 1
|
| 453 |
+
}
|
| 454 |
+
},
|
| 455 |
+
"TrainerControl": {
|
| 456 |
+
"args": {
|
| 457 |
+
"should_epoch_stop": false,
|
| 458 |
+
"should_evaluate": false,
|
| 459 |
+
"should_log": false,
|
| 460 |
+
"should_save": true,
|
| 461 |
+
"should_training_stop": false
|
| 462 |
+
},
|
| 463 |
+
"attributes": {}
|
| 464 |
+
}
|
| 465 |
+
},
|
| 466 |
+
"total_flos": 0.0,
|
| 467 |
+
"train_batch_size": 8,
|
| 468 |
+
"trial_name": null,
|
| 469 |
+
"trial_params": null
|
| 470 |
+
}
|
checkpoint-52/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd906d94b017c1a7fa871b608776d19ecf4218c10c253401fe78ba8ce84435be
|
| 3 |
+
size 6097
|
checkpoint-65/1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 1024,
|
| 3 |
+
"pooling_mode_cls_token": false,
|
| 4 |
+
"pooling_mode_mean_tokens": true,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
checkpoint-65/README.md
ADDED
|
@@ -0,0 +1,1642 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
language:
|
| 3 |
+
- en
|
| 4 |
+
license: apache-2.0
|
| 5 |
+
tags:
|
| 6 |
+
- sentence-transformers
|
| 7 |
+
- sentence-similarity
|
| 8 |
+
- feature-extraction
|
| 9 |
+
- dense
|
| 10 |
+
- generated_from_trainer
|
| 11 |
+
- dataset_size:391
|
| 12 |
+
- loss:MatryoshkaLoss
|
| 13 |
+
- loss:MultipleNegativesRankingLoss
|
| 14 |
+
base_model: intfloat/multilingual-e5-large
|
| 15 |
+
widget:
|
| 16 |
+
- source_sentence: What is the responsibility of assisting and advising the data subjects
|
| 17 |
+
in exercising their rights?
|
| 18 |
+
sentences:
|
| 19 |
+
- '1.Personal data shall be: (a) processed lawfully, fairly and in a transparent
|
| 20 |
+
manner in relation to the data subject (‘lawfulness, fairness and transparency’);
|
| 21 |
+
(b) collected for specified, explicit and legitimate purposes and not further
|
| 22 |
+
processed in a manner that is incompatible with those purposes; further processing
|
| 23 |
+
for archiving purposes in the public interest, scientific or historical research
|
| 24 |
+
purposes or statistical purposes shall, in accordance with Article 89(1), not
|
| 25 |
+
be considered to be incompatible with the initial purposes (‘purpose limitation’);
|
| 26 |
+
(c) adequate, relevant and limited to what is necessary in relation to the purposes
|
| 27 |
+
for which they are processed (‘data minimisation’); (d) accurate and, where necessary,
|
| 28 |
+
kept up to date; every reasonable step must be taken to ensure that personal data
|
| 29 |
+
that are inaccurate, having regard to the purposes for which they are processed,
|
| 30 |
+
are erased or rectified without delay (‘accuracy’); 4.5.2016 L 119/35 (1) Directive
|
| 31 |
+
(EU) 2015/1535 of the European Parliament and of the Council of 9 September 2015
|
| 32 |
+
laying down a procedure for the provision of information in the field of technical
|
| 33 |
+
regulations and of rules on Information Society services (OJ L 241, 17.9.2015,
|
| 34 |
+
p. 1). (e) kept in a form which permits identification of data subjects for no
|
| 35 |
+
longer than is necessary for the purposes for which the personal data are processed;
|
| 36 |
+
personal data may be stored for longer periods insofar as the personal data will
|
| 37 |
+
be processed solely for archiving purposes in the public interest, scientific
|
| 38 |
+
or historical research purposes or statistical purposes in accordance with Article
|
| 39 |
+
89(1) subject to implementation of the appropriate technical and organisational
|
| 40 |
+
measures required by this Regulation in order to safeguard the rights and freedoms
|
| 41 |
+
of the data subject (‘storage limitation’); (f) processed in a manner that ensures
|
| 42 |
+
appropriate security of the personal data, including protection against unauthorised
|
| 43 |
+
or unlawful processing and against accidental loss, destruction or damage, using
|
| 44 |
+
appropriate technical or organisational measures (‘integrity and confidentiality’).
|
| 45 |
+
|
| 46 |
+
2.The controller shall be responsible for, and be able to demonstrate compliance
|
| 47 |
+
with, paragraph 1 (‘accountability’).'
|
| 48 |
+
- '1.A transfer of personal data to a third country or an international organisation
|
| 49 |
+
may take place where the Commission has decided that the third country, a territory
|
| 50 |
+
or one or more specified sectors within that third country, or the international
|
| 51 |
+
organisation in question ensures an adequate level of protection. Such a transfer
|
| 52 |
+
shall not require any specific authorisation.
|
| 53 |
+
|
| 54 |
+
2.When assessing the adequacy of the level of protection, the Commission shall,
|
| 55 |
+
in particular, take account of the following elements: (a) the rule of law, respect
|
| 56 |
+
for human rights and fundamental freedoms, relevant legislation, both general
|
| 57 |
+
and sectoral, including concerning public security, defence, national security
|
| 58 |
+
and criminal law and the access of public authorities to personal data, as well
|
| 59 |
+
as the implementation of such legislation, data protection rules, professional
|
| 60 |
+
rules and security measures, including rules for the onward transfer of personal
|
| 61 |
+
data to another third country or international organisation which are complied
|
| 62 |
+
with in that country or international organisation, case-law, as well as effective
|
| 63 |
+
and enforceable data subject rights and effective administrative and judicial
|
| 64 |
+
redress for the data subjects whose personal data are being transferred; (b) the
|
| 65 |
+
existence and effective functioning of one or more independent supervisory authorities
|
| 66 |
+
in the third country or to which an international organisation is subject, with
|
| 67 |
+
responsibility for ensuring and enforcing compliance with the data protection
|
| 68 |
+
rules, including adequate enforcement powers, for assisting and advising the data
|
| 69 |
+
subjects in exercising their rights and for cooperation with the supervisory authorities
|
| 70 |
+
of the Member States; and (c) the international commitments the third country
|
| 71 |
+
or international organisation concerned has entered into, or other obligations
|
| 72 |
+
arising from legally binding conventions or instruments as well as from its participation
|
| 73 |
+
in multilateral or regional systems, in particular in relation to the protection
|
| 74 |
+
of personal data.
|
| 75 |
+
|
| 76 |
+
3.The Commission, after assessing the adequacy of the level of protection, may
|
| 77 |
+
decide, by means of implementing act, that a third country, a territory or one
|
| 78 |
+
or more specified sectors within a third country, or an international organisation
|
| 79 |
+
ensures an adequate level of protection within the meaning of paragraph 2 of this
|
| 80 |
+
Article. The implementing act shall provide for a mechanism for a periodic review,
|
| 81 |
+
at least every four years, which shall take into account all relevant developments
|
| 82 |
+
in the third country or international organisation. The implementing act shall
|
| 83 |
+
specify its territorial and sectoral application and, where applicable, identify
|
| 84 |
+
the supervisory authority or authorities referred to in point (b) of paragraph
|
| 85 |
+
2 of this Article. The implementing act shall be adopted in accordance with the
|
| 86 |
+
examination procedure referred to in Article 93(2).
|
| 87 |
+
|
| 88 |
+
4.The Commission shall, on an ongoing basis, monitor developments in third countries
|
| 89 |
+
and international organisations that could affect the functioning of decisions
|
| 90 |
+
adopted pursuant to paragraph 3 of this Article and decisions adopted on the basis
|
| 91 |
+
of Article 25(6) of Directive 95/46/EC.
|
| 92 |
+
|
| 93 |
+
5.The Commission shall, where available information reveals, in particular following
|
| 94 |
+
the review referred to in paragraph 3 of this Article, that a third country, a
|
| 95 |
+
territory or one or more specified sectors within a third country, or an international
|
| 96 |
+
organisation no longer ensures an adequate level of protection within the meaning
|
| 97 |
+
of paragraph 2 of this Article, to the extent necessary, repeal, amend or suspend
|
| 98 |
+
the decision referred to in paragraph 3 of this Article by means of implementing
|
| 99 |
+
acts without retro-active effect. Those implementing acts shall be adopted in
|
| 100 |
+
accordance with the examination procedure referred to in Article 93(2). On duly
|
| 101 |
+
justified imperative grounds of urgency, the Commission shall adopt immediately
|
| 102 |
+
applicable implementing acts in accordance with the procedure referred to in Article
|
| 103 |
+
93(3).
|
| 104 |
+
|
| 105 |
+
6.The Commission shall enter into consultations with the third country or international
|
| 106 |
+
organisation with a view to remedying the situation giving rise to the decision
|
| 107 |
+
made pursuant to paragraph 5
|
| 108 |
+
|
| 109 |
+
7.A decision pursuant to paragraph 5 of this Article is without prejudice to transfers
|
| 110 |
+
of personal data to the third country, a territory or one or more specified sectors
|
| 111 |
+
within that third country, or the international organisation in question pursuant
|
| 112 |
+
to Articles 46 to 49
|
| 113 |
+
|
| 114 |
+
8.The Commission shall publish in the Official Journal of the European Union and
|
| 115 |
+
on its website a list of the third countries, territories and specified sectors
|
| 116 |
+
within a third country and international organisations for which it has decided
|
| 117 |
+
that an adequate level of protection is or is no longer ensured.
|
| 118 |
+
|
| 119 |
+
9.Decisions adopted by the Commission on the basis of Article 25(6) of Directive
|
| 120 |
+
95/46/EC shall remain in force until amended, replaced or repealed by a Commission
|
| 121 |
+
Decision adopted in accordance with paragraph 3 or 5 of this Article.'
|
| 122 |
+
- The legal systems of Denmark and Estonia do not allow for administrative fines
|
| 123 |
+
as set out in this Regulation. The rules on administrative fines may be applied
|
| 124 |
+
in such a manner that in Denmark the fine is imposed by competent national courts
|
| 125 |
+
as a criminal penalty and in Estonia the fine is imposed by the supervisory authority
|
| 126 |
+
in the framework of a misdemeanour procedure, provided that such an application
|
| 127 |
+
of the rules in those Member States has an equivalent effect to administrative
|
| 128 |
+
fines imposed by supervisory authorities. Therefore the competent national courts
|
| 129 |
+
should take into account the recommendation by the supervisory authority initiating
|
| 130 |
+
the fine. In any event, the fines imposed should be effective, proportionate and
|
| 131 |
+
dissuasive.
|
| 132 |
+
- source_sentence: Is the fine mandatory for the described offense?
|
| 133 |
+
sentences:
|
| 134 |
+
- "1.Each supervisory authority shall ensure that the imposition of administrative\
|
| 135 |
+
\ fines pursuant to this Article in respect of infringements of this Regulation\
|
| 136 |
+
\ referred to in paragraphs 4, 5 and 6 shall in each individual case be effective,\
|
| 137 |
+
\ proportionate and dissuasive.\n2.Administrative fines shall, depending on the\
|
| 138 |
+
\ circumstances of each individual case, be imposed in addition to, or instead\
|
| 139 |
+
\ of, measures referred to in points (a) to (h) and (j) of Article 58(2). When\
|
| 140 |
+
\ deciding whether to impose an administrative fine and deciding on the amount\
|
| 141 |
+
\ of the administrative fine in each individual case due regard shall be given\
|
| 142 |
+
\ to the following: (a) the nature, gravity and duration of the infringement\
|
| 143 |
+
\ taking into account the nature scope or purpose of the processing concerned\
|
| 144 |
+
\ as well as the number of data subjects affected and the level of damage suffered\
|
| 145 |
+
\ by them; (b) the intentional or negligent character of the infringement; (c)\
|
| 146 |
+
\ any action taken by the controller or processor to mitigate the damage suffered\
|
| 147 |
+
\ by data subjects; (d) the degree of responsibility of the controller or processor\
|
| 148 |
+
\ taking into account technical and organisational measures implemented by them\
|
| 149 |
+
\ pursuant to Articles 25 and 32; (e) any relevant previous infringements by\
|
| 150 |
+
\ the controller or processor; (f) the degree of cooperation with the supervisory\
|
| 151 |
+
\ authority, in order to remedy the infringement and mitigate the possible adverse\
|
| 152 |
+
\ effects of the infringement; (g) the categories of personal data affected by\
|
| 153 |
+
\ the infringement; (h) the manner in which the infringement became known to\
|
| 154 |
+
\ the supervisory authority, in particular whether, and if so to what extent,\
|
| 155 |
+
\ the controller or processor notified the infringement; (i) where measures referred\
|
| 156 |
+
\ to in Article 58(2) have previously been ordered against the controller or processor\
|
| 157 |
+
\ concerned with regard to the same subject-matter, compliance with those measures;\
|
| 158 |
+
\ (j) adherence to approved codes of conduct pursuant to Article 40 or approved\
|
| 159 |
+
\ certification mechanisms pursuant to Article 42; and (k) any other aggravating\
|
| 160 |
+
\ or mitigating factor applicable to the circumstances of the case, such as financial\
|
| 161 |
+
\ benefits gained, or losses avoided, directly or indirectly, from the infringement.\n\
|
| 162 |
+
3.If a controller or processor intentionally or negligently, for the same or linked\
|
| 163 |
+
\ processing operations, infringes several provisions of this Regulation, the\
|
| 164 |
+
\ total amount of the administrative fine shall not exceed the amount specified\
|
| 165 |
+
\ for the gravest infringement.\n4.Infringements of the following provisions shall,\
|
| 166 |
+
\ in accordance with paragraph 2, be subject to administrative fines up to 10\
|
| 167 |
+
\ 000 000 EUR, or in the case of an undertaking, up to 2 % of the total worldwide\
|
| 168 |
+
\ annual turnover of the preceding financial year, whichever is higher: (a) the\
|
| 169 |
+
\ obligations of the controller and the processor pursuant to Articles 8, 11,\
|
| 170 |
+
\ 25 to 39 and 42 and 43; (b) the obligations of the certification body pursuant\
|
| 171 |
+
\ to Articles 42 and 43; (c) the obligations of the monitoring body pursuant\
|
| 172 |
+
\ to Article 41(4). 4.5.2016 L 119/82 \n5.Infringements of the following provisions\
|
| 173 |
+
\ shall, in accordance with paragraph 2, be subject to administrative fines up\
|
| 174 |
+
\ to 20 000 000 EUR, or in the case of an undertaking, up to 4 % of the total\
|
| 175 |
+
\ worldwide annual turnover of the preceding financial year, whichever is higher:\
|
| 176 |
+
\ (a) the basic principles for processing, including conditions for consent,\
|
| 177 |
+
\ pursuant to Articles 5, 6, 7 and 9; (b) the data subjects' rights pursuant\
|
| 178 |
+
\ to Articles 12 to 22; (c) the transfers of personal data to a recipient in\
|
| 179 |
+
\ a third country or an international organisation pursuant to Articles 44 to\
|
| 180 |
+
\ 49; (d) any obligations pursuant to Member State law adopted under Chapter\
|
| 181 |
+
\ IX; (e) non-compliance with an order or a temporary or definitive limitation\
|
| 182 |
+
\ on processing or the suspension of data flows by the supervisory authority pursuant\
|
| 183 |
+
\ to Article 58(2) or failure to provide access in violation of Article 58(1).\n\
|
| 184 |
+
6.Non-compliance with an order by the supervisory authority as referred to in\
|
| 185 |
+
\ Article 58(2) shall, in accordance with paragraph 2 of this Article, be subject\
|
| 186 |
+
\ to administrative fines up to 20 000 000 EUR, or in the case of an undertaking,\
|
| 187 |
+
\ up to 4 % of the total worldwide annual turnover of the preceding financial\
|
| 188 |
+
\ year, whichever is higher.\n7.Without prejudice to the corrective powers of\
|
| 189 |
+
\ supervisory authorities pursuant to Article 58(2), each Member State may lay\
|
| 190 |
+
\ down the rules on whether and to what extent administrative fines may be imposed\
|
| 191 |
+
\ on public authorities and bodies established in that Member State.\n8.The exercise\
|
| 192 |
+
\ by the supervisory authority of its powers under this Article shall be subject\
|
| 193 |
+
\ to appropriate procedural safeguards in accordance with Union and Member State\
|
| 194 |
+
\ law, including effective judicial remedy and due process.\n9.Where the legal\
|
| 195 |
+
\ system of the Member State does not provide for administrative fines, this Article\
|
| 196 |
+
\ may be applied in such a manner that the fine is initiated by the competent\
|
| 197 |
+
\ supervisory authority and imposed by competent national courts, while ensuring\
|
| 198 |
+
\ that those legal remedies are effective and have an equivalent effect to the\
|
| 199 |
+
\ administrative fines imposed by supervisory authorities. In any event, the fines\
|
| 200 |
+
\ imposed shall be effective, proportionate and dissuasive. Those Member States\
|
| 201 |
+
\ shall notify to the Commission the provisions of their laws which they adopt\
|
| 202 |
+
\ pursuant to this paragraph by 25 May 2018 and, without delay, any subsequent\
|
| 203 |
+
\ amendment law or amendment affecting them."
|
| 204 |
+
- "Court (Civil/Criminal): Criminal \nProvisions: Article 386 of the Penal Code\
|
| 205 |
+
\ \nTime of commission of the act: \nResult (innocent, guilty): \nReasoning:\
|
| 206 |
+
\ Conviction for computer fraud committed repeatedly and professionally with a\
|
| 207 |
+
\ total benefit and damage exceeding €30,000. According to the majority opinion,\
|
| 208 |
+
\ the charge is substantiated in both its objective and subjective aspects, and\
|
| 209 |
+
\ the defendant must be declared guilty of the aforementioned criminal acts of\
|
| 210 |
+
\ fraud by means of a computer, committed repeatedly by a perpetrator acting professionally,\
|
| 211 |
+
\ where the total financial benefit and corresponding damage exceed the amount\
|
| 212 |
+
\ of €30,000, as well as for repeated embezzlement.\n\nFacts: The defendant accessed\
|
| 213 |
+
\ a website using a computer, employing, without the knowledge and consent of\
|
| 214 |
+
\ the complainants, the access codes for the electronic management system of the\
|
| 215 |
+
\ bank accounts held by the complainants at a Bank, and transferred money through\
|
| 216 |
+
\ electronically transmitted orders from the complainants' accounts to her own\
|
| 217 |
+
\ account. Specifically, during the period from June 2007 to June 2008, after\
|
| 218 |
+
\ unlawfully acquiring the aforementioned STICK containing the access codes, she\
|
| 219 |
+
\ accessed a website maintained by ..., using, without the complainants' knowledge\
|
| 220 |
+
\ (without their consent or approval), the access codes for the electronic management\
|
| 221 |
+
\ system of the bank accounts held at the aforementioned Bank, transferring through\
|
| 222 |
+
\ electronically transmitted orders to the joint account number ... of the complainants\
|
| 223 |
+
\ from bank accounts numbered ..., ..., and ..., the total amount of €55,710,\
|
| 224 |
+
\ as detailed in the orders, and subsequently, using an ATM card, she gradually\
|
| 225 |
+
\ withdrew from the aforementioned account number ..., the total amount of €55,710,\
|
| 226 |
+
\ making 84 individual withdrawals from automatic teller machines. In addition,\
|
| 227 |
+
\ the defendant, during the period from June 2008 to November 2008, in the same\
|
| 228 |
+
\ exact manner (through the electronic management system of the bank accounts),\
|
| 229 |
+
\ transferred through electronically transmitted orders to account number ...,\
|
| 230 |
+
\ which she had opened at ..., from the complainants' bank accounts numbered ...,\
|
| 231 |
+
\ ..., ..., ..., and ..., the total amount of €73,942, as detailed in the orders\
|
| 232 |
+
\ regarding the transfers of these amounts. Furthermore, during the period from\
|
| 233 |
+
\ February 2008 to November 2008, through multiple acts constituting a continuation\
|
| 234 |
+
\ of the crime, although she had received from the first complainant ... the amounts\
|
| 235 |
+
\ of €695.04, €695.04, and €845.04, in order to pay his insurance contributions\
|
| 236 |
+
\ to O.A.E.E. for the periods of January-February 2008, May-June 2008, and September-October\
|
| 237 |
+
\ 2008, as well as the amounts of €250 and €280, in order to settle credit card\
|
| 238 |
+
\ bills for \"...\", respectively, and from the second complainant ... she received\
|
| 239 |
+
\ the amounts of €283.64, €419.26, and €385.38, to pay the latter's insurance\
|
| 240 |
+
\ contributions to O.A.E.E. for the periods of July-August 2007, May-June 2008,\
|
| 241 |
+
\ September-October 2008, and November-December 2008, as well as the amount of\
|
| 242 |
+
\ €1,888.03 for the settlement of VAT, she never paid the above amounts to settle\
|
| 243 |
+
\ the aforementioned obligations, nor did she return them to the complainants,\
|
| 244 |
+
\ despite being urged to do so, but incorporated them into her assets and wrongfully\
|
| 245 |
+
\ appropriated them. The defendant denies the charges against her and claims that\
|
| 246 |
+
\ the withdrawals were made by the second complainant and that all the amounts\
|
| 247 |
+
\ transferred to her account were transferred to cover the company's expenses\
|
| 248 |
+
\ and their personal expenses, due to her cohabitation with the second complainant\
|
| 249 |
+
\ and with his knowledge, with whom she intended to marry. However, this claim\
|
| 250 |
+
\ is not supported by any evidence; on the contrary, it emerged that she conducted\
|
| 251 |
+
\ the transfers of the money and withdrawals without the complainants' knowledge,\
|
| 252 |
+
\ and when she learned that they had been informed about the account movements\
|
| 253 |
+
\ and met at the Bank, her behavior and demeanor indicated guilt, according to\
|
| 254 |
+
\ the testimony of the prosecution witness ..., an employee of the Pangrati branch\
|
| 255 |
+
\ of ..., who saw her on the same day at the aforementioned Bank when she met\
|
| 256 |
+
\ with the complainants. The ongoing act of fraud using a computer was committed\
|
| 257 |
+
\ by the defendant professionally, as evidenced by her repeated commission of\
|
| 258 |
+
\ the act, as well as the infrastructure she had established with the intent of\
|
| 259 |
+
\ repeated commission, based on a specific plan and methodology (transferring\
|
| 260 |
+
\ smaller amounts to a joint account of the complainants from the remaining accounts\
|
| 261 |
+
\ of the latter, and then withdrawing the transferred amounts with an ATM card,\
|
| 262 |
+
\ as well as directly transferring smaller amounts from the complainants' accounts\
|
| 263 |
+
\ to her personal account she had opened at the same bank), indicating her purpose\
|
| 264 |
+
\ to generate income, with the financial benefit she gained, corresponding to\
|
| 265 |
+
\ the complainants' damage, exceeding a total of €30,000."
|
| 266 |
+
- 'Any person who intentionally, through the technology of information and communication,
|
| 267 |
+
suggests an encounter between an adult and a minor under the age of fifteen, aiming
|
| 268 |
+
at the commitment of the crimes described in par. 1 and 2 of art. 339 and 348Α,
|
| 269 |
+
is sentenced to an imprisonment of at least two years and a fine of fifty to two
|
| 270 |
+
hundred thousand Euros, when the proposal is followed by further actions which
|
| 271 |
+
lead in the commitment of such crimes.
|
| 272 |
+
|
| 273 |
+
'
|
| 274 |
+
- source_sentence: Who should provide authorisation when safeguards are detailed in
|
| 275 |
+
non-legally binding administrative arrangements?
|
| 276 |
+
sentences:
|
| 277 |
+
- In the absence of an adequacy decision, the controller or processor should take
|
| 278 |
+
measures to compensate for the lack of data protection in a third country by way
|
| 279 |
+
of appropriate safeguards for the data subject. Such appropriate safeguards may
|
| 280 |
+
consist of making use of binding corporate rules, standard data protection clauses
|
| 281 |
+
adopted by the Commission, standard data protection clauses adopted by a supervisory
|
| 282 |
+
authority or contractual clauses authorised by a supervisory authority. Those
|
| 283 |
+
safeguards should ensure compliance with data protection requirements and the
|
| 284 |
+
rights of the data subjects appropriate to processing within the Union, including
|
| 285 |
+
the availability of enforceable data subject rights and of effective legal remedies,
|
| 286 |
+
including to obtain effective administrative or judicial redress and to claim
|
| 287 |
+
compensation, in the Union or in a third country. They should relate in particular
|
| 288 |
+
to compliance with the general principles relating to personal data processing,
|
| 289 |
+
the principles of data protection by design and by default. Transfers may also
|
| 290 |
+
be carried out by public authorities or bodies with public authorities or bodies
|
| 291 |
+
in third countries or with international organisations with corresponding duties
|
| 292 |
+
or functions, including on the basis of provisions to be inserted into administrative
|
| 293 |
+
arrangements, such as a memorandum of understanding, providing for enforceable
|
| 294 |
+
and effective rights for data subjects. Authorisation by the competent supervisory
|
| 295 |
+
authority should be obtained when the safeguards are provided for in administrative
|
| 296 |
+
arrangements that are not legally binding.
|
| 297 |
+
- '**Court (Civil/Criminal): Civil**
|
| 298 |
+
|
| 299 |
+
|
| 300 |
+
**Provisions:**
|
| 301 |
+
|
| 302 |
+
|
| 303 |
+
**Time of commission of the act:**
|
| 304 |
+
|
| 305 |
+
|
| 306 |
+
**Outcome (not guilty, guilty):**
|
| 307 |
+
|
| 308 |
+
|
| 309 |
+
**Rationale:**
|
| 310 |
+
|
| 311 |
+
|
| 312 |
+
**Facts:**
|
| 313 |
+
|
| 314 |
+
The plaintiff holds credit card number ............ with the defendant banking
|
| 315 |
+
corporation. Based on the application for alternative networks dated 19/7/2015
|
| 316 |
+
with number ......... submitted at a branch of the defendant, he was granted access
|
| 317 |
+
to the electronic banking service (e-banking) to conduct banking transactions
|
| 318 |
+
(debit, credit, updates, payments) remotely. On 30/11/2020, the plaintiff fell
|
| 319 |
+
victim to electronic fraud through the "phishing" method, whereby an unknown perpetrator
|
| 320 |
+
managed to withdraw a total amount of €3,121.75 from the aforementioned credit
|
| 321 |
+
card. Specifically, the plaintiff received an email at 1:35 PM on 29/11/2020 from
|
| 322 |
+
sender ...... with address ........, informing him that due to an impending system
|
| 323 |
+
change, he needed to verify the mobile phone number linked to the credit card,
|
| 324 |
+
urging him to complete the verification process within the next 24 hours by following
|
| 325 |
+
a link titled ........; otherwise, his account would be locked for security reasons.
|
| 326 |
+
The plaintiff read this email on the afternoon of 30 November 2020 and, believing
|
| 327 |
+
it was from the defendant, followed the instructions and proceeded via the provided
|
| 328 |
+
link to a website that was identical (a clone) to that of the defendant. On this
|
| 329 |
+
page, he was asked to enter the six-digit security code (.........) that had just
|
| 330 |
+
been sent to his mobile phone by the defendant at 3:41 PM, with the note that
|
| 331 |
+
it was an activation code for his ........ card at ........., which he entered.
|
| 332 |
+
|
| 333 |
+
|
| 334 |
+
Subsequently, the plaintiff received, according to his statements, a new email
|
| 335 |
+
(not submitted), which requested him to enter the details of the aforementioned
|
| 336 |
+
credit card, specifically the name of the cardholder and the card number, not
|
| 337 |
+
the PIN, which he also entered, convinced that he was within the online environment
|
| 338 |
+
of the defendant. Then, at 3:47 PM, he received a message on his mobile phone
|
| 339 |
+
from the defendant containing the exact same content as the one he received at
|
| 340 |
+
3:41 PM, while at 3:50 PM he received a message stating that the activation of
|
| 341 |
+
his ......... card at ....... had been completed. Once the plaintiff read this,
|
| 342 |
+
he became concerned that something was not right, and immediately called (at 4:41
|
| 343 |
+
PM) the defendant''s call center to inform them. There, the employees, with whom
|
| 344 |
+
he finally connected at 5:04 PM due to high call center volume, advised him to
|
| 345 |
+
delete the relevant emails, cancel his credit card, change his access passwords
|
| 346 |
+
for the service, and submit a dispute request regarding the conducted transactions.
|
| 347 |
+
The plaintiff electronically sent this request to the defendant, disputing the
|
| 348 |
+
detailed transactions amounting to €3,121.75, which were conducted on 30/11/2020
|
| 349 |
+
during the time frame of 16:37:45-16:43:34 PM, arguing that he had neither performed
|
| 350 |
+
them himself nor authorized anyone else to do so. The plaintiff specifically disputed
|
| 351 |
+
the following transactions, as evidenced by the account activity of the disputed
|
| 352 |
+
credit card during the aforementioned timeframe: a) transaction number .........
|
| 353 |
+
amounting to €150.62 conducted on 30/11/2020 at 4:43:34 PM, b) transaction number
|
| 354 |
+
........ amounting to €293.20 conducted on 30/11/2020 at 4:42:40 PM, c) transaction
|
| 355 |
+
number ............ amounting to €295.21 conducted on 30/11/2020 at 4:42:10 PM,
|
| 356 |
+
d) transaction number .......... amounting to €299.22 conducted on 30/11/2020
|
| 357 |
+
at 4:41:31 PM, e) transaction number ........ amounting to €297.21 conducted on
|
| 358 |
+
30/11/2020 at 4:41:01 PM, f) transaction number ........ amounting to €299.22
|
| 359 |
+
conducted on 30/11/2020 at 4:40:27 PM, g) transaction number ....... amounting
|
| 360 |
+
to €299.22 conducted on 30/11/2020 at 4:39:55 PM, h) transaction number ......
|
| 361 |
+
amounting to €299.22 conducted on 30/11/2020 at 4:39:22 PM, i) transaction number
|
| 362 |
+
......... amounting to €297.22 conducted on 30/11/2020 at 4:38:52 PM, j) transaction
|
| 363 |
+
number ......... amounting to €295.21 conducted on 30/11/2020 at 4:38:17 PM, and
|
| 364 |
+
k) transaction number ......... amounting to €296.21 conducted on 30/11/2020 at
|
| 365 |
+
4:37:45 PM. In its response letter dated 21/12/2020, the defendant denied responsibility
|
| 366 |
+
for the costs of the aforementioned transactions, placing the entire blame on
|
| 367 |
+
the plaintiff for the leak of his card details and security code to the fraudulent
|
| 368 |
+
page. The plaintiff, completely denying any fault for the conducted transactions,
|
| 369 |
+
repeatedly contacted the defendant, both by phone and via email (see emails dated
|
| 370 |
+
15/1/2021 and 11/2/2021), while on 2/3/2021, he electronically sent a report dated
|
| 371 |
+
1/03/2021 to the Consumer Advocate’s email address, recounting the events and
|
| 372 |
+
requesting that the aforementioned Independent Authority intervene to have the
|
| 373 |
+
disputed debt canceled. In its letter with reference number ...../27.04.2021,
|
| 374 |
+
the aforementioned Independent Authority informed the plaintiff that the case
|
| 375 |
+
was outside its mediating role and was therefore archived. Subsequently, the plaintiff
|
| 376 |
+
sent the defendant on 5/3/2021 his extrajudicial statement dated 4/3/2021, calling
|
| 377 |
+
upon it to fully cancel the debt of €3,121.75 that had been unjustly incurred
|
| 378 |
+
against him within two days and to immediately instruct the representatives of
|
| 379 |
+
the collection agency working with it to cease contacting him regarding the disputed
|
| 380 |
+
case. The defendant sent the plaintiff a message on his mobile phone on 20/04/2021
|
| 381 |
+
informing him that his case was still being processed due to lengthy operational
|
| 382 |
+
requirements, while on 23/04/2021, via email, it informed him that considering
|
| 383 |
+
their good cooperation and his efforts to keep them updated, it had reviewed his
|
| 384 |
+
case and decided to refund him the amounts of the transactions that were conducted
|
| 385 |
+
after his contact with their representatives on 30/11/2020 at 4:41 PM, totaling
|
| 386 |
+
€1,038.25, specifically the following: a) transaction of €150.62 conducted on
|
| 387 |
+
30/11/2020 at 4:43 PM, b) transaction of €295.21 conducted on 30/11/2020 at 4:42
|
| 388 |
+
PM, c) transaction of €293.20 conducted on 30/11/2020 at 4:42 PM, and d) transaction
|
| 389 |
+
of €299.22 conducted on 30/11/2020 at 4:41 PM. Beyond this, the defendant refused
|
| 390 |
+
to refund the plaintiff the amount of the remaining transactions conducted on
|
| 391 |
+
30/11/2020, totaling €2,376.08 (and not €2,376.48 as incorrectly stated by the
|
| 392 |
+
plaintiff in his lawsuit), which the plaintiff ultimately fully paid, transferring
|
| 393 |
+
€2,342.77 to the defendant on 7/06/2021 and €33.31 on 15/06/2021 (see related
|
| 394 |
+
deposit receipts).'
|
| 395 |
+
- "Court (Civil/Criminal): Civil \nProvisions: \nTime of commission: July 21,\
|
| 396 |
+
\ 2020 \nOutcome (innocent, guilty): Partially accepts the lawsuit against the\
|
| 397 |
+
\ Bank. \nReasoning: Alongside the bank's responsibility for the ineffective\
|
| 398 |
+
\ protection of its systems against the continually changing and evolving methods\
|
| 399 |
+
\ of deception that affect them, leading to financial damage for its clients who\
|
| 400 |
+
\ entrusted it, which constitutes a breach of its contractual obligations and\
|
| 401 |
+
\ generates contractual liability, there is also the personal responsibility of\
|
| 402 |
+
\ the plaintiff, who did not safeguard, as required, his sensitive banking information\
|
| 403 |
+
\ and disclosed it when he should not have, even though the message that misled\
|
| 404 |
+
\ him came from the context of an SMS conversation with the defendant, even if\
|
| 405 |
+
\ he was directed through the link to a website resembling that of the defendant,\
|
| 406 |
+
\ because he overlooked the relevant instructions and strict recommendations of\
|
| 407 |
+
\ the bank, violating his duty to safeguard them. Therefore, in light of the above,\
|
| 408 |
+
\ the court must partially accept the lawsuit regarding its substance, and with\
|
| 409 |
+
\ the defendant's objection regarding the plaintiff's fault being accepted at\
|
| 410 |
+
\ a rate of 1/6 of the damage suffered, it must be acknowledged – following the\
|
| 411 |
+
\ admissible and lawful modification of the lawsuit's request from a dismissive\
|
| 412 |
+
\ to a declaratory nature as proposed – the defendant's obligation to pay him\
|
| 413 |
+
\ the amount of €2,500, with legal interest, as specified in the operative part.\
|
| 414 |
+
\ Regarding the request to recognize the defendant's obligation to pay him €1,000\
|
| 415 |
+
\ as compensation for the moral damage he suffered from the fraud committed against\
|
| 416 |
+
\ him, this is deemed dismissible as unfounded, because the defendant's liability\
|
| 417 |
+
\ is contractual and not tortious, and there are no special conditions justifying\
|
| 418 |
+
\ the treatment of this specific non-contractual behavior as tortious, making\
|
| 419 |
+
\ it possible to attribute moral damage to the plaintiff from the defendant. \
|
| 420 |
+
\ \nFacts: The plaintiff maintained a joint bank account with his wife and had\
|
| 421 |
+
\ access to the defendant bank's e-banking. On July 21, 2020, following successful\
|
| 422 |
+
\ identification via the agreed-upon credentials (userID, password, OTP), a request\
|
| 423 |
+
\ was made to change the mobile phone number for receiving OTPs, which was completed\
|
| 424 |
+
\ through the bank's platform. However, this change was not made by the plaintiff\
|
| 425 |
+
\ himself, but by a third party who had previously deceived him using the phishing\
|
| 426 |
+
\ method, obtaining his banking details through a misleading SMS. Following the\
|
| 427 |
+
\ phone number change, on July 31, 2020, a transfer of €3,000 was made to a third\
|
| 428 |
+
\ party's account. The transaction was conducted using the necessary credentials\
|
| 429 |
+
\ and OTP sent to the new mobile phone, resulting in the bank considering the\
|
| 430 |
+
\ order valid and executing it. Once the plaintiff realized the transfer, he immediately\
|
| 431 |
+
\ contacted the bank and informed them that he had not given such an order himself.\
|
| 432 |
+
\ Despite the initial assurance that the funds could be recovered, they were ultimately\
|
| 433 |
+
\ not returned, as they had been transferred to a third party's account, and the\
|
| 434 |
+
\ bank denied any responsibility for the loss."
|
| 435 |
+
- source_sentence: When will the periodic review mechanism be conducted?
|
| 436 |
+
sentences:
|
| 437 |
+
- The Commission should monitor the functioning of decisions on the level of protection
|
| 438 |
+
in a third country, a territory or specified sector within a third country, or
|
| 439 |
+
an international organisation, and monitor the functioning of decisions adopted
|
| 440 |
+
on the basis of Article 25(6) or Article 26(4) of Directive 95/46/EC. In its adequacy
|
| 441 |
+
decisions, the Commission should provide for a periodic review mechanism of their
|
| 442 |
+
functioning. That periodic review should be conducted in consultation with the
|
| 443 |
+
third country or international organisation in question and take into account
|
| 444 |
+
all relevant developments in the third country or international organisation.
|
| 445 |
+
For the purposes of monitoring and of carrying out the periodic reviews, the Commission
|
| 446 |
+
should take into consideration the views and findings of the European Parliament
|
| 447 |
+
and of the Council as well as of other relevant bodies and sources. The Commission
|
| 448 |
+
should evaluate, within a reasonable time, the functioning of the latter decisions
|
| 449 |
+
and report any relevant findings to the Committee within the meaning of Regulation
|
| 450 |
+
(EU) No 182/2011 of the European Parliament and of the Council (1) as established
|
| 451 |
+
under this Regulation, to the European Parliament and to the Council.
|
| 452 |
+
- "**Court (Civil/Criminal): Civil** \n**Provisions:** \n**Time of commission\
|
| 453 |
+
\ of the act:** \n**Outcome (not guilty, guilty):** \n**Reasoning:** Partially\
|
| 454 |
+
\ accepts the lawsuit. \n**Facts:** The plaintiff, who works as a lawyer, maintains\
|
| 455 |
+
\ a savings account with the defendant banking corporation under account number\
|
| 456 |
+
\ GR.............. Pursuant to a contract dated June 11, 2010, established in\
|
| 457 |
+
\ Thessaloniki between the defendant and the plaintiff, the plaintiff was granted\
|
| 458 |
+
\ access to the electronic banking system (e-banking) to conduct banking transactions\
|
| 459 |
+
\ remotely. On October 10, 2020, the plaintiff fell victim to electronic fraud\
|
| 460 |
+
\ through the \"phishing\" method, whereby an unknown perpetrator managed to extract\
|
| 461 |
+
\ and transfer €3,000.00 from the plaintiff’s account to another account of the\
|
| 462 |
+
\ same bank. Specifically, on that day at 6:51 a.m., the plaintiff received an\
|
| 463 |
+
\ email from the sender \".........\", with the address ..........., informing\
|
| 464 |
+
\ him that his debit card had been suspended and that online payments and cash\
|
| 465 |
+
\ withdrawals could not be made until the issue was resolved. The email urged\
|
| 466 |
+
\ him to confirm his details within the next 72 hours by following a link titled\
|
| 467 |
+
\ \"card activation.\" \nThe plaintiff read the above email on his mobile phone\
|
| 468 |
+
\ around 8:00 a.m., and believing it came from the defendant, he followed the\
|
| 469 |
+
\ instructions and accessed a website that was identical (a clone) to that of\
|
| 470 |
+
\ the defendant. On this page, he was asked to enter his login credentials to\
|
| 471 |
+
\ connect to the service, which he did, and he was subsequently asked to input\
|
| 472 |
+
\ his debit card details for the alleged activation, which he also provided. Then,\
|
| 473 |
+
\ to complete the process, a number was sent to his mobile phone at 8:07 a.m.\
|
| 474 |
+
\ from the sender ........, which he entered, and two minutes later he received\
|
| 475 |
+
\ a message from the same sender in English stating that the quick access code\
|
| 476 |
+
\ had been activated on his mobile. A few minutes later, at 8:18 a.m., he received\
|
| 477 |
+
\ an email from the defendant informing him of the transfer of €3,000.00 from\
|
| 478 |
+
\ his account to account number GR ........... held at the same bank, with the\
|
| 479 |
+
\ beneficiary's details being .......... As soon as the plaintiff read this, he\
|
| 480 |
+
\ immediately called the defendant's call center and canceled his debit card,\
|
| 481 |
+
\ the access codes for the service ......., and locked the application ..........\
|
| 482 |
+
\ At the same time, he verbally submitted a request to dispute and cancel the\
|
| 483 |
+
\ contested transaction, and in a subsequent phone call, he also canceled his\
|
| 484 |
+
\ credit card. On the same day, he also sent an email to the defendant informing\
|
| 485 |
+
\ them in writing of the above and requesting the cancellation of the transaction\
|
| 486 |
+
\ and the return of the amount of €3,000.00 to his account, as this transfer was\
|
| 487 |
+
\ not made by him but by an unknown perpetrator through electronic fraud and was\
|
| 488 |
+
\ not approved by him. It should also be noted that the plaintiff, as the sole\
|
| 489 |
+
\ beneficiary according to the aforementioned contract for using the defendant's\
|
| 490 |
+
\ Internet Banking service, never received any update via SMS or the VIBER application\
|
| 491 |
+
\ from the bank regarding the transaction details before its completion, nor did\
|
| 492 |
+
\ he receive a one-time code (OTP) to approve the contested transaction. He subsequently\
|
| 493 |
+
\ filed a complaint against unknown persons at the Cyber Crime Division for the\
|
| 494 |
+
\ crime of fraud. The defendant sent an email to the plaintiff on October 16,\
|
| 495 |
+
\ 2020, informing him that his request had been forwarded to the appropriate department\
|
| 496 |
+
\ of the bank for investigation, stating that the bank would never send him an\
|
| 497 |
+
\ email or SMS asking him to enter his personal data and that as of October 7,\
|
| 498 |
+
\ 2020, there was a notice posted for its customers regarding malicious attempts\
|
| 499 |
+
\ to steal personal data in the \"Our News\" section on ....... A month after\
|
| 500 |
+
\ the disputed incident, on November 10, 2020, an amount of €2,296.82 was transferred\
|
| 501 |
+
\ to the plaintiff's account from the account to which the fraudulent credit had\
|
| 502 |
+
\ been made. The plaintiff immediately sent an email to the defendant asking to\
|
| 503 |
+
\ be informed whether this transfer was a return of part of the amount that had\
|
| 504 |
+
\ been illegally withdrawn from his account and requested the return of the remaining\
|
| 505 |
+
\ amount of €703.18. In its response dated January 13, 2021, the defendant confirmed\
|
| 506 |
+
\ that the aforementioned amount indeed came from the account to which the fraudulent\
|
| 507 |
+
\ credit had been made, following a freeze of that account initiated by the defendant\
|
| 508 |
+
\ during the investigation of the incident, but refused to return the remaining\
|
| 509 |
+
\ amount, claiming it bore no responsibility for the leak of the personal codes\
|
| 510 |
+
\ to third parties, according to the terms of the service contract established\
|
| 511 |
+
\ between them. \nFrom the entirety of the evidence presented to the court, there\
|
| 512 |
+
\ is no indication of the authenticity of the contested transaction, as the plaintiff\
|
| 513 |
+
\ did not give his consent for the execution of the transfer of the amount of\
|
| 514 |
+
\ €3,000.00, especially in light of the provision in Article 72 paragraph 2 of\
|
| 515 |
+
\ Law 4537/2018 stating that the mere use of the Internet Banking service by the\
|
| 516 |
+
\ plaintiff does not necessarily constitute sufficient evidence that the payer\
|
| 517 |
+
\ approved the payment action. Specifically, it was proven that the contested\
|
| 518 |
+
\ transaction was not carried out following a strong identification of the plaintiff\
|
| 519 |
+
\ – the sole beneficiary of the account – and his approval, as the latter may\
|
| 520 |
+
\ have entered his personal codes on the counterfeit website; however, he was\
|
| 521 |
+
\ never informed, before the completion of the contested transaction, of the amount\
|
| 522 |
+
\ that would be transferred from his account to a third-party account, nor did\
|
| 523 |
+
\ he receive on his mobile phone, either via SMS or through the VIBER application\
|
| 524 |
+
\ or any other means, the one-time code - extra PIN for its completion, which\
|
| 525 |
+
\ he was required to enter to approve the contested transaction (payment action)\
|
| 526 |
+
\ and thus complete his identification, a fact that was not countered by any evidence\
|
| 527 |
+
\ from the defendant. Furthermore, it is noted that the defendant's claims that\
|
| 528 |
+
\ it bears no responsibility under the terms of the banking services contract,\
|
| 529 |
+
\ whereby it is not liable for any damage to its customer in cases of unauthorized\
|
| 530 |
+
\ use of their personal access codes to the Internet Banking service, are to be\
|
| 531 |
+
\ rejected as fundamentally unfounded. This is because the aforementioned contractual\
|
| 532 |
+
\ terms are invalid according to the provision of Article 103 of Law 4537/2018,\
|
| 533 |
+
\ as they contradict the provisions of Articles 71, 73, and 92 of the same Law,\
|
| 534 |
+
\ which provide for the provider's universal liability and its exemption only\
|
| 535 |
+
\ for unusual and unforeseen circumstances that are beyond the control of the\
|
| 536 |
+
\ party invoking them and whose consequences could not have been avoided despite\
|
| 537 |
+
\ all efforts to the contrary; these provisions establish mandatory law in favor\
|
| 538 |
+
\ of users, as according to Article 103 of Law 4537/2018, payment service providers\
|
| 539 |
+
\ are prohibited from deviating from the provisions to the detriment of payment\
|
| 540 |
+
\ service users, unless the possibility of deviation is explicitly provided and\
|
| 541 |
+
\ they can decide to offer only more favorable terms to payment service users;\
|
| 542 |
+
\ the aforementioned contractual terms do not constitute more favorable terms\
|
| 543 |
+
\ but rather disadvantageous terms for the payment service user. In this case,\
|
| 544 |
+
\ however, the defendant did not prove the authenticity of the transaction and\
|
| 545 |
+
\ its approval by the plaintiff and did not invoke, nor did any unusual and unforeseen\
|
| 546 |
+
\ circumstances beyond its control, the consequences of which could not have been\
|
| 547 |
+
\ avoided despite all efforts to the contrary, come to light. Therefore, the contested\
|
| 548 |
+
\ transaction transferring the amount of €3,000.00 is considered, in the absence\
|
| 549 |
+
\ of demonstrable consent from the plaintiff, unapproved according to the provisions\
|
| 550 |
+
\ of Article 64 of Law 4537/2018, and the defendant's contrary claims are rejected,\
|
| 551 |
+
\ especially since the plaintiff proceeded, according to Article 71 paragraph\
|
| 552 |
+
\ 1 of Law 4537/2018, without undue delay to notify the defendant regarding the\
|
| 553 |
+
\ contested unapproved payment action. Consequently, the defendant is liable for\
|
| 554 |
+
\ compensating the plaintiff for the positive damage he suffered under Article\
|
| 555 |
+
\ 73 of Law 4537/2018 and is obliged to pay him the requested amount of €703.18,\
|
| 556 |
+
\ while the plaintiff’s fault in the occurrence of this damage cannot be established,\
|
| 557 |
+
\ as he entered his personal details in an online environment that was a faithful\
|
| 558 |
+
\ imitation of that of the defendant, as evidenced by the comparison of the screenshots\
|
| 559 |
+
\ of the fake website and the real website provided by the plaintiff, a fact that\
|
| 560 |
+
\ he could not have known while being fully convinced that he was transacting\
|
| 561 |
+
\ with the defendant. Furthermore, the defendant’s liability to compensate the\
|
| 562 |
+
\ plaintiff is based on the provision of Article 8 of Law 2251/1994, which applies\
|
| 563 |
+
\ in this case, as the plaintiff's damage resulted from inadequate fulfillment\
|
| 564 |
+
\ of its obligations in the context of providing its services, but also on the\
|
| 565 |
+
\ provision of Article 914 of the Civil Code in the sense of omission on its part\
|
| 566 |
+
\ of unlawfully and culpably imposed actions. In this case, given that during\
|
| 567 |
+
\ the relevant period there had been a multitude of similar incidents of fraud\
|
| 568 |
+
\ against the defendant's customers, the latter, as a service provider to the\
|
| 569 |
+
\ consumer public and bearing transactional obligations of care and security towards\
|
| 570 |
+
\ them, displayed gross negligence regarding the security provided for electronic\
|
| 571 |
+
\ transaction services, which was compromised by the fraudulent theft of funds,\
|
| 572 |
+
\ as it did not comply with all required high-security measures for executing\
|
| 573 |
+
\ the contested transaction, failing to implement the strict customer identification\
|
| 574 |
+
\ verification process and to check the authenticity of the account to which the\
|
| 575 |
+
\ funds were sent, thus not assuming the suspicious nature of the transaction,\
|
| 576 |
+
\ did not adopt comprehensive and improved protective measures to fully protect\
|
| 577 |
+
\ its customers against malicious attacks and online fraud and to prevent the\
|
| 578 |
+
\ infiltration of unauthorized third parties, nor did it fulfill its obligations\
|
| 579 |
+
\ to inform, accurately inform, and warn its consumers - customers, as it failed\
|
| 580 |
+
\ to adequately inform them of attempts to steal their personal data through the\
|
| 581 |
+
\ sending of informative emails or SMS, while merely posting in a section rather\
|
| 582 |
+
\ than on a central banner (as it later did) does not constitute adequate information\
|
| 583 |
+
\ such that it meets the requirement of protecting its customers and the increased\
|
| 584 |
+
\ safeguarding of their interests. Although the plaintiff acted promptly and informed\
|
| 585 |
+
\ the defendant on the same day about the contested incident, the defendant did\
|
| 586 |
+
\ not act as promptly regarding the investigation of the incident and the freezing\
|
| 587 |
+
\ of the account that held the fraudulent credit to prevent the plaintiff's loss,\
|
| 588 |
+
\ but only returned part of the funds to the plaintiff a month later. This behavior,\
|
| 589 |
+
\ beyond being culpable due to gross negligence, was also unlawful, as it would\
|
| 590 |
+
\ have been illegal even without the contractual relationship, as contrary to\
|
| 591 |
+
\ the provisions of Law 4537/2018 and Law 2251/1994, regarding the lack of security\
|
| 592 |
+
\ of the services that the consumer is legitimately entitled to expect, as well\
|
| 593 |
+
\ as the building of trust that is essential in banking transactions, elements\
|
| 594 |
+
\ that it was obligated to provide within the sphere of the services offered,\
|
| 595 |
+
\ and contrary to the principles of good faith and commercial ethics, as crystallized\
|
| 596 |
+
\ in the provision of Article 288 of the Civil Code, as well as the general duty\
|
| 597 |
+
\ imposed by Article 914 of the Civil Code not to cause harm to another culpably.\
|
| 598 |
+
\ This resulted not only in positive damage to the plaintiff but also in causing\
|
| 599 |
+
\ him moral harm consisting of his mental distress and the disruption, agitation,\
|
| 600 |
+
\ and sorrow he experienced, for which he must be awarded financial compensation.\
|
| 601 |
+
\ Taking into account all the general circumstances of the case, the extent of\
|
| 602 |
+
\ the plaintiff's damage, the severity of the defendant's fault, the mental distress\
|
| 603 |
+
\ suffered by the plaintiff, the insecurity he felt regarding his deposits, the\
|
| 604 |
+
\ sorrow he experienced, and the stress caused by his financial loss, which occurred\
|
| 605 |
+
\ during the pandemic period when his earnings from his professional activity\
|
| 606 |
+
\ had significantly decreased, as well as the financial and social situation of\
|
| 607 |
+
\ the parties, it is the court's opinion that he should be granted, as financial\
|
| 608 |
+
\ compensation for his moral harm, an amount of €250.00, which is deemed reasonable\
|
| 609 |
+
\ and fair. Therefore, the total monetary amount that the plaintiff is entitled\
|
| 610 |
+
\ to for his positive damage and financial compensation for the moral harm suffered\
|
| 611 |
+
\ amounts to a total of (€703.18 + €250.00) = €953.18."
|
| 612 |
+
- 'Failure to notify the Authority of file establishment or permit changes is punished
|
| 613 |
+
by up to three years’ imprisonment and a fine of one to five million Drachmas.
|
| 614 |
+
|
| 615 |
+
Maintaining a file without a permit or violating permit terms is punished by at
|
| 616 |
+
least one year’s imprisonment and a fine of one to five million Drachmas.
|
| 617 |
+
|
| 618 |
+
Unauthorized file interconnection or without permit is punished by up to three
|
| 619 |
+
years’ imprisonment and a fine of one to five million Drachmas.
|
| 620 |
+
|
| 621 |
+
Unlawful interference with personal data is punished by imprisonment and a fine;
|
| 622 |
+
for sensitive data, at least one year’s imprisonment and a fine of one to ten
|
| 623 |
+
million Drachmas.
|
| 624 |
+
|
| 625 |
+
Controllers who fail to comply with Authority decisions or violate data transfer
|
| 626 |
+
rules face at least two years’ imprisonment and a fine of one to five million
|
| 627 |
+
Drachmas.
|
| 628 |
+
|
| 629 |
+
If acts were committed for unlawful benefit or to cause harm, punishment is up
|
| 630 |
+
to ten years’ imprisonment and a fine of two to ten million Drachmas.
|
| 631 |
+
|
| 632 |
+
If acts jeopardize democratic governance or national security, punishment is confinement
|
| 633 |
+
in a penitentiary and a fine of five to ten million Drachmas.
|
| 634 |
+
|
| 635 |
+
Acts committed due to negligence result in at least three months’ imprisonment
|
| 636 |
+
and a fine.
|
| 637 |
+
|
| 638 |
+
If the Controller is not a natural person, the responsible party is the representative
|
| 639 |
+
or head of the organization with administrative or managerial duties.
|
| 640 |
+
|
| 641 |
+
Authorized members of the Authority may carry out preliminary investigations even
|
| 642 |
+
without Prosecutor’s order for certain offenses.
|
| 643 |
+
|
| 644 |
+
The Authority''s President must notify the Public Prosecutor of any offenses under
|
| 645 |
+
investigation, forwarding all relevant evidence.
|
| 646 |
+
|
| 647 |
+
Preliminary investigations must conclude within two months of charges, and trial
|
| 648 |
+
must begin within three months of completion.
|
| 649 |
+
|
| 650 |
+
Continuation of proceedings is allowed only once and for extremely important reasons,
|
| 651 |
+
with adjournment not exceeding two months.
|
| 652 |
+
|
| 653 |
+
Felonies under this law fall under the jurisdiction of the Court of Appeal.
|
| 654 |
+
|
| 655 |
+
'
|
| 656 |
+
- source_sentence: Who must facilitate the exercise of data subject rights?
|
| 657 |
+
sentences:
|
| 658 |
+
- '1.Processing of personal data revealing racial or ethnic origin, political opinions,
|
| 659 |
+
religious or philosophical beliefs, or trade union membership, and the processing
|
| 660 |
+
of genetic data, biometric data for the purpose of uniquely identifying a natural
|
| 661 |
+
person, data concerning health or data concerning a natural person''s sex life
|
| 662 |
+
or sexual orientation shall be prohibited.
|
| 663 |
+
|
| 664 |
+
2.Paragraph 1 shall not apply if one of the following applies: (a) the data subject
|
| 665 |
+
has given explicit consent to the processing of those personal data for one or
|
| 666 |
+
more specified purposes, except where Union or Member State law provide that the
|
| 667 |
+
prohibition referred to in paragraph 1 may not be lifted by the data subject;
|
| 668 |
+
(b) processing is necessary for the purposes of carrying out the obligations
|
| 669 |
+
and exercising specific rights of the controller or of the data subject in the
|
| 670 |
+
field of employment and social security and social protection law in so far as
|
| 671 |
+
it is authorised by Union or Member State law or a collective agreement pursuant
|
| 672 |
+
to Member State law providing for appropriate safeguards for the fundamental rights
|
| 673 |
+
and the interests of the data subject; (c) processing is necessary to protect
|
| 674 |
+
the vital interests of the data subject or of another natural person where the
|
| 675 |
+
data subject is physically or legally incapable of giving consent; (d) processing
|
| 676 |
+
is carried out in the course of its legitimate activities with appropriate safeguards
|
| 677 |
+
by a foundation, association or any other not-for-profit body with a political,
|
| 678 |
+
philosophical, religious or trade union aim and on condition that the processing
|
| 679 |
+
relates solely to the members or to former members of the body or to persons who
|
| 680 |
+
have regular contact with it in connection with its purposes and that the personal
|
| 681 |
+
data are not disclosed outside that body without the consent of the data subjects;
|
| 682 |
+
(e) processing relates to personal data which are manifestly made public by the
|
| 683 |
+
data subject; (f) processing is necessary for the establishment, exercise or
|
| 684 |
+
defence of legal claims or whenever courts are acting in their judicial capacity;
|
| 685 |
+
(g) processing is necessary for reasons of substantial public interest, on the
|
| 686 |
+
basis of Union or Member State law which shall be proportionate to the aim pursued,
|
| 687 |
+
respect the essence of the right to data protection and provide for suitable and
|
| 688 |
+
specific measures to safeguard the fundamental rights and the interests of the
|
| 689 |
+
data subject; (h) processing is necessary for the purposes of preventive or occupational
|
| 690 |
+
medicine, for the assessment of the working capacity of the employee, medical
|
| 691 |
+
diagnosis, the provision of health or social care or treatment or the management
|
| 692 |
+
of health or social care systems and services on the basis of Union or Member
|
| 693 |
+
State law or pursuant to contract with a health professional and subject to the
|
| 694 |
+
conditions and safeguards referred to in paragraph 3; (i) processing is necessary
|
| 695 |
+
for reasons of public interest in the area of public health, such as protecting
|
| 696 |
+
against serious cross-border threats to health or ensuring high standards of quality
|
| 697 |
+
and safety of health care and of medicinal products or medical devices, on the
|
| 698 |
+
basis of Union or Member State law which provides for suitable and specific measures
|
| 699 |
+
to safeguard the rights and freedoms of the data subject, in particular professional
|
| 700 |
+
secrecy; 4.5.2016 L 119/38 (j) processing is necessary for archiving purposes
|
| 701 |
+
in the public interest, scientific or historical research purposes or statistical
|
| 702 |
+
purposes in accordance with Article 89(1) based on Union or Member State law which
|
| 703 |
+
shall be proportionate to the aim pursued, respect the essence of the right to
|
| 704 |
+
data protection and provide for suitable and specific measures to safeguard the
|
| 705 |
+
fundamental rights and the interests of the data subject.
|
| 706 |
+
|
| 707 |
+
3.Personal data referred to in paragraph 1 may be processed for the purposes referred
|
| 708 |
+
to in point (h) of paragraph 2 when those data are processed by or under the responsibility
|
| 709 |
+
of a professional subject to the obligation of professional secrecy under Union
|
| 710 |
+
or Member State law or rules established by national competent bodies or by another
|
| 711 |
+
person also subject to an obligation of secrecy under Union or Member State law
|
| 712 |
+
or rules established by national competent bodies.
|
| 713 |
+
|
| 714 |
+
4.Member States may maintain or introduce further conditions, including limitations,
|
| 715 |
+
with regard to the processing of genetic data, biometric data or data concerning
|
| 716 |
+
health.'
|
| 717 |
+
- Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies
|
| 718 |
+
to the processing of personal data by the Union institutions, bodies, offices
|
| 719 |
+
and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable
|
| 720 |
+
to such processing of personal data should be adapted to the principles and rules
|
| 721 |
+
established in this Regulation and applied in the light of this Regulation. In
|
| 722 |
+
order to provide a strong and coherent data protection framework in the Union,
|
| 723 |
+
the necessary adaptations of Regulation (EC) No 45/2001 should follow after the
|
| 724 |
+
adoption of this Regulation, in order to allow application at the same time as
|
| 725 |
+
this Regulation.
|
| 726 |
+
- "1.The controller shall take appropriate measures to provide any information referred\
|
| 727 |
+
\ to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34\
|
| 728 |
+
\ relating to processing to the data subject in a concise, transparent, intelligible\
|
| 729 |
+
\ and easily accessible form, using clear and plain language, in particular for\
|
| 730 |
+
\ any information addressed specifically to a child. The information shall be\
|
| 731 |
+
\ provided in writing, or by other means, including, where appropriate, by electronic\
|
| 732 |
+
\ means. When requested by the data subject, the information may be provided orally,\
|
| 733 |
+
\ provided that the identity of the data subject is proven by other means. 4.5.2016\
|
| 734 |
+
\ L 119/39 \n2.The controller shall facilitate the exercise of data subject rights\
|
| 735 |
+
\ under Articles 15 to 22. In the cases referred to in Article 11(2), the controller\
|
| 736 |
+
\ shall not refuse to act on the request of the data subject for exercising his\
|
| 737 |
+
\ or her rights under Articles 15 to 22, unless the controller demonstrates that\
|
| 738 |
+
\ it is not in a position to identify the data subject.\n3.The controller shall\
|
| 739 |
+
\ provide information on action taken on a request under Articles 15 to 22 to\
|
| 740 |
+
\ the data subject without undue delay and in any event within one month of receipt\
|
| 741 |
+
\ of the request. That period may be extended by two further months where necessary,\
|
| 742 |
+
\ taking into account the complexity and number of the requests. The controller\
|
| 743 |
+
\ shall inform the data subject of any such extension within one month of receipt\
|
| 744 |
+
\ of the request, together with the reasons for the delay. Where the data subject\
|
| 745 |
+
\ makes the request by electronic form means, the information shall be provided\
|
| 746 |
+
\ by electronic means where possible, unless otherwise requested by the data subject.\n\
|
| 747 |
+
4.If the controller does not take action on the request of the data subject, the\
|
| 748 |
+
\ controller shall inform the data subject without delay and at the latest within\
|
| 749 |
+
\ one month of receipt of the request of the reasons for not taking action and\
|
| 750 |
+
\ on the possibility of lodging a complaint with a supervisory authority and seeking\
|
| 751 |
+
\ a judicial remedy.\n5.Information provided under Articles 13 and 14 and any\
|
| 752 |
+
\ communication and any actions taken under Articles 15 to 22 and 34 shall be\
|
| 753 |
+
\ provided free of charge. Where requests from a data subject are manifestly unfounded\
|
| 754 |
+
\ or excessive, in particular because of their repetitive character, the controller\
|
| 755 |
+
\ may either: (a) charge a reasonable fee taking into account the administrative\
|
| 756 |
+
\ costs of providing the information or communication or taking the action requested;\
|
| 757 |
+
\ or (b) refuse to act on the request. The controller shall bear the burden of\
|
| 758 |
+
\ demonstrating the manifestly unfounded or excessive character of the request.\n\
|
| 759 |
+
6.Without prejudice to Article 11, where the controller has reasonable doubts\
|
| 760 |
+
\ concerning the identity of the natural person making the request referred to\
|
| 761 |
+
\ in Articles 15 to 21, the controller may request the provision of additional\
|
| 762 |
+
\ information necessary to confirm the identity of the data subject.\n7.The information\
|
| 763 |
+
\ to be provided to data subjects pursuant to Articles 13 and 14 may be provided\
|
| 764 |
+
\ in combination with standardised icons in order to give in an easily visible,\
|
| 765 |
+
\ intelligible and clearly legible manner a meaningful overview of the intended\
|
| 766 |
+
\ processing. Where the icons are presented electronically they shall be machine-readable.\n\
|
| 767 |
+
8.The Commission shall be empowered to adopt delegated acts in accordance with\
|
| 768 |
+
\ Article 92 for the purpose of determining the information to be presented by\
|
| 769 |
+
\ the icons and the procedures for providing standardised icons. Section 2 Information\
|
| 770 |
+
\ and access to personal data"
|
| 771 |
+
pipeline_tag: sentence-similarity
|
| 772 |
+
library_name: sentence-transformers
|
| 773 |
+
metrics:
|
| 774 |
+
- cosine_accuracy@1
|
| 775 |
+
- cosine_accuracy@3
|
| 776 |
+
- cosine_accuracy@5
|
| 777 |
+
- cosine_accuracy@10
|
| 778 |
+
- cosine_precision@1
|
| 779 |
+
- cosine_precision@3
|
| 780 |
+
- cosine_precision@5
|
| 781 |
+
- cosine_precision@10
|
| 782 |
+
- cosine_recall@1
|
| 783 |
+
- cosine_recall@3
|
| 784 |
+
- cosine_recall@5
|
| 785 |
+
- cosine_recall@10
|
| 786 |
+
- cosine_ndcg@10
|
| 787 |
+
- cosine_mrr@10
|
| 788 |
+
- cosine_map@100
|
| 789 |
+
model-index:
|
| 790 |
+
- name: multilingual-e5-large
|
| 791 |
+
results:
|
| 792 |
+
- task:
|
| 793 |
+
type: information-retrieval
|
| 794 |
+
name: Information Retrieval
|
| 795 |
+
dataset:
|
| 796 |
+
name: dim 1024
|
| 797 |
+
type: dim_1024
|
| 798 |
+
metrics:
|
| 799 |
+
- type: cosine_accuracy@1
|
| 800 |
+
value: 0.3994878361075544
|
| 801 |
+
name: Cosine Accuracy@1
|
| 802 |
+
- type: cosine_accuracy@3
|
| 803 |
+
value: 0.40973111395646605
|
| 804 |
+
name: Cosine Accuracy@3
|
| 805 |
+
- type: cosine_accuracy@5
|
| 806 |
+
value: 0.44238156209987195
|
| 807 |
+
name: Cosine Accuracy@5
|
| 808 |
+
- type: cosine_accuracy@10
|
| 809 |
+
value: 0.4814340588988476
|
| 810 |
+
name: Cosine Accuracy@10
|
| 811 |
+
- type: cosine_precision@1
|
| 812 |
+
value: 0.3994878361075544
|
| 813 |
+
name: Cosine Precision@1
|
| 814 |
+
- type: cosine_precision@3
|
| 815 |
+
value: 0.3994878361075544
|
| 816 |
+
name: Cosine Precision@3
|
| 817 |
+
- type: cosine_precision@5
|
| 818 |
+
value: 0.3897567221510884
|
| 819 |
+
name: Cosine Precision@5
|
| 820 |
+
- type: cosine_precision@10
|
| 821 |
+
value: 0.3562099871959027
|
| 822 |
+
name: Cosine Precision@10
|
| 823 |
+
- type: cosine_recall@1
|
| 824 |
+
value: 0.046427253250942845
|
| 825 |
+
name: Cosine Recall@1
|
| 826 |
+
- type: cosine_recall@3
|
| 827 |
+
value: 0.1357642561296911
|
| 828 |
+
name: Cosine Recall@3
|
| 829 |
+
- type: cosine_recall@5
|
| 830 |
+
value: 0.20380194680388578
|
| 831 |
+
name: Cosine Recall@5
|
| 832 |
+
- type: cosine_recall@10
|
| 833 |
+
value: 0.30156152834977973
|
| 834 |
+
name: Cosine Recall@10
|
| 835 |
+
- type: cosine_ndcg@10
|
| 836 |
+
value: 0.42824330702763147
|
| 837 |
+
name: Cosine Ndcg@10
|
| 838 |
+
- type: cosine_mrr@10
|
| 839 |
+
value: 0.41413607910086736
|
| 840 |
+
name: Cosine Mrr@10
|
| 841 |
+
- type: cosine_map@100
|
| 842 |
+
value: 0.4960353530991054
|
| 843 |
+
name: Cosine Map@100
|
| 844 |
+
- task:
|
| 845 |
+
type: information-retrieval
|
| 846 |
+
name: Information Retrieval
|
| 847 |
+
dataset:
|
| 848 |
+
name: dim 768
|
| 849 |
+
type: dim_768
|
| 850 |
+
metrics:
|
| 851 |
+
- type: cosine_accuracy@1
|
| 852 |
+
value: 0.3892445582586428
|
| 853 |
+
name: Cosine Accuracy@1
|
| 854 |
+
- type: cosine_accuracy@3
|
| 855 |
+
value: 0.3994878361075544
|
| 856 |
+
name: Cosine Accuracy@3
|
| 857 |
+
- type: cosine_accuracy@5
|
| 858 |
+
value: 0.43661971830985913
|
| 859 |
+
name: Cosine Accuracy@5
|
| 860 |
+
- type: cosine_accuracy@10
|
| 861 |
+
value: 0.47823303457106275
|
| 862 |
+
name: Cosine Accuracy@10
|
| 863 |
+
- type: cosine_precision@1
|
| 864 |
+
value: 0.3892445582586428
|
| 865 |
+
name: Cosine Precision@1
|
| 866 |
+
- type: cosine_precision@3
|
| 867 |
+
value: 0.38988476312419973
|
| 868 |
+
name: Cosine Precision@3
|
| 869 |
+
- type: cosine_precision@5
|
| 870 |
+
value: 0.38156209987195905
|
| 871 |
+
name: Cosine Precision@5
|
| 872 |
+
- type: cosine_precision@10
|
| 873 |
+
value: 0.35147247119078107
|
| 874 |
+
name: Cosine Precision@10
|
| 875 |
+
- type: cosine_recall@1
|
| 876 |
+
value: 0.045140545184589424
|
| 877 |
+
name: Cosine Recall@1
|
| 878 |
+
- type: cosine_recall@3
|
| 879 |
+
value: 0.13218231618768836
|
| 880 |
+
name: Cosine Recall@3
|
| 881 |
+
- type: cosine_recall@5
|
| 882 |
+
value: 0.19882192649305613
|
| 883 |
+
name: Cosine Recall@5
|
| 884 |
+
- type: cosine_recall@10
|
| 885 |
+
value: 0.29727932103829957
|
| 886 |
+
name: Cosine Recall@10
|
| 887 |
+
- type: cosine_ndcg@10
|
| 888 |
+
value: 0.4211330537467249
|
| 889 |
+
name: Cosine Ndcg@10
|
| 890 |
+
- type: cosine_mrr@10
|
| 891 |
+
value: 0.4050812450460335
|
| 892 |
+
name: Cosine Mrr@10
|
| 893 |
+
- type: cosine_map@100
|
| 894 |
+
value: 0.48796722771226453
|
| 895 |
+
name: Cosine Map@100
|
| 896 |
+
- task:
|
| 897 |
+
type: information-retrieval
|
| 898 |
+
name: Information Retrieval
|
| 899 |
+
dataset:
|
| 900 |
+
name: dim 512
|
| 901 |
+
type: dim_512
|
| 902 |
+
metrics:
|
| 903 |
+
- type: cosine_accuracy@1
|
| 904 |
+
value: 0.39436619718309857
|
| 905 |
+
name: Cosine Accuracy@1
|
| 906 |
+
- type: cosine_accuracy@3
|
| 907 |
+
value: 0.4033290653008963
|
| 908 |
+
name: Cosine Accuracy@3
|
| 909 |
+
- type: cosine_accuracy@5
|
| 910 |
+
value: 0.4327784891165173
|
| 911 |
+
name: Cosine Accuracy@5
|
| 912 |
+
- type: cosine_accuracy@10
|
| 913 |
+
value: 0.471190781049936
|
| 914 |
+
name: Cosine Accuracy@10
|
| 915 |
+
- type: cosine_precision@1
|
| 916 |
+
value: 0.39436619718309857
|
| 917 |
+
name: Cosine Precision@1
|
| 918 |
+
- type: cosine_precision@3
|
| 919 |
+
value: 0.39436619718309857
|
| 920 |
+
name: Cosine Precision@3
|
| 921 |
+
- type: cosine_precision@5
|
| 922 |
+
value: 0.38373879641485276
|
| 923 |
+
name: Cosine Precision@5
|
| 924 |
+
- type: cosine_precision@10
|
| 925 |
+
value: 0.348719590268886
|
| 926 |
+
name: Cosine Precision@10
|
| 927 |
+
- type: cosine_recall@1
|
| 928 |
+
value: 0.046001271870766657
|
| 929 |
+
name: Cosine Recall@1
|
| 930 |
+
- type: cosine_recall@3
|
| 931 |
+
value: 0.13434589294029278
|
| 932 |
+
name: Cosine Recall@3
|
| 933 |
+
- type: cosine_recall@5
|
| 934 |
+
value: 0.2006372923557733
|
| 935 |
+
name: Cosine Recall@5
|
| 936 |
+
- type: cosine_recall@10
|
| 937 |
+
value: 0.29407016086576515
|
| 938 |
+
name: Cosine Recall@10
|
| 939 |
+
- type: cosine_ndcg@10
|
| 940 |
+
value: 0.4209567413561994
|
| 941 |
+
name: Cosine Ndcg@10
|
| 942 |
+
- type: cosine_mrr@10
|
| 943 |
+
value: 0.4078435258012718
|
| 944 |
+
name: Cosine Mrr@10
|
| 945 |
+
- type: cosine_map@100
|
| 946 |
+
value: 0.48375387985213597
|
| 947 |
+
name: Cosine Map@100
|
| 948 |
+
- task:
|
| 949 |
+
type: information-retrieval
|
| 950 |
+
name: Information Retrieval
|
| 951 |
+
dataset:
|
| 952 |
+
name: dim 256
|
| 953 |
+
type: dim_256
|
| 954 |
+
metrics:
|
| 955 |
+
- type: cosine_accuracy@1
|
| 956 |
+
value: 0.3764404609475032
|
| 957 |
+
name: Cosine Accuracy@1
|
| 958 |
+
- type: cosine_accuracy@3
|
| 959 |
+
value: 0.382202304737516
|
| 960 |
+
name: Cosine Accuracy@3
|
| 961 |
+
- type: cosine_accuracy@5
|
| 962 |
+
value: 0.41037131882202305
|
| 963 |
+
name: Cosine Accuracy@5
|
| 964 |
+
- type: cosine_accuracy@10
|
| 965 |
+
value: 0.4532650448143406
|
| 966 |
+
name: Cosine Accuracy@10
|
| 967 |
+
- type: cosine_precision@1
|
| 968 |
+
value: 0.3764404609475032
|
| 969 |
+
name: Cosine Precision@1
|
| 970 |
+
- type: cosine_precision@3
|
| 971 |
+
value: 0.3758002560819462
|
| 972 |
+
name: Cosine Precision@3
|
| 973 |
+
- type: cosine_precision@5
|
| 974 |
+
value: 0.365044814340589
|
| 975 |
+
name: Cosine Precision@5
|
| 976 |
+
- type: cosine_precision@10
|
| 977 |
+
value: 0.3325864276568502
|
| 978 |
+
name: Cosine Precision@10
|
| 979 |
+
- type: cosine_recall@1
|
| 980 |
+
value: 0.04345597060609991
|
| 981 |
+
name: Cosine Recall@1
|
| 982 |
+
- type: cosine_recall@3
|
| 983 |
+
value: 0.12739095919345977
|
| 984 |
+
name: Cosine Recall@3
|
| 985 |
+
- type: cosine_recall@5
|
| 986 |
+
value: 0.19108724610052447
|
| 987 |
+
name: Cosine Recall@5
|
| 988 |
+
- type: cosine_recall@10
|
| 989 |
+
value: 0.28270389457679657
|
| 990 |
+
name: Cosine Recall@10
|
| 991 |
+
- type: cosine_ndcg@10
|
| 992 |
+
value: 0.40161260018012396
|
| 993 |
+
name: Cosine Ndcg@10
|
| 994 |
+
- type: cosine_mrr@10
|
| 995 |
+
value: 0.3891762189297396
|
| 996 |
+
name: Cosine Mrr@10
|
| 997 |
+
- type: cosine_map@100
|
| 998 |
+
value: 0.46504361814337597
|
| 999 |
+
name: Cosine Map@100
|
| 1000 |
+
- task:
|
| 1001 |
+
type: information-retrieval
|
| 1002 |
+
name: Information Retrieval
|
| 1003 |
+
dataset:
|
| 1004 |
+
name: dim 128
|
| 1005 |
+
type: dim_128
|
| 1006 |
+
metrics:
|
| 1007 |
+
- type: cosine_accuracy@1
|
| 1008 |
+
value: 0.34699103713188223
|
| 1009 |
+
name: Cosine Accuracy@1
|
| 1010 |
+
- type: cosine_accuracy@3
|
| 1011 |
+
value: 0.3495518565941101
|
| 1012 |
+
name: Cosine Accuracy@3
|
| 1013 |
+
- type: cosine_accuracy@5
|
| 1014 |
+
value: 0.37900128040973113
|
| 1015 |
+
name: Cosine Accuracy@5
|
| 1016 |
+
- type: cosine_accuracy@10
|
| 1017 |
+
value: 0.41613316261203587
|
| 1018 |
+
name: Cosine Accuracy@10
|
| 1019 |
+
- type: cosine_precision@1
|
| 1020 |
+
value: 0.34699103713188223
|
| 1021 |
+
name: Cosine Precision@1
|
| 1022 |
+
- type: cosine_precision@3
|
| 1023 |
+
value: 0.34528382415706355
|
| 1024 |
+
name: Cosine Precision@3
|
| 1025 |
+
- type: cosine_precision@5
|
| 1026 |
+
value: 0.33533930857874517
|
| 1027 |
+
name: Cosine Precision@5
|
| 1028 |
+
- type: cosine_precision@10
|
| 1029 |
+
value: 0.30550576184379
|
| 1030 |
+
name: Cosine Precision@10
|
| 1031 |
+
- type: cosine_recall@1
|
| 1032 |
+
value: 0.04023580723646711
|
| 1033 |
+
name: Cosine Recall@1
|
| 1034 |
+
- type: cosine_recall@3
|
| 1035 |
+
value: 0.11713599313797275
|
| 1036 |
+
name: Cosine Recall@3
|
| 1037 |
+
- type: cosine_recall@5
|
| 1038 |
+
value: 0.17553870970060761
|
| 1039 |
+
name: Cosine Recall@5
|
| 1040 |
+
- type: cosine_recall@10
|
| 1041 |
+
value: 0.2604238007608957
|
| 1042 |
+
name: Cosine Recall@10
|
| 1043 |
+
- type: cosine_ndcg@10
|
| 1044 |
+
value: 0.36965214083548276
|
| 1045 |
+
name: Cosine Ndcg@10
|
| 1046 |
+
- type: cosine_mrr@10
|
| 1047 |
+
value: 0.35818293599983697
|
| 1048 |
+
name: Cosine Mrr@10
|
| 1049 |
+
- type: cosine_map@100
|
| 1050 |
+
value: 0.4291315309956839
|
| 1051 |
+
name: Cosine Map@100
|
| 1052 |
+
- task:
|
| 1053 |
+
type: information-retrieval
|
| 1054 |
+
name: Information Retrieval
|
| 1055 |
+
dataset:
|
| 1056 |
+
name: dim 64
|
| 1057 |
+
type: dim_64
|
| 1058 |
+
metrics:
|
| 1059 |
+
- type: cosine_accuracy@1
|
| 1060 |
+
value: 0.293854033290653
|
| 1061 |
+
name: Cosine Accuracy@1
|
| 1062 |
+
- type: cosine_accuracy@3
|
| 1063 |
+
value: 0.30153649167733676
|
| 1064 |
+
name: Cosine Accuracy@3
|
| 1065 |
+
- type: cosine_accuracy@5
|
| 1066 |
+
value: 0.32714468629961585
|
| 1067 |
+
name: Cosine Accuracy@5
|
| 1068 |
+
- type: cosine_accuracy@10
|
| 1069 |
+
value: 0.3591549295774648
|
| 1070 |
+
name: Cosine Accuracy@10
|
| 1071 |
+
- type: cosine_precision@1
|
| 1072 |
+
value: 0.293854033290653
|
| 1073 |
+
name: Cosine Precision@1
|
| 1074 |
+
- type: cosine_precision@3
|
| 1075 |
+
value: 0.29449423815621
|
| 1076 |
+
name: Cosine Precision@3
|
| 1077 |
+
- type: cosine_precision@5
|
| 1078 |
+
value: 0.288348271446863
|
| 1079 |
+
name: Cosine Precision@5
|
| 1080 |
+
- type: cosine_precision@10
|
| 1081 |
+
value: 0.2681177976952625
|
| 1082 |
+
name: Cosine Precision@10
|
| 1083 |
+
- type: cosine_recall@1
|
| 1084 |
+
value: 0.03212717718240556
|
| 1085 |
+
name: Cosine Recall@1
|
| 1086 |
+
- type: cosine_recall@3
|
| 1087 |
+
value: 0.0944529143897263
|
| 1088 |
+
name: Cosine Recall@3
|
| 1089 |
+
- type: cosine_recall@5
|
| 1090 |
+
value: 0.14311801944731944
|
| 1091 |
+
name: Cosine Recall@5
|
| 1092 |
+
- type: cosine_recall@10
|
| 1093 |
+
value: 0.221706864386852
|
| 1094 |
+
name: Cosine Recall@10
|
| 1095 |
+
- type: cosine_ndcg@10
|
| 1096 |
+
value: 0.3185372635267884
|
| 1097 |
+
name: Cosine Ndcg@10
|
| 1098 |
+
- type: cosine_mrr@10
|
| 1099 |
+
value: 0.30537518037517997
|
| 1100 |
+
name: Cosine Mrr@10
|
| 1101 |
+
- type: cosine_map@100
|
| 1102 |
+
value: 0.3744361264744976
|
| 1103 |
+
name: Cosine Map@100
|
| 1104 |
+
---
|
| 1105 |
+
|
| 1106 |
+
# multilingual-e5-large
|
| 1107 |
+
|
| 1108 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large). It maps sentences & paragraphs to a 1024-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 1109 |
+
|
| 1110 |
+
## Model Details
|
| 1111 |
+
|
| 1112 |
+
### Model Description
|
| 1113 |
+
- **Model Type:** Sentence Transformer
|
| 1114 |
+
- **Base model:** [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large) <!-- at revision 0dc5580a448e4284468b8909bae50fa925907bc5 -->
|
| 1115 |
+
- **Maximum Sequence Length:** 512 tokens
|
| 1116 |
+
- **Output Dimensionality:** 1024 dimensions
|
| 1117 |
+
- **Similarity Function:** Cosine Similarity
|
| 1118 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 1119 |
+
- **Language:** en
|
| 1120 |
+
- **License:** apache-2.0
|
| 1121 |
+
|
| 1122 |
+
### Model Sources
|
| 1123 |
+
|
| 1124 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 1125 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 1126 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 1127 |
+
|
| 1128 |
+
### Full Model Architecture
|
| 1129 |
+
|
| 1130 |
+
```
|
| 1131 |
+
SentenceTransformer(
|
| 1132 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': False, 'architecture': 'XLMRobertaModel'})
|
| 1133 |
+
(1): Pooling({'word_embedding_dimension': 1024, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 1134 |
+
(2): Normalize()
|
| 1135 |
+
)
|
| 1136 |
+
```
|
| 1137 |
+
|
| 1138 |
+
## Usage
|
| 1139 |
+
|
| 1140 |
+
### Direct Usage (Sentence Transformers)
|
| 1141 |
+
|
| 1142 |
+
First install the Sentence Transformers library:
|
| 1143 |
+
|
| 1144 |
+
```bash
|
| 1145 |
+
pip install -U sentence-transformers
|
| 1146 |
+
```
|
| 1147 |
+
|
| 1148 |
+
Then you can load this model and run inference.
|
| 1149 |
+
```python
|
| 1150 |
+
from sentence_transformers import SentenceTransformer
|
| 1151 |
+
|
| 1152 |
+
# Download from the 🤗 Hub
|
| 1153 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
| 1154 |
+
# Run inference
|
| 1155 |
+
sentences = [
|
| 1156 |
+
'Who must facilitate the exercise of data subject rights?',
|
| 1157 |
+
'1.The controller shall take appropriate measures to provide any information referred to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34 relating to processing to the data subject in a concise, transparent, intelligible and easily accessible form, using clear and plain language, in particular for any information addressed specifically to a child. The information shall be provided in writing, or by other means, including, where appropriate, by electronic means. When requested by the data subject, the information may be provided orally, provided that the identity of the data subject is proven by other means. 4.5.2016 L 119/39 \n2.The controller shall facilitate the exercise of data subject rights under Articles 15 to 22. In the cases referred to in Article 11(2), the controller shall not refuse to act on the request of the data subject for exercising his or her rights under Articles 15 to 22, unless the controller demonstrates that it is not in a position to identify the data subject.\n3.The controller shall provide information on action taken on a request under Articles 15 to 22 to the data subject without undue delay and in any event within one month of receipt of the request. That period may be extended by two further months where necessary, taking into account the complexity and number of the requests. The controller shall inform the data subject of any such extension within one month of receipt of the request, together with the reasons for the delay. Where the data subject makes the request by electronic form means, the information shall be provided by electronic means where possible, unless otherwise requested by the data subject.\n4.If the controller does not take action on the request of the data subject, the controller shall inform the data subject without delay and at the latest within one month of receipt of the request of the reasons for not taking action and on the possibility of lodging a complaint with a supervisory authority and seeking a judicial remedy.\n5.Information provided under Articles 13 and 14 and any communication and any actions taken under Articles 15 to 22 and 34 shall be provided free of charge. Where requests from a data subject are manifestly unfounded or excessive, in particular because of their repetitive character, the controller may either: (a) charge a reasonable fee taking into account the administrative costs of providing the information or communication or taking the action requested; or (b) refuse to act on the request. The controller shall bear the burden of demonstrating the manifestly unfounded or excessive character of the request.\n6.Without prejudice to Article 11, where the controller has reasonable doubts concerning the identity of the natural person making the request referred to in Articles 15 to 21, the controller may request the provision of additional information necessary to confirm the identity of the data subject.\n7.The information to be provided to data subjects pursuant to Articles 13 and 14 may be provided in combination with standardised icons in order to give in an easily visible, intelligible and clearly legible manner a meaningful overview of the intended processing. Where the icons are presented electronically they shall be machine-readable.\n8.The Commission shall be empowered to adopt delegated acts in accordance with Article 92 for the purpose of determining the information to be presented by the icons and the procedures for providing standardised icons. Section 2 Information and access to personal data',
|
| 1158 |
+
'Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies to the processing of personal data by the Union institutions, bodies, offices and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable to such processing of personal data should be adapted to the principles and rules established in this Regulation and applied in the light of this Regulation. In order to provide a strong and coherent data protection framework in the Union, the necessary adaptations of Regulation (EC) No 45/2001 should follow after the adoption of this Regulation, in order to allow application at the same time as this Regulation.',
|
| 1159 |
+
]
|
| 1160 |
+
embeddings = model.encode(sentences)
|
| 1161 |
+
print(embeddings.shape)
|
| 1162 |
+
# [3, 1024]
|
| 1163 |
+
|
| 1164 |
+
# Get the similarity scores for the embeddings
|
| 1165 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 1166 |
+
print(similarities)
|
| 1167 |
+
# tensor([[1.0000, 0.5502, 0.2948],
|
| 1168 |
+
# [0.5502, 1.0000, 0.2162],
|
| 1169 |
+
# [0.2948, 0.2162, 1.0000]])
|
| 1170 |
+
```
|
| 1171 |
+
|
| 1172 |
+
<!--
|
| 1173 |
+
### Direct Usage (Transformers)
|
| 1174 |
+
|
| 1175 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 1176 |
+
|
| 1177 |
+
</details>
|
| 1178 |
+
-->
|
| 1179 |
+
|
| 1180 |
+
<!--
|
| 1181 |
+
### Downstream Usage (Sentence Transformers)
|
| 1182 |
+
|
| 1183 |
+
You can finetune this model on your own dataset.
|
| 1184 |
+
|
| 1185 |
+
<details><summary>Click to expand</summary>
|
| 1186 |
+
|
| 1187 |
+
</details>
|
| 1188 |
+
-->
|
| 1189 |
+
|
| 1190 |
+
<!--
|
| 1191 |
+
### Out-of-Scope Use
|
| 1192 |
+
|
| 1193 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 1194 |
+
-->
|
| 1195 |
+
|
| 1196 |
+
## Evaluation
|
| 1197 |
+
|
| 1198 |
+
### Metrics
|
| 1199 |
+
|
| 1200 |
+
#### Information Retrieval
|
| 1201 |
+
|
| 1202 |
+
* Dataset: `dim_1024`
|
| 1203 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1204 |
+
```json
|
| 1205 |
+
{
|
| 1206 |
+
"truncate_dim": 1024
|
| 1207 |
+
}
|
| 1208 |
+
```
|
| 1209 |
+
|
| 1210 |
+
| Metric | Value |
|
| 1211 |
+
|:--------------------|:-----------|
|
| 1212 |
+
| cosine_accuracy@1 | 0.3995 |
|
| 1213 |
+
| cosine_accuracy@3 | 0.4097 |
|
| 1214 |
+
| cosine_accuracy@5 | 0.4424 |
|
| 1215 |
+
| cosine_accuracy@10 | 0.4814 |
|
| 1216 |
+
| cosine_precision@1 | 0.3995 |
|
| 1217 |
+
| cosine_precision@3 | 0.3995 |
|
| 1218 |
+
| cosine_precision@5 | 0.3898 |
|
| 1219 |
+
| cosine_precision@10 | 0.3562 |
|
| 1220 |
+
| cosine_recall@1 | 0.0464 |
|
| 1221 |
+
| cosine_recall@3 | 0.1358 |
|
| 1222 |
+
| cosine_recall@5 | 0.2038 |
|
| 1223 |
+
| cosine_recall@10 | 0.3016 |
|
| 1224 |
+
| **cosine_ndcg@10** | **0.4282** |
|
| 1225 |
+
| cosine_mrr@10 | 0.4141 |
|
| 1226 |
+
| cosine_map@100 | 0.496 |
|
| 1227 |
+
|
| 1228 |
+
#### Information Retrieval
|
| 1229 |
+
|
| 1230 |
+
* Dataset: `dim_768`
|
| 1231 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1232 |
+
```json
|
| 1233 |
+
{
|
| 1234 |
+
"truncate_dim": 768
|
| 1235 |
+
}
|
| 1236 |
+
```
|
| 1237 |
+
|
| 1238 |
+
| Metric | Value |
|
| 1239 |
+
|:--------------------|:-----------|
|
| 1240 |
+
| cosine_accuracy@1 | 0.3892 |
|
| 1241 |
+
| cosine_accuracy@3 | 0.3995 |
|
| 1242 |
+
| cosine_accuracy@5 | 0.4366 |
|
| 1243 |
+
| cosine_accuracy@10 | 0.4782 |
|
| 1244 |
+
| cosine_precision@1 | 0.3892 |
|
| 1245 |
+
| cosine_precision@3 | 0.3899 |
|
| 1246 |
+
| cosine_precision@5 | 0.3816 |
|
| 1247 |
+
| cosine_precision@10 | 0.3515 |
|
| 1248 |
+
| cosine_recall@1 | 0.0451 |
|
| 1249 |
+
| cosine_recall@3 | 0.1322 |
|
| 1250 |
+
| cosine_recall@5 | 0.1988 |
|
| 1251 |
+
| cosine_recall@10 | 0.2973 |
|
| 1252 |
+
| **cosine_ndcg@10** | **0.4211** |
|
| 1253 |
+
| cosine_mrr@10 | 0.4051 |
|
| 1254 |
+
| cosine_map@100 | 0.488 |
|
| 1255 |
+
|
| 1256 |
+
#### Information Retrieval
|
| 1257 |
+
|
| 1258 |
+
* Dataset: `dim_512`
|
| 1259 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1260 |
+
```json
|
| 1261 |
+
{
|
| 1262 |
+
"truncate_dim": 512
|
| 1263 |
+
}
|
| 1264 |
+
```
|
| 1265 |
+
|
| 1266 |
+
| Metric | Value |
|
| 1267 |
+
|:--------------------|:----------|
|
| 1268 |
+
| cosine_accuracy@1 | 0.3944 |
|
| 1269 |
+
| cosine_accuracy@3 | 0.4033 |
|
| 1270 |
+
| cosine_accuracy@5 | 0.4328 |
|
| 1271 |
+
| cosine_accuracy@10 | 0.4712 |
|
| 1272 |
+
| cosine_precision@1 | 0.3944 |
|
| 1273 |
+
| cosine_precision@3 | 0.3944 |
|
| 1274 |
+
| cosine_precision@5 | 0.3837 |
|
| 1275 |
+
| cosine_precision@10 | 0.3487 |
|
| 1276 |
+
| cosine_recall@1 | 0.046 |
|
| 1277 |
+
| cosine_recall@3 | 0.1343 |
|
| 1278 |
+
| cosine_recall@5 | 0.2006 |
|
| 1279 |
+
| cosine_recall@10 | 0.2941 |
|
| 1280 |
+
| **cosine_ndcg@10** | **0.421** |
|
| 1281 |
+
| cosine_mrr@10 | 0.4078 |
|
| 1282 |
+
| cosine_map@100 | 0.4838 |
|
| 1283 |
+
|
| 1284 |
+
#### Information Retrieval
|
| 1285 |
+
|
| 1286 |
+
* Dataset: `dim_256`
|
| 1287 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1288 |
+
```json
|
| 1289 |
+
{
|
| 1290 |
+
"truncate_dim": 256
|
| 1291 |
+
}
|
| 1292 |
+
```
|
| 1293 |
+
|
| 1294 |
+
| Metric | Value |
|
| 1295 |
+
|:--------------------|:-----------|
|
| 1296 |
+
| cosine_accuracy@1 | 0.3764 |
|
| 1297 |
+
| cosine_accuracy@3 | 0.3822 |
|
| 1298 |
+
| cosine_accuracy@5 | 0.4104 |
|
| 1299 |
+
| cosine_accuracy@10 | 0.4533 |
|
| 1300 |
+
| cosine_precision@1 | 0.3764 |
|
| 1301 |
+
| cosine_precision@3 | 0.3758 |
|
| 1302 |
+
| cosine_precision@5 | 0.365 |
|
| 1303 |
+
| cosine_precision@10 | 0.3326 |
|
| 1304 |
+
| cosine_recall@1 | 0.0435 |
|
| 1305 |
+
| cosine_recall@3 | 0.1274 |
|
| 1306 |
+
| cosine_recall@5 | 0.1911 |
|
| 1307 |
+
| cosine_recall@10 | 0.2827 |
|
| 1308 |
+
| **cosine_ndcg@10** | **0.4016** |
|
| 1309 |
+
| cosine_mrr@10 | 0.3892 |
|
| 1310 |
+
| cosine_map@100 | 0.465 |
|
| 1311 |
+
|
| 1312 |
+
#### Information Retrieval
|
| 1313 |
+
|
| 1314 |
+
* Dataset: `dim_128`
|
| 1315 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1316 |
+
```json
|
| 1317 |
+
{
|
| 1318 |
+
"truncate_dim": 128
|
| 1319 |
+
}
|
| 1320 |
+
```
|
| 1321 |
+
|
| 1322 |
+
| Metric | Value |
|
| 1323 |
+
|:--------------------|:-----------|
|
| 1324 |
+
| cosine_accuracy@1 | 0.347 |
|
| 1325 |
+
| cosine_accuracy@3 | 0.3496 |
|
| 1326 |
+
| cosine_accuracy@5 | 0.379 |
|
| 1327 |
+
| cosine_accuracy@10 | 0.4161 |
|
| 1328 |
+
| cosine_precision@1 | 0.347 |
|
| 1329 |
+
| cosine_precision@3 | 0.3453 |
|
| 1330 |
+
| cosine_precision@5 | 0.3353 |
|
| 1331 |
+
| cosine_precision@10 | 0.3055 |
|
| 1332 |
+
| cosine_recall@1 | 0.0402 |
|
| 1333 |
+
| cosine_recall@3 | 0.1171 |
|
| 1334 |
+
| cosine_recall@5 | 0.1755 |
|
| 1335 |
+
| cosine_recall@10 | 0.2604 |
|
| 1336 |
+
| **cosine_ndcg@10** | **0.3697** |
|
| 1337 |
+
| cosine_mrr@10 | 0.3582 |
|
| 1338 |
+
| cosine_map@100 | 0.4291 |
|
| 1339 |
+
|
| 1340 |
+
#### Information Retrieval
|
| 1341 |
+
|
| 1342 |
+
* Dataset: `dim_64`
|
| 1343 |
+
* Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
|
| 1344 |
+
```json
|
| 1345 |
+
{
|
| 1346 |
+
"truncate_dim": 64
|
| 1347 |
+
}
|
| 1348 |
+
```
|
| 1349 |
+
|
| 1350 |
+
| Metric | Value |
|
| 1351 |
+
|:--------------------|:-----------|
|
| 1352 |
+
| cosine_accuracy@1 | 0.2939 |
|
| 1353 |
+
| cosine_accuracy@3 | 0.3015 |
|
| 1354 |
+
| cosine_accuracy@5 | 0.3271 |
|
| 1355 |
+
| cosine_accuracy@10 | 0.3592 |
|
| 1356 |
+
| cosine_precision@1 | 0.2939 |
|
| 1357 |
+
| cosine_precision@3 | 0.2945 |
|
| 1358 |
+
| cosine_precision@5 | 0.2883 |
|
| 1359 |
+
| cosine_precision@10 | 0.2681 |
|
| 1360 |
+
| cosine_recall@1 | 0.0321 |
|
| 1361 |
+
| cosine_recall@3 | 0.0945 |
|
| 1362 |
+
| cosine_recall@5 | 0.1431 |
|
| 1363 |
+
| cosine_recall@10 | 0.2217 |
|
| 1364 |
+
| **cosine_ndcg@10** | **0.3185** |
|
| 1365 |
+
| cosine_mrr@10 | 0.3054 |
|
| 1366 |
+
| cosine_map@100 | 0.3744 |
|
| 1367 |
+
|
| 1368 |
+
<!--
|
| 1369 |
+
## Bias, Risks and Limitations
|
| 1370 |
+
|
| 1371 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 1372 |
+
-->
|
| 1373 |
+
|
| 1374 |
+
<!--
|
| 1375 |
+
### Recommendations
|
| 1376 |
+
|
| 1377 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 1378 |
+
-->
|
| 1379 |
+
|
| 1380 |
+
## Training Details
|
| 1381 |
+
|
| 1382 |
+
### Training Dataset
|
| 1383 |
+
|
| 1384 |
+
#### Unnamed Dataset
|
| 1385 |
+
|
| 1386 |
+
* Size: 391 training samples
|
| 1387 |
+
* Columns: <code>anchor</code> and <code>positive</code>
|
| 1388 |
+
* Approximate statistics based on the first 391 samples:
|
| 1389 |
+
| | anchor | positive |
|
| 1390 |
+
|:--------|:----------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
|
| 1391 |
+
| type | string | string |
|
| 1392 |
+
| details | <ul><li>min: 8 tokens</li><li>mean: 17.16 tokens</li><li>max: 32 tokens</li></ul> | <ul><li>min: 27 tokens</li><li>mean: 377.93 tokens</li><li>max: 512 tokens</li></ul> |
|
| 1393 |
+
* Samples:
|
| 1394 |
+
| anchor | positive |
|
| 1395 |
+
|:-------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 1396 |
+
| <code>What measures must be taken according to Article 32?</code> | <code>1.Where processing is to be carried out on behalf of a controller, the controller shall use only processors providing sufficient guarantees to implement appropriate technical and organisational measures in such a manner that processing will meet the requirements of this Regulation and ensure the protection of the rights of the data subject.<br>2.The processor shall not engage another processor without prior specific or general written authorisation of the controller. In the case of general written authorisation, the processor shall inform the controller of any intended changes concerning the addition or replacement of other processors, thereby giving the controller the opportunity to object to such changes.<br>3.Processing by a processor shall be governed by a contract or other legal act under Union or Member State law, that is binding on the processor with regard to the controller and that sets out the subject-matter and duration of the processing, the nature and purpose of the processing, ...</code> |
|
| 1397 |
+
| <code>What is the responsibility of assisting and advising the data subjects in exercising their rights?</code> | <code>1.A transfer of personal data to a third country or an international organisation may take place where the Commission has decided that the third country, a territory or one or more specified sectors within that third country, or the international organisation in question ensures an adequate level of protection. Such a transfer shall not require any specific authorisation.<br>2.When assessing the adequacy of the level of protection, the Commission shall, in particular, take account of the following elements: (a) the rule of law, respect for human rights and fundamental freedoms, relevant legislation, both general and sectoral, including concerning public security, defence, national security and criminal law and the access of public authorities to personal data, as well as the implementation of such legislation, data protection rules, professional rules and security measures, including rules for the onward transfer of personal data to another third country or international organisation whi...</code> |
|
| 1398 |
+
| <code>What should Member States be authorized to provide for regarding personal data processing for archiving purposes?</code> | <code>Where personal data are processed for archiving purposes, this Regulation should also apply to that processing, bearing in mind that this Regulation should not apply to deceased persons. Public authorities or public or private bodies that hold records of public interest should be services which, pursuant to Union or Member State law, have a legal obligation to acquire, preserve, appraise, arrange, describe, communicate, promote, disseminate and provide access to records of enduring value for general public interest. Member States should also be authorised to provide for the further processing of personal data for archiving purposes, for example with a view to providing specific information related to the political behaviour under former totalitarian state regimes, genocide, crimes against humanity, in particular the Holocaust, or war crimes. 4.5.2016 L 119/29 Official Journal of the European Union EN</code> |
|
| 1399 |
+
* Loss: [<code>MatryoshkaLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#matryoshkaloss) with these parameters:
|
| 1400 |
+
```json
|
| 1401 |
+
{
|
| 1402 |
+
"loss": "MultipleNegativesRankingLoss",
|
| 1403 |
+
"matryoshka_dims": [
|
| 1404 |
+
1024,
|
| 1405 |
+
768,
|
| 1406 |
+
512,
|
| 1407 |
+
256,
|
| 1408 |
+
128,
|
| 1409 |
+
64
|
| 1410 |
+
],
|
| 1411 |
+
"matryoshka_weights": [
|
| 1412 |
+
1,
|
| 1413 |
+
1,
|
| 1414 |
+
1,
|
| 1415 |
+
1,
|
| 1416 |
+
1,
|
| 1417 |
+
1
|
| 1418 |
+
],
|
| 1419 |
+
"n_dims_per_step": -1
|
| 1420 |
+
}
|
| 1421 |
+
```
|
| 1422 |
+
|
| 1423 |
+
### Training Hyperparameters
|
| 1424 |
+
#### Non-Default Hyperparameters
|
| 1425 |
+
|
| 1426 |
+
- `eval_strategy`: epoch
|
| 1427 |
+
- `per_device_eval_batch_size`: 16
|
| 1428 |
+
- `gradient_accumulation_steps`: 4
|
| 1429 |
+
- `learning_rate`: 2e-05
|
| 1430 |
+
- `num_train_epochs`: 20
|
| 1431 |
+
- `lr_scheduler_type`: cosine
|
| 1432 |
+
- `warmup_ratio`: 0.1
|
| 1433 |
+
- `bf16`: True
|
| 1434 |
+
- `load_best_model_at_end`: True
|
| 1435 |
+
- `optim`: adamw_torch_fused
|
| 1436 |
+
- `batch_sampler`: no_duplicates
|
| 1437 |
+
|
| 1438 |
+
#### All Hyperparameters
|
| 1439 |
+
<details><summary>Click to expand</summary>
|
| 1440 |
+
|
| 1441 |
+
- `overwrite_output_dir`: False
|
| 1442 |
+
- `do_predict`: False
|
| 1443 |
+
- `eval_strategy`: epoch
|
| 1444 |
+
- `prediction_loss_only`: True
|
| 1445 |
+
- `per_device_train_batch_size`: 8
|
| 1446 |
+
- `per_device_eval_batch_size`: 16
|
| 1447 |
+
- `per_gpu_train_batch_size`: None
|
| 1448 |
+
- `per_gpu_eval_batch_size`: None
|
| 1449 |
+
- `gradient_accumulation_steps`: 4
|
| 1450 |
+
- `eval_accumulation_steps`: None
|
| 1451 |
+
- `torch_empty_cache_steps`: None
|
| 1452 |
+
- `learning_rate`: 2e-05
|
| 1453 |
+
- `weight_decay`: 0.0
|
| 1454 |
+
- `adam_beta1`: 0.9
|
| 1455 |
+
- `adam_beta2`: 0.999
|
| 1456 |
+
- `adam_epsilon`: 1e-08
|
| 1457 |
+
- `max_grad_norm`: 1.0
|
| 1458 |
+
- `num_train_epochs`: 20
|
| 1459 |
+
- `max_steps`: -1
|
| 1460 |
+
- `lr_scheduler_type`: cosine
|
| 1461 |
+
- `lr_scheduler_kwargs`: {}
|
| 1462 |
+
- `warmup_ratio`: 0.1
|
| 1463 |
+
- `warmup_steps`: 0
|
| 1464 |
+
- `log_level`: passive
|
| 1465 |
+
- `log_level_replica`: warning
|
| 1466 |
+
- `log_on_each_node`: True
|
| 1467 |
+
- `logging_nan_inf_filter`: True
|
| 1468 |
+
- `save_safetensors`: True
|
| 1469 |
+
- `save_on_each_node`: False
|
| 1470 |
+
- `save_only_model`: False
|
| 1471 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 1472 |
+
- `no_cuda`: False
|
| 1473 |
+
- `use_cpu`: False
|
| 1474 |
+
- `use_mps_device`: False
|
| 1475 |
+
- `seed`: 42
|
| 1476 |
+
- `data_seed`: None
|
| 1477 |
+
- `jit_mode_eval`: False
|
| 1478 |
+
- `use_ipex`: False
|
| 1479 |
+
- `bf16`: True
|
| 1480 |
+
- `fp16`: False
|
| 1481 |
+
- `fp16_opt_level`: O1
|
| 1482 |
+
- `half_precision_backend`: auto
|
| 1483 |
+
- `bf16_full_eval`: False
|
| 1484 |
+
- `fp16_full_eval`: False
|
| 1485 |
+
- `tf32`: None
|
| 1486 |
+
- `local_rank`: 0
|
| 1487 |
+
- `ddp_backend`: None
|
| 1488 |
+
- `tpu_num_cores`: None
|
| 1489 |
+
- `tpu_metrics_debug`: False
|
| 1490 |
+
- `debug`: []
|
| 1491 |
+
- `dataloader_drop_last`: False
|
| 1492 |
+
- `dataloader_num_workers`: 0
|
| 1493 |
+
- `dataloader_prefetch_factor`: None
|
| 1494 |
+
- `past_index`: -1
|
| 1495 |
+
- `disable_tqdm`: False
|
| 1496 |
+
- `remove_unused_columns`: True
|
| 1497 |
+
- `label_names`: None
|
| 1498 |
+
- `load_best_model_at_end`: True
|
| 1499 |
+
- `ignore_data_skip`: False
|
| 1500 |
+
- `fsdp`: []
|
| 1501 |
+
- `fsdp_min_num_params`: 0
|
| 1502 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 1503 |
+
- `tp_size`: 0
|
| 1504 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 1505 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 1506 |
+
- `deepspeed`: None
|
| 1507 |
+
- `label_smoothing_factor`: 0.0
|
| 1508 |
+
- `optim`: adamw_torch_fused
|
| 1509 |
+
- `optim_args`: None
|
| 1510 |
+
- `adafactor`: False
|
| 1511 |
+
- `group_by_length`: False
|
| 1512 |
+
- `length_column_name`: length
|
| 1513 |
+
- `ddp_find_unused_parameters`: None
|
| 1514 |
+
- `ddp_bucket_cap_mb`: None
|
| 1515 |
+
- `ddp_broadcast_buffers`: False
|
| 1516 |
+
- `dataloader_pin_memory`: True
|
| 1517 |
+
- `dataloader_persistent_workers`: False
|
| 1518 |
+
- `skip_memory_metrics`: True
|
| 1519 |
+
- `use_legacy_prediction_loop`: False
|
| 1520 |
+
- `push_to_hub`: False
|
| 1521 |
+
- `resume_from_checkpoint`: None
|
| 1522 |
+
- `hub_model_id`: None
|
| 1523 |
+
- `hub_strategy`: every_save
|
| 1524 |
+
- `hub_private_repo`: None
|
| 1525 |
+
- `hub_always_push`: False
|
| 1526 |
+
- `gradient_checkpointing`: False
|
| 1527 |
+
- `gradient_checkpointing_kwargs`: None
|
| 1528 |
+
- `include_inputs_for_metrics`: False
|
| 1529 |
+
- `include_for_metrics`: []
|
| 1530 |
+
- `eval_do_concat_batches`: True
|
| 1531 |
+
- `fp16_backend`: auto
|
| 1532 |
+
- `push_to_hub_model_id`: None
|
| 1533 |
+
- `push_to_hub_organization`: None
|
| 1534 |
+
- `mp_parameters`:
|
| 1535 |
+
- `auto_find_batch_size`: False
|
| 1536 |
+
- `full_determinism`: False
|
| 1537 |
+
- `torchdynamo`: None
|
| 1538 |
+
- `ray_scope`: last
|
| 1539 |
+
- `ddp_timeout`: 1800
|
| 1540 |
+
- `torch_compile`: False
|
| 1541 |
+
- `torch_compile_backend`: None
|
| 1542 |
+
- `torch_compile_mode`: None
|
| 1543 |
+
- `include_tokens_per_second`: False
|
| 1544 |
+
- `include_num_input_tokens_seen`: False
|
| 1545 |
+
- `neftune_noise_alpha`: None
|
| 1546 |
+
- `optim_target_modules`: None
|
| 1547 |
+
- `batch_eval_metrics`: False
|
| 1548 |
+
- `eval_on_start`: False
|
| 1549 |
+
- `use_liger_kernel`: False
|
| 1550 |
+
- `eval_use_gather_object`: False
|
| 1551 |
+
- `average_tokens_across_devices`: False
|
| 1552 |
+
- `prompts`: None
|
| 1553 |
+
- `batch_sampler`: no_duplicates
|
| 1554 |
+
- `multi_dataset_batch_sampler`: proportional
|
| 1555 |
+
- `router_mapping`: {}
|
| 1556 |
+
- `learning_rate_mapping`: {}
|
| 1557 |
+
|
| 1558 |
+
</details>
|
| 1559 |
+
|
| 1560 |
+
### Training Logs
|
| 1561 |
+
| Epoch | Step | Training Loss | dim_1024_cosine_ndcg@10 | dim_768_cosine_ndcg@10 | dim_512_cosine_ndcg@10 | dim_256_cosine_ndcg@10 | dim_128_cosine_ndcg@10 | dim_64_cosine_ndcg@10 |
|
| 1562 |
+
|:------:|:----:|:-------------:|:-----------------------:|:----------------------:|:----------------------:|:----------------------:|:----------------------:|:---------------------:|
|
| 1563 |
+
| 0.8163 | 10 | 31.5155 | - | - | - | - | - | - |
|
| 1564 |
+
| 1.0 | 13 | - | 0.4494 | 0.4446 | 0.4364 | 0.3947 | 0.3362 | 0.2621 |
|
| 1565 |
+
| 1.5714 | 20 | 19.0409 | - | - | - | - | - | - |
|
| 1566 |
+
| 2.0 | 26 | - | 0.4065 | 0.4004 | 0.4013 | 0.3692 | 0.3418 | 0.2882 |
|
| 1567 |
+
| 2.3265 | 30 | 14.5314 | - | - | - | - | - | - |
|
| 1568 |
+
| 3.0 | 39 | - | 0.4418 | 0.4350 | 0.4329 | 0.4087 | 0.3714 | 0.3372 |
|
| 1569 |
+
| 3.0816 | 40 | 8.6778 | - | - | - | - | - | - |
|
| 1570 |
+
| 3.8980 | 50 | 6.0257 | - | - | - | - | - | - |
|
| 1571 |
+
| 4.0 | 52 | - | 0.4291 | 0.4244 | 0.4282 | 0.3980 | 0.3677 | 0.3275 |
|
| 1572 |
+
| 4.6531 | 60 | 3.3524 | - | - | - | - | - | - |
|
| 1573 |
+
| 5.0 | 65 | - | 0.4282 | 0.4211 | 0.4210 | 0.4016 | 0.3697 | 0.3185 |
|
| 1574 |
+
|
| 1575 |
+
|
| 1576 |
+
### Framework Versions
|
| 1577 |
+
- Python: 3.12.11
|
| 1578 |
+
- Sentence Transformers: 5.1.0
|
| 1579 |
+
- Transformers: 4.51.3
|
| 1580 |
+
- PyTorch: 2.8.0+cu126
|
| 1581 |
+
- Accelerate: 1.10.1
|
| 1582 |
+
- Datasets: 4.0.0
|
| 1583 |
+
- Tokenizers: 0.21.4
|
| 1584 |
+
|
| 1585 |
+
## Citation
|
| 1586 |
+
|
| 1587 |
+
### BibTeX
|
| 1588 |
+
|
| 1589 |
+
#### Sentence Transformers
|
| 1590 |
+
```bibtex
|
| 1591 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 1592 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 1593 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 1594 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 1595 |
+
month = "11",
|
| 1596 |
+
year = "2019",
|
| 1597 |
+
publisher = "Association for Computational Linguistics",
|
| 1598 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 1599 |
+
}
|
| 1600 |
+
```
|
| 1601 |
+
|
| 1602 |
+
#### MatryoshkaLoss
|
| 1603 |
+
```bibtex
|
| 1604 |
+
@misc{kusupati2024matryoshka,
|
| 1605 |
+
title={Matryoshka Representation Learning},
|
| 1606 |
+
author={Aditya Kusupati and Gantavya Bhatt and Aniket Rege and Matthew Wallingford and Aditya Sinha and Vivek Ramanujan and William Howard-Snyder and Kaifeng Chen and Sham Kakade and Prateek Jain and Ali Farhadi},
|
| 1607 |
+
year={2024},
|
| 1608 |
+
eprint={2205.13147},
|
| 1609 |
+
archivePrefix={arXiv},
|
| 1610 |
+
primaryClass={cs.LG}
|
| 1611 |
+
}
|
| 1612 |
+
```
|
| 1613 |
+
|
| 1614 |
+
#### MultipleNegativesRankingLoss
|
| 1615 |
+
```bibtex
|
| 1616 |
+
@misc{henderson2017efficient,
|
| 1617 |
+
title={Efficient Natural Language Response Suggestion for Smart Reply},
|
| 1618 |
+
author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
|
| 1619 |
+
year={2017},
|
| 1620 |
+
eprint={1705.00652},
|
| 1621 |
+
archivePrefix={arXiv},
|
| 1622 |
+
primaryClass={cs.CL}
|
| 1623 |
+
}
|
| 1624 |
+
```
|
| 1625 |
+
|
| 1626 |
+
<!--
|
| 1627 |
+
## Glossary
|
| 1628 |
+
|
| 1629 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 1630 |
+
-->
|
| 1631 |
+
|
| 1632 |
+
<!--
|
| 1633 |
+
## Model Card Authors
|
| 1634 |
+
|
| 1635 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 1636 |
+
-->
|
| 1637 |
+
|
| 1638 |
+
<!--
|
| 1639 |
+
## Model Card Contact
|
| 1640 |
+
|
| 1641 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 1642 |
+
-->
|
checkpoint-65/config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"XLMRobertaModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"bos_token_id": 0,
|
| 7 |
+
"classifier_dropout": null,
|
| 8 |
+
"eos_token_id": 2,
|
| 9 |
+
"hidden_act": "gelu",
|
| 10 |
+
"hidden_dropout_prob": 0.1,
|
| 11 |
+
"hidden_size": 1024,
|
| 12 |
+
"initializer_range": 0.02,
|
| 13 |
+
"intermediate_size": 4096,
|
| 14 |
+
"layer_norm_eps": 1e-05,
|
| 15 |
+
"max_position_embeddings": 514,
|
| 16 |
+
"model_type": "xlm-roberta",
|
| 17 |
+
"num_attention_heads": 16,
|
| 18 |
+
"num_hidden_layers": 24,
|
| 19 |
+
"output_past": true,
|
| 20 |
+
"pad_token_id": 1,
|
| 21 |
+
"position_embedding_type": "absolute",
|
| 22 |
+
"torch_dtype": "float32",
|
| 23 |
+
"transformers_version": "4.51.3",
|
| 24 |
+
"type_vocab_size": 1,
|
| 25 |
+
"use_cache": true,
|
| 26 |
+
"vocab_size": 250002
|
| 27 |
+
}
|
checkpoint-65/config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "SentenceTransformer",
|
| 3 |
+
"__version__": {
|
| 4 |
+
"sentence_transformers": "5.1.0",
|
| 5 |
+
"transformers": "4.51.3",
|
| 6 |
+
"pytorch": "2.8.0+cu126"
|
| 7 |
+
},
|
| 8 |
+
"prompts": {
|
| 9 |
+
"query": "",
|
| 10 |
+
"document": ""
|
| 11 |
+
},
|
| 12 |
+
"default_prompt_name": null,
|
| 13 |
+
"similarity_fn_name": "cosine"
|
| 14 |
+
}
|
checkpoint-65/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e170532ef3cecf660eb98f4bc34e8207df70da0a192758efcd848948ff933df
|
| 3 |
+
size 2239607176
|
checkpoint-65/modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
checkpoint-65/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7dffac8a08fff2e6cb35978f0a34cfe908c3cc4bad0a978bff7eb74ebbde769
|
| 3 |
+
size 4471067142
|
checkpoint-65/rng_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26eefef1027f0f7e30b8f30bcbc2af10d09f3fd1f25108c7d6c3ba95b4ac3eb4
|
| 3 |
+
size 14645
|
checkpoint-65/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ea60534e714390f38db0d7748b2fa3b78ae93b7334ba633bbe797337eca2eae
|
| 3 |
+
size 1465
|
checkpoint-65/sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 512,
|
| 3 |
+
"do_lower_case": false
|
| 4 |
+
}
|
checkpoint-65/sentencepiece.bpe.model
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
|
| 3 |
+
size 5069051
|
checkpoint-65/special_tokens_map.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"cls_token": {
|
| 10 |
+
"content": "<s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"eos_token": {
|
| 17 |
+
"content": "</s>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"mask_token": {
|
| 24 |
+
"content": "<mask>",
|
| 25 |
+
"lstrip": true,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"pad_token": {
|
| 31 |
+
"content": "<pad>",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
},
|
| 37 |
+
"sep_token": {
|
| 38 |
+
"content": "</s>",
|
| 39 |
+
"lstrip": false,
|
| 40 |
+
"normalized": false,
|
| 41 |
+
"rstrip": false,
|
| 42 |
+
"single_word": false
|
| 43 |
+
},
|
| 44 |
+
"unk_token": {
|
| 45 |
+
"content": "<unk>",
|
| 46 |
+
"lstrip": false,
|
| 47 |
+
"normalized": false,
|
| 48 |
+
"rstrip": false,
|
| 49 |
+
"single_word": false
|
| 50 |
+
}
|
| 51 |
+
}
|
checkpoint-65/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:883b037111086fd4dfebbbc9b7cee11e1517b5e0c0514879478661440f137085
|
| 3 |
+
size 17082987
|
checkpoint-65/tokenizer_config.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "<s>",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<pad>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "</s>",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "<unk>",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"250001": {
|
| 36 |
+
"content": "<mask>",
|
| 37 |
+
"lstrip": true,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"bos_token": "<s>",
|
| 45 |
+
"clean_up_tokenization_spaces": true,
|
| 46 |
+
"cls_token": "<s>",
|
| 47 |
+
"eos_token": "</s>",
|
| 48 |
+
"extra_special_tokens": {},
|
| 49 |
+
"mask_token": "<mask>",
|
| 50 |
+
"model_max_length": 512,
|
| 51 |
+
"pad_token": "<pad>",
|
| 52 |
+
"sep_token": "</s>",
|
| 53 |
+
"tokenizer_class": "XLMRobertaTokenizer",
|
| 54 |
+
"unk_token": "<unk>"
|
| 55 |
+
}
|
checkpoint-65/trainer_state.json
ADDED
|
@@ -0,0 +1,575 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"best_global_step": 39,
|
| 3 |
+
"best_metric": 0.37139192897263235,
|
| 4 |
+
"best_model_checkpoint": "intfloat/multilingual-e5-large/checkpoint-39",
|
| 5 |
+
"epoch": 5.0,
|
| 6 |
+
"eval_steps": 500,
|
| 7 |
+
"global_step": 65,
|
| 8 |
+
"is_hyper_param_search": false,
|
| 9 |
+
"is_local_process_zero": true,
|
| 10 |
+
"is_world_process_zero": true,
|
| 11 |
+
"log_history": [
|
| 12 |
+
{
|
| 13 |
+
"epoch": 0.8163265306122449,
|
| 14 |
+
"grad_norm": 307.08624267578125,
|
| 15 |
+
"learning_rate": 7.500000000000001e-06,
|
| 16 |
+
"loss": 31.5155,
|
| 17 |
+
"step": 10
|
| 18 |
+
},
|
| 19 |
+
{
|
| 20 |
+
"epoch": 1.0,
|
| 21 |
+
"eval_dim_1024_cosine_accuracy@1": 0.42509603072983354,
|
| 22 |
+
"eval_dim_1024_cosine_accuracy@10": 0.49295774647887325,
|
| 23 |
+
"eval_dim_1024_cosine_accuracy@3": 0.43085787451984636,
|
| 24 |
+
"eval_dim_1024_cosine_accuracy@5": 0.46030729833546735,
|
| 25 |
+
"eval_dim_1024_cosine_map@100": 0.508986346237021,
|
| 26 |
+
"eval_dim_1024_cosine_mrr@10": 0.4369535394183281,
|
| 27 |
+
"eval_dim_1024_cosine_ndcg@10": 0.4493804868009024,
|
| 28 |
+
"eval_dim_1024_cosine_precision@1": 0.42509603072983354,
|
| 29 |
+
"eval_dim_1024_cosine_precision@10": 0.376056338028169,
|
| 30 |
+
"eval_dim_1024_cosine_precision@3": 0.42402902262057185,
|
| 31 |
+
"eval_dim_1024_cosine_precision@5": 0.4133162612035851,
|
| 32 |
+
"eval_dim_1024_cosine_recall@1": 0.04813624827530403,
|
| 33 |
+
"eval_dim_1024_cosine_recall@10": 0.3150476790176975,
|
| 34 |
+
"eval_dim_1024_cosine_recall@3": 0.1404092551990217,
|
| 35 |
+
"eval_dim_1024_cosine_recall@5": 0.21147403835662126,
|
| 36 |
+
"eval_dim_128_cosine_accuracy@1": 0.31370038412291934,
|
| 37 |
+
"eval_dim_128_cosine_accuracy@10": 0.38156209987195905,
|
| 38 |
+
"eval_dim_128_cosine_accuracy@3": 0.31946222791293216,
|
| 39 |
+
"eval_dim_128_cosine_accuracy@5": 0.34571062740076824,
|
| 40 |
+
"eval_dim_128_cosine_map@100": 0.3991669558616212,
|
| 41 |
+
"eval_dim_128_cosine_mrr@10": 0.32517427799117904,
|
| 42 |
+
"eval_dim_128_cosine_ndcg@10": 0.33618283481296385,
|
| 43 |
+
"eval_dim_128_cosine_precision@1": 0.31370038412291934,
|
| 44 |
+
"eval_dim_128_cosine_precision@10": 0.2764404609475032,
|
| 45 |
+
"eval_dim_128_cosine_precision@3": 0.31284677763551,
|
| 46 |
+
"eval_dim_128_cosine_precision@5": 0.30422535211267604,
|
| 47 |
+
"eval_dim_128_cosine_recall@1": 0.037933385936292925,
|
| 48 |
+
"eval_dim_128_cosine_recall@10": 0.24798465115464788,
|
| 49 |
+
"eval_dim_128_cosine_recall@3": 0.11100168654049715,
|
| 50 |
+
"eval_dim_128_cosine_recall@5": 0.1670926413559068,
|
| 51 |
+
"eval_dim_256_cosine_accuracy@1": 0.36427656850192064,
|
| 52 |
+
"eval_dim_256_cosine_accuracy@10": 0.44814340588988477,
|
| 53 |
+
"eval_dim_256_cosine_accuracy@3": 0.36939820742637647,
|
| 54 |
+
"eval_dim_256_cosine_accuracy@5": 0.4090909090909091,
|
| 55 |
+
"eval_dim_256_cosine_map@100": 0.45841270037343096,
|
| 56 |
+
"eval_dim_256_cosine_mrr@10": 0.37879397597707415,
|
| 57 |
+
"eval_dim_256_cosine_ndcg@10": 0.3947006636735062,
|
| 58 |
+
"eval_dim_256_cosine_precision@1": 0.36427656850192064,
|
| 59 |
+
"eval_dim_256_cosine_precision@10": 0.3289372599231754,
|
| 60 |
+
"eval_dim_256_cosine_precision@3": 0.36363636363636365,
|
| 61 |
+
"eval_dim_256_cosine_precision@5": 0.3560819462227913,
|
| 62 |
+
"eval_dim_256_cosine_recall@1": 0.04277277943657814,
|
| 63 |
+
"eval_dim_256_cosine_recall@10": 0.28617844199333936,
|
| 64 |
+
"eval_dim_256_cosine_recall@3": 0.1253991943934714,
|
| 65 |
+
"eval_dim_256_cosine_recall@5": 0.18947388504512186,
|
| 66 |
+
"eval_dim_512_cosine_accuracy@1": 0.4084507042253521,
|
| 67 |
+
"eval_dim_512_cosine_accuracy@10": 0.4871959026888604,
|
| 68 |
+
"eval_dim_512_cosine_accuracy@3": 0.41357234314980795,
|
| 69 |
+
"eval_dim_512_cosine_accuracy@5": 0.4519846350832266,
|
| 70 |
+
"eval_dim_512_cosine_map@100": 0.495554245202425,
|
| 71 |
+
"eval_dim_512_cosine_mrr@10": 0.42213127248338495,
|
| 72 |
+
"eval_dim_512_cosine_ndcg@10": 0.43644305450989757,
|
| 73 |
+
"eval_dim_512_cosine_precision@1": 0.4084507042253521,
|
| 74 |
+
"eval_dim_512_cosine_precision@10": 0.36606914212548014,
|
| 75 |
+
"eval_dim_512_cosine_precision@3": 0.40738369611609043,
|
| 76 |
+
"eval_dim_512_cosine_precision@5": 0.39846350832266325,
|
| 77 |
+
"eval_dim_512_cosine_recall@1": 0.04628035514721453,
|
| 78 |
+
"eval_dim_512_cosine_recall@10": 0.30419701916496145,
|
| 79 |
+
"eval_dim_512_cosine_recall@3": 0.13522898183596205,
|
| 80 |
+
"eval_dim_512_cosine_recall@5": 0.20394662187726964,
|
| 81 |
+
"eval_dim_64_cosine_accuracy@1": 0.24199743918053776,
|
| 82 |
+
"eval_dim_64_cosine_accuracy@10": 0.29641485275288093,
|
| 83 |
+
"eval_dim_64_cosine_accuracy@3": 0.24775928297055058,
|
| 84 |
+
"eval_dim_64_cosine_accuracy@5": 0.26952624839948786,
|
| 85 |
+
"eval_dim_64_cosine_map@100": 0.31803601064541553,
|
| 86 |
+
"eval_dim_64_cosine_mrr@10": 0.25159771761884414,
|
| 87 |
+
"eval_dim_64_cosine_ndcg@10": 0.2620553065689597,
|
| 88 |
+
"eval_dim_64_cosine_precision@1": 0.24199743918053776,
|
| 89 |
+
"eval_dim_64_cosine_precision@10": 0.21568501920614594,
|
| 90 |
+
"eval_dim_64_cosine_precision@3": 0.24199743918053776,
|
| 91 |
+
"eval_dim_64_cosine_precision@5": 0.23649167733674775,
|
| 92 |
+
"eval_dim_64_cosine_recall@1": 0.029110868794154622,
|
| 93 |
+
"eval_dim_64_cosine_recall@10": 0.19521971714475267,
|
| 94 |
+
"eval_dim_64_cosine_recall@3": 0.08524734139651896,
|
| 95 |
+
"eval_dim_64_cosine_recall@5": 0.12921904680249943,
|
| 96 |
+
"eval_dim_768_cosine_accuracy@1": 0.4193341869398207,
|
| 97 |
+
"eval_dim_768_cosine_accuracy@10": 0.4910371318822023,
|
| 98 |
+
"eval_dim_768_cosine_accuracy@3": 0.4238156209987196,
|
| 99 |
+
"eval_dim_768_cosine_accuracy@5": 0.4551856594110115,
|
| 100 |
+
"eval_dim_768_cosine_map@100": 0.5037778776293926,
|
| 101 |
+
"eval_dim_768_cosine_mrr@10": 0.4315339003719285,
|
| 102 |
+
"eval_dim_768_cosine_ndcg@10": 0.44456410503401034,
|
| 103 |
+
"eval_dim_768_cosine_precision@1": 0.4193341869398207,
|
| 104 |
+
"eval_dim_768_cosine_precision@10": 0.37272727272727274,
|
| 105 |
+
"eval_dim_768_cosine_precision@3": 0.4180537772087068,
|
| 106 |
+
"eval_dim_768_cosine_precision@5": 0.4076824583866837,
|
| 107 |
+
"eval_dim_768_cosine_recall@1": 0.04699592881851732,
|
| 108 |
+
"eval_dim_768_cosine_recall@10": 0.3107289399017082,
|
| 109 |
+
"eval_dim_768_cosine_recall@3": 0.13721565163348118,
|
| 110 |
+
"eval_dim_768_cosine_recall@5": 0.20710427114944024,
|
| 111 |
+
"eval_runtime": 98.6525,
|
| 112 |
+
"eval_samples_per_second": 0.0,
|
| 113 |
+
"eval_sequential_score": 0.2620553065689597,
|
| 114 |
+
"eval_steps_per_second": 0.0,
|
| 115 |
+
"step": 13
|
| 116 |
+
},
|
| 117 |
+
{
|
| 118 |
+
"epoch": 1.5714285714285714,
|
| 119 |
+
"grad_norm": 280.07818603515625,
|
| 120 |
+
"learning_rate": 1.5833333333333333e-05,
|
| 121 |
+
"loss": 19.0409,
|
| 122 |
+
"step": 20
|
| 123 |
+
},
|
| 124 |
+
{
|
| 125 |
+
"epoch": 2.0,
|
| 126 |
+
"eval_dim_1024_cosine_accuracy@1": 0.3854033290653009,
|
| 127 |
+
"eval_dim_1024_cosine_accuracy@10": 0.45454545454545453,
|
| 128 |
+
"eval_dim_1024_cosine_accuracy@3": 0.3886043533930858,
|
| 129 |
+
"eval_dim_1024_cosine_accuracy@5": 0.41101152368758004,
|
| 130 |
+
"eval_dim_1024_cosine_map@100": 0.47259820099791205,
|
| 131 |
+
"eval_dim_1024_cosine_mrr@10": 0.39624870434729537,
|
| 132 |
+
"eval_dim_1024_cosine_ndcg@10": 0.4065329035406967,
|
| 133 |
+
"eval_dim_1024_cosine_precision@1": 0.3854033290653009,
|
| 134 |
+
"eval_dim_1024_cosine_precision@10": 0.3357874519846351,
|
| 135 |
+
"eval_dim_1024_cosine_precision@3": 0.3839095177123346,
|
| 136 |
+
"eval_dim_1024_cosine_precision@5": 0.3713188220230474,
|
| 137 |
+
"eval_dim_1024_cosine_recall@1": 0.0451686782205082,
|
| 138 |
+
"eval_dim_1024_cosine_recall@10": 0.2918225395020212,
|
| 139 |
+
"eval_dim_1024_cosine_recall@3": 0.13200270380544088,
|
| 140 |
+
"eval_dim_1024_cosine_recall@5": 0.19735476247586825,
|
| 141 |
+
"eval_dim_128_cosine_accuracy@1": 0.31562099871959026,
|
| 142 |
+
"eval_dim_128_cosine_accuracy@10": 0.39180537772087065,
|
| 143 |
+
"eval_dim_128_cosine_accuracy@3": 0.3207426376440461,
|
| 144 |
+
"eval_dim_128_cosine_accuracy@5": 0.352112676056338,
|
| 145 |
+
"eval_dim_128_cosine_map@100": 0.40471008477532144,
|
| 146 |
+
"eval_dim_128_cosine_mrr@10": 0.32839105339105285,
|
| 147 |
+
"eval_dim_128_cosine_ndcg@10": 0.34177784905202935,
|
| 148 |
+
"eval_dim_128_cosine_precision@1": 0.31562099871959026,
|
| 149 |
+
"eval_dim_128_cosine_precision@10": 0.280729833546735,
|
| 150 |
+
"eval_dim_128_cosine_precision@3": 0.31455399061032857,
|
| 151 |
+
"eval_dim_128_cosine_precision@5": 0.30640204865556975,
|
| 152 |
+
"eval_dim_128_cosine_recall@1": 0.03888088094516579,
|
| 153 |
+
"eval_dim_128_cosine_recall@10": 0.2550464126190524,
|
| 154 |
+
"eval_dim_128_cosine_recall@3": 0.11341113256173359,
|
| 155 |
+
"eval_dim_128_cosine_recall@5": 0.17046484922169536,
|
| 156 |
+
"eval_dim_256_cosine_accuracy@1": 0.3418693982074264,
|
| 157 |
+
"eval_dim_256_cosine_accuracy@10": 0.4238156209987196,
|
| 158 |
+
"eval_dim_256_cosine_accuracy@3": 0.34763124199743917,
|
| 159 |
+
"eval_dim_256_cosine_accuracy@5": 0.38092189500640206,
|
| 160 |
+
"eval_dim_256_cosine_map@100": 0.43770217754051305,
|
| 161 |
+
"eval_dim_256_cosine_mrr@10": 0.35596482938032165,
|
| 162 |
+
"eval_dim_256_cosine_ndcg@10": 0.36923043791328775,
|
| 163 |
+
"eval_dim_256_cosine_precision@1": 0.3418693982074264,
|
| 164 |
+
"eval_dim_256_cosine_precision@10": 0.30441741357234314,
|
| 165 |
+
"eval_dim_256_cosine_precision@3": 0.34165599658557405,
|
| 166 |
+
"eval_dim_256_cosine_precision@5": 0.3322663252240717,
|
| 167 |
+
"eval_dim_256_cosine_recall@1": 0.041410929155814194,
|
| 168 |
+
"eval_dim_256_cosine_recall@10": 0.2705196189189818,
|
| 169 |
+
"eval_dim_256_cosine_recall@3": 0.1212642412965687,
|
| 170 |
+
"eval_dim_256_cosine_recall@5": 0.18173918651563936,
|
| 171 |
+
"eval_dim_512_cosine_accuracy@1": 0.37708066581306016,
|
| 172 |
+
"eval_dim_512_cosine_accuracy@10": 0.4532650448143406,
|
| 173 |
+
"eval_dim_512_cosine_accuracy@3": 0.38092189500640206,
|
| 174 |
+
"eval_dim_512_cosine_accuracy@5": 0.4084507042253521,
|
| 175 |
+
"eval_dim_512_cosine_map@100": 0.4678017780580059,
|
| 176 |
+
"eval_dim_512_cosine_mrr@10": 0.3893670101416575,
|
| 177 |
+
"eval_dim_512_cosine_ndcg@10": 0.40127522003513455,
|
| 178 |
+
"eval_dim_512_cosine_precision@1": 0.37708066581306016,
|
| 179 |
+
"eval_dim_512_cosine_precision@10": 0.33156209987195906,
|
| 180 |
+
"eval_dim_512_cosine_precision@3": 0.37537345283824153,
|
| 181 |
+
"eval_dim_512_cosine_precision@5": 0.36402048655569774,
|
| 182 |
+
"eval_dim_512_cosine_recall@1": 0.04457309853297402,
|
| 183 |
+
"eval_dim_512_cosine_recall@10": 0.2883968018428671,
|
| 184 |
+
"eval_dim_512_cosine_recall@3": 0.13007205872054822,
|
| 185 |
+
"eval_dim_512_cosine_recall@5": 0.19449520589871025,
|
| 186 |
+
"eval_dim_64_cosine_accuracy@1": 0.26696542893725994,
|
| 187 |
+
"eval_dim_64_cosine_accuracy@10": 0.33098591549295775,
|
| 188 |
+
"eval_dim_64_cosine_accuracy@3": 0.27208706786171577,
|
| 189 |
+
"eval_dim_64_cosine_accuracy@5": 0.293213828425096,
|
| 190 |
+
"eval_dim_64_cosine_map@100": 0.34719730722747555,
|
| 191 |
+
"eval_dim_64_cosine_mrr@10": 0.2776957197731842,
|
| 192 |
+
"eval_dim_64_cosine_ndcg@10": 0.2881905192612941,
|
| 193 |
+
"eval_dim_64_cosine_precision@1": 0.26696542893725994,
|
| 194 |
+
"eval_dim_64_cosine_precision@10": 0.237708066581306,
|
| 195 |
+
"eval_dim_64_cosine_precision@3": 0.26717883055911223,
|
| 196 |
+
"eval_dim_64_cosine_precision@5": 0.2596670934699104,
|
| 197 |
+
"eval_dim_64_cosine_recall@1": 0.031692344067516816,
|
| 198 |
+
"eval_dim_64_cosine_recall@10": 0.21473974122936995,
|
| 199 |
+
"eval_dim_64_cosine_recall@3": 0.09327455064654774,
|
| 200 |
+
"eval_dim_64_cosine_recall@5": 0.14131510912407144,
|
| 201 |
+
"eval_dim_768_cosine_accuracy@1": 0.37451984635083224,
|
| 202 |
+
"eval_dim_768_cosine_accuracy@10": 0.4539052496798976,
|
| 203 |
+
"eval_dim_768_cosine_accuracy@3": 0.37900128040973113,
|
| 204 |
+
"eval_dim_768_cosine_accuracy@5": 0.40973111395646605,
|
| 205 |
+
"eval_dim_768_cosine_map@100": 0.4672061011440217,
|
| 206 |
+
"eval_dim_768_cosine_mrr@10": 0.38746671950897227,
|
| 207 |
+
"eval_dim_768_cosine_ndcg@10": 0.4004027303245026,
|
| 208 |
+
"eval_dim_768_cosine_precision@1": 0.37451984635083224,
|
| 209 |
+
"eval_dim_768_cosine_precision@10": 0.3318181818181818,
|
| 210 |
+
"eval_dim_768_cosine_precision@3": 0.3734528382415706,
|
| 211 |
+
"eval_dim_768_cosine_precision@5": 0.3632522407170295,
|
| 212 |
+
"eval_dim_768_cosine_recall@1": 0.04413921317349132,
|
| 213 |
+
"eval_dim_768_cosine_recall@10": 0.28955317519546525,
|
| 214 |
+
"eval_dim_768_cosine_recall@3": 0.12896663310051748,
|
| 215 |
+
"eval_dim_768_cosine_recall@5": 0.19376203165061448,
|
| 216 |
+
"eval_runtime": 98.4244,
|
| 217 |
+
"eval_samples_per_second": 0.0,
|
| 218 |
+
"eval_sequential_score": 0.2881905192612941,
|
| 219 |
+
"eval_steps_per_second": 0.0,
|
| 220 |
+
"step": 26
|
| 221 |
+
},
|
| 222 |
+
{
|
| 223 |
+
"epoch": 2.326530612244898,
|
| 224 |
+
"grad_norm": 305.66259765625,
|
| 225 |
+
"learning_rate": 1.9973569167005725e-05,
|
| 226 |
+
"loss": 14.5314,
|
| 227 |
+
"step": 30
|
| 228 |
+
},
|
| 229 |
+
{
|
| 230 |
+
"epoch": 3.0,
|
| 231 |
+
"eval_dim_1024_cosine_accuracy@1": 0.4180537772087068,
|
| 232 |
+
"eval_dim_1024_cosine_accuracy@10": 0.49039692701664533,
|
| 233 |
+
"eval_dim_1024_cosine_accuracy@3": 0.42189500640204863,
|
| 234 |
+
"eval_dim_1024_cosine_accuracy@5": 0.4500640204865557,
|
| 235 |
+
"eval_dim_1024_cosine_map@100": 0.506794523350519,
|
| 236 |
+
"eval_dim_1024_cosine_mrr@10": 0.42985717334308843,
|
| 237 |
+
"eval_dim_1024_cosine_ndcg@10": 0.44178501209869797,
|
| 238 |
+
"eval_dim_1024_cosine_precision@1": 0.4180537772087068,
|
| 239 |
+
"eval_dim_1024_cosine_precision@10": 0.36869398207426374,
|
| 240 |
+
"eval_dim_1024_cosine_precision@3": 0.4163465642338881,
|
| 241 |
+
"eval_dim_1024_cosine_precision@5": 0.4043533930857874,
|
| 242 |
+
"eval_dim_1024_cosine_recall@1": 0.04734422767263886,
|
| 243 |
+
"eval_dim_1024_cosine_recall@10": 0.308531274625124,
|
| 244 |
+
"eval_dim_1024_cosine_recall@3": 0.138064233626932,
|
| 245 |
+
"eval_dim_1024_cosine_recall@5": 0.2069980430010945,
|
| 246 |
+
"eval_dim_128_cosine_accuracy@1": 0.34699103713188223,
|
| 247 |
+
"eval_dim_128_cosine_accuracy@10": 0.4212548015364917,
|
| 248 |
+
"eval_dim_128_cosine_accuracy@3": 0.35147247119078107,
|
| 249 |
+
"eval_dim_128_cosine_accuracy@5": 0.37900128040973113,
|
| 250 |
+
"eval_dim_128_cosine_map@100": 0.4338211299784659,
|
| 251 |
+
"eval_dim_128_cosine_mrr@10": 0.35916305916305874,
|
| 252 |
+
"eval_dim_128_cosine_ndcg@10": 0.37139192897263235,
|
| 253 |
+
"eval_dim_128_cosine_precision@1": 0.34699103713188223,
|
| 254 |
+
"eval_dim_128_cosine_precision@10": 0.3042893725992318,
|
| 255 |
+
"eval_dim_128_cosine_precision@3": 0.34571062740076824,
|
| 256 |
+
"eval_dim_128_cosine_precision@5": 0.3352112676056338,
|
| 257 |
+
"eval_dim_128_cosine_recall@1": 0.04217848526747235,
|
| 258 |
+
"eval_dim_128_cosine_recall@10": 0.2706183968947745,
|
| 259 |
+
"eval_dim_128_cosine_recall@3": 0.12288848071178002,
|
| 260 |
+
"eval_dim_128_cosine_recall@5": 0.18344012521240954,
|
| 261 |
+
"eval_dim_256_cosine_accuracy@1": 0.38348271446862997,
|
| 262 |
+
"eval_dim_256_cosine_accuracy@10": 0.4551856594110115,
|
| 263 |
+
"eval_dim_256_cosine_accuracy@3": 0.3886043533930858,
|
| 264 |
+
"eval_dim_256_cosine_accuracy@5": 0.4206145966709347,
|
| 265 |
+
"eval_dim_256_cosine_map@100": 0.4709582085612654,
|
| 266 |
+
"eval_dim_256_cosine_mrr@10": 0.3957850639188662,
|
| 267 |
+
"eval_dim_256_cosine_ndcg@10": 0.4087462230477571,
|
| 268 |
+
"eval_dim_256_cosine_precision@1": 0.38348271446862997,
|
| 269 |
+
"eval_dim_256_cosine_precision@10": 0.33886043533930854,
|
| 270 |
+
"eval_dim_256_cosine_precision@3": 0.382202304737516,
|
| 271 |
+
"eval_dim_256_cosine_precision@5": 0.3718309859154929,
|
| 272 |
+
"eval_dim_256_cosine_recall@1": 0.04466034705404223,
|
| 273 |
+
"eval_dim_256_cosine_recall@10": 0.2892016292717267,
|
| 274 |
+
"eval_dim_256_cosine_recall@3": 0.1301795023253766,
|
| 275 |
+
"eval_dim_256_cosine_recall@5": 0.19500340584044382,
|
| 276 |
+
"eval_dim_512_cosine_accuracy@1": 0.4065300896286812,
|
| 277 |
+
"eval_dim_512_cosine_accuracy@10": 0.4814340588988476,
|
| 278 |
+
"eval_dim_512_cosine_accuracy@3": 0.41229193341869397,
|
| 279 |
+
"eval_dim_512_cosine_accuracy@5": 0.44494238156209986,
|
| 280 |
+
"eval_dim_512_cosine_map@100": 0.49555759572196095,
|
| 281 |
+
"eval_dim_512_cosine_mrr@10": 0.41950236774180394,
|
| 282 |
+
"eval_dim_512_cosine_ndcg@10": 0.4329095460408428,
|
| 283 |
+
"eval_dim_512_cosine_precision@1": 0.4065300896286812,
|
| 284 |
+
"eval_dim_512_cosine_precision@10": 0.3596030729833547,
|
| 285 |
+
"eval_dim_512_cosine_precision@3": 0.4054630815194195,
|
| 286 |
+
"eval_dim_512_cosine_precision@5": 0.3947503201024327,
|
| 287 |
+
"eval_dim_512_cosine_recall@1": 0.047372341735862133,
|
| 288 |
+
"eval_dim_512_cosine_recall@10": 0.3071623578952262,
|
| 289 |
+
"eval_dim_512_cosine_recall@3": 0.1383106496582531,
|
| 290 |
+
"eval_dim_512_cosine_recall@5": 0.20757258542171747,
|
| 291 |
+
"eval_dim_64_cosine_accuracy@1": 0.3207426376440461,
|
| 292 |
+
"eval_dim_64_cosine_accuracy@10": 0.3725992317541613,
|
| 293 |
+
"eval_dim_64_cosine_accuracy@3": 0.322663252240717,
|
| 294 |
+
"eval_dim_64_cosine_accuracy@5": 0.3405889884763124,
|
| 295 |
+
"eval_dim_64_cosine_map@100": 0.3933467041096336,
|
| 296 |
+
"eval_dim_64_cosine_mrr@10": 0.32884732638253733,
|
| 297 |
+
"eval_dim_64_cosine_ndcg@10": 0.3371953828075091,
|
| 298 |
+
"eval_dim_64_cosine_precision@1": 0.3207426376440461,
|
| 299 |
+
"eval_dim_64_cosine_precision@10": 0.2797055057618438,
|
| 300 |
+
"eval_dim_64_cosine_precision@3": 0.3188220230473751,
|
| 301 |
+
"eval_dim_64_cosine_precision@5": 0.3088348271446863,
|
| 302 |
+
"eval_dim_64_cosine_recall@1": 0.036318765090758674,
|
| 303 |
+
"eval_dim_64_cosine_recall@10": 0.23840960718091392,
|
| 304 |
+
"eval_dim_64_cosine_recall@3": 0.10562189493083342,
|
| 305 |
+
"eval_dim_64_cosine_recall@5": 0.15867125525021739,
|
| 306 |
+
"eval_dim_768_cosine_accuracy@1": 0.41037131882202305,
|
| 307 |
+
"eval_dim_768_cosine_accuracy@10": 0.4833546734955186,
|
| 308 |
+
"eval_dim_768_cosine_accuracy@3": 0.4142125480153649,
|
| 309 |
+
"eval_dim_768_cosine_accuracy@5": 0.44430217669654287,
|
| 310 |
+
"eval_dim_768_cosine_map@100": 0.500478306774528,
|
| 311 |
+
"eval_dim_768_cosine_mrr@10": 0.4224889742495374,
|
| 312 |
+
"eval_dim_768_cosine_ndcg@10": 0.4349862241563486,
|
| 313 |
+
"eval_dim_768_cosine_precision@1": 0.41037131882202305,
|
| 314 |
+
"eval_dim_768_cosine_precision@10": 0.36165172855313704,
|
| 315 |
+
"eval_dim_768_cosine_precision@3": 0.4086641058472044,
|
| 316 |
+
"eval_dim_768_cosine_precision@5": 0.3969270166453265,
|
| 317 |
+
"eval_dim_768_cosine_recall@1": 0.047186779325657804,
|
| 318 |
+
"eval_dim_768_cosine_recall@10": 0.30540044861465576,
|
| 319 |
+
"eval_dim_768_cosine_recall@3": 0.1375709294981283,
|
| 320 |
+
"eval_dim_768_cosine_recall@5": 0.20603724780478358,
|
| 321 |
+
"eval_runtime": 98.5908,
|
| 322 |
+
"eval_samples_per_second": 0.0,
|
| 323 |
+
"eval_sequential_score": 0.3371953828075091,
|
| 324 |
+
"eval_steps_per_second": 0.0,
|
| 325 |
+
"step": 39
|
| 326 |
+
},
|
| 327 |
+
{
|
| 328 |
+
"epoch": 3.0816326530612246,
|
| 329 |
+
"grad_norm": 255.65982055664062,
|
| 330 |
+
"learning_rate": 1.9762960071199334e-05,
|
| 331 |
+
"loss": 8.6778,
|
| 332 |
+
"step": 40
|
| 333 |
+
},
|
| 334 |
+
{
|
| 335 |
+
"epoch": 3.8979591836734695,
|
| 336 |
+
"grad_norm": 470.4803771972656,
|
| 337 |
+
"learning_rate": 1.9346189253489888e-05,
|
| 338 |
+
"loss": 6.0257,
|
| 339 |
+
"step": 50
|
| 340 |
+
},
|
| 341 |
+
{
|
| 342 |
+
"epoch": 4.0,
|
| 343 |
+
"eval_dim_1024_cosine_accuracy@1": 0.4046094750320102,
|
| 344 |
+
"eval_dim_1024_cosine_accuracy@10": 0.47823303457106275,
|
| 345 |
+
"eval_dim_1024_cosine_accuracy@3": 0.4090909090909091,
|
| 346 |
+
"eval_dim_1024_cosine_accuracy@5": 0.43918053777208704,
|
| 347 |
+
"eval_dim_1024_cosine_map@100": 0.490599623630225,
|
| 348 |
+
"eval_dim_1024_cosine_mrr@10": 0.4168417068064951,
|
| 349 |
+
"eval_dim_1024_cosine_ndcg@10": 0.42913551824501384,
|
| 350 |
+
"eval_dim_1024_cosine_precision@1": 0.4046094750320102,
|
| 351 |
+
"eval_dim_1024_cosine_precision@10": 0.3565941101152369,
|
| 352 |
+
"eval_dim_1024_cosine_precision@3": 0.40311566367904395,
|
| 353 |
+
"eval_dim_1024_cosine_precision@5": 0.39180537772087065,
|
| 354 |
+
"eval_dim_1024_cosine_recall@1": 0.04660606778759063,
|
| 355 |
+
"eval_dim_1024_cosine_recall@10": 0.3014663479400921,
|
| 356 |
+
"eval_dim_1024_cosine_recall@3": 0.13592596883673455,
|
| 357 |
+
"eval_dim_1024_cosine_recall@5": 0.20379253880710943,
|
| 358 |
+
"eval_dim_128_cosine_accuracy@1": 0.34314980793854033,
|
| 359 |
+
"eval_dim_128_cosine_accuracy@10": 0.4148527528809219,
|
| 360 |
+
"eval_dim_128_cosine_accuracy@3": 0.34763124199743917,
|
| 361 |
+
"eval_dim_128_cosine_accuracy@5": 0.37708066581306016,
|
| 362 |
+
"eval_dim_128_cosine_map@100": 0.4276696379169563,
|
| 363 |
+
"eval_dim_128_cosine_mrr@10": 0.35513180090644836,
|
| 364 |
+
"eval_dim_128_cosine_ndcg@10": 0.36765573601526275,
|
| 365 |
+
"eval_dim_128_cosine_precision@1": 0.34314980793854033,
|
| 366 |
+
"eval_dim_128_cosine_precision@10": 0.302752880921895,
|
| 367 |
+
"eval_dim_128_cosine_precision@3": 0.3418693982074264,
|
| 368 |
+
"eval_dim_128_cosine_precision@5": 0.3322663252240717,
|
| 369 |
+
"eval_dim_128_cosine_recall@1": 0.040652627677675406,
|
| 370 |
+
"eval_dim_128_cosine_recall@10": 0.26330336421247125,
|
| 371 |
+
"eval_dim_128_cosine_recall@3": 0.1184519992454523,
|
| 372 |
+
"eval_dim_128_cosine_recall@5": 0.1774839552040709,
|
| 373 |
+
"eval_dim_256_cosine_accuracy@1": 0.3738796414852753,
|
| 374 |
+
"eval_dim_256_cosine_accuracy@10": 0.44558258642765686,
|
| 375 |
+
"eval_dim_256_cosine_accuracy@3": 0.37772087067861715,
|
| 376 |
+
"eval_dim_256_cosine_accuracy@5": 0.40717029449423814,
|
| 377 |
+
"eval_dim_256_cosine_map@100": 0.45855798848430374,
|
| 378 |
+
"eval_dim_256_cosine_mrr@10": 0.38572571794402755,
|
| 379 |
+
"eval_dim_256_cosine_ndcg@10": 0.3980442434686935,
|
| 380 |
+
"eval_dim_256_cosine_precision@1": 0.3738796414852753,
|
| 381 |
+
"eval_dim_256_cosine_precision@10": 0.3297695262483995,
|
| 382 |
+
"eval_dim_256_cosine_precision@3": 0.37238583013230897,
|
| 383 |
+
"eval_dim_256_cosine_precision@5": 0.3615877080665813,
|
| 384 |
+
"eval_dim_256_cosine_recall@1": 0.043086085492826574,
|
| 385 |
+
"eval_dim_256_cosine_recall@10": 0.2792649180924836,
|
| 386 |
+
"eval_dim_256_cosine_recall@3": 0.125747799799009,
|
| 387 |
+
"eval_dim_256_cosine_recall@5": 0.18837022600852496,
|
| 388 |
+
"eval_dim_512_cosine_accuracy@1": 0.39884763124199746,
|
| 389 |
+
"eval_dim_512_cosine_accuracy@10": 0.47823303457106275,
|
| 390 |
+
"eval_dim_512_cosine_accuracy@3": 0.4052496798975672,
|
| 391 |
+
"eval_dim_512_cosine_accuracy@5": 0.44558258642765686,
|
| 392 |
+
"eval_dim_512_cosine_map@100": 0.4876319198894288,
|
| 393 |
+
"eval_dim_512_cosine_mrr@10": 0.41307745462675005,
|
| 394 |
+
"eval_dim_512_cosine_ndcg@10": 0.42824151108259556,
|
| 395 |
+
"eval_dim_512_cosine_precision@1": 0.39884763124199746,
|
| 396 |
+
"eval_dim_512_cosine_precision@10": 0.35793854033290645,
|
| 397 |
+
"eval_dim_512_cosine_precision@3": 0.3975672215108835,
|
| 398 |
+
"eval_dim_512_cosine_precision@5": 0.3888604353393086,
|
| 399 |
+
"eval_dim_512_cosine_recall@1": 0.04570727180608771,
|
| 400 |
+
"eval_dim_512_cosine_recall@10": 0.2993652309972795,
|
| 401 |
+
"eval_dim_512_cosine_recall@3": 0.13329368345632836,
|
| 402 |
+
"eval_dim_512_cosine_recall@5": 0.2006035854063678,
|
| 403 |
+
"eval_dim_64_cosine_accuracy@1": 0.3079385403329065,
|
| 404 |
+
"eval_dim_64_cosine_accuracy@10": 0.36555697823303457,
|
| 405 |
+
"eval_dim_64_cosine_accuracy@3": 0.31241997439180536,
|
| 406 |
+
"eval_dim_64_cosine_accuracy@5": 0.33290653008962867,
|
| 407 |
+
"eval_dim_64_cosine_map@100": 0.38184314430829974,
|
| 408 |
+
"eval_dim_64_cosine_mrr@10": 0.31748394406845065,
|
| 409 |
+
"eval_dim_64_cosine_ndcg@10": 0.3275369456141822,
|
| 410 |
+
"eval_dim_64_cosine_precision@1": 0.3079385403329065,
|
| 411 |
+
"eval_dim_64_cosine_precision@10": 0.27215108834827145,
|
| 412 |
+
"eval_dim_64_cosine_precision@3": 0.3070849338454972,
|
| 413 |
+
"eval_dim_64_cosine_precision@5": 0.29820742637644043,
|
| 414 |
+
"eval_dim_64_cosine_recall@1": 0.03504677697523653,
|
| 415 |
+
"eval_dim_64_cosine_recall@10": 0.23026653514933906,
|
| 416 |
+
"eval_dim_64_cosine_recall@3": 0.10211269541567973,
|
| 417 |
+
"eval_dim_64_cosine_recall@5": 0.15297976910096123,
|
| 418 |
+
"eval_dim_768_cosine_accuracy@1": 0.3994878361075544,
|
| 419 |
+
"eval_dim_768_cosine_accuracy@10": 0.4737516005121639,
|
| 420 |
+
"eval_dim_768_cosine_accuracy@3": 0.4046094750320102,
|
| 421 |
+
"eval_dim_768_cosine_accuracy@5": 0.4359795134443022,
|
| 422 |
+
"eval_dim_768_cosine_map@100": 0.48680507317454147,
|
| 423 |
+
"eval_dim_768_cosine_mrr@10": 0.41201019246793846,
|
| 424 |
+
"eval_dim_768_cosine_ndcg@10": 0.4244383191680289,
|
| 425 |
+
"eval_dim_768_cosine_precision@1": 0.3994878361075544,
|
| 426 |
+
"eval_dim_768_cosine_precision@10": 0.352752880921895,
|
| 427 |
+
"eval_dim_768_cosine_precision@3": 0.39820742637644047,
|
| 428 |
+
"eval_dim_768_cosine_precision@5": 0.3868117797695263,
|
| 429 |
+
"eval_dim_768_cosine_recall@1": 0.046132270416131195,
|
| 430 |
+
"eval_dim_768_cosine_recall@10": 0.29681183299989666,
|
| 431 |
+
"eval_dim_768_cosine_recall@3": 0.13453018491697852,
|
| 432 |
+
"eval_dim_768_cosine_recall@5": 0.20078864250336506,
|
| 433 |
+
"eval_runtime": 98.6751,
|
| 434 |
+
"eval_samples_per_second": 0.0,
|
| 435 |
+
"eval_sequential_score": 0.3275369456141822,
|
| 436 |
+
"eval_steps_per_second": 0.0,
|
| 437 |
+
"step": 52
|
| 438 |
+
},
|
| 439 |
+
{
|
| 440 |
+
"epoch": 4.653061224489796,
|
| 441 |
+
"grad_norm": 311.2161865234375,
|
| 442 |
+
"learning_rate": 1.8732057547721962e-05,
|
| 443 |
+
"loss": 3.3524,
|
| 444 |
+
"step": 60
|
| 445 |
+
},
|
| 446 |
+
{
|
| 447 |
+
"epoch": 5.0,
|
| 448 |
+
"eval_dim_1024_cosine_accuracy@1": 0.3994878361075544,
|
| 449 |
+
"eval_dim_1024_cosine_accuracy@10": 0.4814340588988476,
|
| 450 |
+
"eval_dim_1024_cosine_accuracy@3": 0.40973111395646605,
|
| 451 |
+
"eval_dim_1024_cosine_accuracy@5": 0.44238156209987195,
|
| 452 |
+
"eval_dim_1024_cosine_map@100": 0.4960353530991054,
|
| 453 |
+
"eval_dim_1024_cosine_mrr@10": 0.41413607910086736,
|
| 454 |
+
"eval_dim_1024_cosine_ndcg@10": 0.42824330702763147,
|
| 455 |
+
"eval_dim_1024_cosine_precision@1": 0.3994878361075544,
|
| 456 |
+
"eval_dim_1024_cosine_precision@10": 0.3562099871959027,
|
| 457 |
+
"eval_dim_1024_cosine_precision@3": 0.3994878361075544,
|
| 458 |
+
"eval_dim_1024_cosine_precision@5": 0.3897567221510884,
|
| 459 |
+
"eval_dim_1024_cosine_recall@1": 0.046427253250942845,
|
| 460 |
+
"eval_dim_1024_cosine_recall@10": 0.30156152834977973,
|
| 461 |
+
"eval_dim_1024_cosine_recall@3": 0.1357642561296911,
|
| 462 |
+
"eval_dim_1024_cosine_recall@5": 0.20380194680388578,
|
| 463 |
+
"eval_dim_128_cosine_accuracy@1": 0.34699103713188223,
|
| 464 |
+
"eval_dim_128_cosine_accuracy@10": 0.41613316261203587,
|
| 465 |
+
"eval_dim_128_cosine_accuracy@3": 0.3495518565941101,
|
| 466 |
+
"eval_dim_128_cosine_accuracy@5": 0.37900128040973113,
|
| 467 |
+
"eval_dim_128_cosine_map@100": 0.4291315309956839,
|
| 468 |
+
"eval_dim_128_cosine_mrr@10": 0.35818293599983697,
|
| 469 |
+
"eval_dim_128_cosine_ndcg@10": 0.36965214083548276,
|
| 470 |
+
"eval_dim_128_cosine_precision@1": 0.34699103713188223,
|
| 471 |
+
"eval_dim_128_cosine_precision@10": 0.30550576184379,
|
| 472 |
+
"eval_dim_128_cosine_precision@3": 0.34528382415706355,
|
| 473 |
+
"eval_dim_128_cosine_precision@5": 0.33533930857874517,
|
| 474 |
+
"eval_dim_128_cosine_recall@1": 0.04023580723646711,
|
| 475 |
+
"eval_dim_128_cosine_recall@10": 0.2604238007608957,
|
| 476 |
+
"eval_dim_128_cosine_recall@3": 0.11713599313797275,
|
| 477 |
+
"eval_dim_128_cosine_recall@5": 0.17553870970060761,
|
| 478 |
+
"eval_dim_256_cosine_accuracy@1": 0.3764404609475032,
|
| 479 |
+
"eval_dim_256_cosine_accuracy@10": 0.4532650448143406,
|
| 480 |
+
"eval_dim_256_cosine_accuracy@3": 0.382202304737516,
|
| 481 |
+
"eval_dim_256_cosine_accuracy@5": 0.41037131882202305,
|
| 482 |
+
"eval_dim_256_cosine_map@100": 0.46504361814337597,
|
| 483 |
+
"eval_dim_256_cosine_mrr@10": 0.3891762189297396,
|
| 484 |
+
"eval_dim_256_cosine_ndcg@10": 0.40161260018012396,
|
| 485 |
+
"eval_dim_256_cosine_precision@1": 0.3764404609475032,
|
| 486 |
+
"eval_dim_256_cosine_precision@10": 0.3325864276568502,
|
| 487 |
+
"eval_dim_256_cosine_precision@3": 0.3758002560819462,
|
| 488 |
+
"eval_dim_256_cosine_precision@5": 0.365044814340589,
|
| 489 |
+
"eval_dim_256_cosine_recall@1": 0.04345597060609991,
|
| 490 |
+
"eval_dim_256_cosine_recall@10": 0.28270389457679657,
|
| 491 |
+
"eval_dim_256_cosine_recall@3": 0.12739095919345977,
|
| 492 |
+
"eval_dim_256_cosine_recall@5": 0.19108724610052447,
|
| 493 |
+
"eval_dim_512_cosine_accuracy@1": 0.39436619718309857,
|
| 494 |
+
"eval_dim_512_cosine_accuracy@10": 0.471190781049936,
|
| 495 |
+
"eval_dim_512_cosine_accuracy@3": 0.4033290653008963,
|
| 496 |
+
"eval_dim_512_cosine_accuracy@5": 0.4327784891165173,
|
| 497 |
+
"eval_dim_512_cosine_map@100": 0.48375387985213597,
|
| 498 |
+
"eval_dim_512_cosine_mrr@10": 0.4078435258012718,
|
| 499 |
+
"eval_dim_512_cosine_ndcg@10": 0.4209567413561994,
|
| 500 |
+
"eval_dim_512_cosine_precision@1": 0.39436619718309857,
|
| 501 |
+
"eval_dim_512_cosine_precision@10": 0.348719590268886,
|
| 502 |
+
"eval_dim_512_cosine_precision@3": 0.39436619718309857,
|
| 503 |
+
"eval_dim_512_cosine_precision@5": 0.38373879641485276,
|
| 504 |
+
"eval_dim_512_cosine_recall@1": 0.046001271870766657,
|
| 505 |
+
"eval_dim_512_cosine_recall@10": 0.29407016086576515,
|
| 506 |
+
"eval_dim_512_cosine_recall@3": 0.13434589294029278,
|
| 507 |
+
"eval_dim_512_cosine_recall@5": 0.2006372923557733,
|
| 508 |
+
"eval_dim_64_cosine_accuracy@1": 0.293854033290653,
|
| 509 |
+
"eval_dim_64_cosine_accuracy@10": 0.3591549295774648,
|
| 510 |
+
"eval_dim_64_cosine_accuracy@3": 0.30153649167733676,
|
| 511 |
+
"eval_dim_64_cosine_accuracy@5": 0.32714468629961585,
|
| 512 |
+
"eval_dim_64_cosine_map@100": 0.3744361264744976,
|
| 513 |
+
"eval_dim_64_cosine_mrr@10": 0.30537518037517997,
|
| 514 |
+
"eval_dim_64_cosine_ndcg@10": 0.3185372635267884,
|
| 515 |
+
"eval_dim_64_cosine_precision@1": 0.293854033290653,
|
| 516 |
+
"eval_dim_64_cosine_precision@10": 0.2681177976952625,
|
| 517 |
+
"eval_dim_64_cosine_precision@3": 0.29449423815621,
|
| 518 |
+
"eval_dim_64_cosine_precision@5": 0.288348271446863,
|
| 519 |
+
"eval_dim_64_cosine_recall@1": 0.03212717718240556,
|
| 520 |
+
"eval_dim_64_cosine_recall@10": 0.221706864386852,
|
| 521 |
+
"eval_dim_64_cosine_recall@3": 0.0944529143897263,
|
| 522 |
+
"eval_dim_64_cosine_recall@5": 0.14311801944731944,
|
| 523 |
+
"eval_dim_768_cosine_accuracy@1": 0.3892445582586428,
|
| 524 |
+
"eval_dim_768_cosine_accuracy@10": 0.47823303457106275,
|
| 525 |
+
"eval_dim_768_cosine_accuracy@3": 0.3994878361075544,
|
| 526 |
+
"eval_dim_768_cosine_accuracy@5": 0.43661971830985913,
|
| 527 |
+
"eval_dim_768_cosine_map@100": 0.48796722771226453,
|
| 528 |
+
"eval_dim_768_cosine_mrr@10": 0.4050812450460335,
|
| 529 |
+
"eval_dim_768_cosine_ndcg@10": 0.4211330537467249,
|
| 530 |
+
"eval_dim_768_cosine_precision@1": 0.3892445582586428,
|
| 531 |
+
"eval_dim_768_cosine_precision@10": 0.35147247119078107,
|
| 532 |
+
"eval_dim_768_cosine_precision@3": 0.38988476312419973,
|
| 533 |
+
"eval_dim_768_cosine_precision@5": 0.38156209987195905,
|
| 534 |
+
"eval_dim_768_cosine_recall@1": 0.045140545184589424,
|
| 535 |
+
"eval_dim_768_cosine_recall@10": 0.29727932103829957,
|
| 536 |
+
"eval_dim_768_cosine_recall@3": 0.13218231618768836,
|
| 537 |
+
"eval_dim_768_cosine_recall@5": 0.19882192649305613,
|
| 538 |
+
"eval_runtime": 98.5973,
|
| 539 |
+
"eval_samples_per_second": 0.0,
|
| 540 |
+
"eval_sequential_score": 0.3185372635267884,
|
| 541 |
+
"eval_steps_per_second": 0.0,
|
| 542 |
+
"step": 65
|
| 543 |
+
}
|
| 544 |
+
],
|
| 545 |
+
"logging_steps": 10,
|
| 546 |
+
"max_steps": 240,
|
| 547 |
+
"num_input_tokens_seen": 0,
|
| 548 |
+
"num_train_epochs": 20,
|
| 549 |
+
"save_steps": 500,
|
| 550 |
+
"stateful_callbacks": {
|
| 551 |
+
"EarlyStoppingCallback": {
|
| 552 |
+
"args": {
|
| 553 |
+
"early_stopping_patience": 2,
|
| 554 |
+
"early_stopping_threshold": 0.0
|
| 555 |
+
},
|
| 556 |
+
"attributes": {
|
| 557 |
+
"early_stopping_patience_counter": 2
|
| 558 |
+
}
|
| 559 |
+
},
|
| 560 |
+
"TrainerControl": {
|
| 561 |
+
"args": {
|
| 562 |
+
"should_epoch_stop": false,
|
| 563 |
+
"should_evaluate": false,
|
| 564 |
+
"should_log": false,
|
| 565 |
+
"should_save": true,
|
| 566 |
+
"should_training_stop": true
|
| 567 |
+
},
|
| 568 |
+
"attributes": {}
|
| 569 |
+
}
|
| 570 |
+
},
|
| 571 |
+
"total_flos": 0.0,
|
| 572 |
+
"train_batch_size": 8,
|
| 573 |
+
"trial_name": null,
|
| 574 |
+
"trial_params": null
|
| 575 |
+
}
|
checkpoint-65/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd906d94b017c1a7fa871b608776d19ecf4218c10c253401fe78ba8ce84435be
|
| 3 |
+
size 6097
|
eval/Information-Retrieval_evaluation_dim_1024_results.csv
CHANGED
|
@@ -1,7 +1,6 @@
|
|
| 1 |
epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
|
| 2 |
-
1.0,
|
| 3 |
-
2.0,
|
| 4 |
-
3.0,
|
| 5 |
-
|
| 6 |
-
|
| 7 |
-
3.0,294,0.3053777208706786,0.31434058898847633,0.34635083226632524,0.3854033290653009,0.3053777208706786,0.03802085156159601,0.30644472897994024,0.11197884027712995,0.2998719590268886,0.16921874866295042,0.27516005121638926,0.2530788160980187,0.31961389549417674,0.3342308256907798,0.3945564342654779
|
|
|
|
| 1 |
epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
|
| 2 |
+
1.0,13,0.42509603072983354,0.43085787451984636,0.46030729833546735,0.49295774647887325,0.42509603072983354,0.04813624827530403,0.42402902262057185,0.1404092551990217,0.4133162612035851,0.21147403835662126,0.376056338028169,0.3150476790176975,0.4369535394183281,0.4493804868009024,0.508986346237021
|
| 3 |
+
2.0,26,0.3854033290653009,0.3886043533930858,0.41101152368758004,0.45454545454545453,0.3854033290653009,0.0451686782205082,0.3839095177123346,0.13200270380544088,0.3713188220230474,0.19735476247586825,0.3357874519846351,0.2918225395020212,0.39624870434729537,0.4065329035406967,0.47259820099791205
|
| 4 |
+
3.0,39,0.4180537772087068,0.42189500640204863,0.4500640204865557,0.49039692701664533,0.4180537772087068,0.04734422767263886,0.4163465642338881,0.138064233626932,0.4043533930857874,0.2069980430010945,0.36869398207426374,0.308531274625124,0.42985717334308843,0.44178501209869797,0.506794523350519
|
| 5 |
+
4.0,52,0.4046094750320102,0.4090909090909091,0.43918053777208704,0.47823303457106275,0.4046094750320102,0.04660606778759063,0.40311566367904395,0.13592596883673455,0.39180537772087065,0.20379253880710943,0.3565941101152369,0.3014663479400921,0.4168417068064951,0.42913551824501384,0.490599623630225
|
| 6 |
+
5.0,65,0.3994878361075544,0.40973111395646605,0.44238156209987195,0.4814340588988476,0.3994878361075544,0.046427253250942845,0.3994878361075544,0.1357642561296911,0.3897567221510884,0.20380194680388578,0.3562099871959027,0.30156152834977973,0.41413607910086736,0.42824330702763147,0.4960353530991054
|
|
|