IoannisKat1 commited on
Commit
42557c6
·
verified ·
1 Parent(s): 807a21f

Add finetuned model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +3 -0
  2. checkpoint-39/1_Pooling/config.json +10 -0
  3. checkpoint-39/README.md +1637 -0
  4. checkpoint-39/config.json +27 -0
  5. checkpoint-39/config_sentence_transformers.json +14 -0
  6. checkpoint-39/model.safetensors +3 -0
  7. checkpoint-39/modules.json +20 -0
  8. checkpoint-39/optimizer.pt +3 -0
  9. checkpoint-39/rng_state.pth +3 -0
  10. checkpoint-39/scheduler.pt +3 -0
  11. checkpoint-39/sentence_bert_config.json +4 -0
  12. checkpoint-39/sentencepiece.bpe.model +3 -0
  13. checkpoint-39/special_tokens_map.json +51 -0
  14. checkpoint-39/tokenizer.json +3 -0
  15. checkpoint-39/tokenizer_config.json +55 -0
  16. checkpoint-39/trainer_state.json +358 -0
  17. checkpoint-39/training_args.bin +3 -0
  18. checkpoint-52/1_Pooling/config.json +10 -0
  19. checkpoint-52/README.md +1640 -0
  20. checkpoint-52/config.json +27 -0
  21. checkpoint-52/config_sentence_transformers.json +14 -0
  22. checkpoint-52/model.safetensors +3 -0
  23. checkpoint-52/modules.json +20 -0
  24. checkpoint-52/optimizer.pt +3 -0
  25. checkpoint-52/rng_state.pth +3 -0
  26. checkpoint-52/scheduler.pt +3 -0
  27. checkpoint-52/sentence_bert_config.json +4 -0
  28. checkpoint-52/sentencepiece.bpe.model +3 -0
  29. checkpoint-52/special_tokens_map.json +51 -0
  30. checkpoint-52/tokenizer.json +3 -0
  31. checkpoint-52/tokenizer_config.json +55 -0
  32. checkpoint-52/trainer_state.json +470 -0
  33. checkpoint-52/training_args.bin +3 -0
  34. checkpoint-65/1_Pooling/config.json +10 -0
  35. checkpoint-65/README.md +1642 -0
  36. checkpoint-65/config.json +27 -0
  37. checkpoint-65/config_sentence_transformers.json +14 -0
  38. checkpoint-65/model.safetensors +3 -0
  39. checkpoint-65/modules.json +20 -0
  40. checkpoint-65/optimizer.pt +3 -0
  41. checkpoint-65/rng_state.pth +3 -0
  42. checkpoint-65/scheduler.pt +3 -0
  43. checkpoint-65/sentence_bert_config.json +4 -0
  44. checkpoint-65/sentencepiece.bpe.model +3 -0
  45. checkpoint-65/special_tokens_map.json +51 -0
  46. checkpoint-65/tokenizer.json +3 -0
  47. checkpoint-65/tokenizer_config.json +55 -0
  48. checkpoint-65/trainer_state.json +575 -0
  49. checkpoint-65/training_args.bin +3 -0
  50. eval/Information-Retrieval_evaluation_dim_1024_results.csv +5 -6
.gitattributes CHANGED
@@ -37,3 +37,6 @@ checkpoint-196/tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
  checkpoint-294/tokenizer.json filter=lfs diff=lfs merge=lfs -text
38
  checkpoint-98/tokenizer.json filter=lfs diff=lfs merge=lfs -text
39
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
37
  checkpoint-294/tokenizer.json filter=lfs diff=lfs merge=lfs -text
38
  checkpoint-98/tokenizer.json filter=lfs diff=lfs merge=lfs -text
39
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
40
+ checkpoint-39/tokenizer.json filter=lfs diff=lfs merge=lfs -text
41
+ checkpoint-52/tokenizer.json filter=lfs diff=lfs merge=lfs -text
42
+ checkpoint-65/tokenizer.json filter=lfs diff=lfs merge=lfs -text
checkpoint-39/1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 1024,
3
+ "pooling_mode_cls_token": false,
4
+ "pooling_mode_mean_tokens": true,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
checkpoint-39/README.md ADDED
@@ -0,0 +1,1637 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ license: apache-2.0
5
+ tags:
6
+ - sentence-transformers
7
+ - sentence-similarity
8
+ - feature-extraction
9
+ - dense
10
+ - generated_from_trainer
11
+ - dataset_size:391
12
+ - loss:MatryoshkaLoss
13
+ - loss:MultipleNegativesRankingLoss
14
+ base_model: intfloat/multilingual-e5-large
15
+ widget:
16
+ - source_sentence: What is the responsibility of assisting and advising the data subjects
17
+ in exercising their rights?
18
+ sentences:
19
+ - '1.Personal data shall be: (a) processed lawfully, fairly and in a transparent
20
+ manner in relation to the data subject (‘lawfulness, fairness and transparency’);
21
+ (b) collected for specified, explicit and legitimate purposes and not further
22
+ processed in a manner that is incompatible with those purposes; further processing
23
+ for archiving purposes in the public interest, scientific or historical research
24
+ purposes or statistical purposes shall, in accordance with Article 89(1), not
25
+ be considered to be incompatible with the initial purposes (‘purpose limitation’);
26
+ (c) adequate, relevant and limited to what is necessary in relation to the purposes
27
+ for which they are processed (‘data minimisation’); (d) accurate and, where necessary,
28
+ kept up to date; every reasonable step must be taken to ensure that personal data
29
+ that are inaccurate, having regard to the purposes for which they are processed,
30
+ are erased or rectified without delay (‘accuracy’); 4.5.2016 L 119/35 (1) Directive
31
+ (EU) 2015/1535 of the European Parliament and of the Council of 9 September 2015
32
+ laying down a procedure for the provision of information in the field of technical
33
+ regulations and of rules on Information Society services (OJ L 241, 17.9.2015,
34
+ p. 1). (e) kept in a form which permits identification of data subjects for no
35
+ longer than is necessary for the purposes for which the personal data are processed;
36
+ personal data may be stored for longer periods insofar as the personal data will
37
+ be processed solely for archiving purposes in the public interest, scientific
38
+ or historical research purposes or statistical purposes in accordance with Article
39
+ 89(1) subject to implementation of the appropriate technical and organisational
40
+ measures required by this Regulation in order to safeguard the rights and freedoms
41
+ of the data subject (‘storage limitation’); (f) processed in a manner that ensures
42
+ appropriate security of the personal data, including protection against unauthorised
43
+ or unlawful processing and against accidental loss, destruction or damage, using
44
+ appropriate technical or organisational measures (‘integrity and confidentiality’).
45
+
46
+ 2.The controller shall be responsible for, and be able to demonstrate compliance
47
+ with, paragraph 1 (‘accountability’).'
48
+ - '1.A transfer of personal data to a third country or an international organisation
49
+ may take place where the Commission has decided that the third country, a territory
50
+ or one or more specified sectors within that third country, or the international
51
+ organisation in question ensures an adequate level of protection. Such a transfer
52
+ shall not require any specific authorisation.
53
+
54
+ 2.When assessing the adequacy of the level of protection, the Commission shall,
55
+ in particular, take account of the following elements: (a) the rule of law, respect
56
+ for human rights and fundamental freedoms, relevant legislation, both general
57
+ and sectoral, including concerning public security, defence, national security
58
+ and criminal law and the access of public authorities to personal data, as well
59
+ as the implementation of such legislation, data protection rules, professional
60
+ rules and security measures, including rules for the onward transfer of personal
61
+ data to another third country or international organisation which are complied
62
+ with in that country or international organisation, case-law, as well as effective
63
+ and enforceable data subject rights and effective administrative and judicial
64
+ redress for the data subjects whose personal data are being transferred; (b) the
65
+ existence and effective functioning of one or more independent supervisory authorities
66
+ in the third country or to which an international organisation is subject, with
67
+ responsibility for ensuring and enforcing compliance with the data protection
68
+ rules, including adequate enforcement powers, for assisting and advising the data
69
+ subjects in exercising their rights and for cooperation with the supervisory authorities
70
+ of the Member States; and (c) the international commitments the third country
71
+ or international organisation concerned has entered into, or other obligations
72
+ arising from legally binding conventions or instruments as well as from its participation
73
+ in multilateral or regional systems, in particular in relation to the protection
74
+ of personal data.
75
+
76
+ 3.The Commission, after assessing the adequacy of the level of protection, may
77
+ decide, by means of implementing act, that a third country, a territory or one
78
+ or more specified sectors within a third country, or an international organisation
79
+ ensures an adequate level of protection within the meaning of paragraph 2 of this
80
+ Article. The implementing act shall provide for a mechanism for a periodic review,
81
+ at least every four years, which shall take into account all relevant developments
82
+ in the third country or international organisation. The implementing act shall
83
+ specify its territorial and sectoral application and, where applicable, identify
84
+ the supervisory authority or authorities referred to in point (b) of paragraph
85
+ 2 of this Article. The implementing act shall be adopted in accordance with the
86
+ examination procedure referred to in Article 93(2).
87
+
88
+ 4.The Commission shall, on an ongoing basis, monitor developments in third countries
89
+ and international organisations that could affect the functioning of decisions
90
+ adopted pursuant to paragraph 3 of this Article and decisions adopted on the basis
91
+ of Article 25(6) of Directive 95/46/EC.
92
+
93
+ 5.The Commission shall, where available information reveals, in particular following
94
+ the review referred to in paragraph 3 of this Article, that a third country, a
95
+ territory or one or more specified sectors within a third country, or an international
96
+ organisation no longer ensures an adequate level of protection within the meaning
97
+ of paragraph 2 of this Article, to the extent necessary, repeal, amend or suspend
98
+ the decision referred to in paragraph 3 of this Article by means of implementing
99
+ acts without retro-active effect. Those implementing acts shall be adopted in
100
+ accordance with the examination procedure referred to in Article 93(2). On duly
101
+ justified imperative grounds of urgency, the Commission shall adopt immediately
102
+ applicable implementing acts in accordance with the procedure referred to in Article
103
+ 93(3).
104
+
105
+ 6.The Commission shall enter into consultations with the third country or international
106
+ organisation with a view to remedying the situation giving rise to the decision
107
+ made pursuant to paragraph 5
108
+
109
+ 7.A decision pursuant to paragraph 5 of this Article is without prejudice to transfers
110
+ of personal data to the third country, a territory or one or more specified sectors
111
+ within that third country, or the international organisation in question pursuant
112
+ to Articles 46 to 49
113
+
114
+ 8.The Commission shall publish in the Official Journal of the European Union and
115
+ on its website a list of the third countries, territories and specified sectors
116
+ within a third country and international organisations for which it has decided
117
+ that an adequate level of protection is or is no longer ensured.
118
+
119
+ 9.Decisions adopted by the Commission on the basis of Article 25(6) of Directive
120
+ 95/46/EC shall remain in force until amended, replaced or repealed by a Commission
121
+ Decision adopted in accordance with paragraph 3 or 5 of this Article.'
122
+ - The legal systems of Denmark and Estonia do not allow for administrative fines
123
+ as set out in this Regulation. The rules on administrative fines may be applied
124
+ in such a manner that in Denmark the fine is imposed by competent national courts
125
+ as a criminal penalty and in Estonia the fine is imposed by the supervisory authority
126
+ in the framework of a misdemeanour procedure, provided that such an application
127
+ of the rules in those Member States has an equivalent effect to administrative
128
+ fines imposed by supervisory authorities. Therefore the competent national courts
129
+ should take into account the recommendation by the supervisory authority initiating
130
+ the fine. In any event, the fines imposed should be effective, proportionate and
131
+ dissuasive.
132
+ - source_sentence: Is the fine mandatory for the described offense?
133
+ sentences:
134
+ - "1.Each supervisory authority shall ensure that the imposition of administrative\
135
+ \ fines pursuant to this Article in respect of infringements of this Regulation\
136
+ \ referred to in paragraphs 4, 5 and 6 shall in each individual case be effective,\
137
+ \ proportionate and dissuasive.\n2.Administrative fines shall, depending on the\
138
+ \ circumstances of each individual case, be imposed in addition to, or instead\
139
+ \ of, measures referred to in points (a) to (h) and (j) of Article 58(2). When\
140
+ \ deciding whether to impose an administrative fine and deciding on the amount\
141
+ \ of the administrative fine in each individual case due regard shall be given\
142
+ \ to the following: (a) the nature, gravity and duration of the infringement\
143
+ \ taking into account the nature scope or purpose of the processing concerned\
144
+ \ as well as the number of data subjects affected and the level of damage suffered\
145
+ \ by them; (b) the intentional or negligent character of the infringement; (c)\
146
+ \ any action taken by the controller or processor to mitigate the damage suffered\
147
+ \ by data subjects; (d) the degree of responsibility of the controller or processor\
148
+ \ taking into account technical and organisational measures implemented by them\
149
+ \ pursuant to Articles 25 and 32; (e) any relevant previous infringements by\
150
+ \ the controller or processor; (f) the degree of cooperation with the supervisory\
151
+ \ authority, in order to remedy the infringement and mitigate the possible adverse\
152
+ \ effects of the infringement; (g) the categories of personal data affected by\
153
+ \ the infringement; (h) the manner in which the infringement became known to\
154
+ \ the supervisory authority, in particular whether, and if so to what extent,\
155
+ \ the controller or processor notified the infringement; (i) where measures referred\
156
+ \ to in Article 58(2) have previously been ordered against the controller or processor\
157
+ \ concerned with regard to the same subject-matter, compliance with those measures;\
158
+ \ (j) adherence to approved codes of conduct pursuant to Article 40 or approved\
159
+ \ certification mechanisms pursuant to Article 42; and (k) any other aggravating\
160
+ \ or mitigating factor applicable to the circumstances of the case, such as financial\
161
+ \ benefits gained, or losses avoided, directly or indirectly, from the infringement.\n\
162
+ 3.If a controller or processor intentionally or negligently, for the same or linked\
163
+ \ processing operations, infringes several provisions of this Regulation, the\
164
+ \ total amount of the administrative fine shall not exceed the amount specified\
165
+ \ for the gravest infringement.\n4.Infringements of the following provisions shall,\
166
+ \ in accordance with paragraph 2, be subject to administrative fines up to 10\
167
+ \ 000 000 EUR, or in the case of an undertaking, up to 2 % of the total worldwide\
168
+ \ annual turnover of the preceding financial year, whichever is higher: (a) the\
169
+ \ obligations of the controller and the processor pursuant to Articles 8, 11,\
170
+ \ 25 to 39 and 42 and 43; (b) the obligations of the certification body pursuant\
171
+ \ to Articles 42 and 43; (c) the obligations of the monitoring body pursuant\
172
+ \ to Article 41(4). 4.5.2016 L 119/82 \n5.Infringements of the following provisions\
173
+ \ shall, in accordance with paragraph 2, be subject to administrative fines up\
174
+ \ to 20 000 000 EUR, or in the case of an undertaking, up to 4 % of the total\
175
+ \ worldwide annual turnover of the preceding financial year, whichever is higher:\
176
+ \ (a) the basic principles for processing, including conditions for consent,\
177
+ \ pursuant to Articles 5, 6, 7 and 9; (b) the data subjects' rights pursuant\
178
+ \ to Articles 12 to 22; (c) the transfers of personal data to a recipient in\
179
+ \ a third country or an international organisation pursuant to Articles 44 to\
180
+ \ 49; (d) any obligations pursuant to Member State law adopted under Chapter\
181
+ \ IX; (e) non-compliance with an order or a temporary or definitive limitation\
182
+ \ on processing or the suspension of data flows by the supervisory authority pursuant\
183
+ \ to Article 58(2) or failure to provide access in violation of Article 58(1).\n\
184
+ 6.Non-compliance with an order by the supervisory authority as referred to in\
185
+ \ Article 58(2) shall, in accordance with paragraph 2 of this Article, be subject\
186
+ \ to administrative fines up to 20 000 000 EUR, or in the case of an undertaking,\
187
+ \ up to 4 % of the total worldwide annual turnover of the preceding financial\
188
+ \ year, whichever is higher.\n7.Without prejudice to the corrective powers of\
189
+ \ supervisory authorities pursuant to Article 58(2), each Member State may lay\
190
+ \ down the rules on whether and to what extent administrative fines may be imposed\
191
+ \ on public authorities and bodies established in that Member State.\n8.The exercise\
192
+ \ by the supervisory authority of its powers under this Article shall be subject\
193
+ \ to appropriate procedural safeguards in accordance with Union and Member State\
194
+ \ law, including effective judicial remedy and due process.\n9.Where the legal\
195
+ \ system of the Member State does not provide for administrative fines, this Article\
196
+ \ may be applied in such a manner that the fine is initiated by the competent\
197
+ \ supervisory authority and imposed by competent national courts, while ensuring\
198
+ \ that those legal remedies are effective and have an equivalent effect to the\
199
+ \ administrative fines imposed by supervisory authorities. In any event, the fines\
200
+ \ imposed shall be effective, proportionate and dissuasive. Those Member States\
201
+ \ shall notify to the Commission the provisions of their laws which they adopt\
202
+ \ pursuant to this paragraph by 25 May 2018 and, without delay, any subsequent\
203
+ \ amendment law or amendment affecting them."
204
+ - "Court (Civil/Criminal): Criminal \nProvisions: Article 386 of the Penal Code\
205
+ \ \nTime of commission of the act: \nResult (innocent, guilty): \nReasoning:\
206
+ \ Conviction for computer fraud committed repeatedly and professionally with a\
207
+ \ total benefit and damage exceeding €30,000. According to the majority opinion,\
208
+ \ the charge is substantiated in both its objective and subjective aspects, and\
209
+ \ the defendant must be declared guilty of the aforementioned criminal acts of\
210
+ \ fraud by means of a computer, committed repeatedly by a perpetrator acting professionally,\
211
+ \ where the total financial benefit and corresponding damage exceed the amount\
212
+ \ of €30,000, as well as for repeated embezzlement.\n\nFacts: The defendant accessed\
213
+ \ a website using a computer, employing, without the knowledge and consent of\
214
+ \ the complainants, the access codes for the electronic management system of the\
215
+ \ bank accounts held by the complainants at a Bank, and transferred money through\
216
+ \ electronically transmitted orders from the complainants' accounts to her own\
217
+ \ account. Specifically, during the period from June 2007 to June 2008, after\
218
+ \ unlawfully acquiring the aforementioned STICK containing the access codes, she\
219
+ \ accessed a website maintained by ..., using, without the complainants' knowledge\
220
+ \ (without their consent or approval), the access codes for the electronic management\
221
+ \ system of the bank accounts held at the aforementioned Bank, transferring through\
222
+ \ electronically transmitted orders to the joint account number ... of the complainants\
223
+ \ from bank accounts numbered ..., ..., and ..., the total amount of €55,710,\
224
+ \ as detailed in the orders, and subsequently, using an ATM card, she gradually\
225
+ \ withdrew from the aforementioned account number ..., the total amount of €55,710,\
226
+ \ making 84 individual withdrawals from automatic teller machines. In addition,\
227
+ \ the defendant, during the period from June 2008 to November 2008, in the same\
228
+ \ exact manner (through the electronic management system of the bank accounts),\
229
+ \ transferred through electronically transmitted orders to account number ...,\
230
+ \ which she had opened at ..., from the complainants' bank accounts numbered ...,\
231
+ \ ..., ..., ..., and ..., the total amount of €73,942, as detailed in the orders\
232
+ \ regarding the transfers of these amounts. Furthermore, during the period from\
233
+ \ February 2008 to November 2008, through multiple acts constituting a continuation\
234
+ \ of the crime, although she had received from the first complainant ... the amounts\
235
+ \ of €695.04, €695.04, and €845.04, in order to pay his insurance contributions\
236
+ \ to O.A.E.E. for the periods of January-February 2008, May-June 2008, and September-October\
237
+ \ 2008, as well as the amounts of €250 and €280, in order to settle credit card\
238
+ \ bills for \"...\", respectively, and from the second complainant ... she received\
239
+ \ the amounts of €283.64, €419.26, and €385.38, to pay the latter's insurance\
240
+ \ contributions to O.A.E.E. for the periods of July-August 2007, May-June 2008,\
241
+ \ September-October 2008, and November-December 2008, as well as the amount of\
242
+ \ €1,888.03 for the settlement of VAT, she never paid the above amounts to settle\
243
+ \ the aforementioned obligations, nor did she return them to the complainants,\
244
+ \ despite being urged to do so, but incorporated them into her assets and wrongfully\
245
+ \ appropriated them. The defendant denies the charges against her and claims that\
246
+ \ the withdrawals were made by the second complainant and that all the amounts\
247
+ \ transferred to her account were transferred to cover the company's expenses\
248
+ \ and their personal expenses, due to her cohabitation with the second complainant\
249
+ \ and with his knowledge, with whom she intended to marry. However, this claim\
250
+ \ is not supported by any evidence; on the contrary, it emerged that she conducted\
251
+ \ the transfers of the money and withdrawals without the complainants' knowledge,\
252
+ \ and when she learned that they had been informed about the account movements\
253
+ \ and met at the Bank, her behavior and demeanor indicated guilt, according to\
254
+ \ the testimony of the prosecution witness ..., an employee of the Pangrati branch\
255
+ \ of ..., who saw her on the same day at the aforementioned Bank when she met\
256
+ \ with the complainants. The ongoing act of fraud using a computer was committed\
257
+ \ by the defendant professionally, as evidenced by her repeated commission of\
258
+ \ the act, as well as the infrastructure she had established with the intent of\
259
+ \ repeated commission, based on a specific plan and methodology (transferring\
260
+ \ smaller amounts to a joint account of the complainants from the remaining accounts\
261
+ \ of the latter, and then withdrawing the transferred amounts with an ATM card,\
262
+ \ as well as directly transferring smaller amounts from the complainants' accounts\
263
+ \ to her personal account she had opened at the same bank), indicating her purpose\
264
+ \ to generate income, with the financial benefit she gained, corresponding to\
265
+ \ the complainants' damage, exceeding a total of €30,000."
266
+ - 'Any person who intentionally, through the technology of information and communication,
267
+ suggests an encounter between an adult and a minor under the age of fifteen, aiming
268
+ at the commitment of the crimes described in par. 1 and 2 of art. 339 and 348Α,
269
+ is sentenced to an imprisonment of at least two years and a fine of fifty to two
270
+ hundred thousand Euros, when the proposal is followed by further actions which
271
+ lead in the commitment of such crimes.
272
+
273
+ '
274
+ - source_sentence: Who should provide authorisation when safeguards are detailed in
275
+ non-legally binding administrative arrangements?
276
+ sentences:
277
+ - In the absence of an adequacy decision, the controller or processor should take
278
+ measures to compensate for the lack of data protection in a third country by way
279
+ of appropriate safeguards for the data subject. Such appropriate safeguards may
280
+ consist of making use of binding corporate rules, standard data protection clauses
281
+ adopted by the Commission, standard data protection clauses adopted by a supervisory
282
+ authority or contractual clauses authorised by a supervisory authority. Those
283
+ safeguards should ensure compliance with data protection requirements and the
284
+ rights of the data subjects appropriate to processing within the Union, including
285
+ the availability of enforceable data subject rights and of effective legal remedies,
286
+ including to obtain effective administrative or judicial redress and to claim
287
+ compensation, in the Union or in a third country. They should relate in particular
288
+ to compliance with the general principles relating to personal data processing,
289
+ the principles of data protection by design and by default. Transfers may also
290
+ be carried out by public authorities or bodies with public authorities or bodies
291
+ in third countries or with international organisations with corresponding duties
292
+ or functions, including on the basis of provisions to be inserted into administrative
293
+ arrangements, such as a memorandum of understanding, providing for enforceable
294
+ and effective rights for data subjects. Authorisation by the competent supervisory
295
+ authority should be obtained when the safeguards are provided for in administrative
296
+ arrangements that are not legally binding.
297
+ - '**Court (Civil/Criminal): Civil**
298
+
299
+
300
+ **Provisions:**
301
+
302
+
303
+ **Time of commission of the act:**
304
+
305
+
306
+ **Outcome (not guilty, guilty):**
307
+
308
+
309
+ **Rationale:**
310
+
311
+
312
+ **Facts:**
313
+
314
+ The plaintiff holds credit card number ............ with the defendant banking
315
+ corporation. Based on the application for alternative networks dated 19/7/2015
316
+ with number ......... submitted at a branch of the defendant, he was granted access
317
+ to the electronic banking service (e-banking) to conduct banking transactions
318
+ (debit, credit, updates, payments) remotely. On 30/11/2020, the plaintiff fell
319
+ victim to electronic fraud through the "phishing" method, whereby an unknown perpetrator
320
+ managed to withdraw a total amount of €3,121.75 from the aforementioned credit
321
+ card. Specifically, the plaintiff received an email at 1:35 PM on 29/11/2020 from
322
+ sender ...... with address ........, informing him that due to an impending system
323
+ change, he needed to verify the mobile phone number linked to the credit card,
324
+ urging him to complete the verification process within the next 24 hours by following
325
+ a link titled ........; otherwise, his account would be locked for security reasons.
326
+ The plaintiff read this email on the afternoon of 30 November 2020 and, believing
327
+ it was from the defendant, followed the instructions and proceeded via the provided
328
+ link to a website that was identical (a clone) to that of the defendant. On this
329
+ page, he was asked to enter the six-digit security code (.........) that had just
330
+ been sent to his mobile phone by the defendant at 3:41 PM, with the note that
331
+ it was an activation code for his ........ card at ........., which he entered.
332
+
333
+
334
+ Subsequently, the plaintiff received, according to his statements, a new email
335
+ (not submitted), which requested him to enter the details of the aforementioned
336
+ credit card, specifically the name of the cardholder and the card number, not
337
+ the PIN, which he also entered, convinced that he was within the online environment
338
+ of the defendant. Then, at 3:47 PM, he received a message on his mobile phone
339
+ from the defendant containing the exact same content as the one he received at
340
+ 3:41 PM, while at 3:50 PM he received a message stating that the activation of
341
+ his ......... card at ....... had been completed. Once the plaintiff read this,
342
+ he became concerned that something was not right, and immediately called (at 4:41
343
+ PM) the defendant''s call center to inform them. There, the employees, with whom
344
+ he finally connected at 5:04 PM due to high call center volume, advised him to
345
+ delete the relevant emails, cancel his credit card, change his access passwords
346
+ for the service, and submit a dispute request regarding the conducted transactions.
347
+ The plaintiff electronically sent this request to the defendant, disputing the
348
+ detailed transactions amounting to €3,121.75, which were conducted on 30/11/2020
349
+ during the time frame of 16:37:45-16:43:34 PM, arguing that he had neither performed
350
+ them himself nor authorized anyone else to do so. The plaintiff specifically disputed
351
+ the following transactions, as evidenced by the account activity of the disputed
352
+ credit card during the aforementioned timeframe: a) transaction number .........
353
+ amounting to €150.62 conducted on 30/11/2020 at 4:43:34 PM, b) transaction number
354
+ ........ amounting to €293.20 conducted on 30/11/2020 at 4:42:40 PM, c) transaction
355
+ number ............ amounting to €295.21 conducted on 30/11/2020 at 4:42:10 PM,
356
+ d) transaction number .......... amounting to €299.22 conducted on 30/11/2020
357
+ at 4:41:31 PM, e) transaction number ........ amounting to €297.21 conducted on
358
+ 30/11/2020 at 4:41:01 PM, f) transaction number ........ amounting to €299.22
359
+ conducted on 30/11/2020 at 4:40:27 PM, g) transaction number ....... amounting
360
+ to €299.22 conducted on 30/11/2020 at 4:39:55 PM, h) transaction number ......
361
+ amounting to €299.22 conducted on 30/11/2020 at 4:39:22 PM, i) transaction number
362
+ ......... amounting to €297.22 conducted on 30/11/2020 at 4:38:52 PM, j) transaction
363
+ number ......... amounting to €295.21 conducted on 30/11/2020 at 4:38:17 PM, and
364
+ k) transaction number ......... amounting to €296.21 conducted on 30/11/2020 at
365
+ 4:37:45 PM. In its response letter dated 21/12/2020, the defendant denied responsibility
366
+ for the costs of the aforementioned transactions, placing the entire blame on
367
+ the plaintiff for the leak of his card details and security code to the fraudulent
368
+ page. The plaintiff, completely denying any fault for the conducted transactions,
369
+ repeatedly contacted the defendant, both by phone and via email (see emails dated
370
+ 15/1/2021 and 11/2/2021), while on 2/3/2021, he electronically sent a report dated
371
+ 1/03/2021 to the Consumer Advocate’s email address, recounting the events and
372
+ requesting that the aforementioned Independent Authority intervene to have the
373
+ disputed debt canceled. In its letter with reference number ...../27.04.2021,
374
+ the aforementioned Independent Authority informed the plaintiff that the case
375
+ was outside its mediating role and was therefore archived. Subsequently, the plaintiff
376
+ sent the defendant on 5/3/2021 his extrajudicial statement dated 4/3/2021, calling
377
+ upon it to fully cancel the debt of €3,121.75 that had been unjustly incurred
378
+ against him within two days and to immediately instruct the representatives of
379
+ the collection agency working with it to cease contacting him regarding the disputed
380
+ case. The defendant sent the plaintiff a message on his mobile phone on 20/04/2021
381
+ informing him that his case was still being processed due to lengthy operational
382
+ requirements, while on 23/04/2021, via email, it informed him that considering
383
+ their good cooperation and his efforts to keep them updated, it had reviewed his
384
+ case and decided to refund him the amounts of the transactions that were conducted
385
+ after his contact with their representatives on 30/11/2020 at 4:41 PM, totaling
386
+ €1,038.25, specifically the following: a) transaction of €150.62 conducted on
387
+ 30/11/2020 at 4:43 PM, b) transaction of €295.21 conducted on 30/11/2020 at 4:42
388
+ PM, c) transaction of €293.20 conducted on 30/11/2020 at 4:42 PM, and d) transaction
389
+ of €299.22 conducted on 30/11/2020 at 4:41 PM. Beyond this, the defendant refused
390
+ to refund the plaintiff the amount of the remaining transactions conducted on
391
+ 30/11/2020, totaling €2,376.08 (and not €2,376.48 as incorrectly stated by the
392
+ plaintiff in his lawsuit), which the plaintiff ultimately fully paid, transferring
393
+ €2,342.77 to the defendant on 7/06/2021 and €33.31 on 15/06/2021 (see related
394
+ deposit receipts).'
395
+ - "Court (Civil/Criminal): Civil \nProvisions: \nTime of commission: July 21,\
396
+ \ 2020 \nOutcome (innocent, guilty): Partially accepts the lawsuit against the\
397
+ \ Bank. \nReasoning: Alongside the bank's responsibility for the ineffective\
398
+ \ protection of its systems against the continually changing and evolving methods\
399
+ \ of deception that affect them, leading to financial damage for its clients who\
400
+ \ entrusted it, which constitutes a breach of its contractual obligations and\
401
+ \ generates contractual liability, there is also the personal responsibility of\
402
+ \ the plaintiff, who did not safeguard, as required, his sensitive banking information\
403
+ \ and disclosed it when he should not have, even though the message that misled\
404
+ \ him came from the context of an SMS conversation with the defendant, even if\
405
+ \ he was directed through the link to a website resembling that of the defendant,\
406
+ \ because he overlooked the relevant instructions and strict recommendations of\
407
+ \ the bank, violating his duty to safeguard them. Therefore, in light of the above,\
408
+ \ the court must partially accept the lawsuit regarding its substance, and with\
409
+ \ the defendant's objection regarding the plaintiff's fault being accepted at\
410
+ \ a rate of 1/6 of the damage suffered, it must be acknowledged – following the\
411
+ \ admissible and lawful modification of the lawsuit's request from a dismissive\
412
+ \ to a declaratory nature as proposed – the defendant's obligation to pay him\
413
+ \ the amount of €2,500, with legal interest, as specified in the operative part.\
414
+ \ Regarding the request to recognize the defendant's obligation to pay him €1,000\
415
+ \ as compensation for the moral damage he suffered from the fraud committed against\
416
+ \ him, this is deemed dismissible as unfounded, because the defendant's liability\
417
+ \ is contractual and not tortious, and there are no special conditions justifying\
418
+ \ the treatment of this specific non-contractual behavior as tortious, making\
419
+ \ it possible to attribute moral damage to the plaintiff from the defendant. \
420
+ \ \nFacts: The plaintiff maintained a joint bank account with his wife and had\
421
+ \ access to the defendant bank's e-banking. On July 21, 2020, following successful\
422
+ \ identification via the agreed-upon credentials (userID, password, OTP), a request\
423
+ \ was made to change the mobile phone number for receiving OTPs, which was completed\
424
+ \ through the bank's platform. However, this change was not made by the plaintiff\
425
+ \ himself, but by a third party who had previously deceived him using the phishing\
426
+ \ method, obtaining his banking details through a misleading SMS. Following the\
427
+ \ phone number change, on July 31, 2020, a transfer of €3,000 was made to a third\
428
+ \ party's account. The transaction was conducted using the necessary credentials\
429
+ \ and OTP sent to the new mobile phone, resulting in the bank considering the\
430
+ \ order valid and executing it. Once the plaintiff realized the transfer, he immediately\
431
+ \ contacted the bank and informed them that he had not given such an order himself.\
432
+ \ Despite the initial assurance that the funds could be recovered, they were ultimately\
433
+ \ not returned, as they had been transferred to a third party's account, and the\
434
+ \ bank denied any responsibility for the loss."
435
+ - source_sentence: When will the periodic review mechanism be conducted?
436
+ sentences:
437
+ - The Commission should monitor the functioning of decisions on the level of protection
438
+ in a third country, a territory or specified sector within a third country, or
439
+ an international organisation, and monitor the functioning of decisions adopted
440
+ on the basis of Article 25(6) or Article 26(4) of Directive 95/46/EC. In its adequacy
441
+ decisions, the Commission should provide for a periodic review mechanism of their
442
+ functioning. That periodic review should be conducted in consultation with the
443
+ third country or international organisation in question and take into account
444
+ all relevant developments in the third country or international organisation.
445
+ For the purposes of monitoring and of carrying out the periodic reviews, the Commission
446
+ should take into consideration the views and findings of the European Parliament
447
+ and of the Council as well as of other relevant bodies and sources. The Commission
448
+ should evaluate, within a reasonable time, the functioning of the latter decisions
449
+ and report any relevant findings to the Committee within the meaning of Regulation
450
+ (EU) No 182/2011 of the European Parliament and of the Council (1) as established
451
+ under this Regulation, to the European Parliament and to the Council.
452
+ - "**Court (Civil/Criminal): Civil** \n**Provisions:** \n**Time of commission\
453
+ \ of the act:** \n**Outcome (not guilty, guilty):** \n**Reasoning:** Partially\
454
+ \ accepts the lawsuit. \n**Facts:** The plaintiff, who works as a lawyer, maintains\
455
+ \ a savings account with the defendant banking corporation under account number\
456
+ \ GR.............. Pursuant to a contract dated June 11, 2010, established in\
457
+ \ Thessaloniki between the defendant and the plaintiff, the plaintiff was granted\
458
+ \ access to the electronic banking system (e-banking) to conduct banking transactions\
459
+ \ remotely. On October 10, 2020, the plaintiff fell victim to electronic fraud\
460
+ \ through the \"phishing\" method, whereby an unknown perpetrator managed to extract\
461
+ \ and transfer €3,000.00 from the plaintiff’s account to another account of the\
462
+ \ same bank. Specifically, on that day at 6:51 a.m., the plaintiff received an\
463
+ \ email from the sender \".........\", with the address ..........., informing\
464
+ \ him that his debit card had been suspended and that online payments and cash\
465
+ \ withdrawals could not be made until the issue was resolved. The email urged\
466
+ \ him to confirm his details within the next 72 hours by following a link titled\
467
+ \ \"card activation.\" \nThe plaintiff read the above email on his mobile phone\
468
+ \ around 8:00 a.m., and believing it came from the defendant, he followed the\
469
+ \ instructions and accessed a website that was identical (a clone) to that of\
470
+ \ the defendant. On this page, he was asked to enter his login credentials to\
471
+ \ connect to the service, which he did, and he was subsequently asked to input\
472
+ \ his debit card details for the alleged activation, which he also provided. Then,\
473
+ \ to complete the process, a number was sent to his mobile phone at 8:07 a.m.\
474
+ \ from the sender ........, which he entered, and two minutes later he received\
475
+ \ a message from the same sender in English stating that the quick access code\
476
+ \ had been activated on his mobile. A few minutes later, at 8:18 a.m., he received\
477
+ \ an email from the defendant informing him of the transfer of €3,000.00 from\
478
+ \ his account to account number GR ........... held at the same bank, with the\
479
+ \ beneficiary's details being .......... As soon as the plaintiff read this, he\
480
+ \ immediately called the defendant's call center and canceled his debit card,\
481
+ \ the access codes for the service ......., and locked the application ..........\
482
+ \ At the same time, he verbally submitted a request to dispute and cancel the\
483
+ \ contested transaction, and in a subsequent phone call, he also canceled his\
484
+ \ credit card. On the same day, he also sent an email to the defendant informing\
485
+ \ them in writing of the above and requesting the cancellation of the transaction\
486
+ \ and the return of the amount of €3,000.00 to his account, as this transfer was\
487
+ \ not made by him but by an unknown perpetrator through electronic fraud and was\
488
+ \ not approved by him. It should also be noted that the plaintiff, as the sole\
489
+ \ beneficiary according to the aforementioned contract for using the defendant's\
490
+ \ Internet Banking service, never received any update via SMS or the VIBER application\
491
+ \ from the bank regarding the transaction details before its completion, nor did\
492
+ \ he receive a one-time code (OTP) to approve the contested transaction. He subsequently\
493
+ \ filed a complaint against unknown persons at the Cyber Crime Division for the\
494
+ \ crime of fraud. The defendant sent an email to the plaintiff on October 16,\
495
+ \ 2020, informing him that his request had been forwarded to the appropriate department\
496
+ \ of the bank for investigation, stating that the bank would never send him an\
497
+ \ email or SMS asking him to enter his personal data and that as of October 7,\
498
+ \ 2020, there was a notice posted for its customers regarding malicious attempts\
499
+ \ to steal personal data in the \"Our News\" section on ....... A month after\
500
+ \ the disputed incident, on November 10, 2020, an amount of €2,296.82 was transferred\
501
+ \ to the plaintiff's account from the account to which the fraudulent credit had\
502
+ \ been made. The plaintiff immediately sent an email to the defendant asking to\
503
+ \ be informed whether this transfer was a return of part of the amount that had\
504
+ \ been illegally withdrawn from his account and requested the return of the remaining\
505
+ \ amount of €703.18. In its response dated January 13, 2021, the defendant confirmed\
506
+ \ that the aforementioned amount indeed came from the account to which the fraudulent\
507
+ \ credit had been made, following a freeze of that account initiated by the defendant\
508
+ \ during the investigation of the incident, but refused to return the remaining\
509
+ \ amount, claiming it bore no responsibility for the leak of the personal codes\
510
+ \ to third parties, according to the terms of the service contract established\
511
+ \ between them. \nFrom the entirety of the evidence presented to the court, there\
512
+ \ is no indication of the authenticity of the contested transaction, as the plaintiff\
513
+ \ did not give his consent for the execution of the transfer of the amount of\
514
+ \ €3,000.00, especially in light of the provision in Article 72 paragraph 2 of\
515
+ \ Law 4537/2018 stating that the mere use of the Internet Banking service by the\
516
+ \ plaintiff does not necessarily constitute sufficient evidence that the payer\
517
+ \ approved the payment action. Specifically, it was proven that the contested\
518
+ \ transaction was not carried out following a strong identification of the plaintiff\
519
+ \ – the sole beneficiary of the account – and his approval, as the latter may\
520
+ \ have entered his personal codes on the counterfeit website; however, he was\
521
+ \ never informed, before the completion of the contested transaction, of the amount\
522
+ \ that would be transferred from his account to a third-party account, nor did\
523
+ \ he receive on his mobile phone, either via SMS or through the VIBER application\
524
+ \ or any other means, the one-time code - extra PIN for its completion, which\
525
+ \ he was required to enter to approve the contested transaction (payment action)\
526
+ \ and thus complete his identification, a fact that was not countered by any evidence\
527
+ \ from the defendant. Furthermore, it is noted that the defendant's claims that\
528
+ \ it bears no responsibility under the terms of the banking services contract,\
529
+ \ whereby it is not liable for any damage to its customer in cases of unauthorized\
530
+ \ use of their personal access codes to the Internet Banking service, are to be\
531
+ \ rejected as fundamentally unfounded. This is because the aforementioned contractual\
532
+ \ terms are invalid according to the provision of Article 103 of Law 4537/2018,\
533
+ \ as they contradict the provisions of Articles 71, 73, and 92 of the same Law,\
534
+ \ which provide for the provider's universal liability and its exemption only\
535
+ \ for unusual and unforeseen circumstances that are beyond the control of the\
536
+ \ party invoking them and whose consequences could not have been avoided despite\
537
+ \ all efforts to the contrary; these provisions establish mandatory law in favor\
538
+ \ of users, as according to Article 103 of Law 4537/2018, payment service providers\
539
+ \ are prohibited from deviating from the provisions to the detriment of payment\
540
+ \ service users, unless the possibility of deviation is explicitly provided and\
541
+ \ they can decide to offer only more favorable terms to payment service users;\
542
+ \ the aforementioned contractual terms do not constitute more favorable terms\
543
+ \ but rather disadvantageous terms for the payment service user. In this case,\
544
+ \ however, the defendant did not prove the authenticity of the transaction and\
545
+ \ its approval by the plaintiff and did not invoke, nor did any unusual and unforeseen\
546
+ \ circumstances beyond its control, the consequences of which could not have been\
547
+ \ avoided despite all efforts to the contrary, come to light. Therefore, the contested\
548
+ \ transaction transferring the amount of €3,000.00 is considered, in the absence\
549
+ \ of demonstrable consent from the plaintiff, unapproved according to the provisions\
550
+ \ of Article 64 of Law 4537/2018, and the defendant's contrary claims are rejected,\
551
+ \ especially since the plaintiff proceeded, according to Article 71 paragraph\
552
+ \ 1 of Law 4537/2018, without undue delay to notify the defendant regarding the\
553
+ \ contested unapproved payment action. Consequently, the defendant is liable for\
554
+ \ compensating the plaintiff for the positive damage he suffered under Article\
555
+ \ 73 of Law 4537/2018 and is obliged to pay him the requested amount of €703.18,\
556
+ \ while the plaintiff’s fault in the occurrence of this damage cannot be established,\
557
+ \ as he entered his personal details in an online environment that was a faithful\
558
+ \ imitation of that of the defendant, as evidenced by the comparison of the screenshots\
559
+ \ of the fake website and the real website provided by the plaintiff, a fact that\
560
+ \ he could not have known while being fully convinced that he was transacting\
561
+ \ with the defendant. Furthermore, the defendant’s liability to compensate the\
562
+ \ plaintiff is based on the provision of Article 8 of Law 2251/1994, which applies\
563
+ \ in this case, as the plaintiff's damage resulted from inadequate fulfillment\
564
+ \ of its obligations in the context of providing its services, but also on the\
565
+ \ provision of Article 914 of the Civil Code in the sense of omission on its part\
566
+ \ of unlawfully and culpably imposed actions. In this case, given that during\
567
+ \ the relevant period there had been a multitude of similar incidents of fraud\
568
+ \ against the defendant's customers, the latter, as a service provider to the\
569
+ \ consumer public and bearing transactional obligations of care and security towards\
570
+ \ them, displayed gross negligence regarding the security provided for electronic\
571
+ \ transaction services, which was compromised by the fraudulent theft of funds,\
572
+ \ as it did not comply with all required high-security measures for executing\
573
+ \ the contested transaction, failing to implement the strict customer identification\
574
+ \ verification process and to check the authenticity of the account to which the\
575
+ \ funds were sent, thus not assuming the suspicious nature of the transaction,\
576
+ \ did not adopt comprehensive and improved protective measures to fully protect\
577
+ \ its customers against malicious attacks and online fraud and to prevent the\
578
+ \ infiltration of unauthorized third parties, nor did it fulfill its obligations\
579
+ \ to inform, accurately inform, and warn its consumers - customers, as it failed\
580
+ \ to adequately inform them of attempts to steal their personal data through the\
581
+ \ sending of informative emails or SMS, while merely posting in a section rather\
582
+ \ than on a central banner (as it later did) does not constitute adequate information\
583
+ \ such that it meets the requirement of protecting its customers and the increased\
584
+ \ safeguarding of their interests. Although the plaintiff acted promptly and informed\
585
+ \ the defendant on the same day about the contested incident, the defendant did\
586
+ \ not act as promptly regarding the investigation of the incident and the freezing\
587
+ \ of the account that held the fraudulent credit to prevent the plaintiff's loss,\
588
+ \ but only returned part of the funds to the plaintiff a month later. This behavior,\
589
+ \ beyond being culpable due to gross negligence, was also unlawful, as it would\
590
+ \ have been illegal even without the contractual relationship, as contrary to\
591
+ \ the provisions of Law 4537/2018 and Law 2251/1994, regarding the lack of security\
592
+ \ of the services that the consumer is legitimately entitled to expect, as well\
593
+ \ as the building of trust that is essential in banking transactions, elements\
594
+ \ that it was obligated to provide within the sphere of the services offered,\
595
+ \ and contrary to the principles of good faith and commercial ethics, as crystallized\
596
+ \ in the provision of Article 288 of the Civil Code, as well as the general duty\
597
+ \ imposed by Article 914 of the Civil Code not to cause harm to another culpably.\
598
+ \ This resulted not only in positive damage to the plaintiff but also in causing\
599
+ \ him moral harm consisting of his mental distress and the disruption, agitation,\
600
+ \ and sorrow he experienced, for which he must be awarded financial compensation.\
601
+ \ Taking into account all the general circumstances of the case, the extent of\
602
+ \ the plaintiff's damage, the severity of the defendant's fault, the mental distress\
603
+ \ suffered by the plaintiff, the insecurity he felt regarding his deposits, the\
604
+ \ sorrow he experienced, and the stress caused by his financial loss, which occurred\
605
+ \ during the pandemic period when his earnings from his professional activity\
606
+ \ had significantly decreased, as well as the financial and social situation of\
607
+ \ the parties, it is the court's opinion that he should be granted, as financial\
608
+ \ compensation for his moral harm, an amount of €250.00, which is deemed reasonable\
609
+ \ and fair. Therefore, the total monetary amount that the plaintiff is entitled\
610
+ \ to for his positive damage and financial compensation for the moral harm suffered\
611
+ \ amounts to a total of (€703.18 + €250.00) = €953.18."
612
+ - 'Failure to notify the Authority of file establishment or permit changes is punished
613
+ by up to three years’ imprisonment and a fine of one to five million Drachmas.
614
+
615
+ Maintaining a file without a permit or violating permit terms is punished by at
616
+ least one year’s imprisonment and a fine of one to five million Drachmas.
617
+
618
+ Unauthorized file interconnection or without permit is punished by up to three
619
+ years’ imprisonment and a fine of one to five million Drachmas.
620
+
621
+ Unlawful interference with personal data is punished by imprisonment and a fine;
622
+ for sensitive data, at least one year’s imprisonment and a fine of one to ten
623
+ million Drachmas.
624
+
625
+ Controllers who fail to comply with Authority decisions or violate data transfer
626
+ rules face at least two years’ imprisonment and a fine of one to five million
627
+ Drachmas.
628
+
629
+ If acts were committed for unlawful benefit or to cause harm, punishment is up
630
+ to ten years’ imprisonment and a fine of two to ten million Drachmas.
631
+
632
+ If acts jeopardize democratic governance or national security, punishment is confinement
633
+ in a penitentiary and a fine of five to ten million Drachmas.
634
+
635
+ Acts committed due to negligence result in at least three months’ imprisonment
636
+ and a fine.
637
+
638
+ If the Controller is not a natural person, the responsible party is the representative
639
+ or head of the organization with administrative or managerial duties.
640
+
641
+ Authorized members of the Authority may carry out preliminary investigations even
642
+ without Prosecutor’s order for certain offenses.
643
+
644
+ The Authority''s President must notify the Public Prosecutor of any offenses under
645
+ investigation, forwarding all relevant evidence.
646
+
647
+ Preliminary investigations must conclude within two months of charges, and trial
648
+ must begin within three months of completion.
649
+
650
+ Continuation of proceedings is allowed only once and for extremely important reasons,
651
+ with adjournment not exceeding two months.
652
+
653
+ Felonies under this law fall under the jurisdiction of the Court of Appeal.
654
+
655
+ '
656
+ - source_sentence: Who must facilitate the exercise of data subject rights?
657
+ sentences:
658
+ - '1.Processing of personal data revealing racial or ethnic origin, political opinions,
659
+ religious or philosophical beliefs, or trade union membership, and the processing
660
+ of genetic data, biometric data for the purpose of uniquely identifying a natural
661
+ person, data concerning health or data concerning a natural person''s sex life
662
+ or sexual orientation shall be prohibited.
663
+
664
+ 2.Paragraph 1 shall not apply if one of the following applies: (a) the data subject
665
+ has given explicit consent to the processing of those personal data for one or
666
+ more specified purposes, except where Union or Member State law provide that the
667
+ prohibition referred to in paragraph 1 may not be lifted by the data subject;
668
+ (b) processing is necessary for the purposes of carrying out the obligations
669
+ and exercising specific rights of the controller or of the data subject in the
670
+ field of employment and social security and social protection law in so far as
671
+ it is authorised by Union or Member State law or a collective agreement pursuant
672
+ to Member State law providing for appropriate safeguards for the fundamental rights
673
+ and the interests of the data subject; (c) processing is necessary to protect
674
+ the vital interests of the data subject or of another natural person where the
675
+ data subject is physically or legally incapable of giving consent; (d) processing
676
+ is carried out in the course of its legitimate activities with appropriate safeguards
677
+ by a foundation, association or any other not-for-profit body with a political,
678
+ philosophical, religious or trade union aim and on condition that the processing
679
+ relates solely to the members or to former members of the body or to persons who
680
+ have regular contact with it in connection with its purposes and that the personal
681
+ data are not disclosed outside that body without the consent of the data subjects;
682
+ (e) processing relates to personal data which are manifestly made public by the
683
+ data subject; (f) processing is necessary for the establishment, exercise or
684
+ defence of legal claims or whenever courts are acting in their judicial capacity;
685
+ (g) processing is necessary for reasons of substantial public interest, on the
686
+ basis of Union or Member State law which shall be proportionate to the aim pursued,
687
+ respect the essence of the right to data protection and provide for suitable and
688
+ specific measures to safeguard the fundamental rights and the interests of the
689
+ data subject; (h) processing is necessary for the purposes of preventive or occupational
690
+ medicine, for the assessment of the working capacity of the employee, medical
691
+ diagnosis, the provision of health or social care or treatment or the management
692
+ of health or social care systems and services on the basis of Union or Member
693
+ State law or pursuant to contract with a health professional and subject to the
694
+ conditions and safeguards referred to in paragraph 3; (i) processing is necessary
695
+ for reasons of public interest in the area of public health, such as protecting
696
+ against serious cross-border threats to health or ensuring high standards of quality
697
+ and safety of health care and of medicinal products or medical devices, on the
698
+ basis of Union or Member State law which provides for suitable and specific measures
699
+ to safeguard the rights and freedoms of the data subject, in particular professional
700
+ secrecy; 4.5.2016 L 119/38 (j) processing is necessary for archiving purposes
701
+ in the public interest, scientific or historical research purposes or statistical
702
+ purposes in accordance with Article 89(1) based on Union or Member State law which
703
+ shall be proportionate to the aim pursued, respect the essence of the right to
704
+ data protection and provide for suitable and specific measures to safeguard the
705
+ fundamental rights and the interests of the data subject.
706
+
707
+ 3.Personal data referred to in paragraph 1 may be processed for the purposes referred
708
+ to in point (h) of paragraph 2 when those data are processed by or under the responsibility
709
+ of a professional subject to the obligation of professional secrecy under Union
710
+ or Member State law or rules established by national competent bodies or by another
711
+ person also subject to an obligation of secrecy under Union or Member State law
712
+ or rules established by national competent bodies.
713
+
714
+ 4.Member States may maintain or introduce further conditions, including limitations,
715
+ with regard to the processing of genetic data, biometric data or data concerning
716
+ health.'
717
+ - Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies
718
+ to the processing of personal data by the Union institutions, bodies, offices
719
+ and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable
720
+ to such processing of personal data should be adapted to the principles and rules
721
+ established in this Regulation and applied in the light of this Regulation. In
722
+ order to provide a strong and coherent data protection framework in the Union,
723
+ the necessary adaptations of Regulation (EC) No 45/2001 should follow after the
724
+ adoption of this Regulation, in order to allow application at the same time as
725
+ this Regulation.
726
+ - "1.The controller shall take appropriate measures to provide any information referred\
727
+ \ to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34\
728
+ \ relating to processing to the data subject in a concise, transparent, intelligible\
729
+ \ and easily accessible form, using clear and plain language, in particular for\
730
+ \ any information addressed specifically to a child. The information shall be\
731
+ \ provided in writing, or by other means, including, where appropriate, by electronic\
732
+ \ means. When requested by the data subject, the information may be provided orally,\
733
+ \ provided that the identity of the data subject is proven by other means. 4.5.2016\
734
+ \ L 119/39 \n2.The controller shall facilitate the exercise of data subject rights\
735
+ \ under Articles 15 to 22. In the cases referred to in Article 11(2), the controller\
736
+ \ shall not refuse to act on the request of the data subject for exercising his\
737
+ \ or her rights under Articles 15 to 22, unless the controller demonstrates that\
738
+ \ it is not in a position to identify the data subject.\n3.The controller shall\
739
+ \ provide information on action taken on a request under Articles 15 to 22 to\
740
+ \ the data subject without undue delay and in any event within one month of receipt\
741
+ \ of the request. That period may be extended by two further months where necessary,\
742
+ \ taking into account the complexity and number of the requests. The controller\
743
+ \ shall inform the data subject of any such extension within one month of receipt\
744
+ \ of the request, together with the reasons for the delay. Where the data subject\
745
+ \ makes the request by electronic form means, the information shall be provided\
746
+ \ by electronic means where possible, unless otherwise requested by the data subject.\n\
747
+ 4.If the controller does not take action on the request of the data subject, the\
748
+ \ controller shall inform the data subject without delay and at the latest within\
749
+ \ one month of receipt of the request of the reasons for not taking action and\
750
+ \ on the possibility of lodging a complaint with a supervisory authority and seeking\
751
+ \ a judicial remedy.\n5.Information provided under Articles 13 and 14 and any\
752
+ \ communication and any actions taken under Articles 15 to 22 and 34 shall be\
753
+ \ provided free of charge. Where requests from a data subject are manifestly unfounded\
754
+ \ or excessive, in particular because of their repetitive character, the controller\
755
+ \ may either: (a) charge a reasonable fee taking into account the administrative\
756
+ \ costs of providing the information or communication or taking the action requested;\
757
+ \ or (b) refuse to act on the request. The controller shall bear the burden of\
758
+ \ demonstrating the manifestly unfounded or excessive character of the request.\n\
759
+ 6.Without prejudice to Article 11, where the controller has reasonable doubts\
760
+ \ concerning the identity of the natural person making the request referred to\
761
+ \ in Articles 15 to 21, the controller may request the provision of additional\
762
+ \ information necessary to confirm the identity of the data subject.\n7.The information\
763
+ \ to be provided to data subjects pursuant to Articles 13 and 14 may be provided\
764
+ \ in combination with standardised icons in order to give in an easily visible,\
765
+ \ intelligible and clearly legible manner a meaningful overview of the intended\
766
+ \ processing. Where the icons are presented electronically they shall be machine-readable.\n\
767
+ 8.The Commission shall be empowered to adopt delegated acts in accordance with\
768
+ \ Article 92 for the purpose of determining the information to be presented by\
769
+ \ the icons and the procedures for providing standardised icons. Section 2 Information\
770
+ \ and access to personal data"
771
+ pipeline_tag: sentence-similarity
772
+ library_name: sentence-transformers
773
+ metrics:
774
+ - cosine_accuracy@1
775
+ - cosine_accuracy@3
776
+ - cosine_accuracy@5
777
+ - cosine_accuracy@10
778
+ - cosine_precision@1
779
+ - cosine_precision@3
780
+ - cosine_precision@5
781
+ - cosine_precision@10
782
+ - cosine_recall@1
783
+ - cosine_recall@3
784
+ - cosine_recall@5
785
+ - cosine_recall@10
786
+ - cosine_ndcg@10
787
+ - cosine_mrr@10
788
+ - cosine_map@100
789
+ model-index:
790
+ - name: multilingual-e5-large
791
+ results:
792
+ - task:
793
+ type: information-retrieval
794
+ name: Information Retrieval
795
+ dataset:
796
+ name: dim 1024
797
+ type: dim_1024
798
+ metrics:
799
+ - type: cosine_accuracy@1
800
+ value: 0.4180537772087068
801
+ name: Cosine Accuracy@1
802
+ - type: cosine_accuracy@3
803
+ value: 0.42189500640204863
804
+ name: Cosine Accuracy@3
805
+ - type: cosine_accuracy@5
806
+ value: 0.4500640204865557
807
+ name: Cosine Accuracy@5
808
+ - type: cosine_accuracy@10
809
+ value: 0.49039692701664533
810
+ name: Cosine Accuracy@10
811
+ - type: cosine_precision@1
812
+ value: 0.4180537772087068
813
+ name: Cosine Precision@1
814
+ - type: cosine_precision@3
815
+ value: 0.4163465642338881
816
+ name: Cosine Precision@3
817
+ - type: cosine_precision@5
818
+ value: 0.4043533930857874
819
+ name: Cosine Precision@5
820
+ - type: cosine_precision@10
821
+ value: 0.36869398207426374
822
+ name: Cosine Precision@10
823
+ - type: cosine_recall@1
824
+ value: 0.04734422767263886
825
+ name: Cosine Recall@1
826
+ - type: cosine_recall@3
827
+ value: 0.138064233626932
828
+ name: Cosine Recall@3
829
+ - type: cosine_recall@5
830
+ value: 0.2069980430010945
831
+ name: Cosine Recall@5
832
+ - type: cosine_recall@10
833
+ value: 0.308531274625124
834
+ name: Cosine Recall@10
835
+ - type: cosine_ndcg@10
836
+ value: 0.44178501209869797
837
+ name: Cosine Ndcg@10
838
+ - type: cosine_mrr@10
839
+ value: 0.42985717334308843
840
+ name: Cosine Mrr@10
841
+ - type: cosine_map@100
842
+ value: 0.506794523350519
843
+ name: Cosine Map@100
844
+ - task:
845
+ type: information-retrieval
846
+ name: Information Retrieval
847
+ dataset:
848
+ name: dim 768
849
+ type: dim_768
850
+ metrics:
851
+ - type: cosine_accuracy@1
852
+ value: 0.41037131882202305
853
+ name: Cosine Accuracy@1
854
+ - type: cosine_accuracy@3
855
+ value: 0.4142125480153649
856
+ name: Cosine Accuracy@3
857
+ - type: cosine_accuracy@5
858
+ value: 0.44430217669654287
859
+ name: Cosine Accuracy@5
860
+ - type: cosine_accuracy@10
861
+ value: 0.4833546734955186
862
+ name: Cosine Accuracy@10
863
+ - type: cosine_precision@1
864
+ value: 0.41037131882202305
865
+ name: Cosine Precision@1
866
+ - type: cosine_precision@3
867
+ value: 0.4086641058472044
868
+ name: Cosine Precision@3
869
+ - type: cosine_precision@5
870
+ value: 0.3969270166453265
871
+ name: Cosine Precision@5
872
+ - type: cosine_precision@10
873
+ value: 0.36165172855313704
874
+ name: Cosine Precision@10
875
+ - type: cosine_recall@1
876
+ value: 0.047186779325657804
877
+ name: Cosine Recall@1
878
+ - type: cosine_recall@3
879
+ value: 0.1375709294981283
880
+ name: Cosine Recall@3
881
+ - type: cosine_recall@5
882
+ value: 0.20603724780478358
883
+ name: Cosine Recall@5
884
+ - type: cosine_recall@10
885
+ value: 0.30540044861465576
886
+ name: Cosine Recall@10
887
+ - type: cosine_ndcg@10
888
+ value: 0.4349862241563486
889
+ name: Cosine Ndcg@10
890
+ - type: cosine_mrr@10
891
+ value: 0.4224889742495374
892
+ name: Cosine Mrr@10
893
+ - type: cosine_map@100
894
+ value: 0.500478306774528
895
+ name: Cosine Map@100
896
+ - task:
897
+ type: information-retrieval
898
+ name: Information Retrieval
899
+ dataset:
900
+ name: dim 512
901
+ type: dim_512
902
+ metrics:
903
+ - type: cosine_accuracy@1
904
+ value: 0.4065300896286812
905
+ name: Cosine Accuracy@1
906
+ - type: cosine_accuracy@3
907
+ value: 0.41229193341869397
908
+ name: Cosine Accuracy@3
909
+ - type: cosine_accuracy@5
910
+ value: 0.44494238156209986
911
+ name: Cosine Accuracy@5
912
+ - type: cosine_accuracy@10
913
+ value: 0.4814340588988476
914
+ name: Cosine Accuracy@10
915
+ - type: cosine_precision@1
916
+ value: 0.4065300896286812
917
+ name: Cosine Precision@1
918
+ - type: cosine_precision@3
919
+ value: 0.4054630815194195
920
+ name: Cosine Precision@3
921
+ - type: cosine_precision@5
922
+ value: 0.3947503201024327
923
+ name: Cosine Precision@5
924
+ - type: cosine_precision@10
925
+ value: 0.3596030729833547
926
+ name: Cosine Precision@10
927
+ - type: cosine_recall@1
928
+ value: 0.047372341735862133
929
+ name: Cosine Recall@1
930
+ - type: cosine_recall@3
931
+ value: 0.1383106496582531
932
+ name: Cosine Recall@3
933
+ - type: cosine_recall@5
934
+ value: 0.20757258542171747
935
+ name: Cosine Recall@5
936
+ - type: cosine_recall@10
937
+ value: 0.3071623578952262
938
+ name: Cosine Recall@10
939
+ - type: cosine_ndcg@10
940
+ value: 0.4329095460408428
941
+ name: Cosine Ndcg@10
942
+ - type: cosine_mrr@10
943
+ value: 0.41950236774180394
944
+ name: Cosine Mrr@10
945
+ - type: cosine_map@100
946
+ value: 0.49555759572196095
947
+ name: Cosine Map@100
948
+ - task:
949
+ type: information-retrieval
950
+ name: Information Retrieval
951
+ dataset:
952
+ name: dim 256
953
+ type: dim_256
954
+ metrics:
955
+ - type: cosine_accuracy@1
956
+ value: 0.38348271446862997
957
+ name: Cosine Accuracy@1
958
+ - type: cosine_accuracy@3
959
+ value: 0.3886043533930858
960
+ name: Cosine Accuracy@3
961
+ - type: cosine_accuracy@5
962
+ value: 0.4206145966709347
963
+ name: Cosine Accuracy@5
964
+ - type: cosine_accuracy@10
965
+ value: 0.4551856594110115
966
+ name: Cosine Accuracy@10
967
+ - type: cosine_precision@1
968
+ value: 0.38348271446862997
969
+ name: Cosine Precision@1
970
+ - type: cosine_precision@3
971
+ value: 0.382202304737516
972
+ name: Cosine Precision@3
973
+ - type: cosine_precision@5
974
+ value: 0.3718309859154929
975
+ name: Cosine Precision@5
976
+ - type: cosine_precision@10
977
+ value: 0.33886043533930854
978
+ name: Cosine Precision@10
979
+ - type: cosine_recall@1
980
+ value: 0.04466034705404223
981
+ name: Cosine Recall@1
982
+ - type: cosine_recall@3
983
+ value: 0.1301795023253766
984
+ name: Cosine Recall@3
985
+ - type: cosine_recall@5
986
+ value: 0.19500340584044382
987
+ name: Cosine Recall@5
988
+ - type: cosine_recall@10
989
+ value: 0.2892016292717267
990
+ name: Cosine Recall@10
991
+ - type: cosine_ndcg@10
992
+ value: 0.4087462230477571
993
+ name: Cosine Ndcg@10
994
+ - type: cosine_mrr@10
995
+ value: 0.3957850639188662
996
+ name: Cosine Mrr@10
997
+ - type: cosine_map@100
998
+ value: 0.4709582085612654
999
+ name: Cosine Map@100
1000
+ - task:
1001
+ type: information-retrieval
1002
+ name: Information Retrieval
1003
+ dataset:
1004
+ name: dim 128
1005
+ type: dim_128
1006
+ metrics:
1007
+ - type: cosine_accuracy@1
1008
+ value: 0.34699103713188223
1009
+ name: Cosine Accuracy@1
1010
+ - type: cosine_accuracy@3
1011
+ value: 0.35147247119078107
1012
+ name: Cosine Accuracy@3
1013
+ - type: cosine_accuracy@5
1014
+ value: 0.37900128040973113
1015
+ name: Cosine Accuracy@5
1016
+ - type: cosine_accuracy@10
1017
+ value: 0.4212548015364917
1018
+ name: Cosine Accuracy@10
1019
+ - type: cosine_precision@1
1020
+ value: 0.34699103713188223
1021
+ name: Cosine Precision@1
1022
+ - type: cosine_precision@3
1023
+ value: 0.34571062740076824
1024
+ name: Cosine Precision@3
1025
+ - type: cosine_precision@5
1026
+ value: 0.3352112676056338
1027
+ name: Cosine Precision@5
1028
+ - type: cosine_precision@10
1029
+ value: 0.3042893725992318
1030
+ name: Cosine Precision@10
1031
+ - type: cosine_recall@1
1032
+ value: 0.04217848526747235
1033
+ name: Cosine Recall@1
1034
+ - type: cosine_recall@3
1035
+ value: 0.12288848071178002
1036
+ name: Cosine Recall@3
1037
+ - type: cosine_recall@5
1038
+ value: 0.18344012521240954
1039
+ name: Cosine Recall@5
1040
+ - type: cosine_recall@10
1041
+ value: 0.2706183968947745
1042
+ name: Cosine Recall@10
1043
+ - type: cosine_ndcg@10
1044
+ value: 0.37139192897263235
1045
+ name: Cosine Ndcg@10
1046
+ - type: cosine_mrr@10
1047
+ value: 0.35916305916305874
1048
+ name: Cosine Mrr@10
1049
+ - type: cosine_map@100
1050
+ value: 0.4338211299784659
1051
+ name: Cosine Map@100
1052
+ - task:
1053
+ type: information-retrieval
1054
+ name: Information Retrieval
1055
+ dataset:
1056
+ name: dim 64
1057
+ type: dim_64
1058
+ metrics:
1059
+ - type: cosine_accuracy@1
1060
+ value: 0.3207426376440461
1061
+ name: Cosine Accuracy@1
1062
+ - type: cosine_accuracy@3
1063
+ value: 0.322663252240717
1064
+ name: Cosine Accuracy@3
1065
+ - type: cosine_accuracy@5
1066
+ value: 0.3405889884763124
1067
+ name: Cosine Accuracy@5
1068
+ - type: cosine_accuracy@10
1069
+ value: 0.3725992317541613
1070
+ name: Cosine Accuracy@10
1071
+ - type: cosine_precision@1
1072
+ value: 0.3207426376440461
1073
+ name: Cosine Precision@1
1074
+ - type: cosine_precision@3
1075
+ value: 0.3188220230473751
1076
+ name: Cosine Precision@3
1077
+ - type: cosine_precision@5
1078
+ value: 0.3088348271446863
1079
+ name: Cosine Precision@5
1080
+ - type: cosine_precision@10
1081
+ value: 0.2797055057618438
1082
+ name: Cosine Precision@10
1083
+ - type: cosine_recall@1
1084
+ value: 0.036318765090758674
1085
+ name: Cosine Recall@1
1086
+ - type: cosine_recall@3
1087
+ value: 0.10562189493083342
1088
+ name: Cosine Recall@3
1089
+ - type: cosine_recall@5
1090
+ value: 0.15867125525021739
1091
+ name: Cosine Recall@5
1092
+ - type: cosine_recall@10
1093
+ value: 0.23840960718091392
1094
+ name: Cosine Recall@10
1095
+ - type: cosine_ndcg@10
1096
+ value: 0.3371953828075091
1097
+ name: Cosine Ndcg@10
1098
+ - type: cosine_mrr@10
1099
+ value: 0.32884732638253733
1100
+ name: Cosine Mrr@10
1101
+ - type: cosine_map@100
1102
+ value: 0.3933467041096336
1103
+ name: Cosine Map@100
1104
+ ---
1105
+
1106
+ # multilingual-e5-large
1107
+
1108
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large). It maps sentences & paragraphs to a 1024-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
1109
+
1110
+ ## Model Details
1111
+
1112
+ ### Model Description
1113
+ - **Model Type:** Sentence Transformer
1114
+ - **Base model:** [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large) <!-- at revision 0dc5580a448e4284468b8909bae50fa925907bc5 -->
1115
+ - **Maximum Sequence Length:** 512 tokens
1116
+ - **Output Dimensionality:** 1024 dimensions
1117
+ - **Similarity Function:** Cosine Similarity
1118
+ <!-- - **Training Dataset:** Unknown -->
1119
+ - **Language:** en
1120
+ - **License:** apache-2.0
1121
+
1122
+ ### Model Sources
1123
+
1124
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
1125
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
1126
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
1127
+
1128
+ ### Full Model Architecture
1129
+
1130
+ ```
1131
+ SentenceTransformer(
1132
+ (0): Transformer({'max_seq_length': 512, 'do_lower_case': False, 'architecture': 'XLMRobertaModel'})
1133
+ (1): Pooling({'word_embedding_dimension': 1024, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
1134
+ (2): Normalize()
1135
+ )
1136
+ ```
1137
+
1138
+ ## Usage
1139
+
1140
+ ### Direct Usage (Sentence Transformers)
1141
+
1142
+ First install the Sentence Transformers library:
1143
+
1144
+ ```bash
1145
+ pip install -U sentence-transformers
1146
+ ```
1147
+
1148
+ Then you can load this model and run inference.
1149
+ ```python
1150
+ from sentence_transformers import SentenceTransformer
1151
+
1152
+ # Download from the 🤗 Hub
1153
+ model = SentenceTransformer("sentence_transformers_model_id")
1154
+ # Run inference
1155
+ sentences = [
1156
+ 'Who must facilitate the exercise of data subject rights?',
1157
+ '1.The controller shall take appropriate measures to provide any information referred to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34 relating to processing to the data subject in a concise, transparent, intelligible and easily accessible form, using clear and plain language, in particular for any information addressed specifically to a child. The information shall be provided in writing, or by other means, including, where appropriate, by electronic means. When requested by the data subject, the information may be provided orally, provided that the identity of the data subject is proven by other means. 4.5.2016 L 119/39 \n2.The controller shall facilitate the exercise of data subject rights under Articles 15 to 22. In the cases referred to in Article 11(2), the controller shall not refuse to act on the request of the data subject for exercising his or her rights under Articles 15 to 22, unless the controller demonstrates that it is not in a position to identify the data subject.\n3.The controller shall provide information on action taken on a request under Articles 15 to 22 to the data subject without undue delay and in any event within one month of receipt of the request. That period may be extended by two further months where necessary, taking into account the complexity and number of the requests. The controller shall inform the data subject of any such extension within one month of receipt of the request, together with the reasons for the delay. Where the data subject makes the request by electronic form means, the information shall be provided by electronic means where possible, unless otherwise requested by the data subject.\n4.If the controller does not take action on the request of the data subject, the controller shall inform the data subject without delay and at the latest within one month of receipt of the request of the reasons for not taking action and on the possibility of lodging a complaint with a supervisory authority and seeking a judicial remedy.\n5.Information provided under Articles 13 and 14 and any communication and any actions taken under Articles 15 to 22 and 34 shall be provided free of charge. Where requests from a data subject are manifestly unfounded or excessive, in particular because of their repetitive character, the controller may either: (a) charge a reasonable fee taking into account the administrative costs of providing the information or communication or taking the action requested; or (b) refuse to act on the request. The controller shall bear the burden of demonstrating the manifestly unfounded or excessive character of the request.\n6.Without prejudice to Article 11, where the controller has reasonable doubts concerning the identity of the natural person making the request referred to in Articles 15 to 21, the controller may request the provision of additional information necessary to confirm the identity of the data subject.\n7.The information to be provided to data subjects pursuant to Articles 13 and 14 may be provided in combination with standardised icons in order to give in an easily visible, intelligible and clearly legible manner a meaningful overview of the intended processing. Where the icons are presented electronically they shall be machine-readable.\n8.The Commission shall be empowered to adopt delegated acts in accordance with Article 92 for the purpose of determining the information to be presented by the icons and the procedures for providing standardised icons. Section 2 Information and access to personal data',
1158
+ 'Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies to the processing of personal data by the Union institutions, bodies, offices and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable to such processing of personal data should be adapted to the principles and rules established in this Regulation and applied in the light of this Regulation. In order to provide a strong and coherent data protection framework in the Union, the necessary adaptations of Regulation (EC) No 45/2001 should follow after the adoption of this Regulation, in order to allow application at the same time as this Regulation.',
1159
+ ]
1160
+ embeddings = model.encode(sentences)
1161
+ print(embeddings.shape)
1162
+ # [3, 1024]
1163
+
1164
+ # Get the similarity scores for the embeddings
1165
+ similarities = model.similarity(embeddings, embeddings)
1166
+ print(similarities)
1167
+ # tensor([[1.0000, 0.5748, 0.4790],
1168
+ # [0.5748, 1.0000, 0.3993],
1169
+ # [0.4790, 0.3993, 1.0000]])
1170
+ ```
1171
+
1172
+ <!--
1173
+ ### Direct Usage (Transformers)
1174
+
1175
+ <details><summary>Click to see the direct usage in Transformers</summary>
1176
+
1177
+ </details>
1178
+ -->
1179
+
1180
+ <!--
1181
+ ### Downstream Usage (Sentence Transformers)
1182
+
1183
+ You can finetune this model on your own dataset.
1184
+
1185
+ <details><summary>Click to expand</summary>
1186
+
1187
+ </details>
1188
+ -->
1189
+
1190
+ <!--
1191
+ ### Out-of-Scope Use
1192
+
1193
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
1194
+ -->
1195
+
1196
+ ## Evaluation
1197
+
1198
+ ### Metrics
1199
+
1200
+ #### Information Retrieval
1201
+
1202
+ * Dataset: `dim_1024`
1203
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1204
+ ```json
1205
+ {
1206
+ "truncate_dim": 1024
1207
+ }
1208
+ ```
1209
+
1210
+ | Metric | Value |
1211
+ |:--------------------|:-----------|
1212
+ | cosine_accuracy@1 | 0.4181 |
1213
+ | cosine_accuracy@3 | 0.4219 |
1214
+ | cosine_accuracy@5 | 0.4501 |
1215
+ | cosine_accuracy@10 | 0.4904 |
1216
+ | cosine_precision@1 | 0.4181 |
1217
+ | cosine_precision@3 | 0.4163 |
1218
+ | cosine_precision@5 | 0.4044 |
1219
+ | cosine_precision@10 | 0.3687 |
1220
+ | cosine_recall@1 | 0.0473 |
1221
+ | cosine_recall@3 | 0.1381 |
1222
+ | cosine_recall@5 | 0.207 |
1223
+ | cosine_recall@10 | 0.3085 |
1224
+ | **cosine_ndcg@10** | **0.4418** |
1225
+ | cosine_mrr@10 | 0.4299 |
1226
+ | cosine_map@100 | 0.5068 |
1227
+
1228
+ #### Information Retrieval
1229
+
1230
+ * Dataset: `dim_768`
1231
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1232
+ ```json
1233
+ {
1234
+ "truncate_dim": 768
1235
+ }
1236
+ ```
1237
+
1238
+ | Metric | Value |
1239
+ |:--------------------|:----------|
1240
+ | cosine_accuracy@1 | 0.4104 |
1241
+ | cosine_accuracy@3 | 0.4142 |
1242
+ | cosine_accuracy@5 | 0.4443 |
1243
+ | cosine_accuracy@10 | 0.4834 |
1244
+ | cosine_precision@1 | 0.4104 |
1245
+ | cosine_precision@3 | 0.4087 |
1246
+ | cosine_precision@5 | 0.3969 |
1247
+ | cosine_precision@10 | 0.3617 |
1248
+ | cosine_recall@1 | 0.0472 |
1249
+ | cosine_recall@3 | 0.1376 |
1250
+ | cosine_recall@5 | 0.206 |
1251
+ | cosine_recall@10 | 0.3054 |
1252
+ | **cosine_ndcg@10** | **0.435** |
1253
+ | cosine_mrr@10 | 0.4225 |
1254
+ | cosine_map@100 | 0.5005 |
1255
+
1256
+ #### Information Retrieval
1257
+
1258
+ * Dataset: `dim_512`
1259
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1260
+ ```json
1261
+ {
1262
+ "truncate_dim": 512
1263
+ }
1264
+ ```
1265
+
1266
+ | Metric | Value |
1267
+ |:--------------------|:-----------|
1268
+ | cosine_accuracy@1 | 0.4065 |
1269
+ | cosine_accuracy@3 | 0.4123 |
1270
+ | cosine_accuracy@5 | 0.4449 |
1271
+ | cosine_accuracy@10 | 0.4814 |
1272
+ | cosine_precision@1 | 0.4065 |
1273
+ | cosine_precision@3 | 0.4055 |
1274
+ | cosine_precision@5 | 0.3948 |
1275
+ | cosine_precision@10 | 0.3596 |
1276
+ | cosine_recall@1 | 0.0474 |
1277
+ | cosine_recall@3 | 0.1383 |
1278
+ | cosine_recall@5 | 0.2076 |
1279
+ | cosine_recall@10 | 0.3072 |
1280
+ | **cosine_ndcg@10** | **0.4329** |
1281
+ | cosine_mrr@10 | 0.4195 |
1282
+ | cosine_map@100 | 0.4956 |
1283
+
1284
+ #### Information Retrieval
1285
+
1286
+ * Dataset: `dim_256`
1287
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1288
+ ```json
1289
+ {
1290
+ "truncate_dim": 256
1291
+ }
1292
+ ```
1293
+
1294
+ | Metric | Value |
1295
+ |:--------------------|:-----------|
1296
+ | cosine_accuracy@1 | 0.3835 |
1297
+ | cosine_accuracy@3 | 0.3886 |
1298
+ | cosine_accuracy@5 | 0.4206 |
1299
+ | cosine_accuracy@10 | 0.4552 |
1300
+ | cosine_precision@1 | 0.3835 |
1301
+ | cosine_precision@3 | 0.3822 |
1302
+ | cosine_precision@5 | 0.3718 |
1303
+ | cosine_precision@10 | 0.3389 |
1304
+ | cosine_recall@1 | 0.0447 |
1305
+ | cosine_recall@3 | 0.1302 |
1306
+ | cosine_recall@5 | 0.195 |
1307
+ | cosine_recall@10 | 0.2892 |
1308
+ | **cosine_ndcg@10** | **0.4087** |
1309
+ | cosine_mrr@10 | 0.3958 |
1310
+ | cosine_map@100 | 0.471 |
1311
+
1312
+ #### Information Retrieval
1313
+
1314
+ * Dataset: `dim_128`
1315
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1316
+ ```json
1317
+ {
1318
+ "truncate_dim": 128
1319
+ }
1320
+ ```
1321
+
1322
+ | Metric | Value |
1323
+ |:--------------------|:-----------|
1324
+ | cosine_accuracy@1 | 0.347 |
1325
+ | cosine_accuracy@3 | 0.3515 |
1326
+ | cosine_accuracy@5 | 0.379 |
1327
+ | cosine_accuracy@10 | 0.4213 |
1328
+ | cosine_precision@1 | 0.347 |
1329
+ | cosine_precision@3 | 0.3457 |
1330
+ | cosine_precision@5 | 0.3352 |
1331
+ | cosine_precision@10 | 0.3043 |
1332
+ | cosine_recall@1 | 0.0422 |
1333
+ | cosine_recall@3 | 0.1229 |
1334
+ | cosine_recall@5 | 0.1834 |
1335
+ | cosine_recall@10 | 0.2706 |
1336
+ | **cosine_ndcg@10** | **0.3714** |
1337
+ | cosine_mrr@10 | 0.3592 |
1338
+ | cosine_map@100 | 0.4338 |
1339
+
1340
+ #### Information Retrieval
1341
+
1342
+ * Dataset: `dim_64`
1343
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1344
+ ```json
1345
+ {
1346
+ "truncate_dim": 64
1347
+ }
1348
+ ```
1349
+
1350
+ | Metric | Value |
1351
+ |:--------------------|:-----------|
1352
+ | cosine_accuracy@1 | 0.3207 |
1353
+ | cosine_accuracy@3 | 0.3227 |
1354
+ | cosine_accuracy@5 | 0.3406 |
1355
+ | cosine_accuracy@10 | 0.3726 |
1356
+ | cosine_precision@1 | 0.3207 |
1357
+ | cosine_precision@3 | 0.3188 |
1358
+ | cosine_precision@5 | 0.3088 |
1359
+ | cosine_precision@10 | 0.2797 |
1360
+ | cosine_recall@1 | 0.0363 |
1361
+ | cosine_recall@3 | 0.1056 |
1362
+ | cosine_recall@5 | 0.1587 |
1363
+ | cosine_recall@10 | 0.2384 |
1364
+ | **cosine_ndcg@10** | **0.3372** |
1365
+ | cosine_mrr@10 | 0.3288 |
1366
+ | cosine_map@100 | 0.3933 |
1367
+
1368
+ <!--
1369
+ ## Bias, Risks and Limitations
1370
+
1371
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
1372
+ -->
1373
+
1374
+ <!--
1375
+ ### Recommendations
1376
+
1377
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
1378
+ -->
1379
+
1380
+ ## Training Details
1381
+
1382
+ ### Training Dataset
1383
+
1384
+ #### Unnamed Dataset
1385
+
1386
+ * Size: 391 training samples
1387
+ * Columns: <code>anchor</code> and <code>positive</code>
1388
+ * Approximate statistics based on the first 391 samples:
1389
+ | | anchor | positive |
1390
+ |:--------|:----------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
1391
+ | type | string | string |
1392
+ | details | <ul><li>min: 8 tokens</li><li>mean: 17.16 tokens</li><li>max: 32 tokens</li></ul> | <ul><li>min: 27 tokens</li><li>mean: 377.93 tokens</li><li>max: 512 tokens</li></ul> |
1393
+ * Samples:
1394
+ | anchor | positive |
1395
+ |:-------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
1396
+ | <code>What measures must be taken according to Article 32?</code> | <code>1.Where processing is to be carried out on behalf of a controller, the controller shall use only processors providing sufficient guarantees to implement appropriate technical and organisational measures in such a manner that processing will meet the requirements of this Regulation and ensure the protection of the rights of the data subject.<br>2.The processor shall not engage another processor without prior specific or general written authorisation of the controller. In the case of general written authorisation, the processor shall inform the controller of any intended changes concerning the addition or replacement of other processors, thereby giving the controller the opportunity to object to such changes.<br>3.Processing by a processor shall be governed by a contract or other legal act under Union or Member State law, that is binding on the processor with regard to the controller and that sets out the subject-matter and duration of the processing, the nature and purpose of the processing, ...</code> |
1397
+ | <code>What is the responsibility of assisting and advising the data subjects in exercising their rights?</code> | <code>1.A transfer of personal data to a third country or an international organisation may take place where the Commission has decided that the third country, a territory or one or more specified sectors within that third country, or the international organisation in question ensures an adequate level of protection. Such a transfer shall not require any specific authorisation.<br>2.When assessing the adequacy of the level of protection, the Commission shall, in particular, take account of the following elements: (a) the rule of law, respect for human rights and fundamental freedoms, relevant legislation, both general and sectoral, including concerning public security, defence, national security and criminal law and the access of public authorities to personal data, as well as the implementation of such legislation, data protection rules, professional rules and security measures, including rules for the onward transfer of personal data to another third country or international organisation whi...</code> |
1398
+ | <code>What should Member States be authorized to provide for regarding personal data processing for archiving purposes?</code> | <code>Where personal data are processed for archiving purposes, this Regulation should also apply to that processing, bearing in mind that this Regulation should not apply to deceased persons. Public authorities or public or private bodies that hold records of public interest should be services which, pursuant to Union or Member State law, have a legal obligation to acquire, preserve, appraise, arrange, describe, communicate, promote, disseminate and provide access to records of enduring value for general public interest. Member States should also be authorised to provide for the further processing of personal data for archiving purposes, for example with a view to providing specific information related to the political behaviour under former totalitarian state regimes, genocide, crimes against humanity, in particular the Holocaust, or war crimes. 4.5.2016 L 119/29 Official Journal of the European Union EN</code> |
1399
+ * Loss: [<code>MatryoshkaLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#matryoshkaloss) with these parameters:
1400
+ ```json
1401
+ {
1402
+ "loss": "MultipleNegativesRankingLoss",
1403
+ "matryoshka_dims": [
1404
+ 1024,
1405
+ 768,
1406
+ 512,
1407
+ 256,
1408
+ 128,
1409
+ 64
1410
+ ],
1411
+ "matryoshka_weights": [
1412
+ 1,
1413
+ 1,
1414
+ 1,
1415
+ 1,
1416
+ 1,
1417
+ 1
1418
+ ],
1419
+ "n_dims_per_step": -1
1420
+ }
1421
+ ```
1422
+
1423
+ ### Training Hyperparameters
1424
+ #### Non-Default Hyperparameters
1425
+
1426
+ - `eval_strategy`: epoch
1427
+ - `per_device_eval_batch_size`: 16
1428
+ - `gradient_accumulation_steps`: 4
1429
+ - `learning_rate`: 2e-05
1430
+ - `num_train_epochs`: 20
1431
+ - `lr_scheduler_type`: cosine
1432
+ - `warmup_ratio`: 0.1
1433
+ - `bf16`: True
1434
+ - `load_best_model_at_end`: True
1435
+ - `optim`: adamw_torch_fused
1436
+ - `batch_sampler`: no_duplicates
1437
+
1438
+ #### All Hyperparameters
1439
+ <details><summary>Click to expand</summary>
1440
+
1441
+ - `overwrite_output_dir`: False
1442
+ - `do_predict`: False
1443
+ - `eval_strategy`: epoch
1444
+ - `prediction_loss_only`: True
1445
+ - `per_device_train_batch_size`: 8
1446
+ - `per_device_eval_batch_size`: 16
1447
+ - `per_gpu_train_batch_size`: None
1448
+ - `per_gpu_eval_batch_size`: None
1449
+ - `gradient_accumulation_steps`: 4
1450
+ - `eval_accumulation_steps`: None
1451
+ - `torch_empty_cache_steps`: None
1452
+ - `learning_rate`: 2e-05
1453
+ - `weight_decay`: 0.0
1454
+ - `adam_beta1`: 0.9
1455
+ - `adam_beta2`: 0.999
1456
+ - `adam_epsilon`: 1e-08
1457
+ - `max_grad_norm`: 1.0
1458
+ - `num_train_epochs`: 20
1459
+ - `max_steps`: -1
1460
+ - `lr_scheduler_type`: cosine
1461
+ - `lr_scheduler_kwargs`: {}
1462
+ - `warmup_ratio`: 0.1
1463
+ - `warmup_steps`: 0
1464
+ - `log_level`: passive
1465
+ - `log_level_replica`: warning
1466
+ - `log_on_each_node`: True
1467
+ - `logging_nan_inf_filter`: True
1468
+ - `save_safetensors`: True
1469
+ - `save_on_each_node`: False
1470
+ - `save_only_model`: False
1471
+ - `restore_callback_states_from_checkpoint`: False
1472
+ - `no_cuda`: False
1473
+ - `use_cpu`: False
1474
+ - `use_mps_device`: False
1475
+ - `seed`: 42
1476
+ - `data_seed`: None
1477
+ - `jit_mode_eval`: False
1478
+ - `use_ipex`: False
1479
+ - `bf16`: True
1480
+ - `fp16`: False
1481
+ - `fp16_opt_level`: O1
1482
+ - `half_precision_backend`: auto
1483
+ - `bf16_full_eval`: False
1484
+ - `fp16_full_eval`: False
1485
+ - `tf32`: None
1486
+ - `local_rank`: 0
1487
+ - `ddp_backend`: None
1488
+ - `tpu_num_cores`: None
1489
+ - `tpu_metrics_debug`: False
1490
+ - `debug`: []
1491
+ - `dataloader_drop_last`: False
1492
+ - `dataloader_num_workers`: 0
1493
+ - `dataloader_prefetch_factor`: None
1494
+ - `past_index`: -1
1495
+ - `disable_tqdm`: False
1496
+ - `remove_unused_columns`: True
1497
+ - `label_names`: None
1498
+ - `load_best_model_at_end`: True
1499
+ - `ignore_data_skip`: False
1500
+ - `fsdp`: []
1501
+ - `fsdp_min_num_params`: 0
1502
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
1503
+ - `tp_size`: 0
1504
+ - `fsdp_transformer_layer_cls_to_wrap`: None
1505
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
1506
+ - `deepspeed`: None
1507
+ - `label_smoothing_factor`: 0.0
1508
+ - `optim`: adamw_torch_fused
1509
+ - `optim_args`: None
1510
+ - `adafactor`: False
1511
+ - `group_by_length`: False
1512
+ - `length_column_name`: length
1513
+ - `ddp_find_unused_parameters`: None
1514
+ - `ddp_bucket_cap_mb`: None
1515
+ - `ddp_broadcast_buffers`: False
1516
+ - `dataloader_pin_memory`: True
1517
+ - `dataloader_persistent_workers`: False
1518
+ - `skip_memory_metrics`: True
1519
+ - `use_legacy_prediction_loop`: False
1520
+ - `push_to_hub`: False
1521
+ - `resume_from_checkpoint`: None
1522
+ - `hub_model_id`: None
1523
+ - `hub_strategy`: every_save
1524
+ - `hub_private_repo`: None
1525
+ - `hub_always_push`: False
1526
+ - `gradient_checkpointing`: False
1527
+ - `gradient_checkpointing_kwargs`: None
1528
+ - `include_inputs_for_metrics`: False
1529
+ - `include_for_metrics`: []
1530
+ - `eval_do_concat_batches`: True
1531
+ - `fp16_backend`: auto
1532
+ - `push_to_hub_model_id`: None
1533
+ - `push_to_hub_organization`: None
1534
+ - `mp_parameters`:
1535
+ - `auto_find_batch_size`: False
1536
+ - `full_determinism`: False
1537
+ - `torchdynamo`: None
1538
+ - `ray_scope`: last
1539
+ - `ddp_timeout`: 1800
1540
+ - `torch_compile`: False
1541
+ - `torch_compile_backend`: None
1542
+ - `torch_compile_mode`: None
1543
+ - `include_tokens_per_second`: False
1544
+ - `include_num_input_tokens_seen`: False
1545
+ - `neftune_noise_alpha`: None
1546
+ - `optim_target_modules`: None
1547
+ - `batch_eval_metrics`: False
1548
+ - `eval_on_start`: False
1549
+ - `use_liger_kernel`: False
1550
+ - `eval_use_gather_object`: False
1551
+ - `average_tokens_across_devices`: False
1552
+ - `prompts`: None
1553
+ - `batch_sampler`: no_duplicates
1554
+ - `multi_dataset_batch_sampler`: proportional
1555
+ - `router_mapping`: {}
1556
+ - `learning_rate_mapping`: {}
1557
+
1558
+ </details>
1559
+
1560
+ ### Training Logs
1561
+ | Epoch | Step | Training Loss | dim_1024_cosine_ndcg@10 | dim_768_cosine_ndcg@10 | dim_512_cosine_ndcg@10 | dim_256_cosine_ndcg@10 | dim_128_cosine_ndcg@10 | dim_64_cosine_ndcg@10 |
1562
+ |:------:|:----:|:-------------:|:-----------------------:|:----------------------:|:----------------------:|:----------------------:|:----------------------:|:---------------------:|
1563
+ | 0.8163 | 10 | 31.5155 | - | - | - | - | - | - |
1564
+ | 1.0 | 13 | - | 0.4494 | 0.4446 | 0.4364 | 0.3947 | 0.3362 | 0.2621 |
1565
+ | 1.5714 | 20 | 19.0409 | - | - | - | - | - | - |
1566
+ | 2.0 | 26 | - | 0.4065 | 0.4004 | 0.4013 | 0.3692 | 0.3418 | 0.2882 |
1567
+ | 2.3265 | 30 | 14.5314 | - | - | - | - | - | - |
1568
+ | 3.0 | 39 | - | 0.4418 | 0.4350 | 0.4329 | 0.4087 | 0.3714 | 0.3372 |
1569
+
1570
+
1571
+ ### Framework Versions
1572
+ - Python: 3.12.11
1573
+ - Sentence Transformers: 5.1.0
1574
+ - Transformers: 4.51.3
1575
+ - PyTorch: 2.8.0+cu126
1576
+ - Accelerate: 1.10.1
1577
+ - Datasets: 4.0.0
1578
+ - Tokenizers: 0.21.4
1579
+
1580
+ ## Citation
1581
+
1582
+ ### BibTeX
1583
+
1584
+ #### Sentence Transformers
1585
+ ```bibtex
1586
+ @inproceedings{reimers-2019-sentence-bert,
1587
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
1588
+ author = "Reimers, Nils and Gurevych, Iryna",
1589
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
1590
+ month = "11",
1591
+ year = "2019",
1592
+ publisher = "Association for Computational Linguistics",
1593
+ url = "https://arxiv.org/abs/1908.10084",
1594
+ }
1595
+ ```
1596
+
1597
+ #### MatryoshkaLoss
1598
+ ```bibtex
1599
+ @misc{kusupati2024matryoshka,
1600
+ title={Matryoshka Representation Learning},
1601
+ author={Aditya Kusupati and Gantavya Bhatt and Aniket Rege and Matthew Wallingford and Aditya Sinha and Vivek Ramanujan and William Howard-Snyder and Kaifeng Chen and Sham Kakade and Prateek Jain and Ali Farhadi},
1602
+ year={2024},
1603
+ eprint={2205.13147},
1604
+ archivePrefix={arXiv},
1605
+ primaryClass={cs.LG}
1606
+ }
1607
+ ```
1608
+
1609
+ #### MultipleNegativesRankingLoss
1610
+ ```bibtex
1611
+ @misc{henderson2017efficient,
1612
+ title={Efficient Natural Language Response Suggestion for Smart Reply},
1613
+ author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
1614
+ year={2017},
1615
+ eprint={1705.00652},
1616
+ archivePrefix={arXiv},
1617
+ primaryClass={cs.CL}
1618
+ }
1619
+ ```
1620
+
1621
+ <!--
1622
+ ## Glossary
1623
+
1624
+ *Clearly define terms in order to be accessible across audiences.*
1625
+ -->
1626
+
1627
+ <!--
1628
+ ## Model Card Authors
1629
+
1630
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
1631
+ -->
1632
+
1633
+ <!--
1634
+ ## Model Card Contact
1635
+
1636
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
1637
+ -->
checkpoint-39/config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "XLMRobertaModel"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "bos_token_id": 0,
7
+ "classifier_dropout": null,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 1024,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 4096,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 514,
16
+ "model_type": "xlm-roberta",
17
+ "num_attention_heads": 16,
18
+ "num_hidden_layers": 24,
19
+ "output_past": true,
20
+ "pad_token_id": 1,
21
+ "position_embedding_type": "absolute",
22
+ "torch_dtype": "float32",
23
+ "transformers_version": "4.51.3",
24
+ "type_vocab_size": 1,
25
+ "use_cache": true,
26
+ "vocab_size": 250002
27
+ }
checkpoint-39/config_sentence_transformers.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "SentenceTransformer",
3
+ "__version__": {
4
+ "sentence_transformers": "5.1.0",
5
+ "transformers": "4.51.3",
6
+ "pytorch": "2.8.0+cu126"
7
+ },
8
+ "prompts": {
9
+ "query": "",
10
+ "document": ""
11
+ },
12
+ "default_prompt_name": null,
13
+ "similarity_fn_name": "cosine"
14
+ }
checkpoint-39/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:606517f0bbfd9d0965e1f76f2da0525a6ed6a2c70afc1966a9b0134b9474e775
3
+ size 2239607176
checkpoint-39/modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
checkpoint-39/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9c909a2d90a6be41dec525d4f69773b1b7ef98feaaad0925b99faff29a123cb
3
+ size 4471067142
checkpoint-39/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b43253bbaef563ee65793ca453e451021b8a647dbc8d80b82193bbfb19542943
3
+ size 14645
checkpoint-39/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbe9b9462c0e6409f0e0b402c3d44d048e656208116af5441a4baa2dfc585878
3
+ size 1465
checkpoint-39/sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 512,
3
+ "do_lower_case": false
4
+ }
checkpoint-39/sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
3
+ size 5069051
checkpoint-39/special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "<mask>",
25
+ "lstrip": true,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "<unk>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
checkpoint-39/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:883b037111086fd4dfebbbc9b7cee11e1517b5e0c0514879478661440f137085
3
+ size 17082987
checkpoint-39/tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "250001": {
36
+ "content": "<mask>",
37
+ "lstrip": true,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "bos_token": "<s>",
45
+ "clean_up_tokenization_spaces": true,
46
+ "cls_token": "<s>",
47
+ "eos_token": "</s>",
48
+ "extra_special_tokens": {},
49
+ "mask_token": "<mask>",
50
+ "model_max_length": 512,
51
+ "pad_token": "<pad>",
52
+ "sep_token": "</s>",
53
+ "tokenizer_class": "XLMRobertaTokenizer",
54
+ "unk_token": "<unk>"
55
+ }
checkpoint-39/trainer_state.json ADDED
@@ -0,0 +1,358 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": 39,
3
+ "best_metric": 0.37139192897263235,
4
+ "best_model_checkpoint": "intfloat/multilingual-e5-large/checkpoint-39",
5
+ "epoch": 3.0,
6
+ "eval_steps": 500,
7
+ "global_step": 39,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.8163265306122449,
14
+ "grad_norm": 307.08624267578125,
15
+ "learning_rate": 7.500000000000001e-06,
16
+ "loss": 31.5155,
17
+ "step": 10
18
+ },
19
+ {
20
+ "epoch": 1.0,
21
+ "eval_dim_1024_cosine_accuracy@1": 0.42509603072983354,
22
+ "eval_dim_1024_cosine_accuracy@10": 0.49295774647887325,
23
+ "eval_dim_1024_cosine_accuracy@3": 0.43085787451984636,
24
+ "eval_dim_1024_cosine_accuracy@5": 0.46030729833546735,
25
+ "eval_dim_1024_cosine_map@100": 0.508986346237021,
26
+ "eval_dim_1024_cosine_mrr@10": 0.4369535394183281,
27
+ "eval_dim_1024_cosine_ndcg@10": 0.4493804868009024,
28
+ "eval_dim_1024_cosine_precision@1": 0.42509603072983354,
29
+ "eval_dim_1024_cosine_precision@10": 0.376056338028169,
30
+ "eval_dim_1024_cosine_precision@3": 0.42402902262057185,
31
+ "eval_dim_1024_cosine_precision@5": 0.4133162612035851,
32
+ "eval_dim_1024_cosine_recall@1": 0.04813624827530403,
33
+ "eval_dim_1024_cosine_recall@10": 0.3150476790176975,
34
+ "eval_dim_1024_cosine_recall@3": 0.1404092551990217,
35
+ "eval_dim_1024_cosine_recall@5": 0.21147403835662126,
36
+ "eval_dim_128_cosine_accuracy@1": 0.31370038412291934,
37
+ "eval_dim_128_cosine_accuracy@10": 0.38156209987195905,
38
+ "eval_dim_128_cosine_accuracy@3": 0.31946222791293216,
39
+ "eval_dim_128_cosine_accuracy@5": 0.34571062740076824,
40
+ "eval_dim_128_cosine_map@100": 0.3991669558616212,
41
+ "eval_dim_128_cosine_mrr@10": 0.32517427799117904,
42
+ "eval_dim_128_cosine_ndcg@10": 0.33618283481296385,
43
+ "eval_dim_128_cosine_precision@1": 0.31370038412291934,
44
+ "eval_dim_128_cosine_precision@10": 0.2764404609475032,
45
+ "eval_dim_128_cosine_precision@3": 0.31284677763551,
46
+ "eval_dim_128_cosine_precision@5": 0.30422535211267604,
47
+ "eval_dim_128_cosine_recall@1": 0.037933385936292925,
48
+ "eval_dim_128_cosine_recall@10": 0.24798465115464788,
49
+ "eval_dim_128_cosine_recall@3": 0.11100168654049715,
50
+ "eval_dim_128_cosine_recall@5": 0.1670926413559068,
51
+ "eval_dim_256_cosine_accuracy@1": 0.36427656850192064,
52
+ "eval_dim_256_cosine_accuracy@10": 0.44814340588988477,
53
+ "eval_dim_256_cosine_accuracy@3": 0.36939820742637647,
54
+ "eval_dim_256_cosine_accuracy@5": 0.4090909090909091,
55
+ "eval_dim_256_cosine_map@100": 0.45841270037343096,
56
+ "eval_dim_256_cosine_mrr@10": 0.37879397597707415,
57
+ "eval_dim_256_cosine_ndcg@10": 0.3947006636735062,
58
+ "eval_dim_256_cosine_precision@1": 0.36427656850192064,
59
+ "eval_dim_256_cosine_precision@10": 0.3289372599231754,
60
+ "eval_dim_256_cosine_precision@3": 0.36363636363636365,
61
+ "eval_dim_256_cosine_precision@5": 0.3560819462227913,
62
+ "eval_dim_256_cosine_recall@1": 0.04277277943657814,
63
+ "eval_dim_256_cosine_recall@10": 0.28617844199333936,
64
+ "eval_dim_256_cosine_recall@3": 0.1253991943934714,
65
+ "eval_dim_256_cosine_recall@5": 0.18947388504512186,
66
+ "eval_dim_512_cosine_accuracy@1": 0.4084507042253521,
67
+ "eval_dim_512_cosine_accuracy@10": 0.4871959026888604,
68
+ "eval_dim_512_cosine_accuracy@3": 0.41357234314980795,
69
+ "eval_dim_512_cosine_accuracy@5": 0.4519846350832266,
70
+ "eval_dim_512_cosine_map@100": 0.495554245202425,
71
+ "eval_dim_512_cosine_mrr@10": 0.42213127248338495,
72
+ "eval_dim_512_cosine_ndcg@10": 0.43644305450989757,
73
+ "eval_dim_512_cosine_precision@1": 0.4084507042253521,
74
+ "eval_dim_512_cosine_precision@10": 0.36606914212548014,
75
+ "eval_dim_512_cosine_precision@3": 0.40738369611609043,
76
+ "eval_dim_512_cosine_precision@5": 0.39846350832266325,
77
+ "eval_dim_512_cosine_recall@1": 0.04628035514721453,
78
+ "eval_dim_512_cosine_recall@10": 0.30419701916496145,
79
+ "eval_dim_512_cosine_recall@3": 0.13522898183596205,
80
+ "eval_dim_512_cosine_recall@5": 0.20394662187726964,
81
+ "eval_dim_64_cosine_accuracy@1": 0.24199743918053776,
82
+ "eval_dim_64_cosine_accuracy@10": 0.29641485275288093,
83
+ "eval_dim_64_cosine_accuracy@3": 0.24775928297055058,
84
+ "eval_dim_64_cosine_accuracy@5": 0.26952624839948786,
85
+ "eval_dim_64_cosine_map@100": 0.31803601064541553,
86
+ "eval_dim_64_cosine_mrr@10": 0.25159771761884414,
87
+ "eval_dim_64_cosine_ndcg@10": 0.2620553065689597,
88
+ "eval_dim_64_cosine_precision@1": 0.24199743918053776,
89
+ "eval_dim_64_cosine_precision@10": 0.21568501920614594,
90
+ "eval_dim_64_cosine_precision@3": 0.24199743918053776,
91
+ "eval_dim_64_cosine_precision@5": 0.23649167733674775,
92
+ "eval_dim_64_cosine_recall@1": 0.029110868794154622,
93
+ "eval_dim_64_cosine_recall@10": 0.19521971714475267,
94
+ "eval_dim_64_cosine_recall@3": 0.08524734139651896,
95
+ "eval_dim_64_cosine_recall@5": 0.12921904680249943,
96
+ "eval_dim_768_cosine_accuracy@1": 0.4193341869398207,
97
+ "eval_dim_768_cosine_accuracy@10": 0.4910371318822023,
98
+ "eval_dim_768_cosine_accuracy@3": 0.4238156209987196,
99
+ "eval_dim_768_cosine_accuracy@5": 0.4551856594110115,
100
+ "eval_dim_768_cosine_map@100": 0.5037778776293926,
101
+ "eval_dim_768_cosine_mrr@10": 0.4315339003719285,
102
+ "eval_dim_768_cosine_ndcg@10": 0.44456410503401034,
103
+ "eval_dim_768_cosine_precision@1": 0.4193341869398207,
104
+ "eval_dim_768_cosine_precision@10": 0.37272727272727274,
105
+ "eval_dim_768_cosine_precision@3": 0.4180537772087068,
106
+ "eval_dim_768_cosine_precision@5": 0.4076824583866837,
107
+ "eval_dim_768_cosine_recall@1": 0.04699592881851732,
108
+ "eval_dim_768_cosine_recall@10": 0.3107289399017082,
109
+ "eval_dim_768_cosine_recall@3": 0.13721565163348118,
110
+ "eval_dim_768_cosine_recall@5": 0.20710427114944024,
111
+ "eval_runtime": 98.6525,
112
+ "eval_samples_per_second": 0.0,
113
+ "eval_sequential_score": 0.2620553065689597,
114
+ "eval_steps_per_second": 0.0,
115
+ "step": 13
116
+ },
117
+ {
118
+ "epoch": 1.5714285714285714,
119
+ "grad_norm": 280.07818603515625,
120
+ "learning_rate": 1.5833333333333333e-05,
121
+ "loss": 19.0409,
122
+ "step": 20
123
+ },
124
+ {
125
+ "epoch": 2.0,
126
+ "eval_dim_1024_cosine_accuracy@1": 0.3854033290653009,
127
+ "eval_dim_1024_cosine_accuracy@10": 0.45454545454545453,
128
+ "eval_dim_1024_cosine_accuracy@3": 0.3886043533930858,
129
+ "eval_dim_1024_cosine_accuracy@5": 0.41101152368758004,
130
+ "eval_dim_1024_cosine_map@100": 0.47259820099791205,
131
+ "eval_dim_1024_cosine_mrr@10": 0.39624870434729537,
132
+ "eval_dim_1024_cosine_ndcg@10": 0.4065329035406967,
133
+ "eval_dim_1024_cosine_precision@1": 0.3854033290653009,
134
+ "eval_dim_1024_cosine_precision@10": 0.3357874519846351,
135
+ "eval_dim_1024_cosine_precision@3": 0.3839095177123346,
136
+ "eval_dim_1024_cosine_precision@5": 0.3713188220230474,
137
+ "eval_dim_1024_cosine_recall@1": 0.0451686782205082,
138
+ "eval_dim_1024_cosine_recall@10": 0.2918225395020212,
139
+ "eval_dim_1024_cosine_recall@3": 0.13200270380544088,
140
+ "eval_dim_1024_cosine_recall@5": 0.19735476247586825,
141
+ "eval_dim_128_cosine_accuracy@1": 0.31562099871959026,
142
+ "eval_dim_128_cosine_accuracy@10": 0.39180537772087065,
143
+ "eval_dim_128_cosine_accuracy@3": 0.3207426376440461,
144
+ "eval_dim_128_cosine_accuracy@5": 0.352112676056338,
145
+ "eval_dim_128_cosine_map@100": 0.40471008477532144,
146
+ "eval_dim_128_cosine_mrr@10": 0.32839105339105285,
147
+ "eval_dim_128_cosine_ndcg@10": 0.34177784905202935,
148
+ "eval_dim_128_cosine_precision@1": 0.31562099871959026,
149
+ "eval_dim_128_cosine_precision@10": 0.280729833546735,
150
+ "eval_dim_128_cosine_precision@3": 0.31455399061032857,
151
+ "eval_dim_128_cosine_precision@5": 0.30640204865556975,
152
+ "eval_dim_128_cosine_recall@1": 0.03888088094516579,
153
+ "eval_dim_128_cosine_recall@10": 0.2550464126190524,
154
+ "eval_dim_128_cosine_recall@3": 0.11341113256173359,
155
+ "eval_dim_128_cosine_recall@5": 0.17046484922169536,
156
+ "eval_dim_256_cosine_accuracy@1": 0.3418693982074264,
157
+ "eval_dim_256_cosine_accuracy@10": 0.4238156209987196,
158
+ "eval_dim_256_cosine_accuracy@3": 0.34763124199743917,
159
+ "eval_dim_256_cosine_accuracy@5": 0.38092189500640206,
160
+ "eval_dim_256_cosine_map@100": 0.43770217754051305,
161
+ "eval_dim_256_cosine_mrr@10": 0.35596482938032165,
162
+ "eval_dim_256_cosine_ndcg@10": 0.36923043791328775,
163
+ "eval_dim_256_cosine_precision@1": 0.3418693982074264,
164
+ "eval_dim_256_cosine_precision@10": 0.30441741357234314,
165
+ "eval_dim_256_cosine_precision@3": 0.34165599658557405,
166
+ "eval_dim_256_cosine_precision@5": 0.3322663252240717,
167
+ "eval_dim_256_cosine_recall@1": 0.041410929155814194,
168
+ "eval_dim_256_cosine_recall@10": 0.2705196189189818,
169
+ "eval_dim_256_cosine_recall@3": 0.1212642412965687,
170
+ "eval_dim_256_cosine_recall@5": 0.18173918651563936,
171
+ "eval_dim_512_cosine_accuracy@1": 0.37708066581306016,
172
+ "eval_dim_512_cosine_accuracy@10": 0.4532650448143406,
173
+ "eval_dim_512_cosine_accuracy@3": 0.38092189500640206,
174
+ "eval_dim_512_cosine_accuracy@5": 0.4084507042253521,
175
+ "eval_dim_512_cosine_map@100": 0.4678017780580059,
176
+ "eval_dim_512_cosine_mrr@10": 0.3893670101416575,
177
+ "eval_dim_512_cosine_ndcg@10": 0.40127522003513455,
178
+ "eval_dim_512_cosine_precision@1": 0.37708066581306016,
179
+ "eval_dim_512_cosine_precision@10": 0.33156209987195906,
180
+ "eval_dim_512_cosine_precision@3": 0.37537345283824153,
181
+ "eval_dim_512_cosine_precision@5": 0.36402048655569774,
182
+ "eval_dim_512_cosine_recall@1": 0.04457309853297402,
183
+ "eval_dim_512_cosine_recall@10": 0.2883968018428671,
184
+ "eval_dim_512_cosine_recall@3": 0.13007205872054822,
185
+ "eval_dim_512_cosine_recall@5": 0.19449520589871025,
186
+ "eval_dim_64_cosine_accuracy@1": 0.26696542893725994,
187
+ "eval_dim_64_cosine_accuracy@10": 0.33098591549295775,
188
+ "eval_dim_64_cosine_accuracy@3": 0.27208706786171577,
189
+ "eval_dim_64_cosine_accuracy@5": 0.293213828425096,
190
+ "eval_dim_64_cosine_map@100": 0.34719730722747555,
191
+ "eval_dim_64_cosine_mrr@10": 0.2776957197731842,
192
+ "eval_dim_64_cosine_ndcg@10": 0.2881905192612941,
193
+ "eval_dim_64_cosine_precision@1": 0.26696542893725994,
194
+ "eval_dim_64_cosine_precision@10": 0.237708066581306,
195
+ "eval_dim_64_cosine_precision@3": 0.26717883055911223,
196
+ "eval_dim_64_cosine_precision@5": 0.2596670934699104,
197
+ "eval_dim_64_cosine_recall@1": 0.031692344067516816,
198
+ "eval_dim_64_cosine_recall@10": 0.21473974122936995,
199
+ "eval_dim_64_cosine_recall@3": 0.09327455064654774,
200
+ "eval_dim_64_cosine_recall@5": 0.14131510912407144,
201
+ "eval_dim_768_cosine_accuracy@1": 0.37451984635083224,
202
+ "eval_dim_768_cosine_accuracy@10": 0.4539052496798976,
203
+ "eval_dim_768_cosine_accuracy@3": 0.37900128040973113,
204
+ "eval_dim_768_cosine_accuracy@5": 0.40973111395646605,
205
+ "eval_dim_768_cosine_map@100": 0.4672061011440217,
206
+ "eval_dim_768_cosine_mrr@10": 0.38746671950897227,
207
+ "eval_dim_768_cosine_ndcg@10": 0.4004027303245026,
208
+ "eval_dim_768_cosine_precision@1": 0.37451984635083224,
209
+ "eval_dim_768_cosine_precision@10": 0.3318181818181818,
210
+ "eval_dim_768_cosine_precision@3": 0.3734528382415706,
211
+ "eval_dim_768_cosine_precision@5": 0.3632522407170295,
212
+ "eval_dim_768_cosine_recall@1": 0.04413921317349132,
213
+ "eval_dim_768_cosine_recall@10": 0.28955317519546525,
214
+ "eval_dim_768_cosine_recall@3": 0.12896663310051748,
215
+ "eval_dim_768_cosine_recall@5": 0.19376203165061448,
216
+ "eval_runtime": 98.4244,
217
+ "eval_samples_per_second": 0.0,
218
+ "eval_sequential_score": 0.2881905192612941,
219
+ "eval_steps_per_second": 0.0,
220
+ "step": 26
221
+ },
222
+ {
223
+ "epoch": 2.326530612244898,
224
+ "grad_norm": 305.66259765625,
225
+ "learning_rate": 1.9973569167005725e-05,
226
+ "loss": 14.5314,
227
+ "step": 30
228
+ },
229
+ {
230
+ "epoch": 3.0,
231
+ "eval_dim_1024_cosine_accuracy@1": 0.4180537772087068,
232
+ "eval_dim_1024_cosine_accuracy@10": 0.49039692701664533,
233
+ "eval_dim_1024_cosine_accuracy@3": 0.42189500640204863,
234
+ "eval_dim_1024_cosine_accuracy@5": 0.4500640204865557,
235
+ "eval_dim_1024_cosine_map@100": 0.506794523350519,
236
+ "eval_dim_1024_cosine_mrr@10": 0.42985717334308843,
237
+ "eval_dim_1024_cosine_ndcg@10": 0.44178501209869797,
238
+ "eval_dim_1024_cosine_precision@1": 0.4180537772087068,
239
+ "eval_dim_1024_cosine_precision@10": 0.36869398207426374,
240
+ "eval_dim_1024_cosine_precision@3": 0.4163465642338881,
241
+ "eval_dim_1024_cosine_precision@5": 0.4043533930857874,
242
+ "eval_dim_1024_cosine_recall@1": 0.04734422767263886,
243
+ "eval_dim_1024_cosine_recall@10": 0.308531274625124,
244
+ "eval_dim_1024_cosine_recall@3": 0.138064233626932,
245
+ "eval_dim_1024_cosine_recall@5": 0.2069980430010945,
246
+ "eval_dim_128_cosine_accuracy@1": 0.34699103713188223,
247
+ "eval_dim_128_cosine_accuracy@10": 0.4212548015364917,
248
+ "eval_dim_128_cosine_accuracy@3": 0.35147247119078107,
249
+ "eval_dim_128_cosine_accuracy@5": 0.37900128040973113,
250
+ "eval_dim_128_cosine_map@100": 0.4338211299784659,
251
+ "eval_dim_128_cosine_mrr@10": 0.35916305916305874,
252
+ "eval_dim_128_cosine_ndcg@10": 0.37139192897263235,
253
+ "eval_dim_128_cosine_precision@1": 0.34699103713188223,
254
+ "eval_dim_128_cosine_precision@10": 0.3042893725992318,
255
+ "eval_dim_128_cosine_precision@3": 0.34571062740076824,
256
+ "eval_dim_128_cosine_precision@5": 0.3352112676056338,
257
+ "eval_dim_128_cosine_recall@1": 0.04217848526747235,
258
+ "eval_dim_128_cosine_recall@10": 0.2706183968947745,
259
+ "eval_dim_128_cosine_recall@3": 0.12288848071178002,
260
+ "eval_dim_128_cosine_recall@5": 0.18344012521240954,
261
+ "eval_dim_256_cosine_accuracy@1": 0.38348271446862997,
262
+ "eval_dim_256_cosine_accuracy@10": 0.4551856594110115,
263
+ "eval_dim_256_cosine_accuracy@3": 0.3886043533930858,
264
+ "eval_dim_256_cosine_accuracy@5": 0.4206145966709347,
265
+ "eval_dim_256_cosine_map@100": 0.4709582085612654,
266
+ "eval_dim_256_cosine_mrr@10": 0.3957850639188662,
267
+ "eval_dim_256_cosine_ndcg@10": 0.4087462230477571,
268
+ "eval_dim_256_cosine_precision@1": 0.38348271446862997,
269
+ "eval_dim_256_cosine_precision@10": 0.33886043533930854,
270
+ "eval_dim_256_cosine_precision@3": 0.382202304737516,
271
+ "eval_dim_256_cosine_precision@5": 0.3718309859154929,
272
+ "eval_dim_256_cosine_recall@1": 0.04466034705404223,
273
+ "eval_dim_256_cosine_recall@10": 0.2892016292717267,
274
+ "eval_dim_256_cosine_recall@3": 0.1301795023253766,
275
+ "eval_dim_256_cosine_recall@5": 0.19500340584044382,
276
+ "eval_dim_512_cosine_accuracy@1": 0.4065300896286812,
277
+ "eval_dim_512_cosine_accuracy@10": 0.4814340588988476,
278
+ "eval_dim_512_cosine_accuracy@3": 0.41229193341869397,
279
+ "eval_dim_512_cosine_accuracy@5": 0.44494238156209986,
280
+ "eval_dim_512_cosine_map@100": 0.49555759572196095,
281
+ "eval_dim_512_cosine_mrr@10": 0.41950236774180394,
282
+ "eval_dim_512_cosine_ndcg@10": 0.4329095460408428,
283
+ "eval_dim_512_cosine_precision@1": 0.4065300896286812,
284
+ "eval_dim_512_cosine_precision@10": 0.3596030729833547,
285
+ "eval_dim_512_cosine_precision@3": 0.4054630815194195,
286
+ "eval_dim_512_cosine_precision@5": 0.3947503201024327,
287
+ "eval_dim_512_cosine_recall@1": 0.047372341735862133,
288
+ "eval_dim_512_cosine_recall@10": 0.3071623578952262,
289
+ "eval_dim_512_cosine_recall@3": 0.1383106496582531,
290
+ "eval_dim_512_cosine_recall@5": 0.20757258542171747,
291
+ "eval_dim_64_cosine_accuracy@1": 0.3207426376440461,
292
+ "eval_dim_64_cosine_accuracy@10": 0.3725992317541613,
293
+ "eval_dim_64_cosine_accuracy@3": 0.322663252240717,
294
+ "eval_dim_64_cosine_accuracy@5": 0.3405889884763124,
295
+ "eval_dim_64_cosine_map@100": 0.3933467041096336,
296
+ "eval_dim_64_cosine_mrr@10": 0.32884732638253733,
297
+ "eval_dim_64_cosine_ndcg@10": 0.3371953828075091,
298
+ "eval_dim_64_cosine_precision@1": 0.3207426376440461,
299
+ "eval_dim_64_cosine_precision@10": 0.2797055057618438,
300
+ "eval_dim_64_cosine_precision@3": 0.3188220230473751,
301
+ "eval_dim_64_cosine_precision@5": 0.3088348271446863,
302
+ "eval_dim_64_cosine_recall@1": 0.036318765090758674,
303
+ "eval_dim_64_cosine_recall@10": 0.23840960718091392,
304
+ "eval_dim_64_cosine_recall@3": 0.10562189493083342,
305
+ "eval_dim_64_cosine_recall@5": 0.15867125525021739,
306
+ "eval_dim_768_cosine_accuracy@1": 0.41037131882202305,
307
+ "eval_dim_768_cosine_accuracy@10": 0.4833546734955186,
308
+ "eval_dim_768_cosine_accuracy@3": 0.4142125480153649,
309
+ "eval_dim_768_cosine_accuracy@5": 0.44430217669654287,
310
+ "eval_dim_768_cosine_map@100": 0.500478306774528,
311
+ "eval_dim_768_cosine_mrr@10": 0.4224889742495374,
312
+ "eval_dim_768_cosine_ndcg@10": 0.4349862241563486,
313
+ "eval_dim_768_cosine_precision@1": 0.41037131882202305,
314
+ "eval_dim_768_cosine_precision@10": 0.36165172855313704,
315
+ "eval_dim_768_cosine_precision@3": 0.4086641058472044,
316
+ "eval_dim_768_cosine_precision@5": 0.3969270166453265,
317
+ "eval_dim_768_cosine_recall@1": 0.047186779325657804,
318
+ "eval_dim_768_cosine_recall@10": 0.30540044861465576,
319
+ "eval_dim_768_cosine_recall@3": 0.1375709294981283,
320
+ "eval_dim_768_cosine_recall@5": 0.20603724780478358,
321
+ "eval_runtime": 98.5908,
322
+ "eval_samples_per_second": 0.0,
323
+ "eval_sequential_score": 0.3371953828075091,
324
+ "eval_steps_per_second": 0.0,
325
+ "step": 39
326
+ }
327
+ ],
328
+ "logging_steps": 10,
329
+ "max_steps": 240,
330
+ "num_input_tokens_seen": 0,
331
+ "num_train_epochs": 20,
332
+ "save_steps": 500,
333
+ "stateful_callbacks": {
334
+ "EarlyStoppingCallback": {
335
+ "args": {
336
+ "early_stopping_patience": 2,
337
+ "early_stopping_threshold": 0.0
338
+ },
339
+ "attributes": {
340
+ "early_stopping_patience_counter": 0
341
+ }
342
+ },
343
+ "TrainerControl": {
344
+ "args": {
345
+ "should_epoch_stop": false,
346
+ "should_evaluate": false,
347
+ "should_log": false,
348
+ "should_save": true,
349
+ "should_training_stop": false
350
+ },
351
+ "attributes": {}
352
+ }
353
+ },
354
+ "total_flos": 0.0,
355
+ "train_batch_size": 8,
356
+ "trial_name": null,
357
+ "trial_params": null
358
+ }
checkpoint-39/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd906d94b017c1a7fa871b608776d19ecf4218c10c253401fe78ba8ce84435be
3
+ size 6097
checkpoint-52/1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 1024,
3
+ "pooling_mode_cls_token": false,
4
+ "pooling_mode_mean_tokens": true,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
checkpoint-52/README.md ADDED
@@ -0,0 +1,1640 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ license: apache-2.0
5
+ tags:
6
+ - sentence-transformers
7
+ - sentence-similarity
8
+ - feature-extraction
9
+ - dense
10
+ - generated_from_trainer
11
+ - dataset_size:391
12
+ - loss:MatryoshkaLoss
13
+ - loss:MultipleNegativesRankingLoss
14
+ base_model: intfloat/multilingual-e5-large
15
+ widget:
16
+ - source_sentence: What is the responsibility of assisting and advising the data subjects
17
+ in exercising their rights?
18
+ sentences:
19
+ - '1.Personal data shall be: (a) processed lawfully, fairly and in a transparent
20
+ manner in relation to the data subject (‘lawfulness, fairness and transparency’);
21
+ (b) collected for specified, explicit and legitimate purposes and not further
22
+ processed in a manner that is incompatible with those purposes; further processing
23
+ for archiving purposes in the public interest, scientific or historical research
24
+ purposes or statistical purposes shall, in accordance with Article 89(1), not
25
+ be considered to be incompatible with the initial purposes (‘purpose limitation’);
26
+ (c) adequate, relevant and limited to what is necessary in relation to the purposes
27
+ for which they are processed (‘data minimisation’); (d) accurate and, where necessary,
28
+ kept up to date; every reasonable step must be taken to ensure that personal data
29
+ that are inaccurate, having regard to the purposes for which they are processed,
30
+ are erased or rectified without delay (‘accuracy’); 4.5.2016 L 119/35 (1) Directive
31
+ (EU) 2015/1535 of the European Parliament and of the Council of 9 September 2015
32
+ laying down a procedure for the provision of information in the field of technical
33
+ regulations and of rules on Information Society services (OJ L 241, 17.9.2015,
34
+ p. 1). (e) kept in a form which permits identification of data subjects for no
35
+ longer than is necessary for the purposes for which the personal data are processed;
36
+ personal data may be stored for longer periods insofar as the personal data will
37
+ be processed solely for archiving purposes in the public interest, scientific
38
+ or historical research purposes or statistical purposes in accordance with Article
39
+ 89(1) subject to implementation of the appropriate technical and organisational
40
+ measures required by this Regulation in order to safeguard the rights and freedoms
41
+ of the data subject (‘storage limitation’); (f) processed in a manner that ensures
42
+ appropriate security of the personal data, including protection against unauthorised
43
+ or unlawful processing and against accidental loss, destruction or damage, using
44
+ appropriate technical or organisational measures (‘integrity and confidentiality’).
45
+
46
+ 2.The controller shall be responsible for, and be able to demonstrate compliance
47
+ with, paragraph 1 (‘accountability’).'
48
+ - '1.A transfer of personal data to a third country or an international organisation
49
+ may take place where the Commission has decided that the third country, a territory
50
+ or one or more specified sectors within that third country, or the international
51
+ organisation in question ensures an adequate level of protection. Such a transfer
52
+ shall not require any specific authorisation.
53
+
54
+ 2.When assessing the adequacy of the level of protection, the Commission shall,
55
+ in particular, take account of the following elements: (a) the rule of law, respect
56
+ for human rights and fundamental freedoms, relevant legislation, both general
57
+ and sectoral, including concerning public security, defence, national security
58
+ and criminal law and the access of public authorities to personal data, as well
59
+ as the implementation of such legislation, data protection rules, professional
60
+ rules and security measures, including rules for the onward transfer of personal
61
+ data to another third country or international organisation which are complied
62
+ with in that country or international organisation, case-law, as well as effective
63
+ and enforceable data subject rights and effective administrative and judicial
64
+ redress for the data subjects whose personal data are being transferred; (b) the
65
+ existence and effective functioning of one or more independent supervisory authorities
66
+ in the third country or to which an international organisation is subject, with
67
+ responsibility for ensuring and enforcing compliance with the data protection
68
+ rules, including adequate enforcement powers, for assisting and advising the data
69
+ subjects in exercising their rights and for cooperation with the supervisory authorities
70
+ of the Member States; and (c) the international commitments the third country
71
+ or international organisation concerned has entered into, or other obligations
72
+ arising from legally binding conventions or instruments as well as from its participation
73
+ in multilateral or regional systems, in particular in relation to the protection
74
+ of personal data.
75
+
76
+ 3.The Commission, after assessing the adequacy of the level of protection, may
77
+ decide, by means of implementing act, that a third country, a territory or one
78
+ or more specified sectors within a third country, or an international organisation
79
+ ensures an adequate level of protection within the meaning of paragraph 2 of this
80
+ Article. The implementing act shall provide for a mechanism for a periodic review,
81
+ at least every four years, which shall take into account all relevant developments
82
+ in the third country or international organisation. The implementing act shall
83
+ specify its territorial and sectoral application and, where applicable, identify
84
+ the supervisory authority or authorities referred to in point (b) of paragraph
85
+ 2 of this Article. The implementing act shall be adopted in accordance with the
86
+ examination procedure referred to in Article 93(2).
87
+
88
+ 4.The Commission shall, on an ongoing basis, monitor developments in third countries
89
+ and international organisations that could affect the functioning of decisions
90
+ adopted pursuant to paragraph 3 of this Article and decisions adopted on the basis
91
+ of Article 25(6) of Directive 95/46/EC.
92
+
93
+ 5.The Commission shall, where available information reveals, in particular following
94
+ the review referred to in paragraph 3 of this Article, that a third country, a
95
+ territory or one or more specified sectors within a third country, or an international
96
+ organisation no longer ensures an adequate level of protection within the meaning
97
+ of paragraph 2 of this Article, to the extent necessary, repeal, amend or suspend
98
+ the decision referred to in paragraph 3 of this Article by means of implementing
99
+ acts without retro-active effect. Those implementing acts shall be adopted in
100
+ accordance with the examination procedure referred to in Article 93(2). On duly
101
+ justified imperative grounds of urgency, the Commission shall adopt immediately
102
+ applicable implementing acts in accordance with the procedure referred to in Article
103
+ 93(3).
104
+
105
+ 6.The Commission shall enter into consultations with the third country or international
106
+ organisation with a view to remedying the situation giving rise to the decision
107
+ made pursuant to paragraph 5
108
+
109
+ 7.A decision pursuant to paragraph 5 of this Article is without prejudice to transfers
110
+ of personal data to the third country, a territory or one or more specified sectors
111
+ within that third country, or the international organisation in question pursuant
112
+ to Articles 46 to 49
113
+
114
+ 8.The Commission shall publish in the Official Journal of the European Union and
115
+ on its website a list of the third countries, territories and specified sectors
116
+ within a third country and international organisations for which it has decided
117
+ that an adequate level of protection is or is no longer ensured.
118
+
119
+ 9.Decisions adopted by the Commission on the basis of Article 25(6) of Directive
120
+ 95/46/EC shall remain in force until amended, replaced or repealed by a Commission
121
+ Decision adopted in accordance with paragraph 3 or 5 of this Article.'
122
+ - The legal systems of Denmark and Estonia do not allow for administrative fines
123
+ as set out in this Regulation. The rules on administrative fines may be applied
124
+ in such a manner that in Denmark the fine is imposed by competent national courts
125
+ as a criminal penalty and in Estonia the fine is imposed by the supervisory authority
126
+ in the framework of a misdemeanour procedure, provided that such an application
127
+ of the rules in those Member States has an equivalent effect to administrative
128
+ fines imposed by supervisory authorities. Therefore the competent national courts
129
+ should take into account the recommendation by the supervisory authority initiating
130
+ the fine. In any event, the fines imposed should be effective, proportionate and
131
+ dissuasive.
132
+ - source_sentence: Is the fine mandatory for the described offense?
133
+ sentences:
134
+ - "1.Each supervisory authority shall ensure that the imposition of administrative\
135
+ \ fines pursuant to this Article in respect of infringements of this Regulation\
136
+ \ referred to in paragraphs 4, 5 and 6 shall in each individual case be effective,\
137
+ \ proportionate and dissuasive.\n2.Administrative fines shall, depending on the\
138
+ \ circumstances of each individual case, be imposed in addition to, or instead\
139
+ \ of, measures referred to in points (a) to (h) and (j) of Article 58(2). When\
140
+ \ deciding whether to impose an administrative fine and deciding on the amount\
141
+ \ of the administrative fine in each individual case due regard shall be given\
142
+ \ to the following: (a) the nature, gravity and duration of the infringement\
143
+ \ taking into account the nature scope or purpose of the processing concerned\
144
+ \ as well as the number of data subjects affected and the level of damage suffered\
145
+ \ by them; (b) the intentional or negligent character of the infringement; (c)\
146
+ \ any action taken by the controller or processor to mitigate the damage suffered\
147
+ \ by data subjects; (d) the degree of responsibility of the controller or processor\
148
+ \ taking into account technical and organisational measures implemented by them\
149
+ \ pursuant to Articles 25 and 32; (e) any relevant previous infringements by\
150
+ \ the controller or processor; (f) the degree of cooperation with the supervisory\
151
+ \ authority, in order to remedy the infringement and mitigate the possible adverse\
152
+ \ effects of the infringement; (g) the categories of personal data affected by\
153
+ \ the infringement; (h) the manner in which the infringement became known to\
154
+ \ the supervisory authority, in particular whether, and if so to what extent,\
155
+ \ the controller or processor notified the infringement; (i) where measures referred\
156
+ \ to in Article 58(2) have previously been ordered against the controller or processor\
157
+ \ concerned with regard to the same subject-matter, compliance with those measures;\
158
+ \ (j) adherence to approved codes of conduct pursuant to Article 40 or approved\
159
+ \ certification mechanisms pursuant to Article 42; and (k) any other aggravating\
160
+ \ or mitigating factor applicable to the circumstances of the case, such as financial\
161
+ \ benefits gained, or losses avoided, directly or indirectly, from the infringement.\n\
162
+ 3.If a controller or processor intentionally or negligently, for the same or linked\
163
+ \ processing operations, infringes several provisions of this Regulation, the\
164
+ \ total amount of the administrative fine shall not exceed the amount specified\
165
+ \ for the gravest infringement.\n4.Infringements of the following provisions shall,\
166
+ \ in accordance with paragraph 2, be subject to administrative fines up to 10\
167
+ \ 000 000 EUR, or in the case of an undertaking, up to 2 % of the total worldwide\
168
+ \ annual turnover of the preceding financial year, whichever is higher: (a) the\
169
+ \ obligations of the controller and the processor pursuant to Articles 8, 11,\
170
+ \ 25 to 39 and 42 and 43; (b) the obligations of the certification body pursuant\
171
+ \ to Articles 42 and 43; (c) the obligations of the monitoring body pursuant\
172
+ \ to Article 41(4). 4.5.2016 L 119/82 \n5.Infringements of the following provisions\
173
+ \ shall, in accordance with paragraph 2, be subject to administrative fines up\
174
+ \ to 20 000 000 EUR, or in the case of an undertaking, up to 4 % of the total\
175
+ \ worldwide annual turnover of the preceding financial year, whichever is higher:\
176
+ \ (a) the basic principles for processing, including conditions for consent,\
177
+ \ pursuant to Articles 5, 6, 7 and 9; (b) the data subjects' rights pursuant\
178
+ \ to Articles 12 to 22; (c) the transfers of personal data to a recipient in\
179
+ \ a third country or an international organisation pursuant to Articles 44 to\
180
+ \ 49; (d) any obligations pursuant to Member State law adopted under Chapter\
181
+ \ IX; (e) non-compliance with an order or a temporary or definitive limitation\
182
+ \ on processing or the suspension of data flows by the supervisory authority pursuant\
183
+ \ to Article 58(2) or failure to provide access in violation of Article 58(1).\n\
184
+ 6.Non-compliance with an order by the supervisory authority as referred to in\
185
+ \ Article 58(2) shall, in accordance with paragraph 2 of this Article, be subject\
186
+ \ to administrative fines up to 20 000 000 EUR, or in the case of an undertaking,\
187
+ \ up to 4 % of the total worldwide annual turnover of the preceding financial\
188
+ \ year, whichever is higher.\n7.Without prejudice to the corrective powers of\
189
+ \ supervisory authorities pursuant to Article 58(2), each Member State may lay\
190
+ \ down the rules on whether and to what extent administrative fines may be imposed\
191
+ \ on public authorities and bodies established in that Member State.\n8.The exercise\
192
+ \ by the supervisory authority of its powers under this Article shall be subject\
193
+ \ to appropriate procedural safeguards in accordance with Union and Member State\
194
+ \ law, including effective judicial remedy and due process.\n9.Where the legal\
195
+ \ system of the Member State does not provide for administrative fines, this Article\
196
+ \ may be applied in such a manner that the fine is initiated by the competent\
197
+ \ supervisory authority and imposed by competent national courts, while ensuring\
198
+ \ that those legal remedies are effective and have an equivalent effect to the\
199
+ \ administrative fines imposed by supervisory authorities. In any event, the fines\
200
+ \ imposed shall be effective, proportionate and dissuasive. Those Member States\
201
+ \ shall notify to the Commission the provisions of their laws which they adopt\
202
+ \ pursuant to this paragraph by 25 May 2018 and, without delay, any subsequent\
203
+ \ amendment law or amendment affecting them."
204
+ - "Court (Civil/Criminal): Criminal \nProvisions: Article 386 of the Penal Code\
205
+ \ \nTime of commission of the act: \nResult (innocent, guilty): \nReasoning:\
206
+ \ Conviction for computer fraud committed repeatedly and professionally with a\
207
+ \ total benefit and damage exceeding €30,000. According to the majority opinion,\
208
+ \ the charge is substantiated in both its objective and subjective aspects, and\
209
+ \ the defendant must be declared guilty of the aforementioned criminal acts of\
210
+ \ fraud by means of a computer, committed repeatedly by a perpetrator acting professionally,\
211
+ \ where the total financial benefit and corresponding damage exceed the amount\
212
+ \ of €30,000, as well as for repeated embezzlement.\n\nFacts: The defendant accessed\
213
+ \ a website using a computer, employing, without the knowledge and consent of\
214
+ \ the complainants, the access codes for the electronic management system of the\
215
+ \ bank accounts held by the complainants at a Bank, and transferred money through\
216
+ \ electronically transmitted orders from the complainants' accounts to her own\
217
+ \ account. Specifically, during the period from June 2007 to June 2008, after\
218
+ \ unlawfully acquiring the aforementioned STICK containing the access codes, she\
219
+ \ accessed a website maintained by ..., using, without the complainants' knowledge\
220
+ \ (without their consent or approval), the access codes for the electronic management\
221
+ \ system of the bank accounts held at the aforementioned Bank, transferring through\
222
+ \ electronically transmitted orders to the joint account number ... of the complainants\
223
+ \ from bank accounts numbered ..., ..., and ..., the total amount of €55,710,\
224
+ \ as detailed in the orders, and subsequently, using an ATM card, she gradually\
225
+ \ withdrew from the aforementioned account number ..., the total amount of €55,710,\
226
+ \ making 84 individual withdrawals from automatic teller machines. In addition,\
227
+ \ the defendant, during the period from June 2008 to November 2008, in the same\
228
+ \ exact manner (through the electronic management system of the bank accounts),\
229
+ \ transferred through electronically transmitted orders to account number ...,\
230
+ \ which she had opened at ..., from the complainants' bank accounts numbered ...,\
231
+ \ ..., ..., ..., and ..., the total amount of €73,942, as detailed in the orders\
232
+ \ regarding the transfers of these amounts. Furthermore, during the period from\
233
+ \ February 2008 to November 2008, through multiple acts constituting a continuation\
234
+ \ of the crime, although she had received from the first complainant ... the amounts\
235
+ \ of €695.04, €695.04, and €845.04, in order to pay his insurance contributions\
236
+ \ to O.A.E.E. for the periods of January-February 2008, May-June 2008, and September-October\
237
+ \ 2008, as well as the amounts of €250 and €280, in order to settle credit card\
238
+ \ bills for \"...\", respectively, and from the second complainant ... she received\
239
+ \ the amounts of €283.64, €419.26, and €385.38, to pay the latter's insurance\
240
+ \ contributions to O.A.E.E. for the periods of July-August 2007, May-June 2008,\
241
+ \ September-October 2008, and November-December 2008, as well as the amount of\
242
+ \ €1,888.03 for the settlement of VAT, she never paid the above amounts to settle\
243
+ \ the aforementioned obligations, nor did she return them to the complainants,\
244
+ \ despite being urged to do so, but incorporated them into her assets and wrongfully\
245
+ \ appropriated them. The defendant denies the charges against her and claims that\
246
+ \ the withdrawals were made by the second complainant and that all the amounts\
247
+ \ transferred to her account were transferred to cover the company's expenses\
248
+ \ and their personal expenses, due to her cohabitation with the second complainant\
249
+ \ and with his knowledge, with whom she intended to marry. However, this claim\
250
+ \ is not supported by any evidence; on the contrary, it emerged that she conducted\
251
+ \ the transfers of the money and withdrawals without the complainants' knowledge,\
252
+ \ and when she learned that they had been informed about the account movements\
253
+ \ and met at the Bank, her behavior and demeanor indicated guilt, according to\
254
+ \ the testimony of the prosecution witness ..., an employee of the Pangrati branch\
255
+ \ of ..., who saw her on the same day at the aforementioned Bank when she met\
256
+ \ with the complainants. The ongoing act of fraud using a computer was committed\
257
+ \ by the defendant professionally, as evidenced by her repeated commission of\
258
+ \ the act, as well as the infrastructure she had established with the intent of\
259
+ \ repeated commission, based on a specific plan and methodology (transferring\
260
+ \ smaller amounts to a joint account of the complainants from the remaining accounts\
261
+ \ of the latter, and then withdrawing the transferred amounts with an ATM card,\
262
+ \ as well as directly transferring smaller amounts from the complainants' accounts\
263
+ \ to her personal account she had opened at the same bank), indicating her purpose\
264
+ \ to generate income, with the financial benefit she gained, corresponding to\
265
+ \ the complainants' damage, exceeding a total of €30,000."
266
+ - 'Any person who intentionally, through the technology of information and communication,
267
+ suggests an encounter between an adult and a minor under the age of fifteen, aiming
268
+ at the commitment of the crimes described in par. 1 and 2 of art. 339 and 348Α,
269
+ is sentenced to an imprisonment of at least two years and a fine of fifty to two
270
+ hundred thousand Euros, when the proposal is followed by further actions which
271
+ lead in the commitment of such crimes.
272
+
273
+ '
274
+ - source_sentence: Who should provide authorisation when safeguards are detailed in
275
+ non-legally binding administrative arrangements?
276
+ sentences:
277
+ - In the absence of an adequacy decision, the controller or processor should take
278
+ measures to compensate for the lack of data protection in a third country by way
279
+ of appropriate safeguards for the data subject. Such appropriate safeguards may
280
+ consist of making use of binding corporate rules, standard data protection clauses
281
+ adopted by the Commission, standard data protection clauses adopted by a supervisory
282
+ authority or contractual clauses authorised by a supervisory authority. Those
283
+ safeguards should ensure compliance with data protection requirements and the
284
+ rights of the data subjects appropriate to processing within the Union, including
285
+ the availability of enforceable data subject rights and of effective legal remedies,
286
+ including to obtain effective administrative or judicial redress and to claim
287
+ compensation, in the Union or in a third country. They should relate in particular
288
+ to compliance with the general principles relating to personal data processing,
289
+ the principles of data protection by design and by default. Transfers may also
290
+ be carried out by public authorities or bodies with public authorities or bodies
291
+ in third countries or with international organisations with corresponding duties
292
+ or functions, including on the basis of provisions to be inserted into administrative
293
+ arrangements, such as a memorandum of understanding, providing for enforceable
294
+ and effective rights for data subjects. Authorisation by the competent supervisory
295
+ authority should be obtained when the safeguards are provided for in administrative
296
+ arrangements that are not legally binding.
297
+ - '**Court (Civil/Criminal): Civil**
298
+
299
+
300
+ **Provisions:**
301
+
302
+
303
+ **Time of commission of the act:**
304
+
305
+
306
+ **Outcome (not guilty, guilty):**
307
+
308
+
309
+ **Rationale:**
310
+
311
+
312
+ **Facts:**
313
+
314
+ The plaintiff holds credit card number ............ with the defendant banking
315
+ corporation. Based on the application for alternative networks dated 19/7/2015
316
+ with number ......... submitted at a branch of the defendant, he was granted access
317
+ to the electronic banking service (e-banking) to conduct banking transactions
318
+ (debit, credit, updates, payments) remotely. On 30/11/2020, the plaintiff fell
319
+ victim to electronic fraud through the "phishing" method, whereby an unknown perpetrator
320
+ managed to withdraw a total amount of €3,121.75 from the aforementioned credit
321
+ card. Specifically, the plaintiff received an email at 1:35 PM on 29/11/2020 from
322
+ sender ...... with address ........, informing him that due to an impending system
323
+ change, he needed to verify the mobile phone number linked to the credit card,
324
+ urging him to complete the verification process within the next 24 hours by following
325
+ a link titled ........; otherwise, his account would be locked for security reasons.
326
+ The plaintiff read this email on the afternoon of 30 November 2020 and, believing
327
+ it was from the defendant, followed the instructions and proceeded via the provided
328
+ link to a website that was identical (a clone) to that of the defendant. On this
329
+ page, he was asked to enter the six-digit security code (.........) that had just
330
+ been sent to his mobile phone by the defendant at 3:41 PM, with the note that
331
+ it was an activation code for his ........ card at ........., which he entered.
332
+
333
+
334
+ Subsequently, the plaintiff received, according to his statements, a new email
335
+ (not submitted), which requested him to enter the details of the aforementioned
336
+ credit card, specifically the name of the cardholder and the card number, not
337
+ the PIN, which he also entered, convinced that he was within the online environment
338
+ of the defendant. Then, at 3:47 PM, he received a message on his mobile phone
339
+ from the defendant containing the exact same content as the one he received at
340
+ 3:41 PM, while at 3:50 PM he received a message stating that the activation of
341
+ his ......... card at ....... had been completed. Once the plaintiff read this,
342
+ he became concerned that something was not right, and immediately called (at 4:41
343
+ PM) the defendant''s call center to inform them. There, the employees, with whom
344
+ he finally connected at 5:04 PM due to high call center volume, advised him to
345
+ delete the relevant emails, cancel his credit card, change his access passwords
346
+ for the service, and submit a dispute request regarding the conducted transactions.
347
+ The plaintiff electronically sent this request to the defendant, disputing the
348
+ detailed transactions amounting to €3,121.75, which were conducted on 30/11/2020
349
+ during the time frame of 16:37:45-16:43:34 PM, arguing that he had neither performed
350
+ them himself nor authorized anyone else to do so. The plaintiff specifically disputed
351
+ the following transactions, as evidenced by the account activity of the disputed
352
+ credit card during the aforementioned timeframe: a) transaction number .........
353
+ amounting to €150.62 conducted on 30/11/2020 at 4:43:34 PM, b) transaction number
354
+ ........ amounting to €293.20 conducted on 30/11/2020 at 4:42:40 PM, c) transaction
355
+ number ............ amounting to €295.21 conducted on 30/11/2020 at 4:42:10 PM,
356
+ d) transaction number .......... amounting to €299.22 conducted on 30/11/2020
357
+ at 4:41:31 PM, e) transaction number ........ amounting to €297.21 conducted on
358
+ 30/11/2020 at 4:41:01 PM, f) transaction number ........ amounting to €299.22
359
+ conducted on 30/11/2020 at 4:40:27 PM, g) transaction number ....... amounting
360
+ to €299.22 conducted on 30/11/2020 at 4:39:55 PM, h) transaction number ......
361
+ amounting to €299.22 conducted on 30/11/2020 at 4:39:22 PM, i) transaction number
362
+ ......... amounting to €297.22 conducted on 30/11/2020 at 4:38:52 PM, j) transaction
363
+ number ......... amounting to €295.21 conducted on 30/11/2020 at 4:38:17 PM, and
364
+ k) transaction number ......... amounting to €296.21 conducted on 30/11/2020 at
365
+ 4:37:45 PM. In its response letter dated 21/12/2020, the defendant denied responsibility
366
+ for the costs of the aforementioned transactions, placing the entire blame on
367
+ the plaintiff for the leak of his card details and security code to the fraudulent
368
+ page. The plaintiff, completely denying any fault for the conducted transactions,
369
+ repeatedly contacted the defendant, both by phone and via email (see emails dated
370
+ 15/1/2021 and 11/2/2021), while on 2/3/2021, he electronically sent a report dated
371
+ 1/03/2021 to the Consumer Advocate’s email address, recounting the events and
372
+ requesting that the aforementioned Independent Authority intervene to have the
373
+ disputed debt canceled. In its letter with reference number ...../27.04.2021,
374
+ the aforementioned Independent Authority informed the plaintiff that the case
375
+ was outside its mediating role and was therefore archived. Subsequently, the plaintiff
376
+ sent the defendant on 5/3/2021 his extrajudicial statement dated 4/3/2021, calling
377
+ upon it to fully cancel the debt of €3,121.75 that had been unjustly incurred
378
+ against him within two days and to immediately instruct the representatives of
379
+ the collection agency working with it to cease contacting him regarding the disputed
380
+ case. The defendant sent the plaintiff a message on his mobile phone on 20/04/2021
381
+ informing him that his case was still being processed due to lengthy operational
382
+ requirements, while on 23/04/2021, via email, it informed him that considering
383
+ their good cooperation and his efforts to keep them updated, it had reviewed his
384
+ case and decided to refund him the amounts of the transactions that were conducted
385
+ after his contact with their representatives on 30/11/2020 at 4:41 PM, totaling
386
+ €1,038.25, specifically the following: a) transaction of €150.62 conducted on
387
+ 30/11/2020 at 4:43 PM, b) transaction of €295.21 conducted on 30/11/2020 at 4:42
388
+ PM, c) transaction of €293.20 conducted on 30/11/2020 at 4:42 PM, and d) transaction
389
+ of €299.22 conducted on 30/11/2020 at 4:41 PM. Beyond this, the defendant refused
390
+ to refund the plaintiff the amount of the remaining transactions conducted on
391
+ 30/11/2020, totaling €2,376.08 (and not €2,376.48 as incorrectly stated by the
392
+ plaintiff in his lawsuit), which the plaintiff ultimately fully paid, transferring
393
+ €2,342.77 to the defendant on 7/06/2021 and €33.31 on 15/06/2021 (see related
394
+ deposit receipts).'
395
+ - "Court (Civil/Criminal): Civil \nProvisions: \nTime of commission: July 21,\
396
+ \ 2020 \nOutcome (innocent, guilty): Partially accepts the lawsuit against the\
397
+ \ Bank. \nReasoning: Alongside the bank's responsibility for the ineffective\
398
+ \ protection of its systems against the continually changing and evolving methods\
399
+ \ of deception that affect them, leading to financial damage for its clients who\
400
+ \ entrusted it, which constitutes a breach of its contractual obligations and\
401
+ \ generates contractual liability, there is also the personal responsibility of\
402
+ \ the plaintiff, who did not safeguard, as required, his sensitive banking information\
403
+ \ and disclosed it when he should not have, even though the message that misled\
404
+ \ him came from the context of an SMS conversation with the defendant, even if\
405
+ \ he was directed through the link to a website resembling that of the defendant,\
406
+ \ because he overlooked the relevant instructions and strict recommendations of\
407
+ \ the bank, violating his duty to safeguard them. Therefore, in light of the above,\
408
+ \ the court must partially accept the lawsuit regarding its substance, and with\
409
+ \ the defendant's objection regarding the plaintiff's fault being accepted at\
410
+ \ a rate of 1/6 of the damage suffered, it must be acknowledged – following the\
411
+ \ admissible and lawful modification of the lawsuit's request from a dismissive\
412
+ \ to a declaratory nature as proposed – the defendant's obligation to pay him\
413
+ \ the amount of €2,500, with legal interest, as specified in the operative part.\
414
+ \ Regarding the request to recognize the defendant's obligation to pay him €1,000\
415
+ \ as compensation for the moral damage he suffered from the fraud committed against\
416
+ \ him, this is deemed dismissible as unfounded, because the defendant's liability\
417
+ \ is contractual and not tortious, and there are no special conditions justifying\
418
+ \ the treatment of this specific non-contractual behavior as tortious, making\
419
+ \ it possible to attribute moral damage to the plaintiff from the defendant. \
420
+ \ \nFacts: The plaintiff maintained a joint bank account with his wife and had\
421
+ \ access to the defendant bank's e-banking. On July 21, 2020, following successful\
422
+ \ identification via the agreed-upon credentials (userID, password, OTP), a request\
423
+ \ was made to change the mobile phone number for receiving OTPs, which was completed\
424
+ \ through the bank's platform. However, this change was not made by the plaintiff\
425
+ \ himself, but by a third party who had previously deceived him using the phishing\
426
+ \ method, obtaining his banking details through a misleading SMS. Following the\
427
+ \ phone number change, on July 31, 2020, a transfer of €3,000 was made to a third\
428
+ \ party's account. The transaction was conducted using the necessary credentials\
429
+ \ and OTP sent to the new mobile phone, resulting in the bank considering the\
430
+ \ order valid and executing it. Once the plaintiff realized the transfer, he immediately\
431
+ \ contacted the bank and informed them that he had not given such an order himself.\
432
+ \ Despite the initial assurance that the funds could be recovered, they were ultimately\
433
+ \ not returned, as they had been transferred to a third party's account, and the\
434
+ \ bank denied any responsibility for the loss."
435
+ - source_sentence: When will the periodic review mechanism be conducted?
436
+ sentences:
437
+ - The Commission should monitor the functioning of decisions on the level of protection
438
+ in a third country, a territory or specified sector within a third country, or
439
+ an international organisation, and monitor the functioning of decisions adopted
440
+ on the basis of Article 25(6) or Article 26(4) of Directive 95/46/EC. In its adequacy
441
+ decisions, the Commission should provide for a periodic review mechanism of their
442
+ functioning. That periodic review should be conducted in consultation with the
443
+ third country or international organisation in question and take into account
444
+ all relevant developments in the third country or international organisation.
445
+ For the purposes of monitoring and of carrying out the periodic reviews, the Commission
446
+ should take into consideration the views and findings of the European Parliament
447
+ and of the Council as well as of other relevant bodies and sources. The Commission
448
+ should evaluate, within a reasonable time, the functioning of the latter decisions
449
+ and report any relevant findings to the Committee within the meaning of Regulation
450
+ (EU) No 182/2011 of the European Parliament and of the Council (1) as established
451
+ under this Regulation, to the European Parliament and to the Council.
452
+ - "**Court (Civil/Criminal): Civil** \n**Provisions:** \n**Time of commission\
453
+ \ of the act:** \n**Outcome (not guilty, guilty):** \n**Reasoning:** Partially\
454
+ \ accepts the lawsuit. \n**Facts:** The plaintiff, who works as a lawyer, maintains\
455
+ \ a savings account with the defendant banking corporation under account number\
456
+ \ GR.............. Pursuant to a contract dated June 11, 2010, established in\
457
+ \ Thessaloniki between the defendant and the plaintiff, the plaintiff was granted\
458
+ \ access to the electronic banking system (e-banking) to conduct banking transactions\
459
+ \ remotely. On October 10, 2020, the plaintiff fell victim to electronic fraud\
460
+ \ through the \"phishing\" method, whereby an unknown perpetrator managed to extract\
461
+ \ and transfer €3,000.00 from the plaintiff’s account to another account of the\
462
+ \ same bank. Specifically, on that day at 6:51 a.m., the plaintiff received an\
463
+ \ email from the sender \".........\", with the address ..........., informing\
464
+ \ him that his debit card had been suspended and that online payments and cash\
465
+ \ withdrawals could not be made until the issue was resolved. The email urged\
466
+ \ him to confirm his details within the next 72 hours by following a link titled\
467
+ \ \"card activation.\" \nThe plaintiff read the above email on his mobile phone\
468
+ \ around 8:00 a.m., and believing it came from the defendant, he followed the\
469
+ \ instructions and accessed a website that was identical (a clone) to that of\
470
+ \ the defendant. On this page, he was asked to enter his login credentials to\
471
+ \ connect to the service, which he did, and he was subsequently asked to input\
472
+ \ his debit card details for the alleged activation, which he also provided. Then,\
473
+ \ to complete the process, a number was sent to his mobile phone at 8:07 a.m.\
474
+ \ from the sender ........, which he entered, and two minutes later he received\
475
+ \ a message from the same sender in English stating that the quick access code\
476
+ \ had been activated on his mobile. A few minutes later, at 8:18 a.m., he received\
477
+ \ an email from the defendant informing him of the transfer of €3,000.00 from\
478
+ \ his account to account number GR ........... held at the same bank, with the\
479
+ \ beneficiary's details being .......... As soon as the plaintiff read this, he\
480
+ \ immediately called the defendant's call center and canceled his debit card,\
481
+ \ the access codes for the service ......., and locked the application ..........\
482
+ \ At the same time, he verbally submitted a request to dispute and cancel the\
483
+ \ contested transaction, and in a subsequent phone call, he also canceled his\
484
+ \ credit card. On the same day, he also sent an email to the defendant informing\
485
+ \ them in writing of the above and requesting the cancellation of the transaction\
486
+ \ and the return of the amount of €3,000.00 to his account, as this transfer was\
487
+ \ not made by him but by an unknown perpetrator through electronic fraud and was\
488
+ \ not approved by him. It should also be noted that the plaintiff, as the sole\
489
+ \ beneficiary according to the aforementioned contract for using the defendant's\
490
+ \ Internet Banking service, never received any update via SMS or the VIBER application\
491
+ \ from the bank regarding the transaction details before its completion, nor did\
492
+ \ he receive a one-time code (OTP) to approve the contested transaction. He subsequently\
493
+ \ filed a complaint against unknown persons at the Cyber Crime Division for the\
494
+ \ crime of fraud. The defendant sent an email to the plaintiff on October 16,\
495
+ \ 2020, informing him that his request had been forwarded to the appropriate department\
496
+ \ of the bank for investigation, stating that the bank would never send him an\
497
+ \ email or SMS asking him to enter his personal data and that as of October 7,\
498
+ \ 2020, there was a notice posted for its customers regarding malicious attempts\
499
+ \ to steal personal data in the \"Our News\" section on ....... A month after\
500
+ \ the disputed incident, on November 10, 2020, an amount of €2,296.82 was transferred\
501
+ \ to the plaintiff's account from the account to which the fraudulent credit had\
502
+ \ been made. The plaintiff immediately sent an email to the defendant asking to\
503
+ \ be informed whether this transfer was a return of part of the amount that had\
504
+ \ been illegally withdrawn from his account and requested the return of the remaining\
505
+ \ amount of €703.18. In its response dated January 13, 2021, the defendant confirmed\
506
+ \ that the aforementioned amount indeed came from the account to which the fraudulent\
507
+ \ credit had been made, following a freeze of that account initiated by the defendant\
508
+ \ during the investigation of the incident, but refused to return the remaining\
509
+ \ amount, claiming it bore no responsibility for the leak of the personal codes\
510
+ \ to third parties, according to the terms of the service contract established\
511
+ \ between them. \nFrom the entirety of the evidence presented to the court, there\
512
+ \ is no indication of the authenticity of the contested transaction, as the plaintiff\
513
+ \ did not give his consent for the execution of the transfer of the amount of\
514
+ \ €3,000.00, especially in light of the provision in Article 72 paragraph 2 of\
515
+ \ Law 4537/2018 stating that the mere use of the Internet Banking service by the\
516
+ \ plaintiff does not necessarily constitute sufficient evidence that the payer\
517
+ \ approved the payment action. Specifically, it was proven that the contested\
518
+ \ transaction was not carried out following a strong identification of the plaintiff\
519
+ \ – the sole beneficiary of the account – and his approval, as the latter may\
520
+ \ have entered his personal codes on the counterfeit website; however, he was\
521
+ \ never informed, before the completion of the contested transaction, of the amount\
522
+ \ that would be transferred from his account to a third-party account, nor did\
523
+ \ he receive on his mobile phone, either via SMS or through the VIBER application\
524
+ \ or any other means, the one-time code - extra PIN for its completion, which\
525
+ \ he was required to enter to approve the contested transaction (payment action)\
526
+ \ and thus complete his identification, a fact that was not countered by any evidence\
527
+ \ from the defendant. Furthermore, it is noted that the defendant's claims that\
528
+ \ it bears no responsibility under the terms of the banking services contract,\
529
+ \ whereby it is not liable for any damage to its customer in cases of unauthorized\
530
+ \ use of their personal access codes to the Internet Banking service, are to be\
531
+ \ rejected as fundamentally unfounded. This is because the aforementioned contractual\
532
+ \ terms are invalid according to the provision of Article 103 of Law 4537/2018,\
533
+ \ as they contradict the provisions of Articles 71, 73, and 92 of the same Law,\
534
+ \ which provide for the provider's universal liability and its exemption only\
535
+ \ for unusual and unforeseen circumstances that are beyond the control of the\
536
+ \ party invoking them and whose consequences could not have been avoided despite\
537
+ \ all efforts to the contrary; these provisions establish mandatory law in favor\
538
+ \ of users, as according to Article 103 of Law 4537/2018, payment service providers\
539
+ \ are prohibited from deviating from the provisions to the detriment of payment\
540
+ \ service users, unless the possibility of deviation is explicitly provided and\
541
+ \ they can decide to offer only more favorable terms to payment service users;\
542
+ \ the aforementioned contractual terms do not constitute more favorable terms\
543
+ \ but rather disadvantageous terms for the payment service user. In this case,\
544
+ \ however, the defendant did not prove the authenticity of the transaction and\
545
+ \ its approval by the plaintiff and did not invoke, nor did any unusual and unforeseen\
546
+ \ circumstances beyond its control, the consequences of which could not have been\
547
+ \ avoided despite all efforts to the contrary, come to light. Therefore, the contested\
548
+ \ transaction transferring the amount of €3,000.00 is considered, in the absence\
549
+ \ of demonstrable consent from the plaintiff, unapproved according to the provisions\
550
+ \ of Article 64 of Law 4537/2018, and the defendant's contrary claims are rejected,\
551
+ \ especially since the plaintiff proceeded, according to Article 71 paragraph\
552
+ \ 1 of Law 4537/2018, without undue delay to notify the defendant regarding the\
553
+ \ contested unapproved payment action. Consequently, the defendant is liable for\
554
+ \ compensating the plaintiff for the positive damage he suffered under Article\
555
+ \ 73 of Law 4537/2018 and is obliged to pay him the requested amount of €703.18,\
556
+ \ while the plaintiff’s fault in the occurrence of this damage cannot be established,\
557
+ \ as he entered his personal details in an online environment that was a faithful\
558
+ \ imitation of that of the defendant, as evidenced by the comparison of the screenshots\
559
+ \ of the fake website and the real website provided by the plaintiff, a fact that\
560
+ \ he could not have known while being fully convinced that he was transacting\
561
+ \ with the defendant. Furthermore, the defendant’s liability to compensate the\
562
+ \ plaintiff is based on the provision of Article 8 of Law 2251/1994, which applies\
563
+ \ in this case, as the plaintiff's damage resulted from inadequate fulfillment\
564
+ \ of its obligations in the context of providing its services, but also on the\
565
+ \ provision of Article 914 of the Civil Code in the sense of omission on its part\
566
+ \ of unlawfully and culpably imposed actions. In this case, given that during\
567
+ \ the relevant period there had been a multitude of similar incidents of fraud\
568
+ \ against the defendant's customers, the latter, as a service provider to the\
569
+ \ consumer public and bearing transactional obligations of care and security towards\
570
+ \ them, displayed gross negligence regarding the security provided for electronic\
571
+ \ transaction services, which was compromised by the fraudulent theft of funds,\
572
+ \ as it did not comply with all required high-security measures for executing\
573
+ \ the contested transaction, failing to implement the strict customer identification\
574
+ \ verification process and to check the authenticity of the account to which the\
575
+ \ funds were sent, thus not assuming the suspicious nature of the transaction,\
576
+ \ did not adopt comprehensive and improved protective measures to fully protect\
577
+ \ its customers against malicious attacks and online fraud and to prevent the\
578
+ \ infiltration of unauthorized third parties, nor did it fulfill its obligations\
579
+ \ to inform, accurately inform, and warn its consumers - customers, as it failed\
580
+ \ to adequately inform them of attempts to steal their personal data through the\
581
+ \ sending of informative emails or SMS, while merely posting in a section rather\
582
+ \ than on a central banner (as it later did) does not constitute adequate information\
583
+ \ such that it meets the requirement of protecting its customers and the increased\
584
+ \ safeguarding of their interests. Although the plaintiff acted promptly and informed\
585
+ \ the defendant on the same day about the contested incident, the defendant did\
586
+ \ not act as promptly regarding the investigation of the incident and the freezing\
587
+ \ of the account that held the fraudulent credit to prevent the plaintiff's loss,\
588
+ \ but only returned part of the funds to the plaintiff a month later. This behavior,\
589
+ \ beyond being culpable due to gross negligence, was also unlawful, as it would\
590
+ \ have been illegal even without the contractual relationship, as contrary to\
591
+ \ the provisions of Law 4537/2018 and Law 2251/1994, regarding the lack of security\
592
+ \ of the services that the consumer is legitimately entitled to expect, as well\
593
+ \ as the building of trust that is essential in banking transactions, elements\
594
+ \ that it was obligated to provide within the sphere of the services offered,\
595
+ \ and contrary to the principles of good faith and commercial ethics, as crystallized\
596
+ \ in the provision of Article 288 of the Civil Code, as well as the general duty\
597
+ \ imposed by Article 914 of the Civil Code not to cause harm to another culpably.\
598
+ \ This resulted not only in positive damage to the plaintiff but also in causing\
599
+ \ him moral harm consisting of his mental distress and the disruption, agitation,\
600
+ \ and sorrow he experienced, for which he must be awarded financial compensation.\
601
+ \ Taking into account all the general circumstances of the case, the extent of\
602
+ \ the plaintiff's damage, the severity of the defendant's fault, the mental distress\
603
+ \ suffered by the plaintiff, the insecurity he felt regarding his deposits, the\
604
+ \ sorrow he experienced, and the stress caused by his financial loss, which occurred\
605
+ \ during the pandemic period when his earnings from his professional activity\
606
+ \ had significantly decreased, as well as the financial and social situation of\
607
+ \ the parties, it is the court's opinion that he should be granted, as financial\
608
+ \ compensation for his moral harm, an amount of €250.00, which is deemed reasonable\
609
+ \ and fair. Therefore, the total monetary amount that the plaintiff is entitled\
610
+ \ to for his positive damage and financial compensation for the moral harm suffered\
611
+ \ amounts to a total of (€703.18 + €250.00) = €953.18."
612
+ - 'Failure to notify the Authority of file establishment or permit changes is punished
613
+ by up to three years’ imprisonment and a fine of one to five million Drachmas.
614
+
615
+ Maintaining a file without a permit or violating permit terms is punished by at
616
+ least one year’s imprisonment and a fine of one to five million Drachmas.
617
+
618
+ Unauthorized file interconnection or without permit is punished by up to three
619
+ years’ imprisonment and a fine of one to five million Drachmas.
620
+
621
+ Unlawful interference with personal data is punished by imprisonment and a fine;
622
+ for sensitive data, at least one year’s imprisonment and a fine of one to ten
623
+ million Drachmas.
624
+
625
+ Controllers who fail to comply with Authority decisions or violate data transfer
626
+ rules face at least two years’ imprisonment and a fine of one to five million
627
+ Drachmas.
628
+
629
+ If acts were committed for unlawful benefit or to cause harm, punishment is up
630
+ to ten years’ imprisonment and a fine of two to ten million Drachmas.
631
+
632
+ If acts jeopardize democratic governance or national security, punishment is confinement
633
+ in a penitentiary and a fine of five to ten million Drachmas.
634
+
635
+ Acts committed due to negligence result in at least three months’ imprisonment
636
+ and a fine.
637
+
638
+ If the Controller is not a natural person, the responsible party is the representative
639
+ or head of the organization with administrative or managerial duties.
640
+
641
+ Authorized members of the Authority may carry out preliminary investigations even
642
+ without Prosecutor’s order for certain offenses.
643
+
644
+ The Authority''s President must notify the Public Prosecutor of any offenses under
645
+ investigation, forwarding all relevant evidence.
646
+
647
+ Preliminary investigations must conclude within two months of charges, and trial
648
+ must begin within three months of completion.
649
+
650
+ Continuation of proceedings is allowed only once and for extremely important reasons,
651
+ with adjournment not exceeding two months.
652
+
653
+ Felonies under this law fall under the jurisdiction of the Court of Appeal.
654
+
655
+ '
656
+ - source_sentence: Who must facilitate the exercise of data subject rights?
657
+ sentences:
658
+ - '1.Processing of personal data revealing racial or ethnic origin, political opinions,
659
+ religious or philosophical beliefs, or trade union membership, and the processing
660
+ of genetic data, biometric data for the purpose of uniquely identifying a natural
661
+ person, data concerning health or data concerning a natural person''s sex life
662
+ or sexual orientation shall be prohibited.
663
+
664
+ 2.Paragraph 1 shall not apply if one of the following applies: (a) the data subject
665
+ has given explicit consent to the processing of those personal data for one or
666
+ more specified purposes, except where Union or Member State law provide that the
667
+ prohibition referred to in paragraph 1 may not be lifted by the data subject;
668
+ (b) processing is necessary for the purposes of carrying out the obligations
669
+ and exercising specific rights of the controller or of the data subject in the
670
+ field of employment and social security and social protection law in so far as
671
+ it is authorised by Union or Member State law or a collective agreement pursuant
672
+ to Member State law providing for appropriate safeguards for the fundamental rights
673
+ and the interests of the data subject; (c) processing is necessary to protect
674
+ the vital interests of the data subject or of another natural person where the
675
+ data subject is physically or legally incapable of giving consent; (d) processing
676
+ is carried out in the course of its legitimate activities with appropriate safeguards
677
+ by a foundation, association or any other not-for-profit body with a political,
678
+ philosophical, religious or trade union aim and on condition that the processing
679
+ relates solely to the members or to former members of the body or to persons who
680
+ have regular contact with it in connection with its purposes and that the personal
681
+ data are not disclosed outside that body without the consent of the data subjects;
682
+ (e) processing relates to personal data which are manifestly made public by the
683
+ data subject; (f) processing is necessary for the establishment, exercise or
684
+ defence of legal claims or whenever courts are acting in their judicial capacity;
685
+ (g) processing is necessary for reasons of substantial public interest, on the
686
+ basis of Union or Member State law which shall be proportionate to the aim pursued,
687
+ respect the essence of the right to data protection and provide for suitable and
688
+ specific measures to safeguard the fundamental rights and the interests of the
689
+ data subject; (h) processing is necessary for the purposes of preventive or occupational
690
+ medicine, for the assessment of the working capacity of the employee, medical
691
+ diagnosis, the provision of health or social care or treatment or the management
692
+ of health or social care systems and services on the basis of Union or Member
693
+ State law or pursuant to contract with a health professional and subject to the
694
+ conditions and safeguards referred to in paragraph 3; (i) processing is necessary
695
+ for reasons of public interest in the area of public health, such as protecting
696
+ against serious cross-border threats to health or ensuring high standards of quality
697
+ and safety of health care and of medicinal products or medical devices, on the
698
+ basis of Union or Member State law which provides for suitable and specific measures
699
+ to safeguard the rights and freedoms of the data subject, in particular professional
700
+ secrecy; 4.5.2016 L 119/38 (j) processing is necessary for archiving purposes
701
+ in the public interest, scientific or historical research purposes or statistical
702
+ purposes in accordance with Article 89(1) based on Union or Member State law which
703
+ shall be proportionate to the aim pursued, respect the essence of the right to
704
+ data protection and provide for suitable and specific measures to safeguard the
705
+ fundamental rights and the interests of the data subject.
706
+
707
+ 3.Personal data referred to in paragraph 1 may be processed for the purposes referred
708
+ to in point (h) of paragraph 2 when those data are processed by or under the responsibility
709
+ of a professional subject to the obligation of professional secrecy under Union
710
+ or Member State law or rules established by national competent bodies or by another
711
+ person also subject to an obligation of secrecy under Union or Member State law
712
+ or rules established by national competent bodies.
713
+
714
+ 4.Member States may maintain or introduce further conditions, including limitations,
715
+ with regard to the processing of genetic data, biometric data or data concerning
716
+ health.'
717
+ - Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies
718
+ to the processing of personal data by the Union institutions, bodies, offices
719
+ and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable
720
+ to such processing of personal data should be adapted to the principles and rules
721
+ established in this Regulation and applied in the light of this Regulation. In
722
+ order to provide a strong and coherent data protection framework in the Union,
723
+ the necessary adaptations of Regulation (EC) No 45/2001 should follow after the
724
+ adoption of this Regulation, in order to allow application at the same time as
725
+ this Regulation.
726
+ - "1.The controller shall take appropriate measures to provide any information referred\
727
+ \ to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34\
728
+ \ relating to processing to the data subject in a concise, transparent, intelligible\
729
+ \ and easily accessible form, using clear and plain language, in particular for\
730
+ \ any information addressed specifically to a child. The information shall be\
731
+ \ provided in writing, or by other means, including, where appropriate, by electronic\
732
+ \ means. When requested by the data subject, the information may be provided orally,\
733
+ \ provided that the identity of the data subject is proven by other means. 4.5.2016\
734
+ \ L 119/39 \n2.The controller shall facilitate the exercise of data subject rights\
735
+ \ under Articles 15 to 22. In the cases referred to in Article 11(2), the controller\
736
+ \ shall not refuse to act on the request of the data subject for exercising his\
737
+ \ or her rights under Articles 15 to 22, unless the controller demonstrates that\
738
+ \ it is not in a position to identify the data subject.\n3.The controller shall\
739
+ \ provide information on action taken on a request under Articles 15 to 22 to\
740
+ \ the data subject without undue delay and in any event within one month of receipt\
741
+ \ of the request. That period may be extended by two further months where necessary,\
742
+ \ taking into account the complexity and number of the requests. The controller\
743
+ \ shall inform the data subject of any such extension within one month of receipt\
744
+ \ of the request, together with the reasons for the delay. Where the data subject\
745
+ \ makes the request by electronic form means, the information shall be provided\
746
+ \ by electronic means where possible, unless otherwise requested by the data subject.\n\
747
+ 4.If the controller does not take action on the request of the data subject, the\
748
+ \ controller shall inform the data subject without delay and at the latest within\
749
+ \ one month of receipt of the request of the reasons for not taking action and\
750
+ \ on the possibility of lodging a complaint with a supervisory authority and seeking\
751
+ \ a judicial remedy.\n5.Information provided under Articles 13 and 14 and any\
752
+ \ communication and any actions taken under Articles 15 to 22 and 34 shall be\
753
+ \ provided free of charge. Where requests from a data subject are manifestly unfounded\
754
+ \ or excessive, in particular because of their repetitive character, the controller\
755
+ \ may either: (a) charge a reasonable fee taking into account the administrative\
756
+ \ costs of providing the information or communication or taking the action requested;\
757
+ \ or (b) refuse to act on the request. The controller shall bear the burden of\
758
+ \ demonstrating the manifestly unfounded or excessive character of the request.\n\
759
+ 6.Without prejudice to Article 11, where the controller has reasonable doubts\
760
+ \ concerning the identity of the natural person making the request referred to\
761
+ \ in Articles 15 to 21, the controller may request the provision of additional\
762
+ \ information necessary to confirm the identity of the data subject.\n7.The information\
763
+ \ to be provided to data subjects pursuant to Articles 13 and 14 may be provided\
764
+ \ in combination with standardised icons in order to give in an easily visible,\
765
+ \ intelligible and clearly legible manner a meaningful overview of the intended\
766
+ \ processing. Where the icons are presented electronically they shall be machine-readable.\n\
767
+ 8.The Commission shall be empowered to adopt delegated acts in accordance with\
768
+ \ Article 92 for the purpose of determining the information to be presented by\
769
+ \ the icons and the procedures for providing standardised icons. Section 2 Information\
770
+ \ and access to personal data"
771
+ pipeline_tag: sentence-similarity
772
+ library_name: sentence-transformers
773
+ metrics:
774
+ - cosine_accuracy@1
775
+ - cosine_accuracy@3
776
+ - cosine_accuracy@5
777
+ - cosine_accuracy@10
778
+ - cosine_precision@1
779
+ - cosine_precision@3
780
+ - cosine_precision@5
781
+ - cosine_precision@10
782
+ - cosine_recall@1
783
+ - cosine_recall@3
784
+ - cosine_recall@5
785
+ - cosine_recall@10
786
+ - cosine_ndcg@10
787
+ - cosine_mrr@10
788
+ - cosine_map@100
789
+ model-index:
790
+ - name: multilingual-e5-large
791
+ results:
792
+ - task:
793
+ type: information-retrieval
794
+ name: Information Retrieval
795
+ dataset:
796
+ name: dim 1024
797
+ type: dim_1024
798
+ metrics:
799
+ - type: cosine_accuracy@1
800
+ value: 0.4046094750320102
801
+ name: Cosine Accuracy@1
802
+ - type: cosine_accuracy@3
803
+ value: 0.4090909090909091
804
+ name: Cosine Accuracy@3
805
+ - type: cosine_accuracy@5
806
+ value: 0.43918053777208704
807
+ name: Cosine Accuracy@5
808
+ - type: cosine_accuracy@10
809
+ value: 0.47823303457106275
810
+ name: Cosine Accuracy@10
811
+ - type: cosine_precision@1
812
+ value: 0.4046094750320102
813
+ name: Cosine Precision@1
814
+ - type: cosine_precision@3
815
+ value: 0.40311566367904395
816
+ name: Cosine Precision@3
817
+ - type: cosine_precision@5
818
+ value: 0.39180537772087065
819
+ name: Cosine Precision@5
820
+ - type: cosine_precision@10
821
+ value: 0.3565941101152369
822
+ name: Cosine Precision@10
823
+ - type: cosine_recall@1
824
+ value: 0.04660606778759063
825
+ name: Cosine Recall@1
826
+ - type: cosine_recall@3
827
+ value: 0.13592596883673455
828
+ name: Cosine Recall@3
829
+ - type: cosine_recall@5
830
+ value: 0.20379253880710943
831
+ name: Cosine Recall@5
832
+ - type: cosine_recall@10
833
+ value: 0.3014663479400921
834
+ name: Cosine Recall@10
835
+ - type: cosine_ndcg@10
836
+ value: 0.42913551824501384
837
+ name: Cosine Ndcg@10
838
+ - type: cosine_mrr@10
839
+ value: 0.4168417068064951
840
+ name: Cosine Mrr@10
841
+ - type: cosine_map@100
842
+ value: 0.490599623630225
843
+ name: Cosine Map@100
844
+ - task:
845
+ type: information-retrieval
846
+ name: Information Retrieval
847
+ dataset:
848
+ name: dim 768
849
+ type: dim_768
850
+ metrics:
851
+ - type: cosine_accuracy@1
852
+ value: 0.3994878361075544
853
+ name: Cosine Accuracy@1
854
+ - type: cosine_accuracy@3
855
+ value: 0.4046094750320102
856
+ name: Cosine Accuracy@3
857
+ - type: cosine_accuracy@5
858
+ value: 0.4359795134443022
859
+ name: Cosine Accuracy@5
860
+ - type: cosine_accuracy@10
861
+ value: 0.4737516005121639
862
+ name: Cosine Accuracy@10
863
+ - type: cosine_precision@1
864
+ value: 0.3994878361075544
865
+ name: Cosine Precision@1
866
+ - type: cosine_precision@3
867
+ value: 0.39820742637644047
868
+ name: Cosine Precision@3
869
+ - type: cosine_precision@5
870
+ value: 0.3868117797695263
871
+ name: Cosine Precision@5
872
+ - type: cosine_precision@10
873
+ value: 0.352752880921895
874
+ name: Cosine Precision@10
875
+ - type: cosine_recall@1
876
+ value: 0.046132270416131195
877
+ name: Cosine Recall@1
878
+ - type: cosine_recall@3
879
+ value: 0.13453018491697852
880
+ name: Cosine Recall@3
881
+ - type: cosine_recall@5
882
+ value: 0.20078864250336506
883
+ name: Cosine Recall@5
884
+ - type: cosine_recall@10
885
+ value: 0.29681183299989666
886
+ name: Cosine Recall@10
887
+ - type: cosine_ndcg@10
888
+ value: 0.4244383191680289
889
+ name: Cosine Ndcg@10
890
+ - type: cosine_mrr@10
891
+ value: 0.41201019246793846
892
+ name: Cosine Mrr@10
893
+ - type: cosine_map@100
894
+ value: 0.48680507317454147
895
+ name: Cosine Map@100
896
+ - task:
897
+ type: information-retrieval
898
+ name: Information Retrieval
899
+ dataset:
900
+ name: dim 512
901
+ type: dim_512
902
+ metrics:
903
+ - type: cosine_accuracy@1
904
+ value: 0.39884763124199746
905
+ name: Cosine Accuracy@1
906
+ - type: cosine_accuracy@3
907
+ value: 0.4052496798975672
908
+ name: Cosine Accuracy@3
909
+ - type: cosine_accuracy@5
910
+ value: 0.44558258642765686
911
+ name: Cosine Accuracy@5
912
+ - type: cosine_accuracy@10
913
+ value: 0.47823303457106275
914
+ name: Cosine Accuracy@10
915
+ - type: cosine_precision@1
916
+ value: 0.39884763124199746
917
+ name: Cosine Precision@1
918
+ - type: cosine_precision@3
919
+ value: 0.3975672215108835
920
+ name: Cosine Precision@3
921
+ - type: cosine_precision@5
922
+ value: 0.3888604353393086
923
+ name: Cosine Precision@5
924
+ - type: cosine_precision@10
925
+ value: 0.35793854033290645
926
+ name: Cosine Precision@10
927
+ - type: cosine_recall@1
928
+ value: 0.04570727180608771
929
+ name: Cosine Recall@1
930
+ - type: cosine_recall@3
931
+ value: 0.13329368345632836
932
+ name: Cosine Recall@3
933
+ - type: cosine_recall@5
934
+ value: 0.2006035854063678
935
+ name: Cosine Recall@5
936
+ - type: cosine_recall@10
937
+ value: 0.2993652309972795
938
+ name: Cosine Recall@10
939
+ - type: cosine_ndcg@10
940
+ value: 0.42824151108259556
941
+ name: Cosine Ndcg@10
942
+ - type: cosine_mrr@10
943
+ value: 0.41307745462675005
944
+ name: Cosine Mrr@10
945
+ - type: cosine_map@100
946
+ value: 0.4876319198894288
947
+ name: Cosine Map@100
948
+ - task:
949
+ type: information-retrieval
950
+ name: Information Retrieval
951
+ dataset:
952
+ name: dim 256
953
+ type: dim_256
954
+ metrics:
955
+ - type: cosine_accuracy@1
956
+ value: 0.3738796414852753
957
+ name: Cosine Accuracy@1
958
+ - type: cosine_accuracy@3
959
+ value: 0.37772087067861715
960
+ name: Cosine Accuracy@3
961
+ - type: cosine_accuracy@5
962
+ value: 0.40717029449423814
963
+ name: Cosine Accuracy@5
964
+ - type: cosine_accuracy@10
965
+ value: 0.44558258642765686
966
+ name: Cosine Accuracy@10
967
+ - type: cosine_precision@1
968
+ value: 0.3738796414852753
969
+ name: Cosine Precision@1
970
+ - type: cosine_precision@3
971
+ value: 0.37238583013230897
972
+ name: Cosine Precision@3
973
+ - type: cosine_precision@5
974
+ value: 0.3615877080665813
975
+ name: Cosine Precision@5
976
+ - type: cosine_precision@10
977
+ value: 0.3297695262483995
978
+ name: Cosine Precision@10
979
+ - type: cosine_recall@1
980
+ value: 0.043086085492826574
981
+ name: Cosine Recall@1
982
+ - type: cosine_recall@3
983
+ value: 0.125747799799009
984
+ name: Cosine Recall@3
985
+ - type: cosine_recall@5
986
+ value: 0.18837022600852496
987
+ name: Cosine Recall@5
988
+ - type: cosine_recall@10
989
+ value: 0.2792649180924836
990
+ name: Cosine Recall@10
991
+ - type: cosine_ndcg@10
992
+ value: 0.3980442434686935
993
+ name: Cosine Ndcg@10
994
+ - type: cosine_mrr@10
995
+ value: 0.38572571794402755
996
+ name: Cosine Mrr@10
997
+ - type: cosine_map@100
998
+ value: 0.45855798848430374
999
+ name: Cosine Map@100
1000
+ - task:
1001
+ type: information-retrieval
1002
+ name: Information Retrieval
1003
+ dataset:
1004
+ name: dim 128
1005
+ type: dim_128
1006
+ metrics:
1007
+ - type: cosine_accuracy@1
1008
+ value: 0.34314980793854033
1009
+ name: Cosine Accuracy@1
1010
+ - type: cosine_accuracy@3
1011
+ value: 0.34763124199743917
1012
+ name: Cosine Accuracy@3
1013
+ - type: cosine_accuracy@5
1014
+ value: 0.37708066581306016
1015
+ name: Cosine Accuracy@5
1016
+ - type: cosine_accuracy@10
1017
+ value: 0.4148527528809219
1018
+ name: Cosine Accuracy@10
1019
+ - type: cosine_precision@1
1020
+ value: 0.34314980793854033
1021
+ name: Cosine Precision@1
1022
+ - type: cosine_precision@3
1023
+ value: 0.3418693982074264
1024
+ name: Cosine Precision@3
1025
+ - type: cosine_precision@5
1026
+ value: 0.3322663252240717
1027
+ name: Cosine Precision@5
1028
+ - type: cosine_precision@10
1029
+ value: 0.302752880921895
1030
+ name: Cosine Precision@10
1031
+ - type: cosine_recall@1
1032
+ value: 0.040652627677675406
1033
+ name: Cosine Recall@1
1034
+ - type: cosine_recall@3
1035
+ value: 0.1184519992454523
1036
+ name: Cosine Recall@3
1037
+ - type: cosine_recall@5
1038
+ value: 0.1774839552040709
1039
+ name: Cosine Recall@5
1040
+ - type: cosine_recall@10
1041
+ value: 0.26330336421247125
1042
+ name: Cosine Recall@10
1043
+ - type: cosine_ndcg@10
1044
+ value: 0.36765573601526275
1045
+ name: Cosine Ndcg@10
1046
+ - type: cosine_mrr@10
1047
+ value: 0.35513180090644836
1048
+ name: Cosine Mrr@10
1049
+ - type: cosine_map@100
1050
+ value: 0.4276696379169563
1051
+ name: Cosine Map@100
1052
+ - task:
1053
+ type: information-retrieval
1054
+ name: Information Retrieval
1055
+ dataset:
1056
+ name: dim 64
1057
+ type: dim_64
1058
+ metrics:
1059
+ - type: cosine_accuracy@1
1060
+ value: 0.3079385403329065
1061
+ name: Cosine Accuracy@1
1062
+ - type: cosine_accuracy@3
1063
+ value: 0.31241997439180536
1064
+ name: Cosine Accuracy@3
1065
+ - type: cosine_accuracy@5
1066
+ value: 0.33290653008962867
1067
+ name: Cosine Accuracy@5
1068
+ - type: cosine_accuracy@10
1069
+ value: 0.36555697823303457
1070
+ name: Cosine Accuracy@10
1071
+ - type: cosine_precision@1
1072
+ value: 0.3079385403329065
1073
+ name: Cosine Precision@1
1074
+ - type: cosine_precision@3
1075
+ value: 0.3070849338454972
1076
+ name: Cosine Precision@3
1077
+ - type: cosine_precision@5
1078
+ value: 0.29820742637644043
1079
+ name: Cosine Precision@5
1080
+ - type: cosine_precision@10
1081
+ value: 0.27215108834827145
1082
+ name: Cosine Precision@10
1083
+ - type: cosine_recall@1
1084
+ value: 0.03504677697523653
1085
+ name: Cosine Recall@1
1086
+ - type: cosine_recall@3
1087
+ value: 0.10211269541567973
1088
+ name: Cosine Recall@3
1089
+ - type: cosine_recall@5
1090
+ value: 0.15297976910096123
1091
+ name: Cosine Recall@5
1092
+ - type: cosine_recall@10
1093
+ value: 0.23026653514933906
1094
+ name: Cosine Recall@10
1095
+ - type: cosine_ndcg@10
1096
+ value: 0.3275369456141822
1097
+ name: Cosine Ndcg@10
1098
+ - type: cosine_mrr@10
1099
+ value: 0.31748394406845065
1100
+ name: Cosine Mrr@10
1101
+ - type: cosine_map@100
1102
+ value: 0.38184314430829974
1103
+ name: Cosine Map@100
1104
+ ---
1105
+
1106
+ # multilingual-e5-large
1107
+
1108
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large). It maps sentences & paragraphs to a 1024-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
1109
+
1110
+ ## Model Details
1111
+
1112
+ ### Model Description
1113
+ - **Model Type:** Sentence Transformer
1114
+ - **Base model:** [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large) <!-- at revision 0dc5580a448e4284468b8909bae50fa925907bc5 -->
1115
+ - **Maximum Sequence Length:** 512 tokens
1116
+ - **Output Dimensionality:** 1024 dimensions
1117
+ - **Similarity Function:** Cosine Similarity
1118
+ <!-- - **Training Dataset:** Unknown -->
1119
+ - **Language:** en
1120
+ - **License:** apache-2.0
1121
+
1122
+ ### Model Sources
1123
+
1124
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
1125
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
1126
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
1127
+
1128
+ ### Full Model Architecture
1129
+
1130
+ ```
1131
+ SentenceTransformer(
1132
+ (0): Transformer({'max_seq_length': 512, 'do_lower_case': False, 'architecture': 'XLMRobertaModel'})
1133
+ (1): Pooling({'word_embedding_dimension': 1024, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
1134
+ (2): Normalize()
1135
+ )
1136
+ ```
1137
+
1138
+ ## Usage
1139
+
1140
+ ### Direct Usage (Sentence Transformers)
1141
+
1142
+ First install the Sentence Transformers library:
1143
+
1144
+ ```bash
1145
+ pip install -U sentence-transformers
1146
+ ```
1147
+
1148
+ Then you can load this model and run inference.
1149
+ ```python
1150
+ from sentence_transformers import SentenceTransformer
1151
+
1152
+ # Download from the 🤗 Hub
1153
+ model = SentenceTransformer("sentence_transformers_model_id")
1154
+ # Run inference
1155
+ sentences = [
1156
+ 'Who must facilitate the exercise of data subject rights?',
1157
+ '1.The controller shall take appropriate measures to provide any information referred to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34 relating to processing to the data subject in a concise, transparent, intelligible and easily accessible form, using clear and plain language, in particular for any information addressed specifically to a child. The information shall be provided in writing, or by other means, including, where appropriate, by electronic means. When requested by the data subject, the information may be provided orally, provided that the identity of the data subject is proven by other means. 4.5.2016 L 119/39 \n2.The controller shall facilitate the exercise of data subject rights under Articles 15 to 22. In the cases referred to in Article 11(2), the controller shall not refuse to act on the request of the data subject for exercising his or her rights under Articles 15 to 22, unless the controller demonstrates that it is not in a position to identify the data subject.\n3.The controller shall provide information on action taken on a request under Articles 15 to 22 to the data subject without undue delay and in any event within one month of receipt of the request. That period may be extended by two further months where necessary, taking into account the complexity and number of the requests. The controller shall inform the data subject of any such extension within one month of receipt of the request, together with the reasons for the delay. Where the data subject makes the request by electronic form means, the information shall be provided by electronic means where possible, unless otherwise requested by the data subject.\n4.If the controller does not take action on the request of the data subject, the controller shall inform the data subject without delay and at the latest within one month of receipt of the request of the reasons for not taking action and on the possibility of lodging a complaint with a supervisory authority and seeking a judicial remedy.\n5.Information provided under Articles 13 and 14 and any communication and any actions taken under Articles 15 to 22 and 34 shall be provided free of charge. Where requests from a data subject are manifestly unfounded or excessive, in particular because of their repetitive character, the controller may either: (a) charge a reasonable fee taking into account the administrative costs of providing the information or communication or taking the action requested; or (b) refuse to act on the request. The controller shall bear the burden of demonstrating the manifestly unfounded or excessive character of the request.\n6.Without prejudice to Article 11, where the controller has reasonable doubts concerning the identity of the natural person making the request referred to in Articles 15 to 21, the controller may request the provision of additional information necessary to confirm the identity of the data subject.\n7.The information to be provided to data subjects pursuant to Articles 13 and 14 may be provided in combination with standardised icons in order to give in an easily visible, intelligible and clearly legible manner a meaningful overview of the intended processing. Where the icons are presented electronically they shall be machine-readable.\n8.The Commission shall be empowered to adopt delegated acts in accordance with Article 92 for the purpose of determining the information to be presented by the icons and the procedures for providing standardised icons. Section 2 Information and access to personal data',
1158
+ 'Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies to the processing of personal data by the Union institutions, bodies, offices and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable to such processing of personal data should be adapted to the principles and rules established in this Regulation and applied in the light of this Regulation. In order to provide a strong and coherent data protection framework in the Union, the necessary adaptations of Regulation (EC) No 45/2001 should follow after the adoption of this Regulation, in order to allow application at the same time as this Regulation.',
1159
+ ]
1160
+ embeddings = model.encode(sentences)
1161
+ print(embeddings.shape)
1162
+ # [3, 1024]
1163
+
1164
+ # Get the similarity scores for the embeddings
1165
+ similarities = model.similarity(embeddings, embeddings)
1166
+ print(similarities)
1167
+ # tensor([[1.0000, 0.6418, 0.3512],
1168
+ # [0.6418, 1.0000, 0.3027],
1169
+ # [0.3512, 0.3027, 1.0000]])
1170
+ ```
1171
+
1172
+ <!--
1173
+ ### Direct Usage (Transformers)
1174
+
1175
+ <details><summary>Click to see the direct usage in Transformers</summary>
1176
+
1177
+ </details>
1178
+ -->
1179
+
1180
+ <!--
1181
+ ### Downstream Usage (Sentence Transformers)
1182
+
1183
+ You can finetune this model on your own dataset.
1184
+
1185
+ <details><summary>Click to expand</summary>
1186
+
1187
+ </details>
1188
+ -->
1189
+
1190
+ <!--
1191
+ ### Out-of-Scope Use
1192
+
1193
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
1194
+ -->
1195
+
1196
+ ## Evaluation
1197
+
1198
+ ### Metrics
1199
+
1200
+ #### Information Retrieval
1201
+
1202
+ * Dataset: `dim_1024`
1203
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1204
+ ```json
1205
+ {
1206
+ "truncate_dim": 1024
1207
+ }
1208
+ ```
1209
+
1210
+ | Metric | Value |
1211
+ |:--------------------|:-----------|
1212
+ | cosine_accuracy@1 | 0.4046 |
1213
+ | cosine_accuracy@3 | 0.4091 |
1214
+ | cosine_accuracy@5 | 0.4392 |
1215
+ | cosine_accuracy@10 | 0.4782 |
1216
+ | cosine_precision@1 | 0.4046 |
1217
+ | cosine_precision@3 | 0.4031 |
1218
+ | cosine_precision@5 | 0.3918 |
1219
+ | cosine_precision@10 | 0.3566 |
1220
+ | cosine_recall@1 | 0.0466 |
1221
+ | cosine_recall@3 | 0.1359 |
1222
+ | cosine_recall@5 | 0.2038 |
1223
+ | cosine_recall@10 | 0.3015 |
1224
+ | **cosine_ndcg@10** | **0.4291** |
1225
+ | cosine_mrr@10 | 0.4168 |
1226
+ | cosine_map@100 | 0.4906 |
1227
+
1228
+ #### Information Retrieval
1229
+
1230
+ * Dataset: `dim_768`
1231
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1232
+ ```json
1233
+ {
1234
+ "truncate_dim": 768
1235
+ }
1236
+ ```
1237
+
1238
+ | Metric | Value |
1239
+ |:--------------------|:-----------|
1240
+ | cosine_accuracy@1 | 0.3995 |
1241
+ | cosine_accuracy@3 | 0.4046 |
1242
+ | cosine_accuracy@5 | 0.436 |
1243
+ | cosine_accuracy@10 | 0.4738 |
1244
+ | cosine_precision@1 | 0.3995 |
1245
+ | cosine_precision@3 | 0.3982 |
1246
+ | cosine_precision@5 | 0.3868 |
1247
+ | cosine_precision@10 | 0.3528 |
1248
+ | cosine_recall@1 | 0.0461 |
1249
+ | cosine_recall@3 | 0.1345 |
1250
+ | cosine_recall@5 | 0.2008 |
1251
+ | cosine_recall@10 | 0.2968 |
1252
+ | **cosine_ndcg@10** | **0.4244** |
1253
+ | cosine_mrr@10 | 0.412 |
1254
+ | cosine_map@100 | 0.4868 |
1255
+
1256
+ #### Information Retrieval
1257
+
1258
+ * Dataset: `dim_512`
1259
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1260
+ ```json
1261
+ {
1262
+ "truncate_dim": 512
1263
+ }
1264
+ ```
1265
+
1266
+ | Metric | Value |
1267
+ |:--------------------|:-----------|
1268
+ | cosine_accuracy@1 | 0.3988 |
1269
+ | cosine_accuracy@3 | 0.4052 |
1270
+ | cosine_accuracy@5 | 0.4456 |
1271
+ | cosine_accuracy@10 | 0.4782 |
1272
+ | cosine_precision@1 | 0.3988 |
1273
+ | cosine_precision@3 | 0.3976 |
1274
+ | cosine_precision@5 | 0.3889 |
1275
+ | cosine_precision@10 | 0.3579 |
1276
+ | cosine_recall@1 | 0.0457 |
1277
+ | cosine_recall@3 | 0.1333 |
1278
+ | cosine_recall@5 | 0.2006 |
1279
+ | cosine_recall@10 | 0.2994 |
1280
+ | **cosine_ndcg@10** | **0.4282** |
1281
+ | cosine_mrr@10 | 0.4131 |
1282
+ | cosine_map@100 | 0.4876 |
1283
+
1284
+ #### Information Retrieval
1285
+
1286
+ * Dataset: `dim_256`
1287
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1288
+ ```json
1289
+ {
1290
+ "truncate_dim": 256
1291
+ }
1292
+ ```
1293
+
1294
+ | Metric | Value |
1295
+ |:--------------------|:----------|
1296
+ | cosine_accuracy@1 | 0.3739 |
1297
+ | cosine_accuracy@3 | 0.3777 |
1298
+ | cosine_accuracy@5 | 0.4072 |
1299
+ | cosine_accuracy@10 | 0.4456 |
1300
+ | cosine_precision@1 | 0.3739 |
1301
+ | cosine_precision@3 | 0.3724 |
1302
+ | cosine_precision@5 | 0.3616 |
1303
+ | cosine_precision@10 | 0.3298 |
1304
+ | cosine_recall@1 | 0.0431 |
1305
+ | cosine_recall@3 | 0.1257 |
1306
+ | cosine_recall@5 | 0.1884 |
1307
+ | cosine_recall@10 | 0.2793 |
1308
+ | **cosine_ndcg@10** | **0.398** |
1309
+ | cosine_mrr@10 | 0.3857 |
1310
+ | cosine_map@100 | 0.4586 |
1311
+
1312
+ #### Information Retrieval
1313
+
1314
+ * Dataset: `dim_128`
1315
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1316
+ ```json
1317
+ {
1318
+ "truncate_dim": 128
1319
+ }
1320
+ ```
1321
+
1322
+ | Metric | Value |
1323
+ |:--------------------|:-----------|
1324
+ | cosine_accuracy@1 | 0.3431 |
1325
+ | cosine_accuracy@3 | 0.3476 |
1326
+ | cosine_accuracy@5 | 0.3771 |
1327
+ | cosine_accuracy@10 | 0.4149 |
1328
+ | cosine_precision@1 | 0.3431 |
1329
+ | cosine_precision@3 | 0.3419 |
1330
+ | cosine_precision@5 | 0.3323 |
1331
+ | cosine_precision@10 | 0.3028 |
1332
+ | cosine_recall@1 | 0.0407 |
1333
+ | cosine_recall@3 | 0.1185 |
1334
+ | cosine_recall@5 | 0.1775 |
1335
+ | cosine_recall@10 | 0.2633 |
1336
+ | **cosine_ndcg@10** | **0.3677** |
1337
+ | cosine_mrr@10 | 0.3551 |
1338
+ | cosine_map@100 | 0.4277 |
1339
+
1340
+ #### Information Retrieval
1341
+
1342
+ * Dataset: `dim_64`
1343
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1344
+ ```json
1345
+ {
1346
+ "truncate_dim": 64
1347
+ }
1348
+ ```
1349
+
1350
+ | Metric | Value |
1351
+ |:--------------------|:-----------|
1352
+ | cosine_accuracy@1 | 0.3079 |
1353
+ | cosine_accuracy@3 | 0.3124 |
1354
+ | cosine_accuracy@5 | 0.3329 |
1355
+ | cosine_accuracy@10 | 0.3656 |
1356
+ | cosine_precision@1 | 0.3079 |
1357
+ | cosine_precision@3 | 0.3071 |
1358
+ | cosine_precision@5 | 0.2982 |
1359
+ | cosine_precision@10 | 0.2722 |
1360
+ | cosine_recall@1 | 0.035 |
1361
+ | cosine_recall@3 | 0.1021 |
1362
+ | cosine_recall@5 | 0.153 |
1363
+ | cosine_recall@10 | 0.2303 |
1364
+ | **cosine_ndcg@10** | **0.3275** |
1365
+ | cosine_mrr@10 | 0.3175 |
1366
+ | cosine_map@100 | 0.3818 |
1367
+
1368
+ <!--
1369
+ ## Bias, Risks and Limitations
1370
+
1371
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
1372
+ -->
1373
+
1374
+ <!--
1375
+ ### Recommendations
1376
+
1377
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
1378
+ -->
1379
+
1380
+ ## Training Details
1381
+
1382
+ ### Training Dataset
1383
+
1384
+ #### Unnamed Dataset
1385
+
1386
+ * Size: 391 training samples
1387
+ * Columns: <code>anchor</code> and <code>positive</code>
1388
+ * Approximate statistics based on the first 391 samples:
1389
+ | | anchor | positive |
1390
+ |:--------|:----------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
1391
+ | type | string | string |
1392
+ | details | <ul><li>min: 8 tokens</li><li>mean: 17.16 tokens</li><li>max: 32 tokens</li></ul> | <ul><li>min: 27 tokens</li><li>mean: 377.93 tokens</li><li>max: 512 tokens</li></ul> |
1393
+ * Samples:
1394
+ | anchor | positive |
1395
+ |:-------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
1396
+ | <code>What measures must be taken according to Article 32?</code> | <code>1.Where processing is to be carried out on behalf of a controller, the controller shall use only processors providing sufficient guarantees to implement appropriate technical and organisational measures in such a manner that processing will meet the requirements of this Regulation and ensure the protection of the rights of the data subject.<br>2.The processor shall not engage another processor without prior specific or general written authorisation of the controller. In the case of general written authorisation, the processor shall inform the controller of any intended changes concerning the addition or replacement of other processors, thereby giving the controller the opportunity to object to such changes.<br>3.Processing by a processor shall be governed by a contract or other legal act under Union or Member State law, that is binding on the processor with regard to the controller and that sets out the subject-matter and duration of the processing, the nature and purpose of the processing, ...</code> |
1397
+ | <code>What is the responsibility of assisting and advising the data subjects in exercising their rights?</code> | <code>1.A transfer of personal data to a third country or an international organisation may take place where the Commission has decided that the third country, a territory or one or more specified sectors within that third country, or the international organisation in question ensures an adequate level of protection. Such a transfer shall not require any specific authorisation.<br>2.When assessing the adequacy of the level of protection, the Commission shall, in particular, take account of the following elements: (a) the rule of law, respect for human rights and fundamental freedoms, relevant legislation, both general and sectoral, including concerning public security, defence, national security and criminal law and the access of public authorities to personal data, as well as the implementation of such legislation, data protection rules, professional rules and security measures, including rules for the onward transfer of personal data to another third country or international organisation whi...</code> |
1398
+ | <code>What should Member States be authorized to provide for regarding personal data processing for archiving purposes?</code> | <code>Where personal data are processed for archiving purposes, this Regulation should also apply to that processing, bearing in mind that this Regulation should not apply to deceased persons. Public authorities or public or private bodies that hold records of public interest should be services which, pursuant to Union or Member State law, have a legal obligation to acquire, preserve, appraise, arrange, describe, communicate, promote, disseminate and provide access to records of enduring value for general public interest. Member States should also be authorised to provide for the further processing of personal data for archiving purposes, for example with a view to providing specific information related to the political behaviour under former totalitarian state regimes, genocide, crimes against humanity, in particular the Holocaust, or war crimes. 4.5.2016 L 119/29 Official Journal of the European Union EN</code> |
1399
+ * Loss: [<code>MatryoshkaLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#matryoshkaloss) with these parameters:
1400
+ ```json
1401
+ {
1402
+ "loss": "MultipleNegativesRankingLoss",
1403
+ "matryoshka_dims": [
1404
+ 1024,
1405
+ 768,
1406
+ 512,
1407
+ 256,
1408
+ 128,
1409
+ 64
1410
+ ],
1411
+ "matryoshka_weights": [
1412
+ 1,
1413
+ 1,
1414
+ 1,
1415
+ 1,
1416
+ 1,
1417
+ 1
1418
+ ],
1419
+ "n_dims_per_step": -1
1420
+ }
1421
+ ```
1422
+
1423
+ ### Training Hyperparameters
1424
+ #### Non-Default Hyperparameters
1425
+
1426
+ - `eval_strategy`: epoch
1427
+ - `per_device_eval_batch_size`: 16
1428
+ - `gradient_accumulation_steps`: 4
1429
+ - `learning_rate`: 2e-05
1430
+ - `num_train_epochs`: 20
1431
+ - `lr_scheduler_type`: cosine
1432
+ - `warmup_ratio`: 0.1
1433
+ - `bf16`: True
1434
+ - `load_best_model_at_end`: True
1435
+ - `optim`: adamw_torch_fused
1436
+ - `batch_sampler`: no_duplicates
1437
+
1438
+ #### All Hyperparameters
1439
+ <details><summary>Click to expand</summary>
1440
+
1441
+ - `overwrite_output_dir`: False
1442
+ - `do_predict`: False
1443
+ - `eval_strategy`: epoch
1444
+ - `prediction_loss_only`: True
1445
+ - `per_device_train_batch_size`: 8
1446
+ - `per_device_eval_batch_size`: 16
1447
+ - `per_gpu_train_batch_size`: None
1448
+ - `per_gpu_eval_batch_size`: None
1449
+ - `gradient_accumulation_steps`: 4
1450
+ - `eval_accumulation_steps`: None
1451
+ - `torch_empty_cache_steps`: None
1452
+ - `learning_rate`: 2e-05
1453
+ - `weight_decay`: 0.0
1454
+ - `adam_beta1`: 0.9
1455
+ - `adam_beta2`: 0.999
1456
+ - `adam_epsilon`: 1e-08
1457
+ - `max_grad_norm`: 1.0
1458
+ - `num_train_epochs`: 20
1459
+ - `max_steps`: -1
1460
+ - `lr_scheduler_type`: cosine
1461
+ - `lr_scheduler_kwargs`: {}
1462
+ - `warmup_ratio`: 0.1
1463
+ - `warmup_steps`: 0
1464
+ - `log_level`: passive
1465
+ - `log_level_replica`: warning
1466
+ - `log_on_each_node`: True
1467
+ - `logging_nan_inf_filter`: True
1468
+ - `save_safetensors`: True
1469
+ - `save_on_each_node`: False
1470
+ - `save_only_model`: False
1471
+ - `restore_callback_states_from_checkpoint`: False
1472
+ - `no_cuda`: False
1473
+ - `use_cpu`: False
1474
+ - `use_mps_device`: False
1475
+ - `seed`: 42
1476
+ - `data_seed`: None
1477
+ - `jit_mode_eval`: False
1478
+ - `use_ipex`: False
1479
+ - `bf16`: True
1480
+ - `fp16`: False
1481
+ - `fp16_opt_level`: O1
1482
+ - `half_precision_backend`: auto
1483
+ - `bf16_full_eval`: False
1484
+ - `fp16_full_eval`: False
1485
+ - `tf32`: None
1486
+ - `local_rank`: 0
1487
+ - `ddp_backend`: None
1488
+ - `tpu_num_cores`: None
1489
+ - `tpu_metrics_debug`: False
1490
+ - `debug`: []
1491
+ - `dataloader_drop_last`: False
1492
+ - `dataloader_num_workers`: 0
1493
+ - `dataloader_prefetch_factor`: None
1494
+ - `past_index`: -1
1495
+ - `disable_tqdm`: False
1496
+ - `remove_unused_columns`: True
1497
+ - `label_names`: None
1498
+ - `load_best_model_at_end`: True
1499
+ - `ignore_data_skip`: False
1500
+ - `fsdp`: []
1501
+ - `fsdp_min_num_params`: 0
1502
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
1503
+ - `tp_size`: 0
1504
+ - `fsdp_transformer_layer_cls_to_wrap`: None
1505
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
1506
+ - `deepspeed`: None
1507
+ - `label_smoothing_factor`: 0.0
1508
+ - `optim`: adamw_torch_fused
1509
+ - `optim_args`: None
1510
+ - `adafactor`: False
1511
+ - `group_by_length`: False
1512
+ - `length_column_name`: length
1513
+ - `ddp_find_unused_parameters`: None
1514
+ - `ddp_bucket_cap_mb`: None
1515
+ - `ddp_broadcast_buffers`: False
1516
+ - `dataloader_pin_memory`: True
1517
+ - `dataloader_persistent_workers`: False
1518
+ - `skip_memory_metrics`: True
1519
+ - `use_legacy_prediction_loop`: False
1520
+ - `push_to_hub`: False
1521
+ - `resume_from_checkpoint`: None
1522
+ - `hub_model_id`: None
1523
+ - `hub_strategy`: every_save
1524
+ - `hub_private_repo`: None
1525
+ - `hub_always_push`: False
1526
+ - `gradient_checkpointing`: False
1527
+ - `gradient_checkpointing_kwargs`: None
1528
+ - `include_inputs_for_metrics`: False
1529
+ - `include_for_metrics`: []
1530
+ - `eval_do_concat_batches`: True
1531
+ - `fp16_backend`: auto
1532
+ - `push_to_hub_model_id`: None
1533
+ - `push_to_hub_organization`: None
1534
+ - `mp_parameters`:
1535
+ - `auto_find_batch_size`: False
1536
+ - `full_determinism`: False
1537
+ - `torchdynamo`: None
1538
+ - `ray_scope`: last
1539
+ - `ddp_timeout`: 1800
1540
+ - `torch_compile`: False
1541
+ - `torch_compile_backend`: None
1542
+ - `torch_compile_mode`: None
1543
+ - `include_tokens_per_second`: False
1544
+ - `include_num_input_tokens_seen`: False
1545
+ - `neftune_noise_alpha`: None
1546
+ - `optim_target_modules`: None
1547
+ - `batch_eval_metrics`: False
1548
+ - `eval_on_start`: False
1549
+ - `use_liger_kernel`: False
1550
+ - `eval_use_gather_object`: False
1551
+ - `average_tokens_across_devices`: False
1552
+ - `prompts`: None
1553
+ - `batch_sampler`: no_duplicates
1554
+ - `multi_dataset_batch_sampler`: proportional
1555
+ - `router_mapping`: {}
1556
+ - `learning_rate_mapping`: {}
1557
+
1558
+ </details>
1559
+
1560
+ ### Training Logs
1561
+ | Epoch | Step | Training Loss | dim_1024_cosine_ndcg@10 | dim_768_cosine_ndcg@10 | dim_512_cosine_ndcg@10 | dim_256_cosine_ndcg@10 | dim_128_cosine_ndcg@10 | dim_64_cosine_ndcg@10 |
1562
+ |:------:|:----:|:-------------:|:-----------------------:|:----------------------:|:----------------------:|:----------------------:|:----------------------:|:---------------------:|
1563
+ | 0.8163 | 10 | 31.5155 | - | - | - | - | - | - |
1564
+ | 1.0 | 13 | - | 0.4494 | 0.4446 | 0.4364 | 0.3947 | 0.3362 | 0.2621 |
1565
+ | 1.5714 | 20 | 19.0409 | - | - | - | - | - | - |
1566
+ | 2.0 | 26 | - | 0.4065 | 0.4004 | 0.4013 | 0.3692 | 0.3418 | 0.2882 |
1567
+ | 2.3265 | 30 | 14.5314 | - | - | - | - | - | - |
1568
+ | 3.0 | 39 | - | 0.4418 | 0.4350 | 0.4329 | 0.4087 | 0.3714 | 0.3372 |
1569
+ | 3.0816 | 40 | 8.6778 | - | - | - | - | - | - |
1570
+ | 3.8980 | 50 | 6.0257 | - | - | - | - | - | - |
1571
+ | 4.0 | 52 | - | 0.4291 | 0.4244 | 0.4282 | 0.3980 | 0.3677 | 0.3275 |
1572
+
1573
+
1574
+ ### Framework Versions
1575
+ - Python: 3.12.11
1576
+ - Sentence Transformers: 5.1.0
1577
+ - Transformers: 4.51.3
1578
+ - PyTorch: 2.8.0+cu126
1579
+ - Accelerate: 1.10.1
1580
+ - Datasets: 4.0.0
1581
+ - Tokenizers: 0.21.4
1582
+
1583
+ ## Citation
1584
+
1585
+ ### BibTeX
1586
+
1587
+ #### Sentence Transformers
1588
+ ```bibtex
1589
+ @inproceedings{reimers-2019-sentence-bert,
1590
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
1591
+ author = "Reimers, Nils and Gurevych, Iryna",
1592
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
1593
+ month = "11",
1594
+ year = "2019",
1595
+ publisher = "Association for Computational Linguistics",
1596
+ url = "https://arxiv.org/abs/1908.10084",
1597
+ }
1598
+ ```
1599
+
1600
+ #### MatryoshkaLoss
1601
+ ```bibtex
1602
+ @misc{kusupati2024matryoshka,
1603
+ title={Matryoshka Representation Learning},
1604
+ author={Aditya Kusupati and Gantavya Bhatt and Aniket Rege and Matthew Wallingford and Aditya Sinha and Vivek Ramanujan and William Howard-Snyder and Kaifeng Chen and Sham Kakade and Prateek Jain and Ali Farhadi},
1605
+ year={2024},
1606
+ eprint={2205.13147},
1607
+ archivePrefix={arXiv},
1608
+ primaryClass={cs.LG}
1609
+ }
1610
+ ```
1611
+
1612
+ #### MultipleNegativesRankingLoss
1613
+ ```bibtex
1614
+ @misc{henderson2017efficient,
1615
+ title={Efficient Natural Language Response Suggestion for Smart Reply},
1616
+ author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
1617
+ year={2017},
1618
+ eprint={1705.00652},
1619
+ archivePrefix={arXiv},
1620
+ primaryClass={cs.CL}
1621
+ }
1622
+ ```
1623
+
1624
+ <!--
1625
+ ## Glossary
1626
+
1627
+ *Clearly define terms in order to be accessible across audiences.*
1628
+ -->
1629
+
1630
+ <!--
1631
+ ## Model Card Authors
1632
+
1633
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
1634
+ -->
1635
+
1636
+ <!--
1637
+ ## Model Card Contact
1638
+
1639
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
1640
+ -->
checkpoint-52/config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "XLMRobertaModel"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "bos_token_id": 0,
7
+ "classifier_dropout": null,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 1024,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 4096,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 514,
16
+ "model_type": "xlm-roberta",
17
+ "num_attention_heads": 16,
18
+ "num_hidden_layers": 24,
19
+ "output_past": true,
20
+ "pad_token_id": 1,
21
+ "position_embedding_type": "absolute",
22
+ "torch_dtype": "float32",
23
+ "transformers_version": "4.51.3",
24
+ "type_vocab_size": 1,
25
+ "use_cache": true,
26
+ "vocab_size": 250002
27
+ }
checkpoint-52/config_sentence_transformers.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "SentenceTransformer",
3
+ "__version__": {
4
+ "sentence_transformers": "5.1.0",
5
+ "transformers": "4.51.3",
6
+ "pytorch": "2.8.0+cu126"
7
+ },
8
+ "prompts": {
9
+ "query": "",
10
+ "document": ""
11
+ },
12
+ "default_prompt_name": null,
13
+ "similarity_fn_name": "cosine"
14
+ }
checkpoint-52/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12735f3a106f01897dc07522651bedf61ab577bc550f0ec0823f59ac498655a3
3
+ size 2239607176
checkpoint-52/modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
checkpoint-52/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e985e11ca6344c991936a462d715ab4737a81f1e7ae1d7b9d5018c4289d6330a
3
+ size 4471067142
checkpoint-52/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97826e6974b5be8ca805050e2834698ca64f84d84dd6dafae567ebf4b5323c64
3
+ size 14645
checkpoint-52/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:124a2148c993404cea26c3ac1105405f4d64009654d6294d1bcc583643552613
3
+ size 1465
checkpoint-52/sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 512,
3
+ "do_lower_case": false
4
+ }
checkpoint-52/sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
3
+ size 5069051
checkpoint-52/special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "<mask>",
25
+ "lstrip": true,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "<unk>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
checkpoint-52/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:883b037111086fd4dfebbbc9b7cee11e1517b5e0c0514879478661440f137085
3
+ size 17082987
checkpoint-52/tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "250001": {
36
+ "content": "<mask>",
37
+ "lstrip": true,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "bos_token": "<s>",
45
+ "clean_up_tokenization_spaces": true,
46
+ "cls_token": "<s>",
47
+ "eos_token": "</s>",
48
+ "extra_special_tokens": {},
49
+ "mask_token": "<mask>",
50
+ "model_max_length": 512,
51
+ "pad_token": "<pad>",
52
+ "sep_token": "</s>",
53
+ "tokenizer_class": "XLMRobertaTokenizer",
54
+ "unk_token": "<unk>"
55
+ }
checkpoint-52/trainer_state.json ADDED
@@ -0,0 +1,470 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": 39,
3
+ "best_metric": 0.37139192897263235,
4
+ "best_model_checkpoint": "intfloat/multilingual-e5-large/checkpoint-39",
5
+ "epoch": 4.0,
6
+ "eval_steps": 500,
7
+ "global_step": 52,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.8163265306122449,
14
+ "grad_norm": 307.08624267578125,
15
+ "learning_rate": 7.500000000000001e-06,
16
+ "loss": 31.5155,
17
+ "step": 10
18
+ },
19
+ {
20
+ "epoch": 1.0,
21
+ "eval_dim_1024_cosine_accuracy@1": 0.42509603072983354,
22
+ "eval_dim_1024_cosine_accuracy@10": 0.49295774647887325,
23
+ "eval_dim_1024_cosine_accuracy@3": 0.43085787451984636,
24
+ "eval_dim_1024_cosine_accuracy@5": 0.46030729833546735,
25
+ "eval_dim_1024_cosine_map@100": 0.508986346237021,
26
+ "eval_dim_1024_cosine_mrr@10": 0.4369535394183281,
27
+ "eval_dim_1024_cosine_ndcg@10": 0.4493804868009024,
28
+ "eval_dim_1024_cosine_precision@1": 0.42509603072983354,
29
+ "eval_dim_1024_cosine_precision@10": 0.376056338028169,
30
+ "eval_dim_1024_cosine_precision@3": 0.42402902262057185,
31
+ "eval_dim_1024_cosine_precision@5": 0.4133162612035851,
32
+ "eval_dim_1024_cosine_recall@1": 0.04813624827530403,
33
+ "eval_dim_1024_cosine_recall@10": 0.3150476790176975,
34
+ "eval_dim_1024_cosine_recall@3": 0.1404092551990217,
35
+ "eval_dim_1024_cosine_recall@5": 0.21147403835662126,
36
+ "eval_dim_128_cosine_accuracy@1": 0.31370038412291934,
37
+ "eval_dim_128_cosine_accuracy@10": 0.38156209987195905,
38
+ "eval_dim_128_cosine_accuracy@3": 0.31946222791293216,
39
+ "eval_dim_128_cosine_accuracy@5": 0.34571062740076824,
40
+ "eval_dim_128_cosine_map@100": 0.3991669558616212,
41
+ "eval_dim_128_cosine_mrr@10": 0.32517427799117904,
42
+ "eval_dim_128_cosine_ndcg@10": 0.33618283481296385,
43
+ "eval_dim_128_cosine_precision@1": 0.31370038412291934,
44
+ "eval_dim_128_cosine_precision@10": 0.2764404609475032,
45
+ "eval_dim_128_cosine_precision@3": 0.31284677763551,
46
+ "eval_dim_128_cosine_precision@5": 0.30422535211267604,
47
+ "eval_dim_128_cosine_recall@1": 0.037933385936292925,
48
+ "eval_dim_128_cosine_recall@10": 0.24798465115464788,
49
+ "eval_dim_128_cosine_recall@3": 0.11100168654049715,
50
+ "eval_dim_128_cosine_recall@5": 0.1670926413559068,
51
+ "eval_dim_256_cosine_accuracy@1": 0.36427656850192064,
52
+ "eval_dim_256_cosine_accuracy@10": 0.44814340588988477,
53
+ "eval_dim_256_cosine_accuracy@3": 0.36939820742637647,
54
+ "eval_dim_256_cosine_accuracy@5": 0.4090909090909091,
55
+ "eval_dim_256_cosine_map@100": 0.45841270037343096,
56
+ "eval_dim_256_cosine_mrr@10": 0.37879397597707415,
57
+ "eval_dim_256_cosine_ndcg@10": 0.3947006636735062,
58
+ "eval_dim_256_cosine_precision@1": 0.36427656850192064,
59
+ "eval_dim_256_cosine_precision@10": 0.3289372599231754,
60
+ "eval_dim_256_cosine_precision@3": 0.36363636363636365,
61
+ "eval_dim_256_cosine_precision@5": 0.3560819462227913,
62
+ "eval_dim_256_cosine_recall@1": 0.04277277943657814,
63
+ "eval_dim_256_cosine_recall@10": 0.28617844199333936,
64
+ "eval_dim_256_cosine_recall@3": 0.1253991943934714,
65
+ "eval_dim_256_cosine_recall@5": 0.18947388504512186,
66
+ "eval_dim_512_cosine_accuracy@1": 0.4084507042253521,
67
+ "eval_dim_512_cosine_accuracy@10": 0.4871959026888604,
68
+ "eval_dim_512_cosine_accuracy@3": 0.41357234314980795,
69
+ "eval_dim_512_cosine_accuracy@5": 0.4519846350832266,
70
+ "eval_dim_512_cosine_map@100": 0.495554245202425,
71
+ "eval_dim_512_cosine_mrr@10": 0.42213127248338495,
72
+ "eval_dim_512_cosine_ndcg@10": 0.43644305450989757,
73
+ "eval_dim_512_cosine_precision@1": 0.4084507042253521,
74
+ "eval_dim_512_cosine_precision@10": 0.36606914212548014,
75
+ "eval_dim_512_cosine_precision@3": 0.40738369611609043,
76
+ "eval_dim_512_cosine_precision@5": 0.39846350832266325,
77
+ "eval_dim_512_cosine_recall@1": 0.04628035514721453,
78
+ "eval_dim_512_cosine_recall@10": 0.30419701916496145,
79
+ "eval_dim_512_cosine_recall@3": 0.13522898183596205,
80
+ "eval_dim_512_cosine_recall@5": 0.20394662187726964,
81
+ "eval_dim_64_cosine_accuracy@1": 0.24199743918053776,
82
+ "eval_dim_64_cosine_accuracy@10": 0.29641485275288093,
83
+ "eval_dim_64_cosine_accuracy@3": 0.24775928297055058,
84
+ "eval_dim_64_cosine_accuracy@5": 0.26952624839948786,
85
+ "eval_dim_64_cosine_map@100": 0.31803601064541553,
86
+ "eval_dim_64_cosine_mrr@10": 0.25159771761884414,
87
+ "eval_dim_64_cosine_ndcg@10": 0.2620553065689597,
88
+ "eval_dim_64_cosine_precision@1": 0.24199743918053776,
89
+ "eval_dim_64_cosine_precision@10": 0.21568501920614594,
90
+ "eval_dim_64_cosine_precision@3": 0.24199743918053776,
91
+ "eval_dim_64_cosine_precision@5": 0.23649167733674775,
92
+ "eval_dim_64_cosine_recall@1": 0.029110868794154622,
93
+ "eval_dim_64_cosine_recall@10": 0.19521971714475267,
94
+ "eval_dim_64_cosine_recall@3": 0.08524734139651896,
95
+ "eval_dim_64_cosine_recall@5": 0.12921904680249943,
96
+ "eval_dim_768_cosine_accuracy@1": 0.4193341869398207,
97
+ "eval_dim_768_cosine_accuracy@10": 0.4910371318822023,
98
+ "eval_dim_768_cosine_accuracy@3": 0.4238156209987196,
99
+ "eval_dim_768_cosine_accuracy@5": 0.4551856594110115,
100
+ "eval_dim_768_cosine_map@100": 0.5037778776293926,
101
+ "eval_dim_768_cosine_mrr@10": 0.4315339003719285,
102
+ "eval_dim_768_cosine_ndcg@10": 0.44456410503401034,
103
+ "eval_dim_768_cosine_precision@1": 0.4193341869398207,
104
+ "eval_dim_768_cosine_precision@10": 0.37272727272727274,
105
+ "eval_dim_768_cosine_precision@3": 0.4180537772087068,
106
+ "eval_dim_768_cosine_precision@5": 0.4076824583866837,
107
+ "eval_dim_768_cosine_recall@1": 0.04699592881851732,
108
+ "eval_dim_768_cosine_recall@10": 0.3107289399017082,
109
+ "eval_dim_768_cosine_recall@3": 0.13721565163348118,
110
+ "eval_dim_768_cosine_recall@5": 0.20710427114944024,
111
+ "eval_runtime": 98.6525,
112
+ "eval_samples_per_second": 0.0,
113
+ "eval_sequential_score": 0.2620553065689597,
114
+ "eval_steps_per_second": 0.0,
115
+ "step": 13
116
+ },
117
+ {
118
+ "epoch": 1.5714285714285714,
119
+ "grad_norm": 280.07818603515625,
120
+ "learning_rate": 1.5833333333333333e-05,
121
+ "loss": 19.0409,
122
+ "step": 20
123
+ },
124
+ {
125
+ "epoch": 2.0,
126
+ "eval_dim_1024_cosine_accuracy@1": 0.3854033290653009,
127
+ "eval_dim_1024_cosine_accuracy@10": 0.45454545454545453,
128
+ "eval_dim_1024_cosine_accuracy@3": 0.3886043533930858,
129
+ "eval_dim_1024_cosine_accuracy@5": 0.41101152368758004,
130
+ "eval_dim_1024_cosine_map@100": 0.47259820099791205,
131
+ "eval_dim_1024_cosine_mrr@10": 0.39624870434729537,
132
+ "eval_dim_1024_cosine_ndcg@10": 0.4065329035406967,
133
+ "eval_dim_1024_cosine_precision@1": 0.3854033290653009,
134
+ "eval_dim_1024_cosine_precision@10": 0.3357874519846351,
135
+ "eval_dim_1024_cosine_precision@3": 0.3839095177123346,
136
+ "eval_dim_1024_cosine_precision@5": 0.3713188220230474,
137
+ "eval_dim_1024_cosine_recall@1": 0.0451686782205082,
138
+ "eval_dim_1024_cosine_recall@10": 0.2918225395020212,
139
+ "eval_dim_1024_cosine_recall@3": 0.13200270380544088,
140
+ "eval_dim_1024_cosine_recall@5": 0.19735476247586825,
141
+ "eval_dim_128_cosine_accuracy@1": 0.31562099871959026,
142
+ "eval_dim_128_cosine_accuracy@10": 0.39180537772087065,
143
+ "eval_dim_128_cosine_accuracy@3": 0.3207426376440461,
144
+ "eval_dim_128_cosine_accuracy@5": 0.352112676056338,
145
+ "eval_dim_128_cosine_map@100": 0.40471008477532144,
146
+ "eval_dim_128_cosine_mrr@10": 0.32839105339105285,
147
+ "eval_dim_128_cosine_ndcg@10": 0.34177784905202935,
148
+ "eval_dim_128_cosine_precision@1": 0.31562099871959026,
149
+ "eval_dim_128_cosine_precision@10": 0.280729833546735,
150
+ "eval_dim_128_cosine_precision@3": 0.31455399061032857,
151
+ "eval_dim_128_cosine_precision@5": 0.30640204865556975,
152
+ "eval_dim_128_cosine_recall@1": 0.03888088094516579,
153
+ "eval_dim_128_cosine_recall@10": 0.2550464126190524,
154
+ "eval_dim_128_cosine_recall@3": 0.11341113256173359,
155
+ "eval_dim_128_cosine_recall@5": 0.17046484922169536,
156
+ "eval_dim_256_cosine_accuracy@1": 0.3418693982074264,
157
+ "eval_dim_256_cosine_accuracy@10": 0.4238156209987196,
158
+ "eval_dim_256_cosine_accuracy@3": 0.34763124199743917,
159
+ "eval_dim_256_cosine_accuracy@5": 0.38092189500640206,
160
+ "eval_dim_256_cosine_map@100": 0.43770217754051305,
161
+ "eval_dim_256_cosine_mrr@10": 0.35596482938032165,
162
+ "eval_dim_256_cosine_ndcg@10": 0.36923043791328775,
163
+ "eval_dim_256_cosine_precision@1": 0.3418693982074264,
164
+ "eval_dim_256_cosine_precision@10": 0.30441741357234314,
165
+ "eval_dim_256_cosine_precision@3": 0.34165599658557405,
166
+ "eval_dim_256_cosine_precision@5": 0.3322663252240717,
167
+ "eval_dim_256_cosine_recall@1": 0.041410929155814194,
168
+ "eval_dim_256_cosine_recall@10": 0.2705196189189818,
169
+ "eval_dim_256_cosine_recall@3": 0.1212642412965687,
170
+ "eval_dim_256_cosine_recall@5": 0.18173918651563936,
171
+ "eval_dim_512_cosine_accuracy@1": 0.37708066581306016,
172
+ "eval_dim_512_cosine_accuracy@10": 0.4532650448143406,
173
+ "eval_dim_512_cosine_accuracy@3": 0.38092189500640206,
174
+ "eval_dim_512_cosine_accuracy@5": 0.4084507042253521,
175
+ "eval_dim_512_cosine_map@100": 0.4678017780580059,
176
+ "eval_dim_512_cosine_mrr@10": 0.3893670101416575,
177
+ "eval_dim_512_cosine_ndcg@10": 0.40127522003513455,
178
+ "eval_dim_512_cosine_precision@1": 0.37708066581306016,
179
+ "eval_dim_512_cosine_precision@10": 0.33156209987195906,
180
+ "eval_dim_512_cosine_precision@3": 0.37537345283824153,
181
+ "eval_dim_512_cosine_precision@5": 0.36402048655569774,
182
+ "eval_dim_512_cosine_recall@1": 0.04457309853297402,
183
+ "eval_dim_512_cosine_recall@10": 0.2883968018428671,
184
+ "eval_dim_512_cosine_recall@3": 0.13007205872054822,
185
+ "eval_dim_512_cosine_recall@5": 0.19449520589871025,
186
+ "eval_dim_64_cosine_accuracy@1": 0.26696542893725994,
187
+ "eval_dim_64_cosine_accuracy@10": 0.33098591549295775,
188
+ "eval_dim_64_cosine_accuracy@3": 0.27208706786171577,
189
+ "eval_dim_64_cosine_accuracy@5": 0.293213828425096,
190
+ "eval_dim_64_cosine_map@100": 0.34719730722747555,
191
+ "eval_dim_64_cosine_mrr@10": 0.2776957197731842,
192
+ "eval_dim_64_cosine_ndcg@10": 0.2881905192612941,
193
+ "eval_dim_64_cosine_precision@1": 0.26696542893725994,
194
+ "eval_dim_64_cosine_precision@10": 0.237708066581306,
195
+ "eval_dim_64_cosine_precision@3": 0.26717883055911223,
196
+ "eval_dim_64_cosine_precision@5": 0.2596670934699104,
197
+ "eval_dim_64_cosine_recall@1": 0.031692344067516816,
198
+ "eval_dim_64_cosine_recall@10": 0.21473974122936995,
199
+ "eval_dim_64_cosine_recall@3": 0.09327455064654774,
200
+ "eval_dim_64_cosine_recall@5": 0.14131510912407144,
201
+ "eval_dim_768_cosine_accuracy@1": 0.37451984635083224,
202
+ "eval_dim_768_cosine_accuracy@10": 0.4539052496798976,
203
+ "eval_dim_768_cosine_accuracy@3": 0.37900128040973113,
204
+ "eval_dim_768_cosine_accuracy@5": 0.40973111395646605,
205
+ "eval_dim_768_cosine_map@100": 0.4672061011440217,
206
+ "eval_dim_768_cosine_mrr@10": 0.38746671950897227,
207
+ "eval_dim_768_cosine_ndcg@10": 0.4004027303245026,
208
+ "eval_dim_768_cosine_precision@1": 0.37451984635083224,
209
+ "eval_dim_768_cosine_precision@10": 0.3318181818181818,
210
+ "eval_dim_768_cosine_precision@3": 0.3734528382415706,
211
+ "eval_dim_768_cosine_precision@5": 0.3632522407170295,
212
+ "eval_dim_768_cosine_recall@1": 0.04413921317349132,
213
+ "eval_dim_768_cosine_recall@10": 0.28955317519546525,
214
+ "eval_dim_768_cosine_recall@3": 0.12896663310051748,
215
+ "eval_dim_768_cosine_recall@5": 0.19376203165061448,
216
+ "eval_runtime": 98.4244,
217
+ "eval_samples_per_second": 0.0,
218
+ "eval_sequential_score": 0.2881905192612941,
219
+ "eval_steps_per_second": 0.0,
220
+ "step": 26
221
+ },
222
+ {
223
+ "epoch": 2.326530612244898,
224
+ "grad_norm": 305.66259765625,
225
+ "learning_rate": 1.9973569167005725e-05,
226
+ "loss": 14.5314,
227
+ "step": 30
228
+ },
229
+ {
230
+ "epoch": 3.0,
231
+ "eval_dim_1024_cosine_accuracy@1": 0.4180537772087068,
232
+ "eval_dim_1024_cosine_accuracy@10": 0.49039692701664533,
233
+ "eval_dim_1024_cosine_accuracy@3": 0.42189500640204863,
234
+ "eval_dim_1024_cosine_accuracy@5": 0.4500640204865557,
235
+ "eval_dim_1024_cosine_map@100": 0.506794523350519,
236
+ "eval_dim_1024_cosine_mrr@10": 0.42985717334308843,
237
+ "eval_dim_1024_cosine_ndcg@10": 0.44178501209869797,
238
+ "eval_dim_1024_cosine_precision@1": 0.4180537772087068,
239
+ "eval_dim_1024_cosine_precision@10": 0.36869398207426374,
240
+ "eval_dim_1024_cosine_precision@3": 0.4163465642338881,
241
+ "eval_dim_1024_cosine_precision@5": 0.4043533930857874,
242
+ "eval_dim_1024_cosine_recall@1": 0.04734422767263886,
243
+ "eval_dim_1024_cosine_recall@10": 0.308531274625124,
244
+ "eval_dim_1024_cosine_recall@3": 0.138064233626932,
245
+ "eval_dim_1024_cosine_recall@5": 0.2069980430010945,
246
+ "eval_dim_128_cosine_accuracy@1": 0.34699103713188223,
247
+ "eval_dim_128_cosine_accuracy@10": 0.4212548015364917,
248
+ "eval_dim_128_cosine_accuracy@3": 0.35147247119078107,
249
+ "eval_dim_128_cosine_accuracy@5": 0.37900128040973113,
250
+ "eval_dim_128_cosine_map@100": 0.4338211299784659,
251
+ "eval_dim_128_cosine_mrr@10": 0.35916305916305874,
252
+ "eval_dim_128_cosine_ndcg@10": 0.37139192897263235,
253
+ "eval_dim_128_cosine_precision@1": 0.34699103713188223,
254
+ "eval_dim_128_cosine_precision@10": 0.3042893725992318,
255
+ "eval_dim_128_cosine_precision@3": 0.34571062740076824,
256
+ "eval_dim_128_cosine_precision@5": 0.3352112676056338,
257
+ "eval_dim_128_cosine_recall@1": 0.04217848526747235,
258
+ "eval_dim_128_cosine_recall@10": 0.2706183968947745,
259
+ "eval_dim_128_cosine_recall@3": 0.12288848071178002,
260
+ "eval_dim_128_cosine_recall@5": 0.18344012521240954,
261
+ "eval_dim_256_cosine_accuracy@1": 0.38348271446862997,
262
+ "eval_dim_256_cosine_accuracy@10": 0.4551856594110115,
263
+ "eval_dim_256_cosine_accuracy@3": 0.3886043533930858,
264
+ "eval_dim_256_cosine_accuracy@5": 0.4206145966709347,
265
+ "eval_dim_256_cosine_map@100": 0.4709582085612654,
266
+ "eval_dim_256_cosine_mrr@10": 0.3957850639188662,
267
+ "eval_dim_256_cosine_ndcg@10": 0.4087462230477571,
268
+ "eval_dim_256_cosine_precision@1": 0.38348271446862997,
269
+ "eval_dim_256_cosine_precision@10": 0.33886043533930854,
270
+ "eval_dim_256_cosine_precision@3": 0.382202304737516,
271
+ "eval_dim_256_cosine_precision@5": 0.3718309859154929,
272
+ "eval_dim_256_cosine_recall@1": 0.04466034705404223,
273
+ "eval_dim_256_cosine_recall@10": 0.2892016292717267,
274
+ "eval_dim_256_cosine_recall@3": 0.1301795023253766,
275
+ "eval_dim_256_cosine_recall@5": 0.19500340584044382,
276
+ "eval_dim_512_cosine_accuracy@1": 0.4065300896286812,
277
+ "eval_dim_512_cosine_accuracy@10": 0.4814340588988476,
278
+ "eval_dim_512_cosine_accuracy@3": 0.41229193341869397,
279
+ "eval_dim_512_cosine_accuracy@5": 0.44494238156209986,
280
+ "eval_dim_512_cosine_map@100": 0.49555759572196095,
281
+ "eval_dim_512_cosine_mrr@10": 0.41950236774180394,
282
+ "eval_dim_512_cosine_ndcg@10": 0.4329095460408428,
283
+ "eval_dim_512_cosine_precision@1": 0.4065300896286812,
284
+ "eval_dim_512_cosine_precision@10": 0.3596030729833547,
285
+ "eval_dim_512_cosine_precision@3": 0.4054630815194195,
286
+ "eval_dim_512_cosine_precision@5": 0.3947503201024327,
287
+ "eval_dim_512_cosine_recall@1": 0.047372341735862133,
288
+ "eval_dim_512_cosine_recall@10": 0.3071623578952262,
289
+ "eval_dim_512_cosine_recall@3": 0.1383106496582531,
290
+ "eval_dim_512_cosine_recall@5": 0.20757258542171747,
291
+ "eval_dim_64_cosine_accuracy@1": 0.3207426376440461,
292
+ "eval_dim_64_cosine_accuracy@10": 0.3725992317541613,
293
+ "eval_dim_64_cosine_accuracy@3": 0.322663252240717,
294
+ "eval_dim_64_cosine_accuracy@5": 0.3405889884763124,
295
+ "eval_dim_64_cosine_map@100": 0.3933467041096336,
296
+ "eval_dim_64_cosine_mrr@10": 0.32884732638253733,
297
+ "eval_dim_64_cosine_ndcg@10": 0.3371953828075091,
298
+ "eval_dim_64_cosine_precision@1": 0.3207426376440461,
299
+ "eval_dim_64_cosine_precision@10": 0.2797055057618438,
300
+ "eval_dim_64_cosine_precision@3": 0.3188220230473751,
301
+ "eval_dim_64_cosine_precision@5": 0.3088348271446863,
302
+ "eval_dim_64_cosine_recall@1": 0.036318765090758674,
303
+ "eval_dim_64_cosine_recall@10": 0.23840960718091392,
304
+ "eval_dim_64_cosine_recall@3": 0.10562189493083342,
305
+ "eval_dim_64_cosine_recall@5": 0.15867125525021739,
306
+ "eval_dim_768_cosine_accuracy@1": 0.41037131882202305,
307
+ "eval_dim_768_cosine_accuracy@10": 0.4833546734955186,
308
+ "eval_dim_768_cosine_accuracy@3": 0.4142125480153649,
309
+ "eval_dim_768_cosine_accuracy@5": 0.44430217669654287,
310
+ "eval_dim_768_cosine_map@100": 0.500478306774528,
311
+ "eval_dim_768_cosine_mrr@10": 0.4224889742495374,
312
+ "eval_dim_768_cosine_ndcg@10": 0.4349862241563486,
313
+ "eval_dim_768_cosine_precision@1": 0.41037131882202305,
314
+ "eval_dim_768_cosine_precision@10": 0.36165172855313704,
315
+ "eval_dim_768_cosine_precision@3": 0.4086641058472044,
316
+ "eval_dim_768_cosine_precision@5": 0.3969270166453265,
317
+ "eval_dim_768_cosine_recall@1": 0.047186779325657804,
318
+ "eval_dim_768_cosine_recall@10": 0.30540044861465576,
319
+ "eval_dim_768_cosine_recall@3": 0.1375709294981283,
320
+ "eval_dim_768_cosine_recall@5": 0.20603724780478358,
321
+ "eval_runtime": 98.5908,
322
+ "eval_samples_per_second": 0.0,
323
+ "eval_sequential_score": 0.3371953828075091,
324
+ "eval_steps_per_second": 0.0,
325
+ "step": 39
326
+ },
327
+ {
328
+ "epoch": 3.0816326530612246,
329
+ "grad_norm": 255.65982055664062,
330
+ "learning_rate": 1.9762960071199334e-05,
331
+ "loss": 8.6778,
332
+ "step": 40
333
+ },
334
+ {
335
+ "epoch": 3.8979591836734695,
336
+ "grad_norm": 470.4803771972656,
337
+ "learning_rate": 1.9346189253489888e-05,
338
+ "loss": 6.0257,
339
+ "step": 50
340
+ },
341
+ {
342
+ "epoch": 4.0,
343
+ "eval_dim_1024_cosine_accuracy@1": 0.4046094750320102,
344
+ "eval_dim_1024_cosine_accuracy@10": 0.47823303457106275,
345
+ "eval_dim_1024_cosine_accuracy@3": 0.4090909090909091,
346
+ "eval_dim_1024_cosine_accuracy@5": 0.43918053777208704,
347
+ "eval_dim_1024_cosine_map@100": 0.490599623630225,
348
+ "eval_dim_1024_cosine_mrr@10": 0.4168417068064951,
349
+ "eval_dim_1024_cosine_ndcg@10": 0.42913551824501384,
350
+ "eval_dim_1024_cosine_precision@1": 0.4046094750320102,
351
+ "eval_dim_1024_cosine_precision@10": 0.3565941101152369,
352
+ "eval_dim_1024_cosine_precision@3": 0.40311566367904395,
353
+ "eval_dim_1024_cosine_precision@5": 0.39180537772087065,
354
+ "eval_dim_1024_cosine_recall@1": 0.04660606778759063,
355
+ "eval_dim_1024_cosine_recall@10": 0.3014663479400921,
356
+ "eval_dim_1024_cosine_recall@3": 0.13592596883673455,
357
+ "eval_dim_1024_cosine_recall@5": 0.20379253880710943,
358
+ "eval_dim_128_cosine_accuracy@1": 0.34314980793854033,
359
+ "eval_dim_128_cosine_accuracy@10": 0.4148527528809219,
360
+ "eval_dim_128_cosine_accuracy@3": 0.34763124199743917,
361
+ "eval_dim_128_cosine_accuracy@5": 0.37708066581306016,
362
+ "eval_dim_128_cosine_map@100": 0.4276696379169563,
363
+ "eval_dim_128_cosine_mrr@10": 0.35513180090644836,
364
+ "eval_dim_128_cosine_ndcg@10": 0.36765573601526275,
365
+ "eval_dim_128_cosine_precision@1": 0.34314980793854033,
366
+ "eval_dim_128_cosine_precision@10": 0.302752880921895,
367
+ "eval_dim_128_cosine_precision@3": 0.3418693982074264,
368
+ "eval_dim_128_cosine_precision@5": 0.3322663252240717,
369
+ "eval_dim_128_cosine_recall@1": 0.040652627677675406,
370
+ "eval_dim_128_cosine_recall@10": 0.26330336421247125,
371
+ "eval_dim_128_cosine_recall@3": 0.1184519992454523,
372
+ "eval_dim_128_cosine_recall@5": 0.1774839552040709,
373
+ "eval_dim_256_cosine_accuracy@1": 0.3738796414852753,
374
+ "eval_dim_256_cosine_accuracy@10": 0.44558258642765686,
375
+ "eval_dim_256_cosine_accuracy@3": 0.37772087067861715,
376
+ "eval_dim_256_cosine_accuracy@5": 0.40717029449423814,
377
+ "eval_dim_256_cosine_map@100": 0.45855798848430374,
378
+ "eval_dim_256_cosine_mrr@10": 0.38572571794402755,
379
+ "eval_dim_256_cosine_ndcg@10": 0.3980442434686935,
380
+ "eval_dim_256_cosine_precision@1": 0.3738796414852753,
381
+ "eval_dim_256_cosine_precision@10": 0.3297695262483995,
382
+ "eval_dim_256_cosine_precision@3": 0.37238583013230897,
383
+ "eval_dim_256_cosine_precision@5": 0.3615877080665813,
384
+ "eval_dim_256_cosine_recall@1": 0.043086085492826574,
385
+ "eval_dim_256_cosine_recall@10": 0.2792649180924836,
386
+ "eval_dim_256_cosine_recall@3": 0.125747799799009,
387
+ "eval_dim_256_cosine_recall@5": 0.18837022600852496,
388
+ "eval_dim_512_cosine_accuracy@1": 0.39884763124199746,
389
+ "eval_dim_512_cosine_accuracy@10": 0.47823303457106275,
390
+ "eval_dim_512_cosine_accuracy@3": 0.4052496798975672,
391
+ "eval_dim_512_cosine_accuracy@5": 0.44558258642765686,
392
+ "eval_dim_512_cosine_map@100": 0.4876319198894288,
393
+ "eval_dim_512_cosine_mrr@10": 0.41307745462675005,
394
+ "eval_dim_512_cosine_ndcg@10": 0.42824151108259556,
395
+ "eval_dim_512_cosine_precision@1": 0.39884763124199746,
396
+ "eval_dim_512_cosine_precision@10": 0.35793854033290645,
397
+ "eval_dim_512_cosine_precision@3": 0.3975672215108835,
398
+ "eval_dim_512_cosine_precision@5": 0.3888604353393086,
399
+ "eval_dim_512_cosine_recall@1": 0.04570727180608771,
400
+ "eval_dim_512_cosine_recall@10": 0.2993652309972795,
401
+ "eval_dim_512_cosine_recall@3": 0.13329368345632836,
402
+ "eval_dim_512_cosine_recall@5": 0.2006035854063678,
403
+ "eval_dim_64_cosine_accuracy@1": 0.3079385403329065,
404
+ "eval_dim_64_cosine_accuracy@10": 0.36555697823303457,
405
+ "eval_dim_64_cosine_accuracy@3": 0.31241997439180536,
406
+ "eval_dim_64_cosine_accuracy@5": 0.33290653008962867,
407
+ "eval_dim_64_cosine_map@100": 0.38184314430829974,
408
+ "eval_dim_64_cosine_mrr@10": 0.31748394406845065,
409
+ "eval_dim_64_cosine_ndcg@10": 0.3275369456141822,
410
+ "eval_dim_64_cosine_precision@1": 0.3079385403329065,
411
+ "eval_dim_64_cosine_precision@10": 0.27215108834827145,
412
+ "eval_dim_64_cosine_precision@3": 0.3070849338454972,
413
+ "eval_dim_64_cosine_precision@5": 0.29820742637644043,
414
+ "eval_dim_64_cosine_recall@1": 0.03504677697523653,
415
+ "eval_dim_64_cosine_recall@10": 0.23026653514933906,
416
+ "eval_dim_64_cosine_recall@3": 0.10211269541567973,
417
+ "eval_dim_64_cosine_recall@5": 0.15297976910096123,
418
+ "eval_dim_768_cosine_accuracy@1": 0.3994878361075544,
419
+ "eval_dim_768_cosine_accuracy@10": 0.4737516005121639,
420
+ "eval_dim_768_cosine_accuracy@3": 0.4046094750320102,
421
+ "eval_dim_768_cosine_accuracy@5": 0.4359795134443022,
422
+ "eval_dim_768_cosine_map@100": 0.48680507317454147,
423
+ "eval_dim_768_cosine_mrr@10": 0.41201019246793846,
424
+ "eval_dim_768_cosine_ndcg@10": 0.4244383191680289,
425
+ "eval_dim_768_cosine_precision@1": 0.3994878361075544,
426
+ "eval_dim_768_cosine_precision@10": 0.352752880921895,
427
+ "eval_dim_768_cosine_precision@3": 0.39820742637644047,
428
+ "eval_dim_768_cosine_precision@5": 0.3868117797695263,
429
+ "eval_dim_768_cosine_recall@1": 0.046132270416131195,
430
+ "eval_dim_768_cosine_recall@10": 0.29681183299989666,
431
+ "eval_dim_768_cosine_recall@3": 0.13453018491697852,
432
+ "eval_dim_768_cosine_recall@5": 0.20078864250336506,
433
+ "eval_runtime": 98.6751,
434
+ "eval_samples_per_second": 0.0,
435
+ "eval_sequential_score": 0.3275369456141822,
436
+ "eval_steps_per_second": 0.0,
437
+ "step": 52
438
+ }
439
+ ],
440
+ "logging_steps": 10,
441
+ "max_steps": 240,
442
+ "num_input_tokens_seen": 0,
443
+ "num_train_epochs": 20,
444
+ "save_steps": 500,
445
+ "stateful_callbacks": {
446
+ "EarlyStoppingCallback": {
447
+ "args": {
448
+ "early_stopping_patience": 2,
449
+ "early_stopping_threshold": 0.0
450
+ },
451
+ "attributes": {
452
+ "early_stopping_patience_counter": 1
453
+ }
454
+ },
455
+ "TrainerControl": {
456
+ "args": {
457
+ "should_epoch_stop": false,
458
+ "should_evaluate": false,
459
+ "should_log": false,
460
+ "should_save": true,
461
+ "should_training_stop": false
462
+ },
463
+ "attributes": {}
464
+ }
465
+ },
466
+ "total_flos": 0.0,
467
+ "train_batch_size": 8,
468
+ "trial_name": null,
469
+ "trial_params": null
470
+ }
checkpoint-52/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd906d94b017c1a7fa871b608776d19ecf4218c10c253401fe78ba8ce84435be
3
+ size 6097
checkpoint-65/1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 1024,
3
+ "pooling_mode_cls_token": false,
4
+ "pooling_mode_mean_tokens": true,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
checkpoint-65/README.md ADDED
@@ -0,0 +1,1642 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ license: apache-2.0
5
+ tags:
6
+ - sentence-transformers
7
+ - sentence-similarity
8
+ - feature-extraction
9
+ - dense
10
+ - generated_from_trainer
11
+ - dataset_size:391
12
+ - loss:MatryoshkaLoss
13
+ - loss:MultipleNegativesRankingLoss
14
+ base_model: intfloat/multilingual-e5-large
15
+ widget:
16
+ - source_sentence: What is the responsibility of assisting and advising the data subjects
17
+ in exercising their rights?
18
+ sentences:
19
+ - '1.Personal data shall be: (a) processed lawfully, fairly and in a transparent
20
+ manner in relation to the data subject (‘lawfulness, fairness and transparency’);
21
+ (b) collected for specified, explicit and legitimate purposes and not further
22
+ processed in a manner that is incompatible with those purposes; further processing
23
+ for archiving purposes in the public interest, scientific or historical research
24
+ purposes or statistical purposes shall, in accordance with Article 89(1), not
25
+ be considered to be incompatible with the initial purposes (‘purpose limitation’);
26
+ (c) adequate, relevant and limited to what is necessary in relation to the purposes
27
+ for which they are processed (‘data minimisation’); (d) accurate and, where necessary,
28
+ kept up to date; every reasonable step must be taken to ensure that personal data
29
+ that are inaccurate, having regard to the purposes for which they are processed,
30
+ are erased or rectified without delay (‘accuracy’); 4.5.2016 L 119/35 (1) Directive
31
+ (EU) 2015/1535 of the European Parliament and of the Council of 9 September 2015
32
+ laying down a procedure for the provision of information in the field of technical
33
+ regulations and of rules on Information Society services (OJ L 241, 17.9.2015,
34
+ p. 1). (e) kept in a form which permits identification of data subjects for no
35
+ longer than is necessary for the purposes for which the personal data are processed;
36
+ personal data may be stored for longer periods insofar as the personal data will
37
+ be processed solely for archiving purposes in the public interest, scientific
38
+ or historical research purposes or statistical purposes in accordance with Article
39
+ 89(1) subject to implementation of the appropriate technical and organisational
40
+ measures required by this Regulation in order to safeguard the rights and freedoms
41
+ of the data subject (‘storage limitation’); (f) processed in a manner that ensures
42
+ appropriate security of the personal data, including protection against unauthorised
43
+ or unlawful processing and against accidental loss, destruction or damage, using
44
+ appropriate technical or organisational measures (‘integrity and confidentiality’).
45
+
46
+ 2.The controller shall be responsible for, and be able to demonstrate compliance
47
+ with, paragraph 1 (‘accountability’).'
48
+ - '1.A transfer of personal data to a third country or an international organisation
49
+ may take place where the Commission has decided that the third country, a territory
50
+ or one or more specified sectors within that third country, or the international
51
+ organisation in question ensures an adequate level of protection. Such a transfer
52
+ shall not require any specific authorisation.
53
+
54
+ 2.When assessing the adequacy of the level of protection, the Commission shall,
55
+ in particular, take account of the following elements: (a) the rule of law, respect
56
+ for human rights and fundamental freedoms, relevant legislation, both general
57
+ and sectoral, including concerning public security, defence, national security
58
+ and criminal law and the access of public authorities to personal data, as well
59
+ as the implementation of such legislation, data protection rules, professional
60
+ rules and security measures, including rules for the onward transfer of personal
61
+ data to another third country or international organisation which are complied
62
+ with in that country or international organisation, case-law, as well as effective
63
+ and enforceable data subject rights and effective administrative and judicial
64
+ redress for the data subjects whose personal data are being transferred; (b) the
65
+ existence and effective functioning of one or more independent supervisory authorities
66
+ in the third country or to which an international organisation is subject, with
67
+ responsibility for ensuring and enforcing compliance with the data protection
68
+ rules, including adequate enforcement powers, for assisting and advising the data
69
+ subjects in exercising their rights and for cooperation with the supervisory authorities
70
+ of the Member States; and (c) the international commitments the third country
71
+ or international organisation concerned has entered into, or other obligations
72
+ arising from legally binding conventions or instruments as well as from its participation
73
+ in multilateral or regional systems, in particular in relation to the protection
74
+ of personal data.
75
+
76
+ 3.The Commission, after assessing the adequacy of the level of protection, may
77
+ decide, by means of implementing act, that a third country, a territory or one
78
+ or more specified sectors within a third country, or an international organisation
79
+ ensures an adequate level of protection within the meaning of paragraph 2 of this
80
+ Article. The implementing act shall provide for a mechanism for a periodic review,
81
+ at least every four years, which shall take into account all relevant developments
82
+ in the third country or international organisation. The implementing act shall
83
+ specify its territorial and sectoral application and, where applicable, identify
84
+ the supervisory authority or authorities referred to in point (b) of paragraph
85
+ 2 of this Article. The implementing act shall be adopted in accordance with the
86
+ examination procedure referred to in Article 93(2).
87
+
88
+ 4.The Commission shall, on an ongoing basis, monitor developments in third countries
89
+ and international organisations that could affect the functioning of decisions
90
+ adopted pursuant to paragraph 3 of this Article and decisions adopted on the basis
91
+ of Article 25(6) of Directive 95/46/EC.
92
+
93
+ 5.The Commission shall, where available information reveals, in particular following
94
+ the review referred to in paragraph 3 of this Article, that a third country, a
95
+ territory or one or more specified sectors within a third country, or an international
96
+ organisation no longer ensures an adequate level of protection within the meaning
97
+ of paragraph 2 of this Article, to the extent necessary, repeal, amend or suspend
98
+ the decision referred to in paragraph 3 of this Article by means of implementing
99
+ acts without retro-active effect. Those implementing acts shall be adopted in
100
+ accordance with the examination procedure referred to in Article 93(2). On duly
101
+ justified imperative grounds of urgency, the Commission shall adopt immediately
102
+ applicable implementing acts in accordance with the procedure referred to in Article
103
+ 93(3).
104
+
105
+ 6.The Commission shall enter into consultations with the third country or international
106
+ organisation with a view to remedying the situation giving rise to the decision
107
+ made pursuant to paragraph 5
108
+
109
+ 7.A decision pursuant to paragraph 5 of this Article is without prejudice to transfers
110
+ of personal data to the third country, a territory or one or more specified sectors
111
+ within that third country, or the international organisation in question pursuant
112
+ to Articles 46 to 49
113
+
114
+ 8.The Commission shall publish in the Official Journal of the European Union and
115
+ on its website a list of the third countries, territories and specified sectors
116
+ within a third country and international organisations for which it has decided
117
+ that an adequate level of protection is or is no longer ensured.
118
+
119
+ 9.Decisions adopted by the Commission on the basis of Article 25(6) of Directive
120
+ 95/46/EC shall remain in force until amended, replaced or repealed by a Commission
121
+ Decision adopted in accordance with paragraph 3 or 5 of this Article.'
122
+ - The legal systems of Denmark and Estonia do not allow for administrative fines
123
+ as set out in this Regulation. The rules on administrative fines may be applied
124
+ in such a manner that in Denmark the fine is imposed by competent national courts
125
+ as a criminal penalty and in Estonia the fine is imposed by the supervisory authority
126
+ in the framework of a misdemeanour procedure, provided that such an application
127
+ of the rules in those Member States has an equivalent effect to administrative
128
+ fines imposed by supervisory authorities. Therefore the competent national courts
129
+ should take into account the recommendation by the supervisory authority initiating
130
+ the fine. In any event, the fines imposed should be effective, proportionate and
131
+ dissuasive.
132
+ - source_sentence: Is the fine mandatory for the described offense?
133
+ sentences:
134
+ - "1.Each supervisory authority shall ensure that the imposition of administrative\
135
+ \ fines pursuant to this Article in respect of infringements of this Regulation\
136
+ \ referred to in paragraphs 4, 5 and 6 shall in each individual case be effective,\
137
+ \ proportionate and dissuasive.\n2.Administrative fines shall, depending on the\
138
+ \ circumstances of each individual case, be imposed in addition to, or instead\
139
+ \ of, measures referred to in points (a) to (h) and (j) of Article 58(2). When\
140
+ \ deciding whether to impose an administrative fine and deciding on the amount\
141
+ \ of the administrative fine in each individual case due regard shall be given\
142
+ \ to the following: (a) the nature, gravity and duration of the infringement\
143
+ \ taking into account the nature scope or purpose of the processing concerned\
144
+ \ as well as the number of data subjects affected and the level of damage suffered\
145
+ \ by them; (b) the intentional or negligent character of the infringement; (c)\
146
+ \ any action taken by the controller or processor to mitigate the damage suffered\
147
+ \ by data subjects; (d) the degree of responsibility of the controller or processor\
148
+ \ taking into account technical and organisational measures implemented by them\
149
+ \ pursuant to Articles 25 and 32; (e) any relevant previous infringements by\
150
+ \ the controller or processor; (f) the degree of cooperation with the supervisory\
151
+ \ authority, in order to remedy the infringement and mitigate the possible adverse\
152
+ \ effects of the infringement; (g) the categories of personal data affected by\
153
+ \ the infringement; (h) the manner in which the infringement became known to\
154
+ \ the supervisory authority, in particular whether, and if so to what extent,\
155
+ \ the controller or processor notified the infringement; (i) where measures referred\
156
+ \ to in Article 58(2) have previously been ordered against the controller or processor\
157
+ \ concerned with regard to the same subject-matter, compliance with those measures;\
158
+ \ (j) adherence to approved codes of conduct pursuant to Article 40 or approved\
159
+ \ certification mechanisms pursuant to Article 42; and (k) any other aggravating\
160
+ \ or mitigating factor applicable to the circumstances of the case, such as financial\
161
+ \ benefits gained, or losses avoided, directly or indirectly, from the infringement.\n\
162
+ 3.If a controller or processor intentionally or negligently, for the same or linked\
163
+ \ processing operations, infringes several provisions of this Regulation, the\
164
+ \ total amount of the administrative fine shall not exceed the amount specified\
165
+ \ for the gravest infringement.\n4.Infringements of the following provisions shall,\
166
+ \ in accordance with paragraph 2, be subject to administrative fines up to 10\
167
+ \ 000 000 EUR, or in the case of an undertaking, up to 2 % of the total worldwide\
168
+ \ annual turnover of the preceding financial year, whichever is higher: (a) the\
169
+ \ obligations of the controller and the processor pursuant to Articles 8, 11,\
170
+ \ 25 to 39 and 42 and 43; (b) the obligations of the certification body pursuant\
171
+ \ to Articles 42 and 43; (c) the obligations of the monitoring body pursuant\
172
+ \ to Article 41(4). 4.5.2016 L 119/82 \n5.Infringements of the following provisions\
173
+ \ shall, in accordance with paragraph 2, be subject to administrative fines up\
174
+ \ to 20 000 000 EUR, or in the case of an undertaking, up to 4 % of the total\
175
+ \ worldwide annual turnover of the preceding financial year, whichever is higher:\
176
+ \ (a) the basic principles for processing, including conditions for consent,\
177
+ \ pursuant to Articles 5, 6, 7 and 9; (b) the data subjects' rights pursuant\
178
+ \ to Articles 12 to 22; (c) the transfers of personal data to a recipient in\
179
+ \ a third country or an international organisation pursuant to Articles 44 to\
180
+ \ 49; (d) any obligations pursuant to Member State law adopted under Chapter\
181
+ \ IX; (e) non-compliance with an order or a temporary or definitive limitation\
182
+ \ on processing or the suspension of data flows by the supervisory authority pursuant\
183
+ \ to Article 58(2) or failure to provide access in violation of Article 58(1).\n\
184
+ 6.Non-compliance with an order by the supervisory authority as referred to in\
185
+ \ Article 58(2) shall, in accordance with paragraph 2 of this Article, be subject\
186
+ \ to administrative fines up to 20 000 000 EUR, or in the case of an undertaking,\
187
+ \ up to 4 % of the total worldwide annual turnover of the preceding financial\
188
+ \ year, whichever is higher.\n7.Without prejudice to the corrective powers of\
189
+ \ supervisory authorities pursuant to Article 58(2), each Member State may lay\
190
+ \ down the rules on whether and to what extent administrative fines may be imposed\
191
+ \ on public authorities and bodies established in that Member State.\n8.The exercise\
192
+ \ by the supervisory authority of its powers under this Article shall be subject\
193
+ \ to appropriate procedural safeguards in accordance with Union and Member State\
194
+ \ law, including effective judicial remedy and due process.\n9.Where the legal\
195
+ \ system of the Member State does not provide for administrative fines, this Article\
196
+ \ may be applied in such a manner that the fine is initiated by the competent\
197
+ \ supervisory authority and imposed by competent national courts, while ensuring\
198
+ \ that those legal remedies are effective and have an equivalent effect to the\
199
+ \ administrative fines imposed by supervisory authorities. In any event, the fines\
200
+ \ imposed shall be effective, proportionate and dissuasive. Those Member States\
201
+ \ shall notify to the Commission the provisions of their laws which they adopt\
202
+ \ pursuant to this paragraph by 25 May 2018 and, without delay, any subsequent\
203
+ \ amendment law or amendment affecting them."
204
+ - "Court (Civil/Criminal): Criminal \nProvisions: Article 386 of the Penal Code\
205
+ \ \nTime of commission of the act: \nResult (innocent, guilty): \nReasoning:\
206
+ \ Conviction for computer fraud committed repeatedly and professionally with a\
207
+ \ total benefit and damage exceeding €30,000. According to the majority opinion,\
208
+ \ the charge is substantiated in both its objective and subjective aspects, and\
209
+ \ the defendant must be declared guilty of the aforementioned criminal acts of\
210
+ \ fraud by means of a computer, committed repeatedly by a perpetrator acting professionally,\
211
+ \ where the total financial benefit and corresponding damage exceed the amount\
212
+ \ of €30,000, as well as for repeated embezzlement.\n\nFacts: The defendant accessed\
213
+ \ a website using a computer, employing, without the knowledge and consent of\
214
+ \ the complainants, the access codes for the electronic management system of the\
215
+ \ bank accounts held by the complainants at a Bank, and transferred money through\
216
+ \ electronically transmitted orders from the complainants' accounts to her own\
217
+ \ account. Specifically, during the period from June 2007 to June 2008, after\
218
+ \ unlawfully acquiring the aforementioned STICK containing the access codes, she\
219
+ \ accessed a website maintained by ..., using, without the complainants' knowledge\
220
+ \ (without their consent or approval), the access codes for the electronic management\
221
+ \ system of the bank accounts held at the aforementioned Bank, transferring through\
222
+ \ electronically transmitted orders to the joint account number ... of the complainants\
223
+ \ from bank accounts numbered ..., ..., and ..., the total amount of €55,710,\
224
+ \ as detailed in the orders, and subsequently, using an ATM card, she gradually\
225
+ \ withdrew from the aforementioned account number ..., the total amount of €55,710,\
226
+ \ making 84 individual withdrawals from automatic teller machines. In addition,\
227
+ \ the defendant, during the period from June 2008 to November 2008, in the same\
228
+ \ exact manner (through the electronic management system of the bank accounts),\
229
+ \ transferred through electronically transmitted orders to account number ...,\
230
+ \ which she had opened at ..., from the complainants' bank accounts numbered ...,\
231
+ \ ..., ..., ..., and ..., the total amount of €73,942, as detailed in the orders\
232
+ \ regarding the transfers of these amounts. Furthermore, during the period from\
233
+ \ February 2008 to November 2008, through multiple acts constituting a continuation\
234
+ \ of the crime, although she had received from the first complainant ... the amounts\
235
+ \ of €695.04, €695.04, and €845.04, in order to pay his insurance contributions\
236
+ \ to O.A.E.E. for the periods of January-February 2008, May-June 2008, and September-October\
237
+ \ 2008, as well as the amounts of €250 and €280, in order to settle credit card\
238
+ \ bills for \"...\", respectively, and from the second complainant ... she received\
239
+ \ the amounts of €283.64, €419.26, and €385.38, to pay the latter's insurance\
240
+ \ contributions to O.A.E.E. for the periods of July-August 2007, May-June 2008,\
241
+ \ September-October 2008, and November-December 2008, as well as the amount of\
242
+ \ €1,888.03 for the settlement of VAT, she never paid the above amounts to settle\
243
+ \ the aforementioned obligations, nor did she return them to the complainants,\
244
+ \ despite being urged to do so, but incorporated them into her assets and wrongfully\
245
+ \ appropriated them. The defendant denies the charges against her and claims that\
246
+ \ the withdrawals were made by the second complainant and that all the amounts\
247
+ \ transferred to her account were transferred to cover the company's expenses\
248
+ \ and their personal expenses, due to her cohabitation with the second complainant\
249
+ \ and with his knowledge, with whom she intended to marry. However, this claim\
250
+ \ is not supported by any evidence; on the contrary, it emerged that she conducted\
251
+ \ the transfers of the money and withdrawals without the complainants' knowledge,\
252
+ \ and when she learned that they had been informed about the account movements\
253
+ \ and met at the Bank, her behavior and demeanor indicated guilt, according to\
254
+ \ the testimony of the prosecution witness ..., an employee of the Pangrati branch\
255
+ \ of ..., who saw her on the same day at the aforementioned Bank when she met\
256
+ \ with the complainants. The ongoing act of fraud using a computer was committed\
257
+ \ by the defendant professionally, as evidenced by her repeated commission of\
258
+ \ the act, as well as the infrastructure she had established with the intent of\
259
+ \ repeated commission, based on a specific plan and methodology (transferring\
260
+ \ smaller amounts to a joint account of the complainants from the remaining accounts\
261
+ \ of the latter, and then withdrawing the transferred amounts with an ATM card,\
262
+ \ as well as directly transferring smaller amounts from the complainants' accounts\
263
+ \ to her personal account she had opened at the same bank), indicating her purpose\
264
+ \ to generate income, with the financial benefit she gained, corresponding to\
265
+ \ the complainants' damage, exceeding a total of €30,000."
266
+ - 'Any person who intentionally, through the technology of information and communication,
267
+ suggests an encounter between an adult and a minor under the age of fifteen, aiming
268
+ at the commitment of the crimes described in par. 1 and 2 of art. 339 and 348Α,
269
+ is sentenced to an imprisonment of at least two years and a fine of fifty to two
270
+ hundred thousand Euros, when the proposal is followed by further actions which
271
+ lead in the commitment of such crimes.
272
+
273
+ '
274
+ - source_sentence: Who should provide authorisation when safeguards are detailed in
275
+ non-legally binding administrative arrangements?
276
+ sentences:
277
+ - In the absence of an adequacy decision, the controller or processor should take
278
+ measures to compensate for the lack of data protection in a third country by way
279
+ of appropriate safeguards for the data subject. Such appropriate safeguards may
280
+ consist of making use of binding corporate rules, standard data protection clauses
281
+ adopted by the Commission, standard data protection clauses adopted by a supervisory
282
+ authority or contractual clauses authorised by a supervisory authority. Those
283
+ safeguards should ensure compliance with data protection requirements and the
284
+ rights of the data subjects appropriate to processing within the Union, including
285
+ the availability of enforceable data subject rights and of effective legal remedies,
286
+ including to obtain effective administrative or judicial redress and to claim
287
+ compensation, in the Union or in a third country. They should relate in particular
288
+ to compliance with the general principles relating to personal data processing,
289
+ the principles of data protection by design and by default. Transfers may also
290
+ be carried out by public authorities or bodies with public authorities or bodies
291
+ in third countries or with international organisations with corresponding duties
292
+ or functions, including on the basis of provisions to be inserted into administrative
293
+ arrangements, such as a memorandum of understanding, providing for enforceable
294
+ and effective rights for data subjects. Authorisation by the competent supervisory
295
+ authority should be obtained when the safeguards are provided for in administrative
296
+ arrangements that are not legally binding.
297
+ - '**Court (Civil/Criminal): Civil**
298
+
299
+
300
+ **Provisions:**
301
+
302
+
303
+ **Time of commission of the act:**
304
+
305
+
306
+ **Outcome (not guilty, guilty):**
307
+
308
+
309
+ **Rationale:**
310
+
311
+
312
+ **Facts:**
313
+
314
+ The plaintiff holds credit card number ............ with the defendant banking
315
+ corporation. Based on the application for alternative networks dated 19/7/2015
316
+ with number ......... submitted at a branch of the defendant, he was granted access
317
+ to the electronic banking service (e-banking) to conduct banking transactions
318
+ (debit, credit, updates, payments) remotely. On 30/11/2020, the plaintiff fell
319
+ victim to electronic fraud through the "phishing" method, whereby an unknown perpetrator
320
+ managed to withdraw a total amount of €3,121.75 from the aforementioned credit
321
+ card. Specifically, the plaintiff received an email at 1:35 PM on 29/11/2020 from
322
+ sender ...... with address ........, informing him that due to an impending system
323
+ change, he needed to verify the mobile phone number linked to the credit card,
324
+ urging him to complete the verification process within the next 24 hours by following
325
+ a link titled ........; otherwise, his account would be locked for security reasons.
326
+ The plaintiff read this email on the afternoon of 30 November 2020 and, believing
327
+ it was from the defendant, followed the instructions and proceeded via the provided
328
+ link to a website that was identical (a clone) to that of the defendant. On this
329
+ page, he was asked to enter the six-digit security code (.........) that had just
330
+ been sent to his mobile phone by the defendant at 3:41 PM, with the note that
331
+ it was an activation code for his ........ card at ........., which he entered.
332
+
333
+
334
+ Subsequently, the plaintiff received, according to his statements, a new email
335
+ (not submitted), which requested him to enter the details of the aforementioned
336
+ credit card, specifically the name of the cardholder and the card number, not
337
+ the PIN, which he also entered, convinced that he was within the online environment
338
+ of the defendant. Then, at 3:47 PM, he received a message on his mobile phone
339
+ from the defendant containing the exact same content as the one he received at
340
+ 3:41 PM, while at 3:50 PM he received a message stating that the activation of
341
+ his ......... card at ....... had been completed. Once the plaintiff read this,
342
+ he became concerned that something was not right, and immediately called (at 4:41
343
+ PM) the defendant''s call center to inform them. There, the employees, with whom
344
+ he finally connected at 5:04 PM due to high call center volume, advised him to
345
+ delete the relevant emails, cancel his credit card, change his access passwords
346
+ for the service, and submit a dispute request regarding the conducted transactions.
347
+ The plaintiff electronically sent this request to the defendant, disputing the
348
+ detailed transactions amounting to €3,121.75, which were conducted on 30/11/2020
349
+ during the time frame of 16:37:45-16:43:34 PM, arguing that he had neither performed
350
+ them himself nor authorized anyone else to do so. The plaintiff specifically disputed
351
+ the following transactions, as evidenced by the account activity of the disputed
352
+ credit card during the aforementioned timeframe: a) transaction number .........
353
+ amounting to €150.62 conducted on 30/11/2020 at 4:43:34 PM, b) transaction number
354
+ ........ amounting to €293.20 conducted on 30/11/2020 at 4:42:40 PM, c) transaction
355
+ number ............ amounting to €295.21 conducted on 30/11/2020 at 4:42:10 PM,
356
+ d) transaction number .......... amounting to €299.22 conducted on 30/11/2020
357
+ at 4:41:31 PM, e) transaction number ........ amounting to €297.21 conducted on
358
+ 30/11/2020 at 4:41:01 PM, f) transaction number ........ amounting to €299.22
359
+ conducted on 30/11/2020 at 4:40:27 PM, g) transaction number ....... amounting
360
+ to €299.22 conducted on 30/11/2020 at 4:39:55 PM, h) transaction number ......
361
+ amounting to €299.22 conducted on 30/11/2020 at 4:39:22 PM, i) transaction number
362
+ ......... amounting to €297.22 conducted on 30/11/2020 at 4:38:52 PM, j) transaction
363
+ number ......... amounting to €295.21 conducted on 30/11/2020 at 4:38:17 PM, and
364
+ k) transaction number ......... amounting to €296.21 conducted on 30/11/2020 at
365
+ 4:37:45 PM. In its response letter dated 21/12/2020, the defendant denied responsibility
366
+ for the costs of the aforementioned transactions, placing the entire blame on
367
+ the plaintiff for the leak of his card details and security code to the fraudulent
368
+ page. The plaintiff, completely denying any fault for the conducted transactions,
369
+ repeatedly contacted the defendant, both by phone and via email (see emails dated
370
+ 15/1/2021 and 11/2/2021), while on 2/3/2021, he electronically sent a report dated
371
+ 1/03/2021 to the Consumer Advocate’s email address, recounting the events and
372
+ requesting that the aforementioned Independent Authority intervene to have the
373
+ disputed debt canceled. In its letter with reference number ...../27.04.2021,
374
+ the aforementioned Independent Authority informed the plaintiff that the case
375
+ was outside its mediating role and was therefore archived. Subsequently, the plaintiff
376
+ sent the defendant on 5/3/2021 his extrajudicial statement dated 4/3/2021, calling
377
+ upon it to fully cancel the debt of €3,121.75 that had been unjustly incurred
378
+ against him within two days and to immediately instruct the representatives of
379
+ the collection agency working with it to cease contacting him regarding the disputed
380
+ case. The defendant sent the plaintiff a message on his mobile phone on 20/04/2021
381
+ informing him that his case was still being processed due to lengthy operational
382
+ requirements, while on 23/04/2021, via email, it informed him that considering
383
+ their good cooperation and his efforts to keep them updated, it had reviewed his
384
+ case and decided to refund him the amounts of the transactions that were conducted
385
+ after his contact with their representatives on 30/11/2020 at 4:41 PM, totaling
386
+ €1,038.25, specifically the following: a) transaction of €150.62 conducted on
387
+ 30/11/2020 at 4:43 PM, b) transaction of €295.21 conducted on 30/11/2020 at 4:42
388
+ PM, c) transaction of €293.20 conducted on 30/11/2020 at 4:42 PM, and d) transaction
389
+ of €299.22 conducted on 30/11/2020 at 4:41 PM. Beyond this, the defendant refused
390
+ to refund the plaintiff the amount of the remaining transactions conducted on
391
+ 30/11/2020, totaling €2,376.08 (and not €2,376.48 as incorrectly stated by the
392
+ plaintiff in his lawsuit), which the plaintiff ultimately fully paid, transferring
393
+ €2,342.77 to the defendant on 7/06/2021 and €33.31 on 15/06/2021 (see related
394
+ deposit receipts).'
395
+ - "Court (Civil/Criminal): Civil \nProvisions: \nTime of commission: July 21,\
396
+ \ 2020 \nOutcome (innocent, guilty): Partially accepts the lawsuit against the\
397
+ \ Bank. \nReasoning: Alongside the bank's responsibility for the ineffective\
398
+ \ protection of its systems against the continually changing and evolving methods\
399
+ \ of deception that affect them, leading to financial damage for its clients who\
400
+ \ entrusted it, which constitutes a breach of its contractual obligations and\
401
+ \ generates contractual liability, there is also the personal responsibility of\
402
+ \ the plaintiff, who did not safeguard, as required, his sensitive banking information\
403
+ \ and disclosed it when he should not have, even though the message that misled\
404
+ \ him came from the context of an SMS conversation with the defendant, even if\
405
+ \ he was directed through the link to a website resembling that of the defendant,\
406
+ \ because he overlooked the relevant instructions and strict recommendations of\
407
+ \ the bank, violating his duty to safeguard them. Therefore, in light of the above,\
408
+ \ the court must partially accept the lawsuit regarding its substance, and with\
409
+ \ the defendant's objection regarding the plaintiff's fault being accepted at\
410
+ \ a rate of 1/6 of the damage suffered, it must be acknowledged – following the\
411
+ \ admissible and lawful modification of the lawsuit's request from a dismissive\
412
+ \ to a declaratory nature as proposed – the defendant's obligation to pay him\
413
+ \ the amount of €2,500, with legal interest, as specified in the operative part.\
414
+ \ Regarding the request to recognize the defendant's obligation to pay him €1,000\
415
+ \ as compensation for the moral damage he suffered from the fraud committed against\
416
+ \ him, this is deemed dismissible as unfounded, because the defendant's liability\
417
+ \ is contractual and not tortious, and there are no special conditions justifying\
418
+ \ the treatment of this specific non-contractual behavior as tortious, making\
419
+ \ it possible to attribute moral damage to the plaintiff from the defendant. \
420
+ \ \nFacts: The plaintiff maintained a joint bank account with his wife and had\
421
+ \ access to the defendant bank's e-banking. On July 21, 2020, following successful\
422
+ \ identification via the agreed-upon credentials (userID, password, OTP), a request\
423
+ \ was made to change the mobile phone number for receiving OTPs, which was completed\
424
+ \ through the bank's platform. However, this change was not made by the plaintiff\
425
+ \ himself, but by a third party who had previously deceived him using the phishing\
426
+ \ method, obtaining his banking details through a misleading SMS. Following the\
427
+ \ phone number change, on July 31, 2020, a transfer of €3,000 was made to a third\
428
+ \ party's account. The transaction was conducted using the necessary credentials\
429
+ \ and OTP sent to the new mobile phone, resulting in the bank considering the\
430
+ \ order valid and executing it. Once the plaintiff realized the transfer, he immediately\
431
+ \ contacted the bank and informed them that he had not given such an order himself.\
432
+ \ Despite the initial assurance that the funds could be recovered, they were ultimately\
433
+ \ not returned, as they had been transferred to a third party's account, and the\
434
+ \ bank denied any responsibility for the loss."
435
+ - source_sentence: When will the periodic review mechanism be conducted?
436
+ sentences:
437
+ - The Commission should monitor the functioning of decisions on the level of protection
438
+ in a third country, a territory or specified sector within a third country, or
439
+ an international organisation, and monitor the functioning of decisions adopted
440
+ on the basis of Article 25(6) or Article 26(4) of Directive 95/46/EC. In its adequacy
441
+ decisions, the Commission should provide for a periodic review mechanism of their
442
+ functioning. That periodic review should be conducted in consultation with the
443
+ third country or international organisation in question and take into account
444
+ all relevant developments in the third country or international organisation.
445
+ For the purposes of monitoring and of carrying out the periodic reviews, the Commission
446
+ should take into consideration the views and findings of the European Parliament
447
+ and of the Council as well as of other relevant bodies and sources. The Commission
448
+ should evaluate, within a reasonable time, the functioning of the latter decisions
449
+ and report any relevant findings to the Committee within the meaning of Regulation
450
+ (EU) No 182/2011 of the European Parliament and of the Council (1) as established
451
+ under this Regulation, to the European Parliament and to the Council.
452
+ - "**Court (Civil/Criminal): Civil** \n**Provisions:** \n**Time of commission\
453
+ \ of the act:** \n**Outcome (not guilty, guilty):** \n**Reasoning:** Partially\
454
+ \ accepts the lawsuit. \n**Facts:** The plaintiff, who works as a lawyer, maintains\
455
+ \ a savings account with the defendant banking corporation under account number\
456
+ \ GR.............. Pursuant to a contract dated June 11, 2010, established in\
457
+ \ Thessaloniki between the defendant and the plaintiff, the plaintiff was granted\
458
+ \ access to the electronic banking system (e-banking) to conduct banking transactions\
459
+ \ remotely. On October 10, 2020, the plaintiff fell victim to electronic fraud\
460
+ \ through the \"phishing\" method, whereby an unknown perpetrator managed to extract\
461
+ \ and transfer €3,000.00 from the plaintiff’s account to another account of the\
462
+ \ same bank. Specifically, on that day at 6:51 a.m., the plaintiff received an\
463
+ \ email from the sender \".........\", with the address ..........., informing\
464
+ \ him that his debit card had been suspended and that online payments and cash\
465
+ \ withdrawals could not be made until the issue was resolved. The email urged\
466
+ \ him to confirm his details within the next 72 hours by following a link titled\
467
+ \ \"card activation.\" \nThe plaintiff read the above email on his mobile phone\
468
+ \ around 8:00 a.m., and believing it came from the defendant, he followed the\
469
+ \ instructions and accessed a website that was identical (a clone) to that of\
470
+ \ the defendant. On this page, he was asked to enter his login credentials to\
471
+ \ connect to the service, which he did, and he was subsequently asked to input\
472
+ \ his debit card details for the alleged activation, which he also provided. Then,\
473
+ \ to complete the process, a number was sent to his mobile phone at 8:07 a.m.\
474
+ \ from the sender ........, which he entered, and two minutes later he received\
475
+ \ a message from the same sender in English stating that the quick access code\
476
+ \ had been activated on his mobile. A few minutes later, at 8:18 a.m., he received\
477
+ \ an email from the defendant informing him of the transfer of €3,000.00 from\
478
+ \ his account to account number GR ........... held at the same bank, with the\
479
+ \ beneficiary's details being .......... As soon as the plaintiff read this, he\
480
+ \ immediately called the defendant's call center and canceled his debit card,\
481
+ \ the access codes for the service ......., and locked the application ..........\
482
+ \ At the same time, he verbally submitted a request to dispute and cancel the\
483
+ \ contested transaction, and in a subsequent phone call, he also canceled his\
484
+ \ credit card. On the same day, he also sent an email to the defendant informing\
485
+ \ them in writing of the above and requesting the cancellation of the transaction\
486
+ \ and the return of the amount of €3,000.00 to his account, as this transfer was\
487
+ \ not made by him but by an unknown perpetrator through electronic fraud and was\
488
+ \ not approved by him. It should also be noted that the plaintiff, as the sole\
489
+ \ beneficiary according to the aforementioned contract for using the defendant's\
490
+ \ Internet Banking service, never received any update via SMS or the VIBER application\
491
+ \ from the bank regarding the transaction details before its completion, nor did\
492
+ \ he receive a one-time code (OTP) to approve the contested transaction. He subsequently\
493
+ \ filed a complaint against unknown persons at the Cyber Crime Division for the\
494
+ \ crime of fraud. The defendant sent an email to the plaintiff on October 16,\
495
+ \ 2020, informing him that his request had been forwarded to the appropriate department\
496
+ \ of the bank for investigation, stating that the bank would never send him an\
497
+ \ email or SMS asking him to enter his personal data and that as of October 7,\
498
+ \ 2020, there was a notice posted for its customers regarding malicious attempts\
499
+ \ to steal personal data in the \"Our News\" section on ....... A month after\
500
+ \ the disputed incident, on November 10, 2020, an amount of €2,296.82 was transferred\
501
+ \ to the plaintiff's account from the account to which the fraudulent credit had\
502
+ \ been made. The plaintiff immediately sent an email to the defendant asking to\
503
+ \ be informed whether this transfer was a return of part of the amount that had\
504
+ \ been illegally withdrawn from his account and requested the return of the remaining\
505
+ \ amount of €703.18. In its response dated January 13, 2021, the defendant confirmed\
506
+ \ that the aforementioned amount indeed came from the account to which the fraudulent\
507
+ \ credit had been made, following a freeze of that account initiated by the defendant\
508
+ \ during the investigation of the incident, but refused to return the remaining\
509
+ \ amount, claiming it bore no responsibility for the leak of the personal codes\
510
+ \ to third parties, according to the terms of the service contract established\
511
+ \ between them. \nFrom the entirety of the evidence presented to the court, there\
512
+ \ is no indication of the authenticity of the contested transaction, as the plaintiff\
513
+ \ did not give his consent for the execution of the transfer of the amount of\
514
+ \ €3,000.00, especially in light of the provision in Article 72 paragraph 2 of\
515
+ \ Law 4537/2018 stating that the mere use of the Internet Banking service by the\
516
+ \ plaintiff does not necessarily constitute sufficient evidence that the payer\
517
+ \ approved the payment action. Specifically, it was proven that the contested\
518
+ \ transaction was not carried out following a strong identification of the plaintiff\
519
+ \ – the sole beneficiary of the account – and his approval, as the latter may\
520
+ \ have entered his personal codes on the counterfeit website; however, he was\
521
+ \ never informed, before the completion of the contested transaction, of the amount\
522
+ \ that would be transferred from his account to a third-party account, nor did\
523
+ \ he receive on his mobile phone, either via SMS or through the VIBER application\
524
+ \ or any other means, the one-time code - extra PIN for its completion, which\
525
+ \ he was required to enter to approve the contested transaction (payment action)\
526
+ \ and thus complete his identification, a fact that was not countered by any evidence\
527
+ \ from the defendant. Furthermore, it is noted that the defendant's claims that\
528
+ \ it bears no responsibility under the terms of the banking services contract,\
529
+ \ whereby it is not liable for any damage to its customer in cases of unauthorized\
530
+ \ use of their personal access codes to the Internet Banking service, are to be\
531
+ \ rejected as fundamentally unfounded. This is because the aforementioned contractual\
532
+ \ terms are invalid according to the provision of Article 103 of Law 4537/2018,\
533
+ \ as they contradict the provisions of Articles 71, 73, and 92 of the same Law,\
534
+ \ which provide for the provider's universal liability and its exemption only\
535
+ \ for unusual and unforeseen circumstances that are beyond the control of the\
536
+ \ party invoking them and whose consequences could not have been avoided despite\
537
+ \ all efforts to the contrary; these provisions establish mandatory law in favor\
538
+ \ of users, as according to Article 103 of Law 4537/2018, payment service providers\
539
+ \ are prohibited from deviating from the provisions to the detriment of payment\
540
+ \ service users, unless the possibility of deviation is explicitly provided and\
541
+ \ they can decide to offer only more favorable terms to payment service users;\
542
+ \ the aforementioned contractual terms do not constitute more favorable terms\
543
+ \ but rather disadvantageous terms for the payment service user. In this case,\
544
+ \ however, the defendant did not prove the authenticity of the transaction and\
545
+ \ its approval by the plaintiff and did not invoke, nor did any unusual and unforeseen\
546
+ \ circumstances beyond its control, the consequences of which could not have been\
547
+ \ avoided despite all efforts to the contrary, come to light. Therefore, the contested\
548
+ \ transaction transferring the amount of €3,000.00 is considered, in the absence\
549
+ \ of demonstrable consent from the plaintiff, unapproved according to the provisions\
550
+ \ of Article 64 of Law 4537/2018, and the defendant's contrary claims are rejected,\
551
+ \ especially since the plaintiff proceeded, according to Article 71 paragraph\
552
+ \ 1 of Law 4537/2018, without undue delay to notify the defendant regarding the\
553
+ \ contested unapproved payment action. Consequently, the defendant is liable for\
554
+ \ compensating the plaintiff for the positive damage he suffered under Article\
555
+ \ 73 of Law 4537/2018 and is obliged to pay him the requested amount of €703.18,\
556
+ \ while the plaintiff’s fault in the occurrence of this damage cannot be established,\
557
+ \ as he entered his personal details in an online environment that was a faithful\
558
+ \ imitation of that of the defendant, as evidenced by the comparison of the screenshots\
559
+ \ of the fake website and the real website provided by the plaintiff, a fact that\
560
+ \ he could not have known while being fully convinced that he was transacting\
561
+ \ with the defendant. Furthermore, the defendant’s liability to compensate the\
562
+ \ plaintiff is based on the provision of Article 8 of Law 2251/1994, which applies\
563
+ \ in this case, as the plaintiff's damage resulted from inadequate fulfillment\
564
+ \ of its obligations in the context of providing its services, but also on the\
565
+ \ provision of Article 914 of the Civil Code in the sense of omission on its part\
566
+ \ of unlawfully and culpably imposed actions. In this case, given that during\
567
+ \ the relevant period there had been a multitude of similar incidents of fraud\
568
+ \ against the defendant's customers, the latter, as a service provider to the\
569
+ \ consumer public and bearing transactional obligations of care and security towards\
570
+ \ them, displayed gross negligence regarding the security provided for electronic\
571
+ \ transaction services, which was compromised by the fraudulent theft of funds,\
572
+ \ as it did not comply with all required high-security measures for executing\
573
+ \ the contested transaction, failing to implement the strict customer identification\
574
+ \ verification process and to check the authenticity of the account to which the\
575
+ \ funds were sent, thus not assuming the suspicious nature of the transaction,\
576
+ \ did not adopt comprehensive and improved protective measures to fully protect\
577
+ \ its customers against malicious attacks and online fraud and to prevent the\
578
+ \ infiltration of unauthorized third parties, nor did it fulfill its obligations\
579
+ \ to inform, accurately inform, and warn its consumers - customers, as it failed\
580
+ \ to adequately inform them of attempts to steal their personal data through the\
581
+ \ sending of informative emails or SMS, while merely posting in a section rather\
582
+ \ than on a central banner (as it later did) does not constitute adequate information\
583
+ \ such that it meets the requirement of protecting its customers and the increased\
584
+ \ safeguarding of their interests. Although the plaintiff acted promptly and informed\
585
+ \ the defendant on the same day about the contested incident, the defendant did\
586
+ \ not act as promptly regarding the investigation of the incident and the freezing\
587
+ \ of the account that held the fraudulent credit to prevent the plaintiff's loss,\
588
+ \ but only returned part of the funds to the plaintiff a month later. This behavior,\
589
+ \ beyond being culpable due to gross negligence, was also unlawful, as it would\
590
+ \ have been illegal even without the contractual relationship, as contrary to\
591
+ \ the provisions of Law 4537/2018 and Law 2251/1994, regarding the lack of security\
592
+ \ of the services that the consumer is legitimately entitled to expect, as well\
593
+ \ as the building of trust that is essential in banking transactions, elements\
594
+ \ that it was obligated to provide within the sphere of the services offered,\
595
+ \ and contrary to the principles of good faith and commercial ethics, as crystallized\
596
+ \ in the provision of Article 288 of the Civil Code, as well as the general duty\
597
+ \ imposed by Article 914 of the Civil Code not to cause harm to another culpably.\
598
+ \ This resulted not only in positive damage to the plaintiff but also in causing\
599
+ \ him moral harm consisting of his mental distress and the disruption, agitation,\
600
+ \ and sorrow he experienced, for which he must be awarded financial compensation.\
601
+ \ Taking into account all the general circumstances of the case, the extent of\
602
+ \ the plaintiff's damage, the severity of the defendant's fault, the mental distress\
603
+ \ suffered by the plaintiff, the insecurity he felt regarding his deposits, the\
604
+ \ sorrow he experienced, and the stress caused by his financial loss, which occurred\
605
+ \ during the pandemic period when his earnings from his professional activity\
606
+ \ had significantly decreased, as well as the financial and social situation of\
607
+ \ the parties, it is the court's opinion that he should be granted, as financial\
608
+ \ compensation for his moral harm, an amount of €250.00, which is deemed reasonable\
609
+ \ and fair. Therefore, the total monetary amount that the plaintiff is entitled\
610
+ \ to for his positive damage and financial compensation for the moral harm suffered\
611
+ \ amounts to a total of (€703.18 + €250.00) = €953.18."
612
+ - 'Failure to notify the Authority of file establishment or permit changes is punished
613
+ by up to three years’ imprisonment and a fine of one to five million Drachmas.
614
+
615
+ Maintaining a file without a permit or violating permit terms is punished by at
616
+ least one year’s imprisonment and a fine of one to five million Drachmas.
617
+
618
+ Unauthorized file interconnection or without permit is punished by up to three
619
+ years’ imprisonment and a fine of one to five million Drachmas.
620
+
621
+ Unlawful interference with personal data is punished by imprisonment and a fine;
622
+ for sensitive data, at least one year’s imprisonment and a fine of one to ten
623
+ million Drachmas.
624
+
625
+ Controllers who fail to comply with Authority decisions or violate data transfer
626
+ rules face at least two years’ imprisonment and a fine of one to five million
627
+ Drachmas.
628
+
629
+ If acts were committed for unlawful benefit or to cause harm, punishment is up
630
+ to ten years’ imprisonment and a fine of two to ten million Drachmas.
631
+
632
+ If acts jeopardize democratic governance or national security, punishment is confinement
633
+ in a penitentiary and a fine of five to ten million Drachmas.
634
+
635
+ Acts committed due to negligence result in at least three months’ imprisonment
636
+ and a fine.
637
+
638
+ If the Controller is not a natural person, the responsible party is the representative
639
+ or head of the organization with administrative or managerial duties.
640
+
641
+ Authorized members of the Authority may carry out preliminary investigations even
642
+ without Prosecutor’s order for certain offenses.
643
+
644
+ The Authority''s President must notify the Public Prosecutor of any offenses under
645
+ investigation, forwarding all relevant evidence.
646
+
647
+ Preliminary investigations must conclude within two months of charges, and trial
648
+ must begin within three months of completion.
649
+
650
+ Continuation of proceedings is allowed only once and for extremely important reasons,
651
+ with adjournment not exceeding two months.
652
+
653
+ Felonies under this law fall under the jurisdiction of the Court of Appeal.
654
+
655
+ '
656
+ - source_sentence: Who must facilitate the exercise of data subject rights?
657
+ sentences:
658
+ - '1.Processing of personal data revealing racial or ethnic origin, political opinions,
659
+ religious or philosophical beliefs, or trade union membership, and the processing
660
+ of genetic data, biometric data for the purpose of uniquely identifying a natural
661
+ person, data concerning health or data concerning a natural person''s sex life
662
+ or sexual orientation shall be prohibited.
663
+
664
+ 2.Paragraph 1 shall not apply if one of the following applies: (a) the data subject
665
+ has given explicit consent to the processing of those personal data for one or
666
+ more specified purposes, except where Union or Member State law provide that the
667
+ prohibition referred to in paragraph 1 may not be lifted by the data subject;
668
+ (b) processing is necessary for the purposes of carrying out the obligations
669
+ and exercising specific rights of the controller or of the data subject in the
670
+ field of employment and social security and social protection law in so far as
671
+ it is authorised by Union or Member State law or a collective agreement pursuant
672
+ to Member State law providing for appropriate safeguards for the fundamental rights
673
+ and the interests of the data subject; (c) processing is necessary to protect
674
+ the vital interests of the data subject or of another natural person where the
675
+ data subject is physically or legally incapable of giving consent; (d) processing
676
+ is carried out in the course of its legitimate activities with appropriate safeguards
677
+ by a foundation, association or any other not-for-profit body with a political,
678
+ philosophical, religious or trade union aim and on condition that the processing
679
+ relates solely to the members or to former members of the body or to persons who
680
+ have regular contact with it in connection with its purposes and that the personal
681
+ data are not disclosed outside that body without the consent of the data subjects;
682
+ (e) processing relates to personal data which are manifestly made public by the
683
+ data subject; (f) processing is necessary for the establishment, exercise or
684
+ defence of legal claims or whenever courts are acting in their judicial capacity;
685
+ (g) processing is necessary for reasons of substantial public interest, on the
686
+ basis of Union or Member State law which shall be proportionate to the aim pursued,
687
+ respect the essence of the right to data protection and provide for suitable and
688
+ specific measures to safeguard the fundamental rights and the interests of the
689
+ data subject; (h) processing is necessary for the purposes of preventive or occupational
690
+ medicine, for the assessment of the working capacity of the employee, medical
691
+ diagnosis, the provision of health or social care or treatment or the management
692
+ of health or social care systems and services on the basis of Union or Member
693
+ State law or pursuant to contract with a health professional and subject to the
694
+ conditions and safeguards referred to in paragraph 3; (i) processing is necessary
695
+ for reasons of public interest in the area of public health, such as protecting
696
+ against serious cross-border threats to health or ensuring high standards of quality
697
+ and safety of health care and of medicinal products or medical devices, on the
698
+ basis of Union or Member State law which provides for suitable and specific measures
699
+ to safeguard the rights and freedoms of the data subject, in particular professional
700
+ secrecy; 4.5.2016 L 119/38 (j) processing is necessary for archiving purposes
701
+ in the public interest, scientific or historical research purposes or statistical
702
+ purposes in accordance with Article 89(1) based on Union or Member State law which
703
+ shall be proportionate to the aim pursued, respect the essence of the right to
704
+ data protection and provide for suitable and specific measures to safeguard the
705
+ fundamental rights and the interests of the data subject.
706
+
707
+ 3.Personal data referred to in paragraph 1 may be processed for the purposes referred
708
+ to in point (h) of paragraph 2 when those data are processed by or under the responsibility
709
+ of a professional subject to the obligation of professional secrecy under Union
710
+ or Member State law or rules established by national competent bodies or by another
711
+ person also subject to an obligation of secrecy under Union or Member State law
712
+ or rules established by national competent bodies.
713
+
714
+ 4.Member States may maintain or introduce further conditions, including limitations,
715
+ with regard to the processing of genetic data, biometric data or data concerning
716
+ health.'
717
+ - Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies
718
+ to the processing of personal data by the Union institutions, bodies, offices
719
+ and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable
720
+ to such processing of personal data should be adapted to the principles and rules
721
+ established in this Regulation and applied in the light of this Regulation. In
722
+ order to provide a strong and coherent data protection framework in the Union,
723
+ the necessary adaptations of Regulation (EC) No 45/2001 should follow after the
724
+ adoption of this Regulation, in order to allow application at the same time as
725
+ this Regulation.
726
+ - "1.The controller shall take appropriate measures to provide any information referred\
727
+ \ to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34\
728
+ \ relating to processing to the data subject in a concise, transparent, intelligible\
729
+ \ and easily accessible form, using clear and plain language, in particular for\
730
+ \ any information addressed specifically to a child. The information shall be\
731
+ \ provided in writing, or by other means, including, where appropriate, by electronic\
732
+ \ means. When requested by the data subject, the information may be provided orally,\
733
+ \ provided that the identity of the data subject is proven by other means. 4.5.2016\
734
+ \ L 119/39 \n2.The controller shall facilitate the exercise of data subject rights\
735
+ \ under Articles 15 to 22. In the cases referred to in Article 11(2), the controller\
736
+ \ shall not refuse to act on the request of the data subject for exercising his\
737
+ \ or her rights under Articles 15 to 22, unless the controller demonstrates that\
738
+ \ it is not in a position to identify the data subject.\n3.The controller shall\
739
+ \ provide information on action taken on a request under Articles 15 to 22 to\
740
+ \ the data subject without undue delay and in any event within one month of receipt\
741
+ \ of the request. That period may be extended by two further months where necessary,\
742
+ \ taking into account the complexity and number of the requests. The controller\
743
+ \ shall inform the data subject of any such extension within one month of receipt\
744
+ \ of the request, together with the reasons for the delay. Where the data subject\
745
+ \ makes the request by electronic form means, the information shall be provided\
746
+ \ by electronic means where possible, unless otherwise requested by the data subject.\n\
747
+ 4.If the controller does not take action on the request of the data subject, the\
748
+ \ controller shall inform the data subject without delay and at the latest within\
749
+ \ one month of receipt of the request of the reasons for not taking action and\
750
+ \ on the possibility of lodging a complaint with a supervisory authority and seeking\
751
+ \ a judicial remedy.\n5.Information provided under Articles 13 and 14 and any\
752
+ \ communication and any actions taken under Articles 15 to 22 and 34 shall be\
753
+ \ provided free of charge. Where requests from a data subject are manifestly unfounded\
754
+ \ or excessive, in particular because of their repetitive character, the controller\
755
+ \ may either: (a) charge a reasonable fee taking into account the administrative\
756
+ \ costs of providing the information or communication or taking the action requested;\
757
+ \ or (b) refuse to act on the request. The controller shall bear the burden of\
758
+ \ demonstrating the manifestly unfounded or excessive character of the request.\n\
759
+ 6.Without prejudice to Article 11, where the controller has reasonable doubts\
760
+ \ concerning the identity of the natural person making the request referred to\
761
+ \ in Articles 15 to 21, the controller may request the provision of additional\
762
+ \ information necessary to confirm the identity of the data subject.\n7.The information\
763
+ \ to be provided to data subjects pursuant to Articles 13 and 14 may be provided\
764
+ \ in combination with standardised icons in order to give in an easily visible,\
765
+ \ intelligible and clearly legible manner a meaningful overview of the intended\
766
+ \ processing. Where the icons are presented electronically they shall be machine-readable.\n\
767
+ 8.The Commission shall be empowered to adopt delegated acts in accordance with\
768
+ \ Article 92 for the purpose of determining the information to be presented by\
769
+ \ the icons and the procedures for providing standardised icons. Section 2 Information\
770
+ \ and access to personal data"
771
+ pipeline_tag: sentence-similarity
772
+ library_name: sentence-transformers
773
+ metrics:
774
+ - cosine_accuracy@1
775
+ - cosine_accuracy@3
776
+ - cosine_accuracy@5
777
+ - cosine_accuracy@10
778
+ - cosine_precision@1
779
+ - cosine_precision@3
780
+ - cosine_precision@5
781
+ - cosine_precision@10
782
+ - cosine_recall@1
783
+ - cosine_recall@3
784
+ - cosine_recall@5
785
+ - cosine_recall@10
786
+ - cosine_ndcg@10
787
+ - cosine_mrr@10
788
+ - cosine_map@100
789
+ model-index:
790
+ - name: multilingual-e5-large
791
+ results:
792
+ - task:
793
+ type: information-retrieval
794
+ name: Information Retrieval
795
+ dataset:
796
+ name: dim 1024
797
+ type: dim_1024
798
+ metrics:
799
+ - type: cosine_accuracy@1
800
+ value: 0.3994878361075544
801
+ name: Cosine Accuracy@1
802
+ - type: cosine_accuracy@3
803
+ value: 0.40973111395646605
804
+ name: Cosine Accuracy@3
805
+ - type: cosine_accuracy@5
806
+ value: 0.44238156209987195
807
+ name: Cosine Accuracy@5
808
+ - type: cosine_accuracy@10
809
+ value: 0.4814340588988476
810
+ name: Cosine Accuracy@10
811
+ - type: cosine_precision@1
812
+ value: 0.3994878361075544
813
+ name: Cosine Precision@1
814
+ - type: cosine_precision@3
815
+ value: 0.3994878361075544
816
+ name: Cosine Precision@3
817
+ - type: cosine_precision@5
818
+ value: 0.3897567221510884
819
+ name: Cosine Precision@5
820
+ - type: cosine_precision@10
821
+ value: 0.3562099871959027
822
+ name: Cosine Precision@10
823
+ - type: cosine_recall@1
824
+ value: 0.046427253250942845
825
+ name: Cosine Recall@1
826
+ - type: cosine_recall@3
827
+ value: 0.1357642561296911
828
+ name: Cosine Recall@3
829
+ - type: cosine_recall@5
830
+ value: 0.20380194680388578
831
+ name: Cosine Recall@5
832
+ - type: cosine_recall@10
833
+ value: 0.30156152834977973
834
+ name: Cosine Recall@10
835
+ - type: cosine_ndcg@10
836
+ value: 0.42824330702763147
837
+ name: Cosine Ndcg@10
838
+ - type: cosine_mrr@10
839
+ value: 0.41413607910086736
840
+ name: Cosine Mrr@10
841
+ - type: cosine_map@100
842
+ value: 0.4960353530991054
843
+ name: Cosine Map@100
844
+ - task:
845
+ type: information-retrieval
846
+ name: Information Retrieval
847
+ dataset:
848
+ name: dim 768
849
+ type: dim_768
850
+ metrics:
851
+ - type: cosine_accuracy@1
852
+ value: 0.3892445582586428
853
+ name: Cosine Accuracy@1
854
+ - type: cosine_accuracy@3
855
+ value: 0.3994878361075544
856
+ name: Cosine Accuracy@3
857
+ - type: cosine_accuracy@5
858
+ value: 0.43661971830985913
859
+ name: Cosine Accuracy@5
860
+ - type: cosine_accuracy@10
861
+ value: 0.47823303457106275
862
+ name: Cosine Accuracy@10
863
+ - type: cosine_precision@1
864
+ value: 0.3892445582586428
865
+ name: Cosine Precision@1
866
+ - type: cosine_precision@3
867
+ value: 0.38988476312419973
868
+ name: Cosine Precision@3
869
+ - type: cosine_precision@5
870
+ value: 0.38156209987195905
871
+ name: Cosine Precision@5
872
+ - type: cosine_precision@10
873
+ value: 0.35147247119078107
874
+ name: Cosine Precision@10
875
+ - type: cosine_recall@1
876
+ value: 0.045140545184589424
877
+ name: Cosine Recall@1
878
+ - type: cosine_recall@3
879
+ value: 0.13218231618768836
880
+ name: Cosine Recall@3
881
+ - type: cosine_recall@5
882
+ value: 0.19882192649305613
883
+ name: Cosine Recall@5
884
+ - type: cosine_recall@10
885
+ value: 0.29727932103829957
886
+ name: Cosine Recall@10
887
+ - type: cosine_ndcg@10
888
+ value: 0.4211330537467249
889
+ name: Cosine Ndcg@10
890
+ - type: cosine_mrr@10
891
+ value: 0.4050812450460335
892
+ name: Cosine Mrr@10
893
+ - type: cosine_map@100
894
+ value: 0.48796722771226453
895
+ name: Cosine Map@100
896
+ - task:
897
+ type: information-retrieval
898
+ name: Information Retrieval
899
+ dataset:
900
+ name: dim 512
901
+ type: dim_512
902
+ metrics:
903
+ - type: cosine_accuracy@1
904
+ value: 0.39436619718309857
905
+ name: Cosine Accuracy@1
906
+ - type: cosine_accuracy@3
907
+ value: 0.4033290653008963
908
+ name: Cosine Accuracy@3
909
+ - type: cosine_accuracy@5
910
+ value: 0.4327784891165173
911
+ name: Cosine Accuracy@5
912
+ - type: cosine_accuracy@10
913
+ value: 0.471190781049936
914
+ name: Cosine Accuracy@10
915
+ - type: cosine_precision@1
916
+ value: 0.39436619718309857
917
+ name: Cosine Precision@1
918
+ - type: cosine_precision@3
919
+ value: 0.39436619718309857
920
+ name: Cosine Precision@3
921
+ - type: cosine_precision@5
922
+ value: 0.38373879641485276
923
+ name: Cosine Precision@5
924
+ - type: cosine_precision@10
925
+ value: 0.348719590268886
926
+ name: Cosine Precision@10
927
+ - type: cosine_recall@1
928
+ value: 0.046001271870766657
929
+ name: Cosine Recall@1
930
+ - type: cosine_recall@3
931
+ value: 0.13434589294029278
932
+ name: Cosine Recall@3
933
+ - type: cosine_recall@5
934
+ value: 0.2006372923557733
935
+ name: Cosine Recall@5
936
+ - type: cosine_recall@10
937
+ value: 0.29407016086576515
938
+ name: Cosine Recall@10
939
+ - type: cosine_ndcg@10
940
+ value: 0.4209567413561994
941
+ name: Cosine Ndcg@10
942
+ - type: cosine_mrr@10
943
+ value: 0.4078435258012718
944
+ name: Cosine Mrr@10
945
+ - type: cosine_map@100
946
+ value: 0.48375387985213597
947
+ name: Cosine Map@100
948
+ - task:
949
+ type: information-retrieval
950
+ name: Information Retrieval
951
+ dataset:
952
+ name: dim 256
953
+ type: dim_256
954
+ metrics:
955
+ - type: cosine_accuracy@1
956
+ value: 0.3764404609475032
957
+ name: Cosine Accuracy@1
958
+ - type: cosine_accuracy@3
959
+ value: 0.382202304737516
960
+ name: Cosine Accuracy@3
961
+ - type: cosine_accuracy@5
962
+ value: 0.41037131882202305
963
+ name: Cosine Accuracy@5
964
+ - type: cosine_accuracy@10
965
+ value: 0.4532650448143406
966
+ name: Cosine Accuracy@10
967
+ - type: cosine_precision@1
968
+ value: 0.3764404609475032
969
+ name: Cosine Precision@1
970
+ - type: cosine_precision@3
971
+ value: 0.3758002560819462
972
+ name: Cosine Precision@3
973
+ - type: cosine_precision@5
974
+ value: 0.365044814340589
975
+ name: Cosine Precision@5
976
+ - type: cosine_precision@10
977
+ value: 0.3325864276568502
978
+ name: Cosine Precision@10
979
+ - type: cosine_recall@1
980
+ value: 0.04345597060609991
981
+ name: Cosine Recall@1
982
+ - type: cosine_recall@3
983
+ value: 0.12739095919345977
984
+ name: Cosine Recall@3
985
+ - type: cosine_recall@5
986
+ value: 0.19108724610052447
987
+ name: Cosine Recall@5
988
+ - type: cosine_recall@10
989
+ value: 0.28270389457679657
990
+ name: Cosine Recall@10
991
+ - type: cosine_ndcg@10
992
+ value: 0.40161260018012396
993
+ name: Cosine Ndcg@10
994
+ - type: cosine_mrr@10
995
+ value: 0.3891762189297396
996
+ name: Cosine Mrr@10
997
+ - type: cosine_map@100
998
+ value: 0.46504361814337597
999
+ name: Cosine Map@100
1000
+ - task:
1001
+ type: information-retrieval
1002
+ name: Information Retrieval
1003
+ dataset:
1004
+ name: dim 128
1005
+ type: dim_128
1006
+ metrics:
1007
+ - type: cosine_accuracy@1
1008
+ value: 0.34699103713188223
1009
+ name: Cosine Accuracy@1
1010
+ - type: cosine_accuracy@3
1011
+ value: 0.3495518565941101
1012
+ name: Cosine Accuracy@3
1013
+ - type: cosine_accuracy@5
1014
+ value: 0.37900128040973113
1015
+ name: Cosine Accuracy@5
1016
+ - type: cosine_accuracy@10
1017
+ value: 0.41613316261203587
1018
+ name: Cosine Accuracy@10
1019
+ - type: cosine_precision@1
1020
+ value: 0.34699103713188223
1021
+ name: Cosine Precision@1
1022
+ - type: cosine_precision@3
1023
+ value: 0.34528382415706355
1024
+ name: Cosine Precision@3
1025
+ - type: cosine_precision@5
1026
+ value: 0.33533930857874517
1027
+ name: Cosine Precision@5
1028
+ - type: cosine_precision@10
1029
+ value: 0.30550576184379
1030
+ name: Cosine Precision@10
1031
+ - type: cosine_recall@1
1032
+ value: 0.04023580723646711
1033
+ name: Cosine Recall@1
1034
+ - type: cosine_recall@3
1035
+ value: 0.11713599313797275
1036
+ name: Cosine Recall@3
1037
+ - type: cosine_recall@5
1038
+ value: 0.17553870970060761
1039
+ name: Cosine Recall@5
1040
+ - type: cosine_recall@10
1041
+ value: 0.2604238007608957
1042
+ name: Cosine Recall@10
1043
+ - type: cosine_ndcg@10
1044
+ value: 0.36965214083548276
1045
+ name: Cosine Ndcg@10
1046
+ - type: cosine_mrr@10
1047
+ value: 0.35818293599983697
1048
+ name: Cosine Mrr@10
1049
+ - type: cosine_map@100
1050
+ value: 0.4291315309956839
1051
+ name: Cosine Map@100
1052
+ - task:
1053
+ type: information-retrieval
1054
+ name: Information Retrieval
1055
+ dataset:
1056
+ name: dim 64
1057
+ type: dim_64
1058
+ metrics:
1059
+ - type: cosine_accuracy@1
1060
+ value: 0.293854033290653
1061
+ name: Cosine Accuracy@1
1062
+ - type: cosine_accuracy@3
1063
+ value: 0.30153649167733676
1064
+ name: Cosine Accuracy@3
1065
+ - type: cosine_accuracy@5
1066
+ value: 0.32714468629961585
1067
+ name: Cosine Accuracy@5
1068
+ - type: cosine_accuracy@10
1069
+ value: 0.3591549295774648
1070
+ name: Cosine Accuracy@10
1071
+ - type: cosine_precision@1
1072
+ value: 0.293854033290653
1073
+ name: Cosine Precision@1
1074
+ - type: cosine_precision@3
1075
+ value: 0.29449423815621
1076
+ name: Cosine Precision@3
1077
+ - type: cosine_precision@5
1078
+ value: 0.288348271446863
1079
+ name: Cosine Precision@5
1080
+ - type: cosine_precision@10
1081
+ value: 0.2681177976952625
1082
+ name: Cosine Precision@10
1083
+ - type: cosine_recall@1
1084
+ value: 0.03212717718240556
1085
+ name: Cosine Recall@1
1086
+ - type: cosine_recall@3
1087
+ value: 0.0944529143897263
1088
+ name: Cosine Recall@3
1089
+ - type: cosine_recall@5
1090
+ value: 0.14311801944731944
1091
+ name: Cosine Recall@5
1092
+ - type: cosine_recall@10
1093
+ value: 0.221706864386852
1094
+ name: Cosine Recall@10
1095
+ - type: cosine_ndcg@10
1096
+ value: 0.3185372635267884
1097
+ name: Cosine Ndcg@10
1098
+ - type: cosine_mrr@10
1099
+ value: 0.30537518037517997
1100
+ name: Cosine Mrr@10
1101
+ - type: cosine_map@100
1102
+ value: 0.3744361264744976
1103
+ name: Cosine Map@100
1104
+ ---
1105
+
1106
+ # multilingual-e5-large
1107
+
1108
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large). It maps sentences & paragraphs to a 1024-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
1109
+
1110
+ ## Model Details
1111
+
1112
+ ### Model Description
1113
+ - **Model Type:** Sentence Transformer
1114
+ - **Base model:** [intfloat/multilingual-e5-large](https://huggingface.co/intfloat/multilingual-e5-large) <!-- at revision 0dc5580a448e4284468b8909bae50fa925907bc5 -->
1115
+ - **Maximum Sequence Length:** 512 tokens
1116
+ - **Output Dimensionality:** 1024 dimensions
1117
+ - **Similarity Function:** Cosine Similarity
1118
+ <!-- - **Training Dataset:** Unknown -->
1119
+ - **Language:** en
1120
+ - **License:** apache-2.0
1121
+
1122
+ ### Model Sources
1123
+
1124
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
1125
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
1126
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
1127
+
1128
+ ### Full Model Architecture
1129
+
1130
+ ```
1131
+ SentenceTransformer(
1132
+ (0): Transformer({'max_seq_length': 512, 'do_lower_case': False, 'architecture': 'XLMRobertaModel'})
1133
+ (1): Pooling({'word_embedding_dimension': 1024, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
1134
+ (2): Normalize()
1135
+ )
1136
+ ```
1137
+
1138
+ ## Usage
1139
+
1140
+ ### Direct Usage (Sentence Transformers)
1141
+
1142
+ First install the Sentence Transformers library:
1143
+
1144
+ ```bash
1145
+ pip install -U sentence-transformers
1146
+ ```
1147
+
1148
+ Then you can load this model and run inference.
1149
+ ```python
1150
+ from sentence_transformers import SentenceTransformer
1151
+
1152
+ # Download from the 🤗 Hub
1153
+ model = SentenceTransformer("sentence_transformers_model_id")
1154
+ # Run inference
1155
+ sentences = [
1156
+ 'Who must facilitate the exercise of data subject rights?',
1157
+ '1.The controller shall take appropriate measures to provide any information referred to in Articles 13 and 14 and any communication under Articles 15 to 22 and 34 relating to processing to the data subject in a concise, transparent, intelligible and easily accessible form, using clear and plain language, in particular for any information addressed specifically to a child. The information shall be provided in writing, or by other means, including, where appropriate, by electronic means. When requested by the data subject, the information may be provided orally, provided that the identity of the data subject is proven by other means. 4.5.2016 L 119/39 \n2.The controller shall facilitate the exercise of data subject rights under Articles 15 to 22. In the cases referred to in Article 11(2), the controller shall not refuse to act on the request of the data subject for exercising his or her rights under Articles 15 to 22, unless the controller demonstrates that it is not in a position to identify the data subject.\n3.The controller shall provide information on action taken on a request under Articles 15 to 22 to the data subject without undue delay and in any event within one month of receipt of the request. That period may be extended by two further months where necessary, taking into account the complexity and number of the requests. The controller shall inform the data subject of any such extension within one month of receipt of the request, together with the reasons for the delay. Where the data subject makes the request by electronic form means, the information shall be provided by electronic means where possible, unless otherwise requested by the data subject.\n4.If the controller does not take action on the request of the data subject, the controller shall inform the data subject without delay and at the latest within one month of receipt of the request of the reasons for not taking action and on the possibility of lodging a complaint with a supervisory authority and seeking a judicial remedy.\n5.Information provided under Articles 13 and 14 and any communication and any actions taken under Articles 15 to 22 and 34 shall be provided free of charge. Where requests from a data subject are manifestly unfounded or excessive, in particular because of their repetitive character, the controller may either: (a) charge a reasonable fee taking into account the administrative costs of providing the information or communication or taking the action requested; or (b) refuse to act on the request. The controller shall bear the burden of demonstrating the manifestly unfounded or excessive character of the request.\n6.Without prejudice to Article 11, where the controller has reasonable doubts concerning the identity of the natural person making the request referred to in Articles 15 to 21, the controller may request the provision of additional information necessary to confirm the identity of the data subject.\n7.The information to be provided to data subjects pursuant to Articles 13 and 14 may be provided in combination with standardised icons in order to give in an easily visible, intelligible and clearly legible manner a meaningful overview of the intended processing. Where the icons are presented electronically they shall be machine-readable.\n8.The Commission shall be empowered to adopt delegated acts in accordance with Article 92 for the purpose of determining the information to be presented by the icons and the procedures for providing standardised icons. Section 2 Information and access to personal data',
1158
+ 'Regulation (EC) No 45/2001 of the European Parliament and of the Council (2) applies to the processing of personal data by the Union institutions, bodies, offices and agencies. Regulation (EC) No 45/2001 and other Union legal acts applicable to such processing of personal data should be adapted to the principles and rules established in this Regulation and applied in the light of this Regulation. In order to provide a strong and coherent data protection framework in the Union, the necessary adaptations of Regulation (EC) No 45/2001 should follow after the adoption of this Regulation, in order to allow application at the same time as this Regulation.',
1159
+ ]
1160
+ embeddings = model.encode(sentences)
1161
+ print(embeddings.shape)
1162
+ # [3, 1024]
1163
+
1164
+ # Get the similarity scores for the embeddings
1165
+ similarities = model.similarity(embeddings, embeddings)
1166
+ print(similarities)
1167
+ # tensor([[1.0000, 0.5502, 0.2948],
1168
+ # [0.5502, 1.0000, 0.2162],
1169
+ # [0.2948, 0.2162, 1.0000]])
1170
+ ```
1171
+
1172
+ <!--
1173
+ ### Direct Usage (Transformers)
1174
+
1175
+ <details><summary>Click to see the direct usage in Transformers</summary>
1176
+
1177
+ </details>
1178
+ -->
1179
+
1180
+ <!--
1181
+ ### Downstream Usage (Sentence Transformers)
1182
+
1183
+ You can finetune this model on your own dataset.
1184
+
1185
+ <details><summary>Click to expand</summary>
1186
+
1187
+ </details>
1188
+ -->
1189
+
1190
+ <!--
1191
+ ### Out-of-Scope Use
1192
+
1193
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
1194
+ -->
1195
+
1196
+ ## Evaluation
1197
+
1198
+ ### Metrics
1199
+
1200
+ #### Information Retrieval
1201
+
1202
+ * Dataset: `dim_1024`
1203
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1204
+ ```json
1205
+ {
1206
+ "truncate_dim": 1024
1207
+ }
1208
+ ```
1209
+
1210
+ | Metric | Value |
1211
+ |:--------------------|:-----------|
1212
+ | cosine_accuracy@1 | 0.3995 |
1213
+ | cosine_accuracy@3 | 0.4097 |
1214
+ | cosine_accuracy@5 | 0.4424 |
1215
+ | cosine_accuracy@10 | 0.4814 |
1216
+ | cosine_precision@1 | 0.3995 |
1217
+ | cosine_precision@3 | 0.3995 |
1218
+ | cosine_precision@5 | 0.3898 |
1219
+ | cosine_precision@10 | 0.3562 |
1220
+ | cosine_recall@1 | 0.0464 |
1221
+ | cosine_recall@3 | 0.1358 |
1222
+ | cosine_recall@5 | 0.2038 |
1223
+ | cosine_recall@10 | 0.3016 |
1224
+ | **cosine_ndcg@10** | **0.4282** |
1225
+ | cosine_mrr@10 | 0.4141 |
1226
+ | cosine_map@100 | 0.496 |
1227
+
1228
+ #### Information Retrieval
1229
+
1230
+ * Dataset: `dim_768`
1231
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1232
+ ```json
1233
+ {
1234
+ "truncate_dim": 768
1235
+ }
1236
+ ```
1237
+
1238
+ | Metric | Value |
1239
+ |:--------------------|:-----------|
1240
+ | cosine_accuracy@1 | 0.3892 |
1241
+ | cosine_accuracy@3 | 0.3995 |
1242
+ | cosine_accuracy@5 | 0.4366 |
1243
+ | cosine_accuracy@10 | 0.4782 |
1244
+ | cosine_precision@1 | 0.3892 |
1245
+ | cosine_precision@3 | 0.3899 |
1246
+ | cosine_precision@5 | 0.3816 |
1247
+ | cosine_precision@10 | 0.3515 |
1248
+ | cosine_recall@1 | 0.0451 |
1249
+ | cosine_recall@3 | 0.1322 |
1250
+ | cosine_recall@5 | 0.1988 |
1251
+ | cosine_recall@10 | 0.2973 |
1252
+ | **cosine_ndcg@10** | **0.4211** |
1253
+ | cosine_mrr@10 | 0.4051 |
1254
+ | cosine_map@100 | 0.488 |
1255
+
1256
+ #### Information Retrieval
1257
+
1258
+ * Dataset: `dim_512`
1259
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1260
+ ```json
1261
+ {
1262
+ "truncate_dim": 512
1263
+ }
1264
+ ```
1265
+
1266
+ | Metric | Value |
1267
+ |:--------------------|:----------|
1268
+ | cosine_accuracy@1 | 0.3944 |
1269
+ | cosine_accuracy@3 | 0.4033 |
1270
+ | cosine_accuracy@5 | 0.4328 |
1271
+ | cosine_accuracy@10 | 0.4712 |
1272
+ | cosine_precision@1 | 0.3944 |
1273
+ | cosine_precision@3 | 0.3944 |
1274
+ | cosine_precision@5 | 0.3837 |
1275
+ | cosine_precision@10 | 0.3487 |
1276
+ | cosine_recall@1 | 0.046 |
1277
+ | cosine_recall@3 | 0.1343 |
1278
+ | cosine_recall@5 | 0.2006 |
1279
+ | cosine_recall@10 | 0.2941 |
1280
+ | **cosine_ndcg@10** | **0.421** |
1281
+ | cosine_mrr@10 | 0.4078 |
1282
+ | cosine_map@100 | 0.4838 |
1283
+
1284
+ #### Information Retrieval
1285
+
1286
+ * Dataset: `dim_256`
1287
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1288
+ ```json
1289
+ {
1290
+ "truncate_dim": 256
1291
+ }
1292
+ ```
1293
+
1294
+ | Metric | Value |
1295
+ |:--------------------|:-----------|
1296
+ | cosine_accuracy@1 | 0.3764 |
1297
+ | cosine_accuracy@3 | 0.3822 |
1298
+ | cosine_accuracy@5 | 0.4104 |
1299
+ | cosine_accuracy@10 | 0.4533 |
1300
+ | cosine_precision@1 | 0.3764 |
1301
+ | cosine_precision@3 | 0.3758 |
1302
+ | cosine_precision@5 | 0.365 |
1303
+ | cosine_precision@10 | 0.3326 |
1304
+ | cosine_recall@1 | 0.0435 |
1305
+ | cosine_recall@3 | 0.1274 |
1306
+ | cosine_recall@5 | 0.1911 |
1307
+ | cosine_recall@10 | 0.2827 |
1308
+ | **cosine_ndcg@10** | **0.4016** |
1309
+ | cosine_mrr@10 | 0.3892 |
1310
+ | cosine_map@100 | 0.465 |
1311
+
1312
+ #### Information Retrieval
1313
+
1314
+ * Dataset: `dim_128`
1315
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1316
+ ```json
1317
+ {
1318
+ "truncate_dim": 128
1319
+ }
1320
+ ```
1321
+
1322
+ | Metric | Value |
1323
+ |:--------------------|:-----------|
1324
+ | cosine_accuracy@1 | 0.347 |
1325
+ | cosine_accuracy@3 | 0.3496 |
1326
+ | cosine_accuracy@5 | 0.379 |
1327
+ | cosine_accuracy@10 | 0.4161 |
1328
+ | cosine_precision@1 | 0.347 |
1329
+ | cosine_precision@3 | 0.3453 |
1330
+ | cosine_precision@5 | 0.3353 |
1331
+ | cosine_precision@10 | 0.3055 |
1332
+ | cosine_recall@1 | 0.0402 |
1333
+ | cosine_recall@3 | 0.1171 |
1334
+ | cosine_recall@5 | 0.1755 |
1335
+ | cosine_recall@10 | 0.2604 |
1336
+ | **cosine_ndcg@10** | **0.3697** |
1337
+ | cosine_mrr@10 | 0.3582 |
1338
+ | cosine_map@100 | 0.4291 |
1339
+
1340
+ #### Information Retrieval
1341
+
1342
+ * Dataset: `dim_64`
1343
+ * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator) with these parameters:
1344
+ ```json
1345
+ {
1346
+ "truncate_dim": 64
1347
+ }
1348
+ ```
1349
+
1350
+ | Metric | Value |
1351
+ |:--------------------|:-----------|
1352
+ | cosine_accuracy@1 | 0.2939 |
1353
+ | cosine_accuracy@3 | 0.3015 |
1354
+ | cosine_accuracy@5 | 0.3271 |
1355
+ | cosine_accuracy@10 | 0.3592 |
1356
+ | cosine_precision@1 | 0.2939 |
1357
+ | cosine_precision@3 | 0.2945 |
1358
+ | cosine_precision@5 | 0.2883 |
1359
+ | cosine_precision@10 | 0.2681 |
1360
+ | cosine_recall@1 | 0.0321 |
1361
+ | cosine_recall@3 | 0.0945 |
1362
+ | cosine_recall@5 | 0.1431 |
1363
+ | cosine_recall@10 | 0.2217 |
1364
+ | **cosine_ndcg@10** | **0.3185** |
1365
+ | cosine_mrr@10 | 0.3054 |
1366
+ | cosine_map@100 | 0.3744 |
1367
+
1368
+ <!--
1369
+ ## Bias, Risks and Limitations
1370
+
1371
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
1372
+ -->
1373
+
1374
+ <!--
1375
+ ### Recommendations
1376
+
1377
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
1378
+ -->
1379
+
1380
+ ## Training Details
1381
+
1382
+ ### Training Dataset
1383
+
1384
+ #### Unnamed Dataset
1385
+
1386
+ * Size: 391 training samples
1387
+ * Columns: <code>anchor</code> and <code>positive</code>
1388
+ * Approximate statistics based on the first 391 samples:
1389
+ | | anchor | positive |
1390
+ |:--------|:----------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
1391
+ | type | string | string |
1392
+ | details | <ul><li>min: 8 tokens</li><li>mean: 17.16 tokens</li><li>max: 32 tokens</li></ul> | <ul><li>min: 27 tokens</li><li>mean: 377.93 tokens</li><li>max: 512 tokens</li></ul> |
1393
+ * Samples:
1394
+ | anchor | positive |
1395
+ |:-------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
1396
+ | <code>What measures must be taken according to Article 32?</code> | <code>1.Where processing is to be carried out on behalf of a controller, the controller shall use only processors providing sufficient guarantees to implement appropriate technical and organisational measures in such a manner that processing will meet the requirements of this Regulation and ensure the protection of the rights of the data subject.<br>2.The processor shall not engage another processor without prior specific or general written authorisation of the controller. In the case of general written authorisation, the processor shall inform the controller of any intended changes concerning the addition or replacement of other processors, thereby giving the controller the opportunity to object to such changes.<br>3.Processing by a processor shall be governed by a contract or other legal act under Union or Member State law, that is binding on the processor with regard to the controller and that sets out the subject-matter and duration of the processing, the nature and purpose of the processing, ...</code> |
1397
+ | <code>What is the responsibility of assisting and advising the data subjects in exercising their rights?</code> | <code>1.A transfer of personal data to a third country or an international organisation may take place where the Commission has decided that the third country, a territory or one or more specified sectors within that third country, or the international organisation in question ensures an adequate level of protection. Such a transfer shall not require any specific authorisation.<br>2.When assessing the adequacy of the level of protection, the Commission shall, in particular, take account of the following elements: (a) the rule of law, respect for human rights and fundamental freedoms, relevant legislation, both general and sectoral, including concerning public security, defence, national security and criminal law and the access of public authorities to personal data, as well as the implementation of such legislation, data protection rules, professional rules and security measures, including rules for the onward transfer of personal data to another third country or international organisation whi...</code> |
1398
+ | <code>What should Member States be authorized to provide for regarding personal data processing for archiving purposes?</code> | <code>Where personal data are processed for archiving purposes, this Regulation should also apply to that processing, bearing in mind that this Regulation should not apply to deceased persons. Public authorities or public or private bodies that hold records of public interest should be services which, pursuant to Union or Member State law, have a legal obligation to acquire, preserve, appraise, arrange, describe, communicate, promote, disseminate and provide access to records of enduring value for general public interest. Member States should also be authorised to provide for the further processing of personal data for archiving purposes, for example with a view to providing specific information related to the political behaviour under former totalitarian state regimes, genocide, crimes against humanity, in particular the Holocaust, or war crimes. 4.5.2016 L 119/29 Official Journal of the European Union EN</code> |
1399
+ * Loss: [<code>MatryoshkaLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#matryoshkaloss) with these parameters:
1400
+ ```json
1401
+ {
1402
+ "loss": "MultipleNegativesRankingLoss",
1403
+ "matryoshka_dims": [
1404
+ 1024,
1405
+ 768,
1406
+ 512,
1407
+ 256,
1408
+ 128,
1409
+ 64
1410
+ ],
1411
+ "matryoshka_weights": [
1412
+ 1,
1413
+ 1,
1414
+ 1,
1415
+ 1,
1416
+ 1,
1417
+ 1
1418
+ ],
1419
+ "n_dims_per_step": -1
1420
+ }
1421
+ ```
1422
+
1423
+ ### Training Hyperparameters
1424
+ #### Non-Default Hyperparameters
1425
+
1426
+ - `eval_strategy`: epoch
1427
+ - `per_device_eval_batch_size`: 16
1428
+ - `gradient_accumulation_steps`: 4
1429
+ - `learning_rate`: 2e-05
1430
+ - `num_train_epochs`: 20
1431
+ - `lr_scheduler_type`: cosine
1432
+ - `warmup_ratio`: 0.1
1433
+ - `bf16`: True
1434
+ - `load_best_model_at_end`: True
1435
+ - `optim`: adamw_torch_fused
1436
+ - `batch_sampler`: no_duplicates
1437
+
1438
+ #### All Hyperparameters
1439
+ <details><summary>Click to expand</summary>
1440
+
1441
+ - `overwrite_output_dir`: False
1442
+ - `do_predict`: False
1443
+ - `eval_strategy`: epoch
1444
+ - `prediction_loss_only`: True
1445
+ - `per_device_train_batch_size`: 8
1446
+ - `per_device_eval_batch_size`: 16
1447
+ - `per_gpu_train_batch_size`: None
1448
+ - `per_gpu_eval_batch_size`: None
1449
+ - `gradient_accumulation_steps`: 4
1450
+ - `eval_accumulation_steps`: None
1451
+ - `torch_empty_cache_steps`: None
1452
+ - `learning_rate`: 2e-05
1453
+ - `weight_decay`: 0.0
1454
+ - `adam_beta1`: 0.9
1455
+ - `adam_beta2`: 0.999
1456
+ - `adam_epsilon`: 1e-08
1457
+ - `max_grad_norm`: 1.0
1458
+ - `num_train_epochs`: 20
1459
+ - `max_steps`: -1
1460
+ - `lr_scheduler_type`: cosine
1461
+ - `lr_scheduler_kwargs`: {}
1462
+ - `warmup_ratio`: 0.1
1463
+ - `warmup_steps`: 0
1464
+ - `log_level`: passive
1465
+ - `log_level_replica`: warning
1466
+ - `log_on_each_node`: True
1467
+ - `logging_nan_inf_filter`: True
1468
+ - `save_safetensors`: True
1469
+ - `save_on_each_node`: False
1470
+ - `save_only_model`: False
1471
+ - `restore_callback_states_from_checkpoint`: False
1472
+ - `no_cuda`: False
1473
+ - `use_cpu`: False
1474
+ - `use_mps_device`: False
1475
+ - `seed`: 42
1476
+ - `data_seed`: None
1477
+ - `jit_mode_eval`: False
1478
+ - `use_ipex`: False
1479
+ - `bf16`: True
1480
+ - `fp16`: False
1481
+ - `fp16_opt_level`: O1
1482
+ - `half_precision_backend`: auto
1483
+ - `bf16_full_eval`: False
1484
+ - `fp16_full_eval`: False
1485
+ - `tf32`: None
1486
+ - `local_rank`: 0
1487
+ - `ddp_backend`: None
1488
+ - `tpu_num_cores`: None
1489
+ - `tpu_metrics_debug`: False
1490
+ - `debug`: []
1491
+ - `dataloader_drop_last`: False
1492
+ - `dataloader_num_workers`: 0
1493
+ - `dataloader_prefetch_factor`: None
1494
+ - `past_index`: -1
1495
+ - `disable_tqdm`: False
1496
+ - `remove_unused_columns`: True
1497
+ - `label_names`: None
1498
+ - `load_best_model_at_end`: True
1499
+ - `ignore_data_skip`: False
1500
+ - `fsdp`: []
1501
+ - `fsdp_min_num_params`: 0
1502
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
1503
+ - `tp_size`: 0
1504
+ - `fsdp_transformer_layer_cls_to_wrap`: None
1505
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
1506
+ - `deepspeed`: None
1507
+ - `label_smoothing_factor`: 0.0
1508
+ - `optim`: adamw_torch_fused
1509
+ - `optim_args`: None
1510
+ - `adafactor`: False
1511
+ - `group_by_length`: False
1512
+ - `length_column_name`: length
1513
+ - `ddp_find_unused_parameters`: None
1514
+ - `ddp_bucket_cap_mb`: None
1515
+ - `ddp_broadcast_buffers`: False
1516
+ - `dataloader_pin_memory`: True
1517
+ - `dataloader_persistent_workers`: False
1518
+ - `skip_memory_metrics`: True
1519
+ - `use_legacy_prediction_loop`: False
1520
+ - `push_to_hub`: False
1521
+ - `resume_from_checkpoint`: None
1522
+ - `hub_model_id`: None
1523
+ - `hub_strategy`: every_save
1524
+ - `hub_private_repo`: None
1525
+ - `hub_always_push`: False
1526
+ - `gradient_checkpointing`: False
1527
+ - `gradient_checkpointing_kwargs`: None
1528
+ - `include_inputs_for_metrics`: False
1529
+ - `include_for_metrics`: []
1530
+ - `eval_do_concat_batches`: True
1531
+ - `fp16_backend`: auto
1532
+ - `push_to_hub_model_id`: None
1533
+ - `push_to_hub_organization`: None
1534
+ - `mp_parameters`:
1535
+ - `auto_find_batch_size`: False
1536
+ - `full_determinism`: False
1537
+ - `torchdynamo`: None
1538
+ - `ray_scope`: last
1539
+ - `ddp_timeout`: 1800
1540
+ - `torch_compile`: False
1541
+ - `torch_compile_backend`: None
1542
+ - `torch_compile_mode`: None
1543
+ - `include_tokens_per_second`: False
1544
+ - `include_num_input_tokens_seen`: False
1545
+ - `neftune_noise_alpha`: None
1546
+ - `optim_target_modules`: None
1547
+ - `batch_eval_metrics`: False
1548
+ - `eval_on_start`: False
1549
+ - `use_liger_kernel`: False
1550
+ - `eval_use_gather_object`: False
1551
+ - `average_tokens_across_devices`: False
1552
+ - `prompts`: None
1553
+ - `batch_sampler`: no_duplicates
1554
+ - `multi_dataset_batch_sampler`: proportional
1555
+ - `router_mapping`: {}
1556
+ - `learning_rate_mapping`: {}
1557
+
1558
+ </details>
1559
+
1560
+ ### Training Logs
1561
+ | Epoch | Step | Training Loss | dim_1024_cosine_ndcg@10 | dim_768_cosine_ndcg@10 | dim_512_cosine_ndcg@10 | dim_256_cosine_ndcg@10 | dim_128_cosine_ndcg@10 | dim_64_cosine_ndcg@10 |
1562
+ |:------:|:----:|:-------------:|:-----------------------:|:----------------------:|:----------------------:|:----------------------:|:----------------------:|:---------------------:|
1563
+ | 0.8163 | 10 | 31.5155 | - | - | - | - | - | - |
1564
+ | 1.0 | 13 | - | 0.4494 | 0.4446 | 0.4364 | 0.3947 | 0.3362 | 0.2621 |
1565
+ | 1.5714 | 20 | 19.0409 | - | - | - | - | - | - |
1566
+ | 2.0 | 26 | - | 0.4065 | 0.4004 | 0.4013 | 0.3692 | 0.3418 | 0.2882 |
1567
+ | 2.3265 | 30 | 14.5314 | - | - | - | - | - | - |
1568
+ | 3.0 | 39 | - | 0.4418 | 0.4350 | 0.4329 | 0.4087 | 0.3714 | 0.3372 |
1569
+ | 3.0816 | 40 | 8.6778 | - | - | - | - | - | - |
1570
+ | 3.8980 | 50 | 6.0257 | - | - | - | - | - | - |
1571
+ | 4.0 | 52 | - | 0.4291 | 0.4244 | 0.4282 | 0.3980 | 0.3677 | 0.3275 |
1572
+ | 4.6531 | 60 | 3.3524 | - | - | - | - | - | - |
1573
+ | 5.0 | 65 | - | 0.4282 | 0.4211 | 0.4210 | 0.4016 | 0.3697 | 0.3185 |
1574
+
1575
+
1576
+ ### Framework Versions
1577
+ - Python: 3.12.11
1578
+ - Sentence Transformers: 5.1.0
1579
+ - Transformers: 4.51.3
1580
+ - PyTorch: 2.8.0+cu126
1581
+ - Accelerate: 1.10.1
1582
+ - Datasets: 4.0.0
1583
+ - Tokenizers: 0.21.4
1584
+
1585
+ ## Citation
1586
+
1587
+ ### BibTeX
1588
+
1589
+ #### Sentence Transformers
1590
+ ```bibtex
1591
+ @inproceedings{reimers-2019-sentence-bert,
1592
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
1593
+ author = "Reimers, Nils and Gurevych, Iryna",
1594
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
1595
+ month = "11",
1596
+ year = "2019",
1597
+ publisher = "Association for Computational Linguistics",
1598
+ url = "https://arxiv.org/abs/1908.10084",
1599
+ }
1600
+ ```
1601
+
1602
+ #### MatryoshkaLoss
1603
+ ```bibtex
1604
+ @misc{kusupati2024matryoshka,
1605
+ title={Matryoshka Representation Learning},
1606
+ author={Aditya Kusupati and Gantavya Bhatt and Aniket Rege and Matthew Wallingford and Aditya Sinha and Vivek Ramanujan and William Howard-Snyder and Kaifeng Chen and Sham Kakade and Prateek Jain and Ali Farhadi},
1607
+ year={2024},
1608
+ eprint={2205.13147},
1609
+ archivePrefix={arXiv},
1610
+ primaryClass={cs.LG}
1611
+ }
1612
+ ```
1613
+
1614
+ #### MultipleNegativesRankingLoss
1615
+ ```bibtex
1616
+ @misc{henderson2017efficient,
1617
+ title={Efficient Natural Language Response Suggestion for Smart Reply},
1618
+ author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
1619
+ year={2017},
1620
+ eprint={1705.00652},
1621
+ archivePrefix={arXiv},
1622
+ primaryClass={cs.CL}
1623
+ }
1624
+ ```
1625
+
1626
+ <!--
1627
+ ## Glossary
1628
+
1629
+ *Clearly define terms in order to be accessible across audiences.*
1630
+ -->
1631
+
1632
+ <!--
1633
+ ## Model Card Authors
1634
+
1635
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
1636
+ -->
1637
+
1638
+ <!--
1639
+ ## Model Card Contact
1640
+
1641
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
1642
+ -->
checkpoint-65/config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "XLMRobertaModel"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "bos_token_id": 0,
7
+ "classifier_dropout": null,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 1024,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 4096,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 514,
16
+ "model_type": "xlm-roberta",
17
+ "num_attention_heads": 16,
18
+ "num_hidden_layers": 24,
19
+ "output_past": true,
20
+ "pad_token_id": 1,
21
+ "position_embedding_type": "absolute",
22
+ "torch_dtype": "float32",
23
+ "transformers_version": "4.51.3",
24
+ "type_vocab_size": 1,
25
+ "use_cache": true,
26
+ "vocab_size": 250002
27
+ }
checkpoint-65/config_sentence_transformers.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "SentenceTransformer",
3
+ "__version__": {
4
+ "sentence_transformers": "5.1.0",
5
+ "transformers": "4.51.3",
6
+ "pytorch": "2.8.0+cu126"
7
+ },
8
+ "prompts": {
9
+ "query": "",
10
+ "document": ""
11
+ },
12
+ "default_prompt_name": null,
13
+ "similarity_fn_name": "cosine"
14
+ }
checkpoint-65/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e170532ef3cecf660eb98f4bc34e8207df70da0a192758efcd848948ff933df
3
+ size 2239607176
checkpoint-65/modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
checkpoint-65/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7dffac8a08fff2e6cb35978f0a34cfe908c3cc4bad0a978bff7eb74ebbde769
3
+ size 4471067142
checkpoint-65/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26eefef1027f0f7e30b8f30bcbc2af10d09f3fd1f25108c7d6c3ba95b4ac3eb4
3
+ size 14645
checkpoint-65/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ea60534e714390f38db0d7748b2fa3b78ae93b7334ba633bbe797337eca2eae
3
+ size 1465
checkpoint-65/sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 512,
3
+ "do_lower_case": false
4
+ }
checkpoint-65/sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
3
+ size 5069051
checkpoint-65/special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "<mask>",
25
+ "lstrip": true,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "<unk>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
checkpoint-65/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:883b037111086fd4dfebbbc9b7cee11e1517b5e0c0514879478661440f137085
3
+ size 17082987
checkpoint-65/tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "250001": {
36
+ "content": "<mask>",
37
+ "lstrip": true,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "bos_token": "<s>",
45
+ "clean_up_tokenization_spaces": true,
46
+ "cls_token": "<s>",
47
+ "eos_token": "</s>",
48
+ "extra_special_tokens": {},
49
+ "mask_token": "<mask>",
50
+ "model_max_length": 512,
51
+ "pad_token": "<pad>",
52
+ "sep_token": "</s>",
53
+ "tokenizer_class": "XLMRobertaTokenizer",
54
+ "unk_token": "<unk>"
55
+ }
checkpoint-65/trainer_state.json ADDED
@@ -0,0 +1,575 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": 39,
3
+ "best_metric": 0.37139192897263235,
4
+ "best_model_checkpoint": "intfloat/multilingual-e5-large/checkpoint-39",
5
+ "epoch": 5.0,
6
+ "eval_steps": 500,
7
+ "global_step": 65,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.8163265306122449,
14
+ "grad_norm": 307.08624267578125,
15
+ "learning_rate": 7.500000000000001e-06,
16
+ "loss": 31.5155,
17
+ "step": 10
18
+ },
19
+ {
20
+ "epoch": 1.0,
21
+ "eval_dim_1024_cosine_accuracy@1": 0.42509603072983354,
22
+ "eval_dim_1024_cosine_accuracy@10": 0.49295774647887325,
23
+ "eval_dim_1024_cosine_accuracy@3": 0.43085787451984636,
24
+ "eval_dim_1024_cosine_accuracy@5": 0.46030729833546735,
25
+ "eval_dim_1024_cosine_map@100": 0.508986346237021,
26
+ "eval_dim_1024_cosine_mrr@10": 0.4369535394183281,
27
+ "eval_dim_1024_cosine_ndcg@10": 0.4493804868009024,
28
+ "eval_dim_1024_cosine_precision@1": 0.42509603072983354,
29
+ "eval_dim_1024_cosine_precision@10": 0.376056338028169,
30
+ "eval_dim_1024_cosine_precision@3": 0.42402902262057185,
31
+ "eval_dim_1024_cosine_precision@5": 0.4133162612035851,
32
+ "eval_dim_1024_cosine_recall@1": 0.04813624827530403,
33
+ "eval_dim_1024_cosine_recall@10": 0.3150476790176975,
34
+ "eval_dim_1024_cosine_recall@3": 0.1404092551990217,
35
+ "eval_dim_1024_cosine_recall@5": 0.21147403835662126,
36
+ "eval_dim_128_cosine_accuracy@1": 0.31370038412291934,
37
+ "eval_dim_128_cosine_accuracy@10": 0.38156209987195905,
38
+ "eval_dim_128_cosine_accuracy@3": 0.31946222791293216,
39
+ "eval_dim_128_cosine_accuracy@5": 0.34571062740076824,
40
+ "eval_dim_128_cosine_map@100": 0.3991669558616212,
41
+ "eval_dim_128_cosine_mrr@10": 0.32517427799117904,
42
+ "eval_dim_128_cosine_ndcg@10": 0.33618283481296385,
43
+ "eval_dim_128_cosine_precision@1": 0.31370038412291934,
44
+ "eval_dim_128_cosine_precision@10": 0.2764404609475032,
45
+ "eval_dim_128_cosine_precision@3": 0.31284677763551,
46
+ "eval_dim_128_cosine_precision@5": 0.30422535211267604,
47
+ "eval_dim_128_cosine_recall@1": 0.037933385936292925,
48
+ "eval_dim_128_cosine_recall@10": 0.24798465115464788,
49
+ "eval_dim_128_cosine_recall@3": 0.11100168654049715,
50
+ "eval_dim_128_cosine_recall@5": 0.1670926413559068,
51
+ "eval_dim_256_cosine_accuracy@1": 0.36427656850192064,
52
+ "eval_dim_256_cosine_accuracy@10": 0.44814340588988477,
53
+ "eval_dim_256_cosine_accuracy@3": 0.36939820742637647,
54
+ "eval_dim_256_cosine_accuracy@5": 0.4090909090909091,
55
+ "eval_dim_256_cosine_map@100": 0.45841270037343096,
56
+ "eval_dim_256_cosine_mrr@10": 0.37879397597707415,
57
+ "eval_dim_256_cosine_ndcg@10": 0.3947006636735062,
58
+ "eval_dim_256_cosine_precision@1": 0.36427656850192064,
59
+ "eval_dim_256_cosine_precision@10": 0.3289372599231754,
60
+ "eval_dim_256_cosine_precision@3": 0.36363636363636365,
61
+ "eval_dim_256_cosine_precision@5": 0.3560819462227913,
62
+ "eval_dim_256_cosine_recall@1": 0.04277277943657814,
63
+ "eval_dim_256_cosine_recall@10": 0.28617844199333936,
64
+ "eval_dim_256_cosine_recall@3": 0.1253991943934714,
65
+ "eval_dim_256_cosine_recall@5": 0.18947388504512186,
66
+ "eval_dim_512_cosine_accuracy@1": 0.4084507042253521,
67
+ "eval_dim_512_cosine_accuracy@10": 0.4871959026888604,
68
+ "eval_dim_512_cosine_accuracy@3": 0.41357234314980795,
69
+ "eval_dim_512_cosine_accuracy@5": 0.4519846350832266,
70
+ "eval_dim_512_cosine_map@100": 0.495554245202425,
71
+ "eval_dim_512_cosine_mrr@10": 0.42213127248338495,
72
+ "eval_dim_512_cosine_ndcg@10": 0.43644305450989757,
73
+ "eval_dim_512_cosine_precision@1": 0.4084507042253521,
74
+ "eval_dim_512_cosine_precision@10": 0.36606914212548014,
75
+ "eval_dim_512_cosine_precision@3": 0.40738369611609043,
76
+ "eval_dim_512_cosine_precision@5": 0.39846350832266325,
77
+ "eval_dim_512_cosine_recall@1": 0.04628035514721453,
78
+ "eval_dim_512_cosine_recall@10": 0.30419701916496145,
79
+ "eval_dim_512_cosine_recall@3": 0.13522898183596205,
80
+ "eval_dim_512_cosine_recall@5": 0.20394662187726964,
81
+ "eval_dim_64_cosine_accuracy@1": 0.24199743918053776,
82
+ "eval_dim_64_cosine_accuracy@10": 0.29641485275288093,
83
+ "eval_dim_64_cosine_accuracy@3": 0.24775928297055058,
84
+ "eval_dim_64_cosine_accuracy@5": 0.26952624839948786,
85
+ "eval_dim_64_cosine_map@100": 0.31803601064541553,
86
+ "eval_dim_64_cosine_mrr@10": 0.25159771761884414,
87
+ "eval_dim_64_cosine_ndcg@10": 0.2620553065689597,
88
+ "eval_dim_64_cosine_precision@1": 0.24199743918053776,
89
+ "eval_dim_64_cosine_precision@10": 0.21568501920614594,
90
+ "eval_dim_64_cosine_precision@3": 0.24199743918053776,
91
+ "eval_dim_64_cosine_precision@5": 0.23649167733674775,
92
+ "eval_dim_64_cosine_recall@1": 0.029110868794154622,
93
+ "eval_dim_64_cosine_recall@10": 0.19521971714475267,
94
+ "eval_dim_64_cosine_recall@3": 0.08524734139651896,
95
+ "eval_dim_64_cosine_recall@5": 0.12921904680249943,
96
+ "eval_dim_768_cosine_accuracy@1": 0.4193341869398207,
97
+ "eval_dim_768_cosine_accuracy@10": 0.4910371318822023,
98
+ "eval_dim_768_cosine_accuracy@3": 0.4238156209987196,
99
+ "eval_dim_768_cosine_accuracy@5": 0.4551856594110115,
100
+ "eval_dim_768_cosine_map@100": 0.5037778776293926,
101
+ "eval_dim_768_cosine_mrr@10": 0.4315339003719285,
102
+ "eval_dim_768_cosine_ndcg@10": 0.44456410503401034,
103
+ "eval_dim_768_cosine_precision@1": 0.4193341869398207,
104
+ "eval_dim_768_cosine_precision@10": 0.37272727272727274,
105
+ "eval_dim_768_cosine_precision@3": 0.4180537772087068,
106
+ "eval_dim_768_cosine_precision@5": 0.4076824583866837,
107
+ "eval_dim_768_cosine_recall@1": 0.04699592881851732,
108
+ "eval_dim_768_cosine_recall@10": 0.3107289399017082,
109
+ "eval_dim_768_cosine_recall@3": 0.13721565163348118,
110
+ "eval_dim_768_cosine_recall@5": 0.20710427114944024,
111
+ "eval_runtime": 98.6525,
112
+ "eval_samples_per_second": 0.0,
113
+ "eval_sequential_score": 0.2620553065689597,
114
+ "eval_steps_per_second": 0.0,
115
+ "step": 13
116
+ },
117
+ {
118
+ "epoch": 1.5714285714285714,
119
+ "grad_norm": 280.07818603515625,
120
+ "learning_rate": 1.5833333333333333e-05,
121
+ "loss": 19.0409,
122
+ "step": 20
123
+ },
124
+ {
125
+ "epoch": 2.0,
126
+ "eval_dim_1024_cosine_accuracy@1": 0.3854033290653009,
127
+ "eval_dim_1024_cosine_accuracy@10": 0.45454545454545453,
128
+ "eval_dim_1024_cosine_accuracy@3": 0.3886043533930858,
129
+ "eval_dim_1024_cosine_accuracy@5": 0.41101152368758004,
130
+ "eval_dim_1024_cosine_map@100": 0.47259820099791205,
131
+ "eval_dim_1024_cosine_mrr@10": 0.39624870434729537,
132
+ "eval_dim_1024_cosine_ndcg@10": 0.4065329035406967,
133
+ "eval_dim_1024_cosine_precision@1": 0.3854033290653009,
134
+ "eval_dim_1024_cosine_precision@10": 0.3357874519846351,
135
+ "eval_dim_1024_cosine_precision@3": 0.3839095177123346,
136
+ "eval_dim_1024_cosine_precision@5": 0.3713188220230474,
137
+ "eval_dim_1024_cosine_recall@1": 0.0451686782205082,
138
+ "eval_dim_1024_cosine_recall@10": 0.2918225395020212,
139
+ "eval_dim_1024_cosine_recall@3": 0.13200270380544088,
140
+ "eval_dim_1024_cosine_recall@5": 0.19735476247586825,
141
+ "eval_dim_128_cosine_accuracy@1": 0.31562099871959026,
142
+ "eval_dim_128_cosine_accuracy@10": 0.39180537772087065,
143
+ "eval_dim_128_cosine_accuracy@3": 0.3207426376440461,
144
+ "eval_dim_128_cosine_accuracy@5": 0.352112676056338,
145
+ "eval_dim_128_cosine_map@100": 0.40471008477532144,
146
+ "eval_dim_128_cosine_mrr@10": 0.32839105339105285,
147
+ "eval_dim_128_cosine_ndcg@10": 0.34177784905202935,
148
+ "eval_dim_128_cosine_precision@1": 0.31562099871959026,
149
+ "eval_dim_128_cosine_precision@10": 0.280729833546735,
150
+ "eval_dim_128_cosine_precision@3": 0.31455399061032857,
151
+ "eval_dim_128_cosine_precision@5": 0.30640204865556975,
152
+ "eval_dim_128_cosine_recall@1": 0.03888088094516579,
153
+ "eval_dim_128_cosine_recall@10": 0.2550464126190524,
154
+ "eval_dim_128_cosine_recall@3": 0.11341113256173359,
155
+ "eval_dim_128_cosine_recall@5": 0.17046484922169536,
156
+ "eval_dim_256_cosine_accuracy@1": 0.3418693982074264,
157
+ "eval_dim_256_cosine_accuracy@10": 0.4238156209987196,
158
+ "eval_dim_256_cosine_accuracy@3": 0.34763124199743917,
159
+ "eval_dim_256_cosine_accuracy@5": 0.38092189500640206,
160
+ "eval_dim_256_cosine_map@100": 0.43770217754051305,
161
+ "eval_dim_256_cosine_mrr@10": 0.35596482938032165,
162
+ "eval_dim_256_cosine_ndcg@10": 0.36923043791328775,
163
+ "eval_dim_256_cosine_precision@1": 0.3418693982074264,
164
+ "eval_dim_256_cosine_precision@10": 0.30441741357234314,
165
+ "eval_dim_256_cosine_precision@3": 0.34165599658557405,
166
+ "eval_dim_256_cosine_precision@5": 0.3322663252240717,
167
+ "eval_dim_256_cosine_recall@1": 0.041410929155814194,
168
+ "eval_dim_256_cosine_recall@10": 0.2705196189189818,
169
+ "eval_dim_256_cosine_recall@3": 0.1212642412965687,
170
+ "eval_dim_256_cosine_recall@5": 0.18173918651563936,
171
+ "eval_dim_512_cosine_accuracy@1": 0.37708066581306016,
172
+ "eval_dim_512_cosine_accuracy@10": 0.4532650448143406,
173
+ "eval_dim_512_cosine_accuracy@3": 0.38092189500640206,
174
+ "eval_dim_512_cosine_accuracy@5": 0.4084507042253521,
175
+ "eval_dim_512_cosine_map@100": 0.4678017780580059,
176
+ "eval_dim_512_cosine_mrr@10": 0.3893670101416575,
177
+ "eval_dim_512_cosine_ndcg@10": 0.40127522003513455,
178
+ "eval_dim_512_cosine_precision@1": 0.37708066581306016,
179
+ "eval_dim_512_cosine_precision@10": 0.33156209987195906,
180
+ "eval_dim_512_cosine_precision@3": 0.37537345283824153,
181
+ "eval_dim_512_cosine_precision@5": 0.36402048655569774,
182
+ "eval_dim_512_cosine_recall@1": 0.04457309853297402,
183
+ "eval_dim_512_cosine_recall@10": 0.2883968018428671,
184
+ "eval_dim_512_cosine_recall@3": 0.13007205872054822,
185
+ "eval_dim_512_cosine_recall@5": 0.19449520589871025,
186
+ "eval_dim_64_cosine_accuracy@1": 0.26696542893725994,
187
+ "eval_dim_64_cosine_accuracy@10": 0.33098591549295775,
188
+ "eval_dim_64_cosine_accuracy@3": 0.27208706786171577,
189
+ "eval_dim_64_cosine_accuracy@5": 0.293213828425096,
190
+ "eval_dim_64_cosine_map@100": 0.34719730722747555,
191
+ "eval_dim_64_cosine_mrr@10": 0.2776957197731842,
192
+ "eval_dim_64_cosine_ndcg@10": 0.2881905192612941,
193
+ "eval_dim_64_cosine_precision@1": 0.26696542893725994,
194
+ "eval_dim_64_cosine_precision@10": 0.237708066581306,
195
+ "eval_dim_64_cosine_precision@3": 0.26717883055911223,
196
+ "eval_dim_64_cosine_precision@5": 0.2596670934699104,
197
+ "eval_dim_64_cosine_recall@1": 0.031692344067516816,
198
+ "eval_dim_64_cosine_recall@10": 0.21473974122936995,
199
+ "eval_dim_64_cosine_recall@3": 0.09327455064654774,
200
+ "eval_dim_64_cosine_recall@5": 0.14131510912407144,
201
+ "eval_dim_768_cosine_accuracy@1": 0.37451984635083224,
202
+ "eval_dim_768_cosine_accuracy@10": 0.4539052496798976,
203
+ "eval_dim_768_cosine_accuracy@3": 0.37900128040973113,
204
+ "eval_dim_768_cosine_accuracy@5": 0.40973111395646605,
205
+ "eval_dim_768_cosine_map@100": 0.4672061011440217,
206
+ "eval_dim_768_cosine_mrr@10": 0.38746671950897227,
207
+ "eval_dim_768_cosine_ndcg@10": 0.4004027303245026,
208
+ "eval_dim_768_cosine_precision@1": 0.37451984635083224,
209
+ "eval_dim_768_cosine_precision@10": 0.3318181818181818,
210
+ "eval_dim_768_cosine_precision@3": 0.3734528382415706,
211
+ "eval_dim_768_cosine_precision@5": 0.3632522407170295,
212
+ "eval_dim_768_cosine_recall@1": 0.04413921317349132,
213
+ "eval_dim_768_cosine_recall@10": 0.28955317519546525,
214
+ "eval_dim_768_cosine_recall@3": 0.12896663310051748,
215
+ "eval_dim_768_cosine_recall@5": 0.19376203165061448,
216
+ "eval_runtime": 98.4244,
217
+ "eval_samples_per_second": 0.0,
218
+ "eval_sequential_score": 0.2881905192612941,
219
+ "eval_steps_per_second": 0.0,
220
+ "step": 26
221
+ },
222
+ {
223
+ "epoch": 2.326530612244898,
224
+ "grad_norm": 305.66259765625,
225
+ "learning_rate": 1.9973569167005725e-05,
226
+ "loss": 14.5314,
227
+ "step": 30
228
+ },
229
+ {
230
+ "epoch": 3.0,
231
+ "eval_dim_1024_cosine_accuracy@1": 0.4180537772087068,
232
+ "eval_dim_1024_cosine_accuracy@10": 0.49039692701664533,
233
+ "eval_dim_1024_cosine_accuracy@3": 0.42189500640204863,
234
+ "eval_dim_1024_cosine_accuracy@5": 0.4500640204865557,
235
+ "eval_dim_1024_cosine_map@100": 0.506794523350519,
236
+ "eval_dim_1024_cosine_mrr@10": 0.42985717334308843,
237
+ "eval_dim_1024_cosine_ndcg@10": 0.44178501209869797,
238
+ "eval_dim_1024_cosine_precision@1": 0.4180537772087068,
239
+ "eval_dim_1024_cosine_precision@10": 0.36869398207426374,
240
+ "eval_dim_1024_cosine_precision@3": 0.4163465642338881,
241
+ "eval_dim_1024_cosine_precision@5": 0.4043533930857874,
242
+ "eval_dim_1024_cosine_recall@1": 0.04734422767263886,
243
+ "eval_dim_1024_cosine_recall@10": 0.308531274625124,
244
+ "eval_dim_1024_cosine_recall@3": 0.138064233626932,
245
+ "eval_dim_1024_cosine_recall@5": 0.2069980430010945,
246
+ "eval_dim_128_cosine_accuracy@1": 0.34699103713188223,
247
+ "eval_dim_128_cosine_accuracy@10": 0.4212548015364917,
248
+ "eval_dim_128_cosine_accuracy@3": 0.35147247119078107,
249
+ "eval_dim_128_cosine_accuracy@5": 0.37900128040973113,
250
+ "eval_dim_128_cosine_map@100": 0.4338211299784659,
251
+ "eval_dim_128_cosine_mrr@10": 0.35916305916305874,
252
+ "eval_dim_128_cosine_ndcg@10": 0.37139192897263235,
253
+ "eval_dim_128_cosine_precision@1": 0.34699103713188223,
254
+ "eval_dim_128_cosine_precision@10": 0.3042893725992318,
255
+ "eval_dim_128_cosine_precision@3": 0.34571062740076824,
256
+ "eval_dim_128_cosine_precision@5": 0.3352112676056338,
257
+ "eval_dim_128_cosine_recall@1": 0.04217848526747235,
258
+ "eval_dim_128_cosine_recall@10": 0.2706183968947745,
259
+ "eval_dim_128_cosine_recall@3": 0.12288848071178002,
260
+ "eval_dim_128_cosine_recall@5": 0.18344012521240954,
261
+ "eval_dim_256_cosine_accuracy@1": 0.38348271446862997,
262
+ "eval_dim_256_cosine_accuracy@10": 0.4551856594110115,
263
+ "eval_dim_256_cosine_accuracy@3": 0.3886043533930858,
264
+ "eval_dim_256_cosine_accuracy@5": 0.4206145966709347,
265
+ "eval_dim_256_cosine_map@100": 0.4709582085612654,
266
+ "eval_dim_256_cosine_mrr@10": 0.3957850639188662,
267
+ "eval_dim_256_cosine_ndcg@10": 0.4087462230477571,
268
+ "eval_dim_256_cosine_precision@1": 0.38348271446862997,
269
+ "eval_dim_256_cosine_precision@10": 0.33886043533930854,
270
+ "eval_dim_256_cosine_precision@3": 0.382202304737516,
271
+ "eval_dim_256_cosine_precision@5": 0.3718309859154929,
272
+ "eval_dim_256_cosine_recall@1": 0.04466034705404223,
273
+ "eval_dim_256_cosine_recall@10": 0.2892016292717267,
274
+ "eval_dim_256_cosine_recall@3": 0.1301795023253766,
275
+ "eval_dim_256_cosine_recall@5": 0.19500340584044382,
276
+ "eval_dim_512_cosine_accuracy@1": 0.4065300896286812,
277
+ "eval_dim_512_cosine_accuracy@10": 0.4814340588988476,
278
+ "eval_dim_512_cosine_accuracy@3": 0.41229193341869397,
279
+ "eval_dim_512_cosine_accuracy@5": 0.44494238156209986,
280
+ "eval_dim_512_cosine_map@100": 0.49555759572196095,
281
+ "eval_dim_512_cosine_mrr@10": 0.41950236774180394,
282
+ "eval_dim_512_cosine_ndcg@10": 0.4329095460408428,
283
+ "eval_dim_512_cosine_precision@1": 0.4065300896286812,
284
+ "eval_dim_512_cosine_precision@10": 0.3596030729833547,
285
+ "eval_dim_512_cosine_precision@3": 0.4054630815194195,
286
+ "eval_dim_512_cosine_precision@5": 0.3947503201024327,
287
+ "eval_dim_512_cosine_recall@1": 0.047372341735862133,
288
+ "eval_dim_512_cosine_recall@10": 0.3071623578952262,
289
+ "eval_dim_512_cosine_recall@3": 0.1383106496582531,
290
+ "eval_dim_512_cosine_recall@5": 0.20757258542171747,
291
+ "eval_dim_64_cosine_accuracy@1": 0.3207426376440461,
292
+ "eval_dim_64_cosine_accuracy@10": 0.3725992317541613,
293
+ "eval_dim_64_cosine_accuracy@3": 0.322663252240717,
294
+ "eval_dim_64_cosine_accuracy@5": 0.3405889884763124,
295
+ "eval_dim_64_cosine_map@100": 0.3933467041096336,
296
+ "eval_dim_64_cosine_mrr@10": 0.32884732638253733,
297
+ "eval_dim_64_cosine_ndcg@10": 0.3371953828075091,
298
+ "eval_dim_64_cosine_precision@1": 0.3207426376440461,
299
+ "eval_dim_64_cosine_precision@10": 0.2797055057618438,
300
+ "eval_dim_64_cosine_precision@3": 0.3188220230473751,
301
+ "eval_dim_64_cosine_precision@5": 0.3088348271446863,
302
+ "eval_dim_64_cosine_recall@1": 0.036318765090758674,
303
+ "eval_dim_64_cosine_recall@10": 0.23840960718091392,
304
+ "eval_dim_64_cosine_recall@3": 0.10562189493083342,
305
+ "eval_dim_64_cosine_recall@5": 0.15867125525021739,
306
+ "eval_dim_768_cosine_accuracy@1": 0.41037131882202305,
307
+ "eval_dim_768_cosine_accuracy@10": 0.4833546734955186,
308
+ "eval_dim_768_cosine_accuracy@3": 0.4142125480153649,
309
+ "eval_dim_768_cosine_accuracy@5": 0.44430217669654287,
310
+ "eval_dim_768_cosine_map@100": 0.500478306774528,
311
+ "eval_dim_768_cosine_mrr@10": 0.4224889742495374,
312
+ "eval_dim_768_cosine_ndcg@10": 0.4349862241563486,
313
+ "eval_dim_768_cosine_precision@1": 0.41037131882202305,
314
+ "eval_dim_768_cosine_precision@10": 0.36165172855313704,
315
+ "eval_dim_768_cosine_precision@3": 0.4086641058472044,
316
+ "eval_dim_768_cosine_precision@5": 0.3969270166453265,
317
+ "eval_dim_768_cosine_recall@1": 0.047186779325657804,
318
+ "eval_dim_768_cosine_recall@10": 0.30540044861465576,
319
+ "eval_dim_768_cosine_recall@3": 0.1375709294981283,
320
+ "eval_dim_768_cosine_recall@5": 0.20603724780478358,
321
+ "eval_runtime": 98.5908,
322
+ "eval_samples_per_second": 0.0,
323
+ "eval_sequential_score": 0.3371953828075091,
324
+ "eval_steps_per_second": 0.0,
325
+ "step": 39
326
+ },
327
+ {
328
+ "epoch": 3.0816326530612246,
329
+ "grad_norm": 255.65982055664062,
330
+ "learning_rate": 1.9762960071199334e-05,
331
+ "loss": 8.6778,
332
+ "step": 40
333
+ },
334
+ {
335
+ "epoch": 3.8979591836734695,
336
+ "grad_norm": 470.4803771972656,
337
+ "learning_rate": 1.9346189253489888e-05,
338
+ "loss": 6.0257,
339
+ "step": 50
340
+ },
341
+ {
342
+ "epoch": 4.0,
343
+ "eval_dim_1024_cosine_accuracy@1": 0.4046094750320102,
344
+ "eval_dim_1024_cosine_accuracy@10": 0.47823303457106275,
345
+ "eval_dim_1024_cosine_accuracy@3": 0.4090909090909091,
346
+ "eval_dim_1024_cosine_accuracy@5": 0.43918053777208704,
347
+ "eval_dim_1024_cosine_map@100": 0.490599623630225,
348
+ "eval_dim_1024_cosine_mrr@10": 0.4168417068064951,
349
+ "eval_dim_1024_cosine_ndcg@10": 0.42913551824501384,
350
+ "eval_dim_1024_cosine_precision@1": 0.4046094750320102,
351
+ "eval_dim_1024_cosine_precision@10": 0.3565941101152369,
352
+ "eval_dim_1024_cosine_precision@3": 0.40311566367904395,
353
+ "eval_dim_1024_cosine_precision@5": 0.39180537772087065,
354
+ "eval_dim_1024_cosine_recall@1": 0.04660606778759063,
355
+ "eval_dim_1024_cosine_recall@10": 0.3014663479400921,
356
+ "eval_dim_1024_cosine_recall@3": 0.13592596883673455,
357
+ "eval_dim_1024_cosine_recall@5": 0.20379253880710943,
358
+ "eval_dim_128_cosine_accuracy@1": 0.34314980793854033,
359
+ "eval_dim_128_cosine_accuracy@10": 0.4148527528809219,
360
+ "eval_dim_128_cosine_accuracy@3": 0.34763124199743917,
361
+ "eval_dim_128_cosine_accuracy@5": 0.37708066581306016,
362
+ "eval_dim_128_cosine_map@100": 0.4276696379169563,
363
+ "eval_dim_128_cosine_mrr@10": 0.35513180090644836,
364
+ "eval_dim_128_cosine_ndcg@10": 0.36765573601526275,
365
+ "eval_dim_128_cosine_precision@1": 0.34314980793854033,
366
+ "eval_dim_128_cosine_precision@10": 0.302752880921895,
367
+ "eval_dim_128_cosine_precision@3": 0.3418693982074264,
368
+ "eval_dim_128_cosine_precision@5": 0.3322663252240717,
369
+ "eval_dim_128_cosine_recall@1": 0.040652627677675406,
370
+ "eval_dim_128_cosine_recall@10": 0.26330336421247125,
371
+ "eval_dim_128_cosine_recall@3": 0.1184519992454523,
372
+ "eval_dim_128_cosine_recall@5": 0.1774839552040709,
373
+ "eval_dim_256_cosine_accuracy@1": 0.3738796414852753,
374
+ "eval_dim_256_cosine_accuracy@10": 0.44558258642765686,
375
+ "eval_dim_256_cosine_accuracy@3": 0.37772087067861715,
376
+ "eval_dim_256_cosine_accuracy@5": 0.40717029449423814,
377
+ "eval_dim_256_cosine_map@100": 0.45855798848430374,
378
+ "eval_dim_256_cosine_mrr@10": 0.38572571794402755,
379
+ "eval_dim_256_cosine_ndcg@10": 0.3980442434686935,
380
+ "eval_dim_256_cosine_precision@1": 0.3738796414852753,
381
+ "eval_dim_256_cosine_precision@10": 0.3297695262483995,
382
+ "eval_dim_256_cosine_precision@3": 0.37238583013230897,
383
+ "eval_dim_256_cosine_precision@5": 0.3615877080665813,
384
+ "eval_dim_256_cosine_recall@1": 0.043086085492826574,
385
+ "eval_dim_256_cosine_recall@10": 0.2792649180924836,
386
+ "eval_dim_256_cosine_recall@3": 0.125747799799009,
387
+ "eval_dim_256_cosine_recall@5": 0.18837022600852496,
388
+ "eval_dim_512_cosine_accuracy@1": 0.39884763124199746,
389
+ "eval_dim_512_cosine_accuracy@10": 0.47823303457106275,
390
+ "eval_dim_512_cosine_accuracy@3": 0.4052496798975672,
391
+ "eval_dim_512_cosine_accuracy@5": 0.44558258642765686,
392
+ "eval_dim_512_cosine_map@100": 0.4876319198894288,
393
+ "eval_dim_512_cosine_mrr@10": 0.41307745462675005,
394
+ "eval_dim_512_cosine_ndcg@10": 0.42824151108259556,
395
+ "eval_dim_512_cosine_precision@1": 0.39884763124199746,
396
+ "eval_dim_512_cosine_precision@10": 0.35793854033290645,
397
+ "eval_dim_512_cosine_precision@3": 0.3975672215108835,
398
+ "eval_dim_512_cosine_precision@5": 0.3888604353393086,
399
+ "eval_dim_512_cosine_recall@1": 0.04570727180608771,
400
+ "eval_dim_512_cosine_recall@10": 0.2993652309972795,
401
+ "eval_dim_512_cosine_recall@3": 0.13329368345632836,
402
+ "eval_dim_512_cosine_recall@5": 0.2006035854063678,
403
+ "eval_dim_64_cosine_accuracy@1": 0.3079385403329065,
404
+ "eval_dim_64_cosine_accuracy@10": 0.36555697823303457,
405
+ "eval_dim_64_cosine_accuracy@3": 0.31241997439180536,
406
+ "eval_dim_64_cosine_accuracy@5": 0.33290653008962867,
407
+ "eval_dim_64_cosine_map@100": 0.38184314430829974,
408
+ "eval_dim_64_cosine_mrr@10": 0.31748394406845065,
409
+ "eval_dim_64_cosine_ndcg@10": 0.3275369456141822,
410
+ "eval_dim_64_cosine_precision@1": 0.3079385403329065,
411
+ "eval_dim_64_cosine_precision@10": 0.27215108834827145,
412
+ "eval_dim_64_cosine_precision@3": 0.3070849338454972,
413
+ "eval_dim_64_cosine_precision@5": 0.29820742637644043,
414
+ "eval_dim_64_cosine_recall@1": 0.03504677697523653,
415
+ "eval_dim_64_cosine_recall@10": 0.23026653514933906,
416
+ "eval_dim_64_cosine_recall@3": 0.10211269541567973,
417
+ "eval_dim_64_cosine_recall@5": 0.15297976910096123,
418
+ "eval_dim_768_cosine_accuracy@1": 0.3994878361075544,
419
+ "eval_dim_768_cosine_accuracy@10": 0.4737516005121639,
420
+ "eval_dim_768_cosine_accuracy@3": 0.4046094750320102,
421
+ "eval_dim_768_cosine_accuracy@5": 0.4359795134443022,
422
+ "eval_dim_768_cosine_map@100": 0.48680507317454147,
423
+ "eval_dim_768_cosine_mrr@10": 0.41201019246793846,
424
+ "eval_dim_768_cosine_ndcg@10": 0.4244383191680289,
425
+ "eval_dim_768_cosine_precision@1": 0.3994878361075544,
426
+ "eval_dim_768_cosine_precision@10": 0.352752880921895,
427
+ "eval_dim_768_cosine_precision@3": 0.39820742637644047,
428
+ "eval_dim_768_cosine_precision@5": 0.3868117797695263,
429
+ "eval_dim_768_cosine_recall@1": 0.046132270416131195,
430
+ "eval_dim_768_cosine_recall@10": 0.29681183299989666,
431
+ "eval_dim_768_cosine_recall@3": 0.13453018491697852,
432
+ "eval_dim_768_cosine_recall@5": 0.20078864250336506,
433
+ "eval_runtime": 98.6751,
434
+ "eval_samples_per_second": 0.0,
435
+ "eval_sequential_score": 0.3275369456141822,
436
+ "eval_steps_per_second": 0.0,
437
+ "step": 52
438
+ },
439
+ {
440
+ "epoch": 4.653061224489796,
441
+ "grad_norm": 311.2161865234375,
442
+ "learning_rate": 1.8732057547721962e-05,
443
+ "loss": 3.3524,
444
+ "step": 60
445
+ },
446
+ {
447
+ "epoch": 5.0,
448
+ "eval_dim_1024_cosine_accuracy@1": 0.3994878361075544,
449
+ "eval_dim_1024_cosine_accuracy@10": 0.4814340588988476,
450
+ "eval_dim_1024_cosine_accuracy@3": 0.40973111395646605,
451
+ "eval_dim_1024_cosine_accuracy@5": 0.44238156209987195,
452
+ "eval_dim_1024_cosine_map@100": 0.4960353530991054,
453
+ "eval_dim_1024_cosine_mrr@10": 0.41413607910086736,
454
+ "eval_dim_1024_cosine_ndcg@10": 0.42824330702763147,
455
+ "eval_dim_1024_cosine_precision@1": 0.3994878361075544,
456
+ "eval_dim_1024_cosine_precision@10": 0.3562099871959027,
457
+ "eval_dim_1024_cosine_precision@3": 0.3994878361075544,
458
+ "eval_dim_1024_cosine_precision@5": 0.3897567221510884,
459
+ "eval_dim_1024_cosine_recall@1": 0.046427253250942845,
460
+ "eval_dim_1024_cosine_recall@10": 0.30156152834977973,
461
+ "eval_dim_1024_cosine_recall@3": 0.1357642561296911,
462
+ "eval_dim_1024_cosine_recall@5": 0.20380194680388578,
463
+ "eval_dim_128_cosine_accuracy@1": 0.34699103713188223,
464
+ "eval_dim_128_cosine_accuracy@10": 0.41613316261203587,
465
+ "eval_dim_128_cosine_accuracy@3": 0.3495518565941101,
466
+ "eval_dim_128_cosine_accuracy@5": 0.37900128040973113,
467
+ "eval_dim_128_cosine_map@100": 0.4291315309956839,
468
+ "eval_dim_128_cosine_mrr@10": 0.35818293599983697,
469
+ "eval_dim_128_cosine_ndcg@10": 0.36965214083548276,
470
+ "eval_dim_128_cosine_precision@1": 0.34699103713188223,
471
+ "eval_dim_128_cosine_precision@10": 0.30550576184379,
472
+ "eval_dim_128_cosine_precision@3": 0.34528382415706355,
473
+ "eval_dim_128_cosine_precision@5": 0.33533930857874517,
474
+ "eval_dim_128_cosine_recall@1": 0.04023580723646711,
475
+ "eval_dim_128_cosine_recall@10": 0.2604238007608957,
476
+ "eval_dim_128_cosine_recall@3": 0.11713599313797275,
477
+ "eval_dim_128_cosine_recall@5": 0.17553870970060761,
478
+ "eval_dim_256_cosine_accuracy@1": 0.3764404609475032,
479
+ "eval_dim_256_cosine_accuracy@10": 0.4532650448143406,
480
+ "eval_dim_256_cosine_accuracy@3": 0.382202304737516,
481
+ "eval_dim_256_cosine_accuracy@5": 0.41037131882202305,
482
+ "eval_dim_256_cosine_map@100": 0.46504361814337597,
483
+ "eval_dim_256_cosine_mrr@10": 0.3891762189297396,
484
+ "eval_dim_256_cosine_ndcg@10": 0.40161260018012396,
485
+ "eval_dim_256_cosine_precision@1": 0.3764404609475032,
486
+ "eval_dim_256_cosine_precision@10": 0.3325864276568502,
487
+ "eval_dim_256_cosine_precision@3": 0.3758002560819462,
488
+ "eval_dim_256_cosine_precision@5": 0.365044814340589,
489
+ "eval_dim_256_cosine_recall@1": 0.04345597060609991,
490
+ "eval_dim_256_cosine_recall@10": 0.28270389457679657,
491
+ "eval_dim_256_cosine_recall@3": 0.12739095919345977,
492
+ "eval_dim_256_cosine_recall@5": 0.19108724610052447,
493
+ "eval_dim_512_cosine_accuracy@1": 0.39436619718309857,
494
+ "eval_dim_512_cosine_accuracy@10": 0.471190781049936,
495
+ "eval_dim_512_cosine_accuracy@3": 0.4033290653008963,
496
+ "eval_dim_512_cosine_accuracy@5": 0.4327784891165173,
497
+ "eval_dim_512_cosine_map@100": 0.48375387985213597,
498
+ "eval_dim_512_cosine_mrr@10": 0.4078435258012718,
499
+ "eval_dim_512_cosine_ndcg@10": 0.4209567413561994,
500
+ "eval_dim_512_cosine_precision@1": 0.39436619718309857,
501
+ "eval_dim_512_cosine_precision@10": 0.348719590268886,
502
+ "eval_dim_512_cosine_precision@3": 0.39436619718309857,
503
+ "eval_dim_512_cosine_precision@5": 0.38373879641485276,
504
+ "eval_dim_512_cosine_recall@1": 0.046001271870766657,
505
+ "eval_dim_512_cosine_recall@10": 0.29407016086576515,
506
+ "eval_dim_512_cosine_recall@3": 0.13434589294029278,
507
+ "eval_dim_512_cosine_recall@5": 0.2006372923557733,
508
+ "eval_dim_64_cosine_accuracy@1": 0.293854033290653,
509
+ "eval_dim_64_cosine_accuracy@10": 0.3591549295774648,
510
+ "eval_dim_64_cosine_accuracy@3": 0.30153649167733676,
511
+ "eval_dim_64_cosine_accuracy@5": 0.32714468629961585,
512
+ "eval_dim_64_cosine_map@100": 0.3744361264744976,
513
+ "eval_dim_64_cosine_mrr@10": 0.30537518037517997,
514
+ "eval_dim_64_cosine_ndcg@10": 0.3185372635267884,
515
+ "eval_dim_64_cosine_precision@1": 0.293854033290653,
516
+ "eval_dim_64_cosine_precision@10": 0.2681177976952625,
517
+ "eval_dim_64_cosine_precision@3": 0.29449423815621,
518
+ "eval_dim_64_cosine_precision@5": 0.288348271446863,
519
+ "eval_dim_64_cosine_recall@1": 0.03212717718240556,
520
+ "eval_dim_64_cosine_recall@10": 0.221706864386852,
521
+ "eval_dim_64_cosine_recall@3": 0.0944529143897263,
522
+ "eval_dim_64_cosine_recall@5": 0.14311801944731944,
523
+ "eval_dim_768_cosine_accuracy@1": 0.3892445582586428,
524
+ "eval_dim_768_cosine_accuracy@10": 0.47823303457106275,
525
+ "eval_dim_768_cosine_accuracy@3": 0.3994878361075544,
526
+ "eval_dim_768_cosine_accuracy@5": 0.43661971830985913,
527
+ "eval_dim_768_cosine_map@100": 0.48796722771226453,
528
+ "eval_dim_768_cosine_mrr@10": 0.4050812450460335,
529
+ "eval_dim_768_cosine_ndcg@10": 0.4211330537467249,
530
+ "eval_dim_768_cosine_precision@1": 0.3892445582586428,
531
+ "eval_dim_768_cosine_precision@10": 0.35147247119078107,
532
+ "eval_dim_768_cosine_precision@3": 0.38988476312419973,
533
+ "eval_dim_768_cosine_precision@5": 0.38156209987195905,
534
+ "eval_dim_768_cosine_recall@1": 0.045140545184589424,
535
+ "eval_dim_768_cosine_recall@10": 0.29727932103829957,
536
+ "eval_dim_768_cosine_recall@3": 0.13218231618768836,
537
+ "eval_dim_768_cosine_recall@5": 0.19882192649305613,
538
+ "eval_runtime": 98.5973,
539
+ "eval_samples_per_second": 0.0,
540
+ "eval_sequential_score": 0.3185372635267884,
541
+ "eval_steps_per_second": 0.0,
542
+ "step": 65
543
+ }
544
+ ],
545
+ "logging_steps": 10,
546
+ "max_steps": 240,
547
+ "num_input_tokens_seen": 0,
548
+ "num_train_epochs": 20,
549
+ "save_steps": 500,
550
+ "stateful_callbacks": {
551
+ "EarlyStoppingCallback": {
552
+ "args": {
553
+ "early_stopping_patience": 2,
554
+ "early_stopping_threshold": 0.0
555
+ },
556
+ "attributes": {
557
+ "early_stopping_patience_counter": 2
558
+ }
559
+ },
560
+ "TrainerControl": {
561
+ "args": {
562
+ "should_epoch_stop": false,
563
+ "should_evaluate": false,
564
+ "should_log": false,
565
+ "should_save": true,
566
+ "should_training_stop": true
567
+ },
568
+ "attributes": {}
569
+ }
570
+ },
571
+ "total_flos": 0.0,
572
+ "train_batch_size": 8,
573
+ "trial_name": null,
574
+ "trial_params": null
575
+ }
checkpoint-65/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd906d94b017c1a7fa871b608776d19ecf4218c10c253401fe78ba8ce84435be
3
+ size 6097
eval/Information-Retrieval_evaluation_dim_1024_results.csv CHANGED
@@ -1,7 +1,6 @@
1
  epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
2
- 1.0,98,0.3719590268886043,0.37836107554417414,0.4020486555697823,0.43982074263764404,0.3719590268886043,0.04338670134208909,0.37153222364489963,0.1268773565773867,0.3613316261203585,0.19083511167371434,0.3265044814340589,0.28262195979320087,0.383397099770339,0.3947688545057553,0.4604070214987707
3
- 2.0,196,0.3591549295774648,0.3649167733674776,0.39308578745198464,0.42445582586427655,0.3591549295774648,0.040925664980934,0.35830132309005547,0.11912044022990924,0.3495518565941101,0.17907504115268522,0.31914212548015364,0.2663878590041381,0.37061688311688284,0.38277564232489586,0.4442656203645836
4
- 3.0,294,0.3354673495518566,0.3405889884763124,0.3725992317541613,0.41357234314980795,0.3354673495518566,0.0398374526951408,0.33418693982074266,0.11613369449549121,0.3261203585147247,0.1745427554610417,0.2996798975672215,0.26082122731297214,0.34860069507956787,0.3620561774122382,0.4292335776181432
5
- 1.0,98,0.34571062740076824,0.352112676056338,0.3854033290653009,0.4231754161331626,0.34571062740076824,0.04202665510348477,0.34571062740076824,0.12344281372964075,0.33751600512163893,0.1862277356935127,0.3060179257362356,0.2720738817855689,0.3591188545413894,0.37218117046458954,0.4413040417287197
6
- 2.0,196,0.3290653008962868,0.3348271446862996,0.3559539052496799,0.3886043533930858,0.3290653008962868,0.04062540337753272,0.32885189927443453,0.11937529555421877,0.31869398207426375,0.17929032559391017,0.28380281690140846,0.2609802153031206,0.3392725037091231,0.34967137880514326,0.4165482880126111
7
- 3.0,294,0.3053777208706786,0.31434058898847633,0.34635083226632524,0.3854033290653009,0.3053777208706786,0.03802085156159601,0.30644472897994024,0.11197884027712995,0.2998719590268886,0.16921874866295042,0.27516005121638926,0.2530788160980187,0.31961389549417674,0.3342308256907798,0.3945564342654779
 
1
  epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
2
+ 1.0,13,0.42509603072983354,0.43085787451984636,0.46030729833546735,0.49295774647887325,0.42509603072983354,0.04813624827530403,0.42402902262057185,0.1404092551990217,0.4133162612035851,0.21147403835662126,0.376056338028169,0.3150476790176975,0.4369535394183281,0.4493804868009024,0.508986346237021
3
+ 2.0,26,0.3854033290653009,0.3886043533930858,0.41101152368758004,0.45454545454545453,0.3854033290653009,0.0451686782205082,0.3839095177123346,0.13200270380544088,0.3713188220230474,0.19735476247586825,0.3357874519846351,0.2918225395020212,0.39624870434729537,0.4065329035406967,0.47259820099791205
4
+ 3.0,39,0.4180537772087068,0.42189500640204863,0.4500640204865557,0.49039692701664533,0.4180537772087068,0.04734422767263886,0.4163465642338881,0.138064233626932,0.4043533930857874,0.2069980430010945,0.36869398207426374,0.308531274625124,0.42985717334308843,0.44178501209869797,0.506794523350519
5
+ 4.0,52,0.4046094750320102,0.4090909090909091,0.43918053777208704,0.47823303457106275,0.4046094750320102,0.04660606778759063,0.40311566367904395,0.13592596883673455,0.39180537772087065,0.20379253880710943,0.3565941101152369,0.3014663479400921,0.4168417068064951,0.42913551824501384,0.490599623630225
6
+ 5.0,65,0.3994878361075544,0.40973111395646605,0.44238156209987195,0.4814340588988476,0.3994878361075544,0.046427253250942845,0.3994878361075544,0.1357642561296911,0.3897567221510884,0.20380194680388578,0.3562099871959027,0.30156152834977973,0.41413607910086736,0.42824330702763147,0.4960353530991054