Amir313n commited on
Commit
f0e0831
·
verified ·
1 Parent(s): aae3f6f

Training in progress, step 500

Browse files
Files changed (28) hide show
  1. .gitattributes +1 -0
  2. config.json +66 -0
  3. model.safetensors +3 -0
  4. runs/Apr06_11-20-31_gp01/events.out.tfevents.1743938436.gp01.4008839.0 +3 -0
  5. runs/Apr06_12-55-42_gp01/events.out.tfevents.1743944147.gp01.4048216.0 +3 -0
  6. runs/Apr07_10-00-55_gp01/events.out.tfevents.1744020060.gp01.313777.0 +3 -0
  7. runs/Apr07_10-18-52_gp01/events.out.tfevents.1744021136.gp01.318140.0 +3 -0
  8. runs/Apr07_10-24-08_gp01/events.out.tfevents.1744021453.gp01.320760.0 +3 -0
  9. runs/Apr07_10-36-39_gp01/events.out.tfevents.1744022204.gp01.326123.0 +3 -0
  10. runs/Apr07_10-42-40_gp01/events.out.tfevents.1744022565.gp01.328824.0 +3 -0
  11. runs/Apr07_12-13-53_gp01/events.out.tfevents.1744028038.gp01.381148.0 +3 -0
  12. runs/Apr07_20-38-06_gp01/events.out.tfevents.1744058290.gp01.491979.0 +3 -0
  13. runs/Apr07_20-43-05_gp01/events.out.tfevents.1744058589.gp01.494154.0 +3 -0
  14. runs/Apr07_20-55-42_gp01/events.out.tfevents.1744059346.gp01.500835.0 +3 -0
  15. runs/Apr12_10-29-06_gp01/events.out.tfevents.1744453751.gp01.3472498.0 +3 -0
  16. runs/Apr12_10-33-44_gp01/events.out.tfevents.1744454029.gp01.3478016.0 +3 -0
  17. runs/Apr12_10-52-43_gp01/events.out.tfevents.1744455168.gp01.3495757.0 +3 -0
  18. runs/Apr12_13-12-32_gp01/events.out.tfevents.1744463556.gp01.3633647.0 +3 -0
  19. runs/Apr12_13-18-11_gp01/events.out.tfevents.1744463896.gp01.3636918.0 +3 -0
  20. runs/Apr21_10-18-25_gp01/events.out.tfevents.1745230712.gp01.2087389.0 +3 -0
  21. runs/Apr21_10-31-04_gp01/events.out.tfevents.1745231470.gp01.2095885.0 +3 -0
  22. runs/Apr21_12-21-30_gp01/events.out.tfevents.1745238097.gp01.2141558.0 +3 -0
  23. runs/Apr21_12-32-12_gp01/events.out.tfevents.1745238738.gp01.2147951.0 +3 -0
  24. runs/Apr21_12-37-41_gp01/events.out.tfevents.1745239067.gp01.2150943.0 +3 -0
  25. special_tokens_map.json +51 -0
  26. tokenizer.json +3 -0
  27. tokenizer_config.json +55 -0
  28. training_args.bin +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "XLMRobertaLoRA"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "auto_map": {
7
+ "AutoConfig": "jinaai/xlm-roberta-flash-implementation--configuration_xlm_roberta.XLMRobertaFlashConfig",
8
+ "AutoModel": "jinaai/xlm-roberta-flash-implementation--modeling_lora.XLMRobertaLoRA",
9
+ "AutoModelForMaskedLM": "jinaai/xlm-roberta-flash-implementation--modeling_xlm_roberta.XLMRobertaForMaskedLM",
10
+ "AutoModelForPreTraining": "jinaai/xlm-roberta-flash-implementation--modeling_xlm_roberta.XLMRobertaForPreTraining"
11
+ },
12
+ "bos_token_id": 0,
13
+ "classifier_dropout": null,
14
+ "emb_pooler": null,
15
+ "eos_token_id": 2,
16
+ "hidden_act": "gelu",
17
+ "hidden_dropout_prob": 0.1,
18
+ "hidden_size": 1024,
19
+ "initializer_range": 0.02,
20
+ "intermediate_size": 4096,
21
+ "layer_norm_eps": 1e-05,
22
+ "load_trained_adapters": true,
23
+ "lora_adaptations": [
24
+ "hadith_retrieval.query",
25
+ "hadith_retrieval.passage",
26
+ "separation",
27
+ "classification",
28
+ "text-matching"
29
+ ],
30
+ "lora_alpha": 1,
31
+ "lora_dropout_p": 0.0,
32
+ "lora_main_params_trainable": false,
33
+ "lora_rank": 4,
34
+ "matryoshka_dimensions": [
35
+ 32,
36
+ 64,
37
+ 128,
38
+ 256,
39
+ 512,
40
+ 768,
41
+ 1024
42
+ ],
43
+ "max_position_embeddings": 8194,
44
+ "model_type": "xlm-roberta",
45
+ "num_attention_heads": 16,
46
+ "num_hidden_layers": 24,
47
+ "output_past": true,
48
+ "pad_token_id": 1,
49
+ "position_embedding_type": "rotary",
50
+ "rotary_emb_base": 20000.0,
51
+ "task_instructions": {
52
+ "classification": "",
53
+ "hadith_retrieval.passage": "Represent the hadith for retrieval: ",
54
+ "hadith_retrieval.query": "Represent the query for retrieving related hadiths: ",
55
+ "separation": "",
56
+ "text-matching": ""
57
+ },
58
+ "torch_dtype": "bfloat16",
59
+ "transformers_version": "4.50.3",
60
+ "truncate_dim": null,
61
+ "type_vocab_size": 1,
62
+ "use_cache": true,
63
+ "use_flash_attn": true,
64
+ "use_reentrant": false,
65
+ "vocab_size": 250002
66
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee6d5757440d99428055d93ab30fe871e38a64f3f9fcf0344302b92040b3d6fc
3
+ size 1144685320
runs/Apr06_11-20-31_gp01/events.out.tfevents.1743938436.gp01.4008839.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd3bc49a88e4e8df4a15a2ab4a5483003c00e28f2071c02066838043423ecb84
3
+ size 4423
runs/Apr06_12-55-42_gp01/events.out.tfevents.1743944147.gp01.4048216.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18bfd406021aa752f76bfb3d0abe142cb8ab0a7ecf9488d2e6efa4acc5ad20e0
3
+ size 4423
runs/Apr07_10-00-55_gp01/events.out.tfevents.1744020060.gp01.313777.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e81abd8250cad167df98021769d00021b19a99fb10270914f6697f7b99270b2c
3
+ size 4771
runs/Apr07_10-18-52_gp01/events.out.tfevents.1744021136.gp01.318140.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb72618276e4093c43b96fcb04a30c95ed03d0b6bd067ff1adc9a6c8e1b052fb
3
+ size 4772
runs/Apr07_10-24-08_gp01/events.out.tfevents.1744021453.gp01.320760.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85c782890440e4112f9b86274f6bae974b9d6f79adb4599621269b3220e88abc
3
+ size 4773
runs/Apr07_10-36-39_gp01/events.out.tfevents.1744022204.gp01.326123.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe47108707d18916b6ce30594338c3ca615f699f9ddb45a81fd5d3e0ed249c30
3
+ size 4424
runs/Apr07_10-42-40_gp01/events.out.tfevents.1744022565.gp01.328824.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f20dc7513c761344d076efbe00a8c8dedf7392415d33193b462f92f6d70c440
3
+ size 6534
runs/Apr07_12-13-53_gp01/events.out.tfevents.1744028038.gp01.381148.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7675eeab03688fd76abe778f44cbf8039b8f3b8568c59f9b639054ff901349c
3
+ size 6534
runs/Apr07_20-38-06_gp01/events.out.tfevents.1744058290.gp01.491979.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b1cf95b5e7cf99bec098a63c0d49263714e8b461dcaaaea576e0df62bf400b4
3
+ size 4424
runs/Apr07_20-43-05_gp01/events.out.tfevents.1744058589.gp01.494154.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22ad757a0eae378e7ff7fec4a998a47abe5fdd2eaac2e10ad7a56b6882b80c98
3
+ size 4636
runs/Apr07_20-55-42_gp01/events.out.tfevents.1744059346.gp01.500835.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4c6bbf72059c0ec0d11eb02748a2fcace2998155d9b3bd8ebcc96307d6e5d84
3
+ size 14332
runs/Apr12_10-29-06_gp01/events.out.tfevents.1744453751.gp01.3472498.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27aa67fc107b585c462ea644e3eabcd8dcf5923426c3c7f5c5b84ea62b78cdd0
3
+ size 4877
runs/Apr12_10-33-44_gp01/events.out.tfevents.1744454029.gp01.3478016.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d842973a5c6c603d05f1cb781f7a2f43b88d632fbba0a9014cc978b60b00030b
3
+ size 4877
runs/Apr12_10-52-43_gp01/events.out.tfevents.1744455168.gp01.3495757.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4048e137f685d0cf125ca319158a9b5c253f1f71b91aef9259be89a261f95c8b
3
+ size 6343
runs/Apr12_13-12-32_gp01/events.out.tfevents.1744463556.gp01.3633647.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c12eb4f68f3bdb2ca70a2d3ba01a95200f2ce1342388df32cbe7b2b20d3058ee
3
+ size 4877
runs/Apr12_13-18-11_gp01/events.out.tfevents.1744463896.gp01.3636918.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e4cda083d26d05365b349c28e53a6136688c2fc625ad3dc6e404c7df8c4123f
3
+ size 31129
runs/Apr21_10-18-25_gp01/events.out.tfevents.1745230712.gp01.2087389.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee44c0696e1db5ca035c8dfc5e30d4dc7f1c8a27e8206bd951c916953cdd57b0
3
+ size 4876
runs/Apr21_10-31-04_gp01/events.out.tfevents.1745231470.gp01.2095885.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf7139866f90ec2841c6a05e1bb910a05652ffed755e27d0bae0b5fff9a1bd29
3
+ size 4876
runs/Apr21_12-21-30_gp01/events.out.tfevents.1745238097.gp01.2141558.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc61eceffafe2dadb522e241248774fd1977d914e88f2fab9ce8191555abd53
3
+ size 5132
runs/Apr21_12-32-12_gp01/events.out.tfevents.1745238738.gp01.2147951.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c32a78ca3afa9bfb5390be5d644ad184b024fc6742c5f5c382a9acd46a292c2d
3
+ size 4877
runs/Apr21_12-37-41_gp01/events.out.tfevents.1745239067.gp01.2150943.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:301740f6368aa8adec46214ae7a2cd554c5eafa0e08f3ae6c769869d0ac27561
3
+ size 5424
special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "<mask>",
25
+ "lstrip": true,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "<unk>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e19cd8c08f528b481e909f73dbd1fd62b1e8b1117579ba205e477801237f9e0
3
+ size 17082988
tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "250001": {
36
+ "content": "<mask>",
37
+ "lstrip": true,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "bos_token": "<s>",
45
+ "clean_up_tokenization_spaces": true,
46
+ "cls_token": "<s>",
47
+ "eos_token": "</s>",
48
+ "extra_special_tokens": {},
49
+ "mask_token": "<mask>",
50
+ "model_max_length": 8194,
51
+ "pad_token": "<pad>",
52
+ "sep_token": "</s>",
53
+ "tokenizer_class": "XLMRobertaTokenizerFast",
54
+ "unk_token": "<unk>"
55
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efbec979f53d5e9c05d32c9cb9bf8ef20cbfd829f8b126b2a71d818a4e64138c
3
+ size 5816