Dekel Cohen commited on
Commit
ff52183
·
1 Parent(s): c3f415b

new model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. config.json +33 -0
  3. generation_config.json +7 -0
  4. model-00001-of-00058.safetensors +3 -0
  5. model-00002-of-00058.safetensors +3 -0
  6. model-00003-of-00058.safetensors +3 -0
  7. model-00004-of-00058.safetensors +3 -0
  8. model-00005-of-00058.safetensors +3 -0
  9. model-00006-of-00058.safetensors +3 -0
  10. model-00007-of-00058.safetensors +3 -0
  11. model-00008-of-00058.safetensors +3 -0
  12. model-00009-of-00058.safetensors +3 -0
  13. model-00010-of-00058.safetensors +3 -0
  14. model-00011-of-00058.safetensors +3 -0
  15. model-00012-of-00058.safetensors +3 -0
  16. model-00013-of-00058.safetensors +3 -0
  17. model-00014-of-00058.safetensors +3 -0
  18. model-00015-of-00058.safetensors +3 -0
  19. model-00016-of-00058.safetensors +3 -0
  20. model-00017-of-00058.safetensors +3 -0
  21. model-00018-of-00058.safetensors +3 -0
  22. model-00019-of-00058.safetensors +3 -0
  23. model-00020-of-00058.safetensors +3 -0
  24. model-00021-of-00058.safetensors +3 -0
  25. model-00022-of-00058.safetensors +3 -0
  26. model-00023-of-00058.safetensors +3 -0
  27. model-00024-of-00058.safetensors +3 -0
  28. model-00025-of-00058.safetensors +3 -0
  29. model-00026-of-00058.safetensors +3 -0
  30. model-00027-of-00058.safetensors +3 -0
  31. model-00028-of-00058.safetensors +3 -0
  32. model-00029-of-00058.safetensors +3 -0
  33. model-00030-of-00058.safetensors +3 -0
  34. model-00031-of-00058.safetensors +3 -0
  35. model-00032-of-00058.safetensors +3 -0
  36. model-00033-of-00058.safetensors +3 -0
  37. model-00034-of-00058.safetensors +3 -0
  38. model-00035-of-00058.safetensors +3 -0
  39. model-00036-of-00058.safetensors +3 -0
  40. model-00037-of-00058.safetensors +3 -0
  41. model-00038-of-00058.safetensors +3 -0
  42. model-00039-of-00058.safetensors +3 -0
  43. model-00040-of-00058.safetensors +3 -0
  44. model-00041-of-00058.safetensors +3 -0
  45. model-00042-of-00058.safetensors +3 -0
  46. model-00043-of-00058.safetensors +3 -0
  47. model-00044-of-00058.safetensors +3 -0
  48. model-00045-of-00058.safetensors +3 -0
  49. model-00046-of-00058.safetensors +3 -0
  50. model-00047-of-00058.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "CohereForAI/aya-101",
3
+ "architectures": [
4
+ "T5ForConditionalGeneration"
5
+ ],
6
+ "classifier_dropout": 0.0,
7
+ "d_ff": 10240,
8
+ "d_kv": 64,
9
+ "d_model": 4096,
10
+ "decoder_start_token_id": 0,
11
+ "dense_act_fn": "gelu_new",
12
+ "dropout_rate": 0.1,
13
+ "eos_token_id": 1,
14
+ "feed_forward_proj": "gated-gelu",
15
+ "initializer_factor": 1.0,
16
+ "is_encoder_decoder": true,
17
+ "is_gated_act": true,
18
+ "layer_norm_epsilon": 1e-06,
19
+ "model_type": "t5",
20
+ "num_decoder_layers": 24,
21
+ "num_heads": 64,
22
+ "num_layers": 24,
23
+ "output_past": true,
24
+ "pad_token_id": 0,
25
+ "relative_attention_max_distance": 128,
26
+ "relative_attention_num_buckets": 32,
27
+ "tie_word_embeddings": false,
28
+ "tokenizer_class": "T5Tokenizer",
29
+ "torch_dtype": "float32",
30
+ "transformers_version": "4.36.2",
31
+ "use_cache": true,
32
+ "vocab_size": 250112
33
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "decoder_start_token_id": 0,
4
+ "eos_token_id": 1,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.36.2"
7
+ }
model-00001-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ee5060b747ac7e2c1be9cd97c43f993341d6cc442c2e7ec44d8f6b0cdcbc135
3
+ size 4097835136
model-00002-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fc6a6cf4b9706b03379d15cf37d27088d75496b488ba120ff1b54115520eafc
3
+ size 838903144
model-00003-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0a05afaa3b956436c6e35d9d84244fc5bcac25c08e11b344d4b7307d8fe32aa
3
+ size 838894816
model-00004-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc1477aa9f6223bc3a1c6e05c08675e7b037a0f34ed8d287d306e0bc4a34c55c
3
+ size 838894816
model-00005-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64ed435ff4e52ff98fbe90ad6cfac524327badccb4f58789addd366852060ec0
3
+ size 838911312
model-00006-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ded232c5ff01a67979c9a3b7134d9a544d8e7f6b8b49cee9fe618d774d425671
3
+ size 771785832
model-00007-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a65651279806c5ba01db2d88b7547b33d757838d322b4b973f0533678cacb3a0
3
+ size 771785832
model-00008-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb3ad0089dbfb62a4461cd98cb1b588235cc509b6c2c94baf34d2bcfeb8ba4a5
3
+ size 771785832
model-00009-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eafebbd578ff50b822cfbb6e415e58eceeb8b90ebe7732e0fa70028240ea9264
3
+ size 771785832
model-00010-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f96b41dcaf37c51d228cb7bb6dd6e871a18f4bab35c2450ec4a8557309a21827
3
+ size 771785832
model-00011-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ae73ffd22765f358d77f406f3f1d78996828fef9981036bfde85a87801d97b0
3
+ size 771785832
model-00012-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:114cd99b4c605f31ad71feacbcce4da22dd3dec7270edc18662e85da2ecc206e
3
+ size 771785840
model-00013-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e75e93617d9a9e229675df8678476b64a7da7261d4b70c5cc79bb48436f5c704
3
+ size 771785840
model-00014-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebbf2c9cdc98a42961a8703194b0b17d5792b7bf4ebee580324ac0c2581f4865
3
+ size 771785840
model-00015-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd94e6654301436f21593bb47a74788b3e9eafe3b0a73428783a00ae9984c018
3
+ size 771785840
model-00016-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fe3d0d091a8ef2dd49fe37a5a23ce21cc690d9bec799a7543d9c20d63b5ade3
3
+ size 771785840
model-00017-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62fd739f7024acabefe0ea168e63d5275ebeecbbcaa8c9d228f7e637f77edd75
3
+ size 771785840
model-00018-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ecb869ffa17e7e6056fcfcaba2ecd4a854e0d4fdafcbdd64cd62314f7153537
3
+ size 771785840
model-00019-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aed4e57f19a24c26d05b8b8a89906a5fa834d5e9acbb3e1378c87bfe45987120
3
+ size 771785840
model-00020-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ae31052dc9294d98526888e4b81545017c1a11bc2b0bf18f39d6878c3c9fbfd
3
+ size 771785840
model-00021-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6c454fe1f9908d53b06b85ee4efb5ee95fa1dd8dc6fa56323a9b6796ad9d8f6
3
+ size 771785840
model-00022-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:278bf79e73b12529614eb6eae2863eb4db644ad5dd1f7b6081e9abba2b7f8692
3
+ size 771785840
model-00023-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cecc02c74b05dad3754c76f56eef4875bf6f16cb8d9265a414687e2de91c8e10
3
+ size 771785840
model-00024-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f4676fd29a15463bb30a1d580709cea57ee1a612c1150c8dd87291fb538f006
3
+ size 771785840
model-00025-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1675e6458803892fa69702dc5d71d53ce2a03a6e9a68e5db1b0a1922566e5d1
3
+ size 838919640
model-00026-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f8a66a3f378c7e87a4911b116a7a63c7e00e3b7d38d955d00da993dc5c0a879
3
+ size 838894824
model-00027-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68248e87be6aa20c413261e8a47e06ebeea41dd33d22617391a9ba5f8d24c3ef
3
+ size 738231520
model-00028-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aded28e602ba7497fe84f3595e6f87183b72a47f532b7f81164ccf3195aeab68
3
+ size 704693704
model-00029-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb61c6be6a65b8ecb356a8c78fc47935cef9f3b1e18ea1a2a777e08730cde4df
3
+ size 838894816
model-00030-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:777c8f9a5ac296282b025a4fe664fd718c1d3dc5da5cff9288ae82cd93d1602d
3
+ size 838894824
model-00031-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29ac25648527804f241393fe0c2b01e811071f9124511e60cf48413f991a98bd
3
+ size 738231520
model-00032-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b792023be12084c3327137ba48d4bb1ce060a3e651fafdfbb090e4ce1d85506
3
+ size 704693704
model-00033-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4dc32aaaff354f03ddde730e1efd7dc2908f24c8bcec12ca156d50ed03d4e4a
3
+ size 838894816
model-00034-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3591afe70cfb8dc911750d114b2b72a687835ab4eeae8c214840be3607722f16
3
+ size 838894824
model-00035-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a26c449662d5b6359c41b131a4eafa6257db948eef198f453d9e220a0fa44b72
3
+ size 738231520
model-00036-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62a483d7c4913ce639d67bb9f8f1ee238f91654460240fbeb65f2090b392c1e9
3
+ size 704693704
model-00037-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a06773b745e76a91802e3afbf07e153884561770b020da1e6bbeb38e63b3067
3
+ size 838894816
model-00038-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b906cab98c13c7a05fa26552be1f0797ba1a8dcf7ad3218c2cd83933758efd7
3
+ size 838894824
model-00039-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23a2d93cfb543368fc54c9033ed6cb46cb2474a771e49fe1ef690d2b5534f400
3
+ size 738231536
model-00040-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3edb4cb42f0212f3f50f67b7be0c2aef7329afb51bc330d2899b022bb905e73
3
+ size 704693720
model-00041-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:752539296b750fe6d73fa93ee71e1cfdcbe18f229b3d0766ba371df873f9710b
3
+ size 838894832
model-00042-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c11e4e96a379c079868284857981448505ff408e37afeea6221792d2e3e39e05
3
+ size 838894832
model-00043-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70cc615c7bd3b2cc50155873392afff29ac41bd8dc5412a6172c73e5492cc3a5
3
+ size 738231536
model-00044-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1562c9c77c11c8eef4631d5c98d8dda9f0ab5fdd7c34f39dcb7163a28befde8d
3
+ size 704693720
model-00045-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4012e5fd75fda64c6d66a2a0f41b9084b0271a0a34fd4fffb4663024f0a300b9
3
+ size 838894832
model-00046-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96514604172115763f9c02d65e68429924d90899bcce54f254d69fb96b752449
3
+ size 838894832
model-00047-of-00058.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f007b3876baaebb7e38f0b7c8a9486a4c068cb17c6a975142c59d34e541583c9
3
+ size 738231536