bruhzair commited on
Commit
ffbf028
·
verified ·
1 Parent(s): 9091bba

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +42 -0
  3. chat_template.jinja +7 -0
  4. config.json +39 -0
  5. mergekit_config.yml +12 -0
  6. model-00001-of-00063.safetensors +3 -0
  7. model-00002-of-00063.safetensors +3 -0
  8. model-00003-of-00063.safetensors +3 -0
  9. model-00004-of-00063.safetensors +3 -0
  10. model-00005-of-00063.safetensors +3 -0
  11. model-00006-of-00063.safetensors +3 -0
  12. model-00007-of-00063.safetensors +3 -0
  13. model-00008-of-00063.safetensors +3 -0
  14. model-00009-of-00063.safetensors +3 -0
  15. model-00010-of-00063.safetensors +3 -0
  16. model-00011-of-00063.safetensors +3 -0
  17. model-00012-of-00063.safetensors +3 -0
  18. model-00013-of-00063.safetensors +3 -0
  19. model-00014-of-00063.safetensors +3 -0
  20. model-00015-of-00063.safetensors +3 -0
  21. model-00016-of-00063.safetensors +3 -0
  22. model-00017-of-00063.safetensors +3 -0
  23. model-00018-of-00063.safetensors +3 -0
  24. model-00019-of-00063.safetensors +3 -0
  25. model-00020-of-00063.safetensors +3 -0
  26. model-00021-of-00063.safetensors +3 -0
  27. model-00022-of-00063.safetensors +3 -0
  28. model-00023-of-00063.safetensors +3 -0
  29. model-00024-of-00063.safetensors +3 -0
  30. model-00025-of-00063.safetensors +3 -0
  31. model-00026-of-00063.safetensors +3 -0
  32. model-00027-of-00063.safetensors +3 -0
  33. model-00028-of-00063.safetensors +3 -0
  34. model-00029-of-00063.safetensors +3 -0
  35. model-00030-of-00063.safetensors +3 -0
  36. model-00031-of-00063.safetensors +3 -0
  37. model-00032-of-00063.safetensors +3 -0
  38. model-00033-of-00063.safetensors +3 -0
  39. model-00034-of-00063.safetensors +3 -0
  40. model-00035-of-00063.safetensors +3 -0
  41. model-00036-of-00063.safetensors +3 -0
  42. model-00037-of-00063.safetensors +3 -0
  43. model-00038-of-00063.safetensors +3 -0
  44. model-00039-of-00063.safetensors +3 -0
  45. model-00040-of-00063.safetensors +3 -0
  46. model-00041-of-00063.safetensors +3 -0
  47. model-00042-of-00063.safetensors +3 -0
  48. model-00043-of-00063.safetensors +3 -0
  49. model-00044-of-00063.safetensors +3 -0
  50. model-00045-of-00063.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: []
3
+ library_name: transformers
4
+ tags:
5
+ - mergekit
6
+ - merge
7
+
8
+ ---
9
+ # prototype-0.4x273
10
+
11
+ This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
12
+
13
+ ## Merge Details
14
+ ### Merge Method
15
+
16
+ This model was merged using the [Model Stock](https://arxiv.org/abs/2403.19522) merge method using /workspace/cache/models--BruhzWater--Eden-L3.3-70b-0.3/snapshots/723770586b6603d44ac9bb1d4527e80e86d4dc8b as a base.
17
+
18
+ ### Models Merged
19
+
20
+ The following models were included in the merge:
21
+ * /workspace/cache/models--BruhzWater--Liliths-Whisper-L3.3-70b-0.1/snapshots/2f5b9f0307fbb865a3f2e98eefaeb3c86955cb03
22
+ * /workspace/cache/models--BruhzWater--Apocrypha-L3.3-70b-0.3/snapshots/3facb4c0a7b953ff34a5caa90976830bf82a84c2
23
+ * /workspace/cache/models--BruhzWater--Serpents-Tongue-L3.3-70b-0.3/snapshots/d007a7bcc7047d712abb2dfb6ad940fe03cd2047
24
+
25
+ ### Configuration
26
+
27
+ The following YAML configuration was used to produce this model:
28
+
29
+ ```yaml
30
+ models:
31
+ - model: /workspace/cache/models--BruhzWater--Liliths-Whisper-L3.3-70b-0.1/snapshots/2f5b9f0307fbb865a3f2e98eefaeb3c86955cb03
32
+ - model: /workspace/cache/models--BruhzWater--Serpents-Tongue-L3.3-70b-0.3/snapshots/d007a7bcc7047d712abb2dfb6ad940fe03cd2047
33
+ - model: /workspace/cache/models--BruhzWater--Apocrypha-L3.3-70b-0.3/snapshots/3facb4c0a7b953ff34a5caa90976830bf82a84c2
34
+ base_model: /workspace/cache/models--BruhzWater--Eden-L3.3-70b-0.3/snapshots/723770586b6603d44ac9bb1d4527e80e86d4dc8b
35
+ merge_method: model_stock
36
+ tokenizer:
37
+ source: base
38
+ chat_template: llama3
39
+ int8_mask: true
40
+ pad_to_multiple_of: 8
41
+ dtype: float32
42
+ ```
chat_template.jinja ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {% set loop_messages = messages %}
2
+ {% for message in loop_messages %}
3
+ {% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}
4
+ {% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}
5
+ {{ content }}
6
+ {% endfor %}
7
+ {% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}
config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "LlamaForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 128000,
8
+ "eos_token_id": [
9
+ 128001,
10
+ 128008,
11
+ 128009
12
+ ],
13
+ "head_dim": 128,
14
+ "hidden_act": "silu",
15
+ "hidden_size": 8192,
16
+ "initializer_range": 0.02,
17
+ "intermediate_size": 28672,
18
+ "max_position_embeddings": 131072,
19
+ "mlp_bias": false,
20
+ "model_type": "llama",
21
+ "num_attention_heads": 64,
22
+ "num_hidden_layers": 80,
23
+ "num_key_value_heads": 8,
24
+ "pretraining_tp": 1,
25
+ "rms_norm_eps": 1e-05,
26
+ "rope_scaling": {
27
+ "factor": 8.0,
28
+ "high_freq_factor": 4.0,
29
+ "low_freq_factor": 1.0,
30
+ "original_max_position_embeddings": 8192,
31
+ "rope_type": "llama3"
32
+ },
33
+ "rope_theta": 500000.0,
34
+ "tie_word_embeddings": false,
35
+ "torch_dtype": "float32",
36
+ "transformers_version": "4.54.0",
37
+ "use_cache": true,
38
+ "vocab_size": 128256
39
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ models:
2
+ - model: /workspace/cache/models--BruhzWater--Liliths-Whisper-L3.3-70b-0.1/snapshots/2f5b9f0307fbb865a3f2e98eefaeb3c86955cb03
3
+ - model: /workspace/cache/models--BruhzWater--Serpents-Tongue-L3.3-70b-0.3/snapshots/d007a7bcc7047d712abb2dfb6ad940fe03cd2047
4
+ - model: /workspace/cache/models--BruhzWater--Apocrypha-L3.3-70b-0.3/snapshots/3facb4c0a7b953ff34a5caa90976830bf82a84c2
5
+ base_model: /workspace/cache/models--BruhzWater--Eden-L3.3-70b-0.3/snapshots/723770586b6603d44ac9bb1d4527e80e86d4dc8b
6
+ merge_method: model_stock
7
+ tokenizer:
8
+ source: base
9
+ chat_template: llama3
10
+ int8_mask: true
11
+ pad_to_multiple_of: 8
12
+ dtype: float32
model-00001-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28df82549f8acb5ec8431f43f6fb691cb077a91e45475715ade2a261a409ebbf
3
+ size 4697753296
model-00002-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31555cfb05861c71ab6b58e7b8300a0d7b6352c38476dbc6d1984786621ba86d
3
+ size 4697687552
model-00003-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c8d13c6a6ae43940798a540e18293b8862a6453d7a912bccb179b9b68d62cf8
3
+ size 4563502240
model-00004-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04e1a4e71e6d7d3bbcf99d354fbde68ee1b0525d26e24bca1f0f7a924f898ffc
3
+ size 2415952488
model-00005-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc8ca7f82086e70d76371d2ec0a7c2351748cc25fb5123d0c15fe2c3e54bf1ed
3
+ size 4236247288
model-00006-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92cf4f30b8170560c59428d8cbc363402e91d9934e2cdda5bf6acaa823f51845
3
+ size 4160915056
model-00007-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7dcc4cc8b5b927e6b414b9ca02d5b8bc6daa0463daee02d746f61dc82250e52b
3
+ size 4362077112
model-00008-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc5563d6349648785580eee63f71c87c8d6935183d306ccb81cecb8ff740c3e2
3
+ size 4664133016
model-00009-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c2a826f4d446e6f4276b4ecdeedba05ec45ee33cbd60acb1779129a61a8eb31
3
+ size 2415952472
model-00010-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f781782a932e3f34999f09165a644a6464d4e162a44dfaaf499503438a58723d
3
+ size 4202692744
model-00011-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97c1fbee1c9b2de3ee8709a50b1958fa817ca79f50cb0624d9d0d38f3cb5fca5
3
+ size 4764961040
model-00012-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e09e1cf8b2063041de219218589ab2b690e4539aea2de38dfa8eb78b4b52123
3
+ size 4596991016
model-00013-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4316883b0474b4dc9920456e694202f32a078282e81e3b92d3ea497db5a429cb
3
+ size 4596958144
model-00014-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cd80f20a98befcf0bd5377e983268f4e6c7607bd3011d95ca30489f9a627df9
3
+ size 4093740200
model-00015-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bed1607ce06846ef29b412f3783fc1424dc39406cee963f4741980e5c3074c2
3
+ size 4127360504
model-00016-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0c4c0030a539b950d00e12e155c95c135b9bb433df9d6d45df81bb95194ea47
3
+ size 4395697424
model-00017-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e83947dd52fd237add07da4bb9e52125387e382628d16569385016c234f0995f
3
+ size 4898948256
model-00018-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fda4558350940799c332b20662a2d7d9059878dfc900b50f5a3211151a52b059
3
+ size 4966188888
model-00019-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb1b4df9f5852a27a41bf526f698ccf2921d2a5abbad451190fcc6089cddc828
3
+ size 4731340744
model-00020-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa128ba82492f2b840c907ef43e3d73d5302fffae9abe1b6642f41a0fdd5d166
3
+ size 4295000896
model-00021-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cc5151c3a6736b5e6c9d82244c901444ecc36c72b38353b77bb0651bb24ca55
3
+ size 4295000912
model-00022-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ceaa7d8d6435f1fe166f6d104867e8b4616f78abf3394797c500b59b6c605382
3
+ size 4462905176
model-00023-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c85d5a4ff83fe3377d6d26973bf640c7fee06bb77b6bfd8734e8a09df74faa87
3
+ size 4664198768
model-00024-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b064e2ca56e70fa4b5338845a82733c3f9eb8e28c5a56eca30a6fe257e31d367
3
+ size 4664067240
model-00025-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe626bf6f0e1053abd813cd74a10edc5bb4e547fa604bba45be6fa0ab694e9c9
3
+ size 4899014024
model-00026-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd8af77841b97ac92f10fe2263d3a260e252aa39d8cce1ae5ebdcf6be6088912
3
+ size 4462938048
model-00027-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9f6c3eb7fb239e040908998781574746bc508af0c0d6e0f956196e3ea3f999b
3
+ size 4898981144
model-00028-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09d6eda99ce7399c437113a6c041ea2a9d476a7982414821601e79f2c1cd30c3
3
+ size 4328555448
model-00029-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c88a2b1434e52d94b4780cba4c9cd6c3cde79962720b57890667b1a403611439
3
+ size 4362208656
model-00030-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c87f98306b525999925165a246e66e792e7d81659807dff7afbcaedd15e063ad
3
+ size 4832003688
model-00031-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9c235d62ce61ca7804a13894eee98b7d8aaa40ec56246fbf7cb70dc173ff166
3
+ size 4898981152
model-00032-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3ae11765b804bec43e21c8c724596835a51635fbff1e6630ecff7c18b9bbc73
3
+ size 4227859632
model-00033-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e8e201fd4b9e104622ecdb815f0c23cef0a6977bdc3519387cdcb06a3650e9f
3
+ size 4697819080
model-00034-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ad8429cbcbec747055321dbd519aa5b1a1345f6e84df49458c4e69df36a77e8
3
+ size 4160849288
model-00035-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d4b0ac0a620530a8c23fc29446c871aa160cb0b5cd14ca804874c1072fdc2b2
3
+ size 4328555448
model-00036-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1882323501f4816b59dde0f156c688336a075ff1a34f47a8930470d94f791de
3
+ size 4831839160
model-00037-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:822afa97f66a97001037c169da64e465ef6e8b37be6dedc82f60c7881f2e29ab
3
+ size 4228089920
model-00038-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40ea7f3f8ce9a8ea1c96c7eb4723fce677d5fbed82a2ae93b9e697385b4dbf0c
3
+ size 4630611336
model-00039-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acc1c2e9031dc9c50d65629363d4fdadfd0b1fe9552f6d9eb6c78f6ff0eac736
3
+ size 4898948264
model-00040-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f6b413c71258c44c7179b7d6d993e8340306e991091c6f7889dcd63ccd6324b
3
+ size 4966188872
model-00041-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:316024bf4c1a06cd3b9e8c1a6ff0d42615080bbb04ce1576f4073ba404924201
3
+ size 4160882184
model-00042-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:055918a7a0ebc5063ac24f205805a3618df766404d96b52c612980ca63bdcfc7
3
+ size 4362142880
model-00043-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f518cf3219e78132735ea25b6545fc75dc718378dd25dc54d7e7c70429eb024e
3
+ size 4563403592
model-00044-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e9f83946c8e094fbc7f436f11b3af6ccc7dd6edbb1fb35f94fa0679d74eb130
3
+ size 4596991024
model-00045-of-00063.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d19bab4996e40c76eb31291f1dc4ccdefa252ecdc33ac2016be0ee283989c0ed
3
+ size 4261644448