bruhzair commited on
Commit
c4e7ce2
·
verified ·
1 Parent(s): e8a14c6

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +43 -0
  3. config.json +40 -0
  4. mergekit_config.yml +14 -0
  5. model-00001-of-00049.safetensors +3 -0
  6. model-00002-of-00049.safetensors +3 -0
  7. model-00003-of-00049.safetensors +3 -0
  8. model-00004-of-00049.safetensors +3 -0
  9. model-00005-of-00049.safetensors +3 -0
  10. model-00006-of-00049.safetensors +3 -0
  11. model-00007-of-00049.safetensors +3 -0
  12. model-00008-of-00049.safetensors +3 -0
  13. model-00009-of-00049.safetensors +3 -0
  14. model-00010-of-00049.safetensors +3 -0
  15. model-00011-of-00049.safetensors +3 -0
  16. model-00012-of-00049.safetensors +3 -0
  17. model-00013-of-00049.safetensors +3 -0
  18. model-00014-of-00049.safetensors +3 -0
  19. model-00015-of-00049.safetensors +3 -0
  20. model-00016-of-00049.safetensors +3 -0
  21. model-00017-of-00049.safetensors +3 -0
  22. model-00018-of-00049.safetensors +3 -0
  23. model-00019-of-00049.safetensors +3 -0
  24. model-00020-of-00049.safetensors +3 -0
  25. model-00021-of-00049.safetensors +3 -0
  26. model-00022-of-00049.safetensors +3 -0
  27. model-00023-of-00049.safetensors +3 -0
  28. model-00024-of-00049.safetensors +3 -0
  29. model-00025-of-00049.safetensors +3 -0
  30. model-00026-of-00049.safetensors +3 -0
  31. model-00027-of-00049.safetensors +3 -0
  32. model-00028-of-00049.safetensors +3 -0
  33. model-00029-of-00049.safetensors +3 -0
  34. model-00030-of-00049.safetensors +3 -0
  35. model-00031-of-00049.safetensors +3 -0
  36. model-00032-of-00049.safetensors +3 -0
  37. model-00033-of-00049.safetensors +3 -0
  38. model-00034-of-00049.safetensors +3 -0
  39. model-00035-of-00049.safetensors +3 -0
  40. model-00036-of-00049.safetensors +3 -0
  41. model-00037-of-00049.safetensors +3 -0
  42. model-00038-of-00049.safetensors +3 -0
  43. model-00039-of-00049.safetensors +3 -0
  44. model-00040-of-00049.safetensors +3 -0
  45. model-00041-of-00049.safetensors +3 -0
  46. model-00042-of-00049.safetensors +3 -0
  47. model-00043-of-00049.safetensors +3 -0
  48. model-00044-of-00049.safetensors +3 -0
  49. model-00045-of-00049.safetensors +3 -0
  50. model-00046-of-00049.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: []
3
+ library_name: transformers
4
+ tags:
5
+ - mergekit
6
+ - merge
7
+
8
+ ---
9
+ # Test1
10
+
11
+ This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
12
+
13
+ ## Merge Details
14
+ ### Merge Method
15
+
16
+ This model was merged using the NuSLERP merge method.
17
+
18
+ ### Models Merged
19
+
20
+ The following models were included in the merge:
21
+ * /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
22
+ * /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
23
+
24
+ ### Configuration
25
+
26
+ The following YAML configuration was used to produce this model:
27
+
28
+ ```yaml
29
+ dtype: bfloat16
30
+ merge_method: nuslerp
31
+ modules:
32
+ default:
33
+ slices:
34
+ - sources:
35
+ - layer_range: [0, 64]
36
+ model: /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
37
+ parameters:
38
+ weight: [0.85, 0.8, 0.9, 0.95, 0.9, 0.8, 0.85]
39
+ - layer_range: [0, 64]
40
+ model: /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
41
+ parameters:
42
+ weight: [0.15, 0.2, 0.1, 0.05, 0.1, 0.2, 0.15]
43
+ ```
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Cohere2ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 5,
8
+ "cache_implementation": "hybrid",
9
+ "eos_token_id": 255001,
10
+ "head_dim": 128,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 12288,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 36864,
15
+ "layer_norm_eps": 1e-05,
16
+ "logit_scale": 0.25,
17
+ "max_position_embeddings": 262144,
18
+ "model_type": "cohere2",
19
+ "num_attention_heads": 96,
20
+ "num_hidden_layers": 64,
21
+ "num_key_value_heads": 8,
22
+ "order_of_interleaved_layers": "local_attn_first",
23
+ "pad_token_id": 0,
24
+ "position_embedding_type": "rope_gptj",
25
+ "rope_scaling": null,
26
+ "rope_theta": 50000,
27
+ "rotary_pct": 1.0,
28
+ "sliding_window": 4096,
29
+ "sliding_window_pattern": 4,
30
+ "torch_dtype": "bfloat16",
31
+ "transformers_version": "4.50.3",
32
+ "unsloth_fixed": true,
33
+ "unsloth_version": "2025.3.18",
34
+ "use_cache": true,
35
+ "use_embedding_sharing": true,
36
+ "use_gated_activation": true,
37
+ "use_parallel_block": true,
38
+ "use_parallel_embedding": true,
39
+ "vocab_size": 256000
40
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dtype: bfloat16
2
+ merge_method: nuslerp
3
+ modules:
4
+ default:
5
+ slices:
6
+ - sources:
7
+ - layer_range: [0, 64]
8
+ model: /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
9
+ parameters:
10
+ weight: [0.85, 0.8, 0.9, 0.95, 0.9, 0.8, 0.85]
11
+ - layer_range: [0, 64]
12
+ model: /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
13
+ parameters:
14
+ weight: [0.15, 0.2, 0.1, 0.05, 0.1, 0.2, 0.15]
model-00001-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3b0580b297718a42483245c285bf83479c0f8babffa1e05db0931104243da38
3
+ size 6291456144
model-00002-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa4a943ff834f9318c3041d8329bb288fedb16c1169c8f5795b7fa296c0e9f09
3
+ size 4278240416
model-00003-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ff152143dc8721e37da5a24d0b3a0070cb3aea12c738875a141e5a271720969
3
+ size 4278215736
model-00004-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84ced3598456cddd55f89eacd600d97420fa58beba9ebc47e592635100e68d63
3
+ size 4932552336
model-00005-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49845a3008cade80780e10dda14f4bb8a79fe9bce3eb70f2da90d664ca6cfd8e
3
+ size 4278215744
model-00006-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e81c8720678d94c90795bf6adeb46e58334e1fff6020642d6ae7be14deef1f7
3
+ size 4278215744
model-00007-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8abc550bf04907b7b5b4abbbd87181f9e275ecc0f12d34636cee04f34685821
3
+ size 4932552336
model-00008-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efa0035bf27b69819f0c9a603cf4ad7259c3c4a1252cbd3031d0ea40419cf132
3
+ size 4278215744
model-00009-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1ab2c97ec3dfe6721e019642455b74c9474d4f52c2f60d120d6b8b3eaabc8ac
3
+ size 4278215744
model-00010-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0234e5aaa7f1051ac254577014a5f5d1194549964498ed8a333e73b7d486b840
3
+ size 4932552328
model-00011-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:230014326a7b939ad4482aa29ba1fddf02c60f6a3cd014a523471b27daa296d8
3
+ size 4278215736
model-00012-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e027c3ffd0907f0b271344921962c1a1dc22db5e26dba2e15c2479b6a238e29
3
+ size 4278215744
model-00013-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb587a4ad954a3c5edc5469953f581de4912fbf98758394b2160dbfe6250228a
3
+ size 4932552336
model-00014-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49e0e2541b7c76ab481c73b7a783b665c7ea9122825a14232dd2e22f92cf8e87
3
+ size 4278215744
model-00015-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b57d62ea42224203b62168ccf1b126b3f2f1d4652626dbb4ad1969b52f97ca02
3
+ size 4278215744
model-00016-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:488d79f14185e949761a98c7069454d4c6dde09a8e732d1f29ad34f7eee2a5e3
3
+ size 4932552336
model-00017-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b258a3f8cc45d97fe3ff673468a7c9b53bd60212938fc537997ae8ee3f53a0d8
3
+ size 4278215744
model-00018-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25a22952186ce33de46d905d09ee7a8c9873b78e44610c7180075f5c08bbf136
3
+ size 4278215744
model-00019-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02e7a2153c1aea192619e65d8b897ba7a667a9073c8261cb99ae0ca893ddf658
3
+ size 4932552328
model-00020-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7feb5068ed884dcd99fcf4f7dbede994eef865405cebfa054a0bf1f40d3fede1
3
+ size 4278215744
model-00021-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38c30888102679f621d4e860601055e14993aea3e78687cb9fa926866df22328
3
+ size 4278215744
model-00022-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8acd5544e3427db315faf9c28de0a678a343428c75e2209a87333298da03ca43
3
+ size 4932552336
model-00023-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:612c9a374e15cdf73298b57d9e250d5c994da67aede154e1d2712d2662fb263d
3
+ size 4278215744
model-00024-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:802ebd683d8faf619c310869136f608bc838113c71d4f3183d47c77336de519c
3
+ size 4278215744
model-00025-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e94aa9211d0161bf503999e2c85e07d69f6d2a84868a9ec2041d0277b3518592
3
+ size 4932552336
model-00026-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aef782bb909fe1ee030689d7d613655e2af1f2dbd54c3f5f638d153be4ee627
3
+ size 4278215744
model-00027-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f123e8c4a49207bab1260bf64198c2739498e86fba3be11ec5f7aab26833570
3
+ size 4278215744
model-00028-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0b29f20b9426309270dbf5fadb193ba667811e53cdf2dafd69a44de2e3a2802
3
+ size 4932552328
model-00029-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cad09d68490387199facdf027be131a7786b0698d98c202af6e04650137e2ff
3
+ size 4278215744
model-00030-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6546959ce612a06c3610cdef98e1c33d61a6b85b175270d465be72439e1794b5
3
+ size 4278215744
model-00031-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89451da7703881dc7517c45657884659f9dfd942deb017ad58b4eea05f86cf61
3
+ size 4932552336
model-00032-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bb788d46a5924136a7f0c7c33171aed0d2fde0f2c14bd9b81fa541bf9118aaa
3
+ size 4278215744
model-00033-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e123a8f9aec7ee96bae788702294dc47857218bb053d488d14e41a86f103a40c
3
+ size 4278215744
model-00034-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5e6ddd9508148bf111b469e101564ffe59df878fb025a6d9b801081cc063a65
3
+ size 4932552336
model-00035-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbda5842405e076e4d5305e64658d691a6bd1ff48e6dca34e18bfe3aa5da1a12
3
+ size 4278215744
model-00036-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:010fc5bbe2b8321b02c60e3b47b186c2268d46cdb1e9ed0d0a2ac663ba12261b
3
+ size 4278215736
model-00037-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c9e6c19bef1442eb764c8090efe362ef577a6adaf6bc95c5372967e5b5ec640
3
+ size 4932552336
model-00038-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ff529357acb86b8783a41671055a76bf47b8a636e9d6b4f55ebf5362f37769b
3
+ size 4278215744
model-00039-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4df22dccb2695d14a8c1c6ea3085b2d00cff4e74177c812fd852ab959ea6dc4
3
+ size 4278215744
model-00040-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bac6b24b16f69737e08b7f31e73ec9d3d38b303b7a9d8833bc2bf7df8d54b16
3
+ size 4932552336
model-00041-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a5d175915987cf4badea7cc75a7602412c8f97dbcfda67aac4d78ff62241560
3
+ size 4278215744
model-00042-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e54e69338559462378c4f1e614ed29491f9022c4c57a6a467d3ed07c0065b60
3
+ size 4278215744
model-00043-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:477c1faf63d9681441c92b58fc6e15db2f1e8f0fd16509f79b9499fb77f71cbd
3
+ size 4932552328
model-00044-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91ef158bf3c3785d0fecb43e5a2c57db234038d74b8d1e9a5a78cb11f9fcc957
3
+ size 4278215736
model-00045-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88b22196438e39f2d6ec75f6cde6f7de7991a2e6fc078d61e691eb0a4c0de28e
3
+ size 4278215744
model-00046-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9fbbb83123cc0f948c53b238506515a949772d23c03d34b79cb18bbb33a0170
3
+ size 4932552336