bruhzair commited on
Commit
d0b7141
·
verified ·
1 Parent(s): eb4ce5a

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +43 -0
  3. config.json +40 -0
  4. mergekit_config.yml +14 -0
  5. model-00001-of-00049.safetensors +3 -0
  6. model-00002-of-00049.safetensors +3 -0
  7. model-00003-of-00049.safetensors +3 -0
  8. model-00004-of-00049.safetensors +3 -0
  9. model-00005-of-00049.safetensors +3 -0
  10. model-00006-of-00049.safetensors +3 -0
  11. model-00007-of-00049.safetensors +3 -0
  12. model-00008-of-00049.safetensors +3 -0
  13. model-00009-of-00049.safetensors +3 -0
  14. model-00010-of-00049.safetensors +3 -0
  15. model-00011-of-00049.safetensors +3 -0
  16. model-00012-of-00049.safetensors +3 -0
  17. model-00013-of-00049.safetensors +3 -0
  18. model-00014-of-00049.safetensors +3 -0
  19. model-00015-of-00049.safetensors +3 -0
  20. model-00016-of-00049.safetensors +3 -0
  21. model-00017-of-00049.safetensors +3 -0
  22. model-00018-of-00049.safetensors +3 -0
  23. model-00019-of-00049.safetensors +3 -0
  24. model-00020-of-00049.safetensors +3 -0
  25. model-00021-of-00049.safetensors +3 -0
  26. model-00022-of-00049.safetensors +3 -0
  27. model-00023-of-00049.safetensors +3 -0
  28. model-00024-of-00049.safetensors +3 -0
  29. model-00025-of-00049.safetensors +3 -0
  30. model-00026-of-00049.safetensors +3 -0
  31. model-00027-of-00049.safetensors +3 -0
  32. model-00028-of-00049.safetensors +3 -0
  33. model-00029-of-00049.safetensors +3 -0
  34. model-00030-of-00049.safetensors +3 -0
  35. model-00031-of-00049.safetensors +3 -0
  36. model-00032-of-00049.safetensors +3 -0
  37. model-00033-of-00049.safetensors +3 -0
  38. model-00034-of-00049.safetensors +3 -0
  39. model-00035-of-00049.safetensors +3 -0
  40. model-00036-of-00049.safetensors +3 -0
  41. model-00037-of-00049.safetensors +3 -0
  42. model-00038-of-00049.safetensors +3 -0
  43. model-00039-of-00049.safetensors +3 -0
  44. model-00040-of-00049.safetensors +3 -0
  45. model-00041-of-00049.safetensors +3 -0
  46. model-00042-of-00049.safetensors +3 -0
  47. model-00043-of-00049.safetensors +3 -0
  48. model-00044-of-00049.safetensors +3 -0
  49. model-00045-of-00049.safetensors +3 -0
  50. model-00046-of-00049.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: []
3
+ library_name: transformers
4
+ tags:
5
+ - mergekit
6
+ - merge
7
+
8
+ ---
9
+ # Test1
10
+
11
+ This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
12
+
13
+ ## Merge Details
14
+ ### Merge Method
15
+
16
+ This model was merged using the NuSLERP merge method.
17
+
18
+ ### Models Merged
19
+
20
+ The following models were included in the merge:
21
+ * /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
22
+ * /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
23
+
24
+ ### Configuration
25
+
26
+ The following YAML configuration was used to produce this model:
27
+
28
+ ```yaml
29
+ dtype: bfloat16
30
+ merge_method: nuslerp
31
+ modules:
32
+ default:
33
+ slices:
34
+ - sources:
35
+ - layer_range: [0, 64]
36
+ model: /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
37
+ parameters:
38
+ weight: [0.9, 0.7, 0.5, 0.35, 0.5, 0.7, 0.9]
39
+ - layer_range: [0, 64]
40
+ model: /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
41
+ parameters:
42
+ weight: [0.1, 0.3, 0.5, 0.65, 0.5, 0.3, 0.1]
43
+ ```
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Cohere2ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 5,
8
+ "cache_implementation": "hybrid",
9
+ "eos_token_id": 255001,
10
+ "head_dim": 128,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 12288,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 36864,
15
+ "layer_norm_eps": 1e-05,
16
+ "logit_scale": 0.25,
17
+ "max_position_embeddings": 262144,
18
+ "model_type": "cohere2",
19
+ "num_attention_heads": 96,
20
+ "num_hidden_layers": 64,
21
+ "num_key_value_heads": 8,
22
+ "order_of_interleaved_layers": "local_attn_first",
23
+ "pad_token_id": 0,
24
+ "position_embedding_type": "rope_gptj",
25
+ "rope_scaling": null,
26
+ "rope_theta": 50000,
27
+ "rotary_pct": 1.0,
28
+ "sliding_window": 4096,
29
+ "sliding_window_pattern": 4,
30
+ "torch_dtype": "bfloat16",
31
+ "transformers_version": "4.50.2",
32
+ "unsloth_fixed": true,
33
+ "unsloth_version": "2025.3.18",
34
+ "use_cache": true,
35
+ "use_embedding_sharing": true,
36
+ "use_gated_activation": true,
37
+ "use_parallel_block": true,
38
+ "use_parallel_embedding": true,
39
+ "vocab_size": 256000
40
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dtype: bfloat16
2
+ merge_method: nuslerp
3
+ modules:
4
+ default:
5
+ slices:
6
+ - sources:
7
+ - layer_range: [0, 64]
8
+ model: /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
9
+ parameters:
10
+ weight: [0.9, 0.7, 0.5, 0.35, 0.5, 0.7, 0.9]
11
+ - layer_range: [0, 64]
12
+ model: /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
13
+ parameters:
14
+ weight: [0.1, 0.3, 0.5, 0.65, 0.5, 0.3, 0.1]
model-00001-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0e5df379091bffb60a5cfe096243a6c44e2b32bff271a9ea515cda309860764
3
+ size 6291456144
model-00002-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2c563a2247c3e317da7f4df8003a119a9057ddc02b1df5553ea0d3d33be2d6
3
+ size 4278240416
model-00003-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:980b141375a4b5776f87d7a816ca270f63b5f8555c65d617744fb77c55de6976
3
+ size 4278215736
model-00004-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e85b06ca541aaa4cc7193b165d2187dfde6ede803a16890bb637b817a873fa03
3
+ size 4932552336
model-00005-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee68526c8e3991208f6a5d5f3c7900ede46de853e1795a2964b72a3e314af956
3
+ size 4278215744
model-00006-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edcb012730823afbf0b6fa197eefbbe4e4d003ceb548433ca155b8fdf54183c0
3
+ size 4278215744
model-00007-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba2a8ab6403f533d28754c20cb542c1a7ebd28364d80b1a7dc6d63849279bd45
3
+ size 4932552336
model-00008-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:231abd01ae9dad713a0816198e33e432b7e0b3d4a710cb02e3b7d92d7cc01cea
3
+ size 4278215744
model-00009-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:088b348088173779026af6cd8db85dd73ba275df442f603c6f7bda530e45b571
3
+ size 4278215744
model-00010-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45ea1505df9b45cfa0612cc450a5659b95f4a01aac663324b337207986a2a16a
3
+ size 4932552328
model-00011-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d27ff58f8a8a50827e8c13345b008e95d1b7065361e855543976959528702c27
3
+ size 4278215736
model-00012-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd128a35ca3f4811eecdd87f4386f64333a50a4da81f2295dad78e2d9ca3490b
3
+ size 4278215744
model-00013-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:726b3877fdbaa3cbb49e5b8cd9ec8e30c24a88da1ade5059e5e02f29b56898cd
3
+ size 4932552336
model-00014-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a401f95415fc85296bde907c57141d21a9b64b58ebcbc0d51f3d5ce61473ec38
3
+ size 4278215744
model-00015-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:943735f63795f3cb4457a28cf9df43c41f28c302c7cb14886d9570dc6b38ebde
3
+ size 4278215744
model-00016-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:804e756a062e3663362594fe708cbd2d766dce66dca60a798a2d373ae06ac02d
3
+ size 4932552336
model-00017-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5503e184b5059f49053af6abb87a4d8f87842bcb7296084b70af0fbc3e1efae
3
+ size 4278215744
model-00018-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:728255e1c5790155acbf496259ec9eb54dec1f4e1137ee65670d478f1c0d6bca
3
+ size 4278215744
model-00019-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71cf1f4628665a8bfaa1f8fb58a21a5d4056ff627da907cb7a64efedf114ba88
3
+ size 4932552328
model-00020-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8d365c15f7dee71cd7748b9911b8e3b8cceacde2ac38fa0efd24fd6822a1a97
3
+ size 4278215744
model-00021-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84de165483b355c764be822866c7ff82f37fd839ad930bbe885afc62070847a2
3
+ size 4278215744
model-00022-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:927259e4b098c3350297310ac46125938c0c2bf1844ec8073cbffdee1600a0fc
3
+ size 4932552336
model-00023-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b04cf3dcf7ef0967f8e948e52b931ab48b7a3e8b699135a78c976d49ae0417cc
3
+ size 4278215744
model-00024-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86956081fad43aa8da1645b9790b8f2d733895bf746660535c6fca4b130f28e8
3
+ size 4278215744
model-00025-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e1fc60462ad9017f6f6ddb850278909e599e3d19f0059b1bcc2b7db1521b705
3
+ size 4932552336
model-00026-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57b5994b7c1b7ed2834a52da532b654ae00a754f97a75294be2c9f3fdf843390
3
+ size 4278215744
model-00027-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0213d5bb47ecd74bb6768b9f4a177f3c81e6fb2728e429f568b104b5f683345
3
+ size 4278215744
model-00028-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe32e2c4f369c75b6a44c69feb462e3494334ad38eedf133d2f46f6ece355cc8
3
+ size 4932552328
model-00029-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdb9cb36fc4b009379a257b89b60041bb14b2e006bdfb563dc7eade32a1d068f
3
+ size 4278215744
model-00030-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2c8bc189e8fbd53df5e56f07661db140a45dca6f06ec7c4f7a2adc685b22505
3
+ size 4278215744
model-00031-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4238630affe9cd39e51149844a9a21a0bd884659d60850d5d3db8e550e586062
3
+ size 4932552336
model-00032-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6b3305507039eb78f18c8dc2bdc26c53bf51a04e136a71461a082a40b8d8367
3
+ size 4278215744
model-00033-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdfb36d693ac234f75511aa7680039a4a34d8df05e256e23d8e0d4f8876edc82
3
+ size 4278215744
model-00034-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:742dbcf8dff637e1b46c2c3c4f12ce8ec66462c489db9fa72471019973b37f43
3
+ size 4932552336
model-00035-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:438d6125f1fe9bc2204c63fb6aa68099adf4d638676095681da38ed0e3b07339
3
+ size 4278215744
model-00036-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f64cbdb1d14cbf378ce30ea1d802108fdc7a6c566fb01ec759997fe5155538c1
3
+ size 4278215736
model-00037-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6681ed8ef832565fb081f883f170419610333c8246fe662c25626210269114c
3
+ size 4932552336
model-00038-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d93415ae2b48a84198489c3596b986aa2051babdf83fa56266e74e9694a584c
3
+ size 4278215744
model-00039-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc12b5a3a45b843eee819ed4c7ef69cd49b1765724f9b124a1c280ed31c2df23
3
+ size 4278215744
model-00040-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efe33873d59bf1df381dbbe781cc0bdaddbf6a132592b306792d869632bed35a
3
+ size 4932552336
model-00041-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:847db266f8cdc9c29da12f3cec089b5bbb496c132d409a0bc5c766a0c036777c
3
+ size 4278215744
model-00042-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:749efc76c8566dfd59f7cb4bb01a92f17510dd197bc55feec0129ee427a46d34
3
+ size 4278215744
model-00043-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:186b743f639a031c6d490220e54a8c6d6dc8b4d44307f9f15b1eef47ade5be54
3
+ size 4932552328
model-00044-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d56b13628aff60545b0d39165d7f488fd017286f3883739b753639ccd8defb6
3
+ size 4278215736
model-00045-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08a95e7196ea8a86ee1706cde9377e1bae17456438ffae3ae0c9aa777cc7860b
3
+ size 4278215744
model-00046-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1e475e0232d8c9c24f4449b7b7923cf6733aff0ad2daf7a2effd3ee3e16b90d
3
+ size 4932552336