bruhzair commited on
Commit
e0a9099
·
verified ·
1 Parent(s): 3f44702

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +43 -0
  3. config.json +40 -0
  4. mergekit_config.yml +14 -0
  5. model-00001-of-00002.safetensors +3 -0
  6. model-00001-of-00049.safetensors +3 -0
  7. model-00002-of-00002.safetensors +3 -0
  8. model-00002-of-00049.safetensors +3 -0
  9. model-00003-of-00049.safetensors +3 -0
  10. model-00004-of-00049.safetensors +3 -0
  11. model-00005-of-00049.safetensors +3 -0
  12. model-00006-of-00049.safetensors +3 -0
  13. model-00007-of-00049.safetensors +3 -0
  14. model-00008-of-00049.safetensors +3 -0
  15. model-00009-of-00049.safetensors +3 -0
  16. model-00010-of-00049.safetensors +3 -0
  17. model-00011-of-00049.safetensors +3 -0
  18. model-00012-of-00049.safetensors +3 -0
  19. model-00013-of-00049.safetensors +3 -0
  20. model-00014-of-00049.safetensors +3 -0
  21. model-00015-of-00049.safetensors +3 -0
  22. model-00016-of-00049.safetensors +3 -0
  23. model-00017-of-00049.safetensors +3 -0
  24. model-00018-of-00049.safetensors +3 -0
  25. model-00019-of-00049.safetensors +3 -0
  26. model-00020-of-00049.safetensors +3 -0
  27. model-00021-of-00049.safetensors +3 -0
  28. model-00022-of-00049.safetensors +3 -0
  29. model-00023-of-00049.safetensors +3 -0
  30. model-00024-of-00049.safetensors +3 -0
  31. model-00025-of-00049.safetensors +3 -0
  32. model-00026-of-00049.safetensors +3 -0
  33. model-00027-of-00049.safetensors +3 -0
  34. model-00028-of-00049.safetensors +3 -0
  35. model-00029-of-00049.safetensors +3 -0
  36. model-00030-of-00049.safetensors +3 -0
  37. model-00031-of-00049.safetensors +3 -0
  38. model-00032-of-00049.safetensors +3 -0
  39. model-00033-of-00049.safetensors +3 -0
  40. model-00034-of-00049.safetensors +3 -0
  41. model-00035-of-00049.safetensors +3 -0
  42. model-00036-of-00049.safetensors +3 -0
  43. model-00037-of-00049.safetensors +3 -0
  44. model-00038-of-00049.safetensors +3 -0
  45. model-00039-of-00049.safetensors +3 -0
  46. model-00040-of-00049.safetensors +3 -0
  47. model-00041-of-00049.safetensors +3 -0
  48. model-00042-of-00049.safetensors +3 -0
  49. model-00043-of-00049.safetensors +3 -0
  50. model-00044-of-00049.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: []
3
+ library_name: transformers
4
+ tags:
5
+ - mergekit
6
+ - merge
7
+
8
+ ---
9
+ # Test1
10
+
11
+ This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
12
+
13
+ ## Merge Details
14
+ ### Merge Method
15
+
16
+ This model was merged using the NuSLERP merge method.
17
+
18
+ ### Models Merged
19
+
20
+ The following models were included in the merge:
21
+ * /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
22
+ * /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
23
+
24
+ ### Configuration
25
+
26
+ The following YAML configuration was used to produce this model:
27
+
28
+ ```yaml
29
+ dtype: bfloat16
30
+ merge_method: nuslerp
31
+ modules:
32
+ default:
33
+ slices:
34
+ - sources:
35
+ - layer_range: [0, 64]
36
+ model: /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
37
+ parameters:
38
+ weight: [0.9, 0.8, 0.75, 0.7, 0.65, 0.7, 0.75, 0.8, 0.9]
39
+ - layer_range: [0, 64]
40
+ model: /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
41
+ parameters:
42
+ weight: [0.1, 0.2, 0.25, 0.3, 0.35, 0.3, 0.25, 0.2, 0.1]
43
+ ```
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Cohere2ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 5,
8
+ "cache_implementation": "hybrid",
9
+ "eos_token_id": 255001,
10
+ "head_dim": 128,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 12288,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 36864,
15
+ "layer_norm_eps": 1e-05,
16
+ "logit_scale": 0.25,
17
+ "max_position_embeddings": 262144,
18
+ "model_type": "cohere2",
19
+ "num_attention_heads": 96,
20
+ "num_hidden_layers": 64,
21
+ "num_key_value_heads": 8,
22
+ "order_of_interleaved_layers": "local_attn_first",
23
+ "pad_token_id": 0,
24
+ "position_embedding_type": "rope_gptj",
25
+ "rope_scaling": null,
26
+ "rope_theta": 50000,
27
+ "rotary_pct": 1.0,
28
+ "sliding_window": 4096,
29
+ "sliding_window_pattern": 4,
30
+ "torch_dtype": "bfloat16",
31
+ "transformers_version": "4.50.2",
32
+ "unsloth_fixed": true,
33
+ "unsloth_version": "2025.3.18",
34
+ "use_cache": true,
35
+ "use_embedding_sharing": true,
36
+ "use_gated_activation": true,
37
+ "use_parallel_block": true,
38
+ "use_parallel_embedding": true,
39
+ "vocab_size": 256000
40
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dtype: bfloat16
2
+ merge_method: nuslerp
3
+ modules:
4
+ default:
5
+ slices:
6
+ - sources:
7
+ - layer_range: [0, 64]
8
+ model: /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
9
+ parameters:
10
+ weight: [0.9, 0.8, 0.75, 0.7, 0.65, 0.7, 0.75, 0.8, 0.9]
11
+ - layer_range: [0, 64]
12
+ model: /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
13
+ parameters:
14
+ weight: [0.1, 0.2, 0.25, 0.3, 0.35, 0.3, 0.25, 0.2, 0.1]
model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51ffb0f8210cab2ad6831bc661196b1887446b9f2df4299cddf2d767658af037
3
+ size 6291456144
model-00001-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0e5df379091bffb60a5cfe096243a6c44e2b32bff271a9ea515cda309860764
3
+ size 6291456144
model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5ecd58b3bff5b6f7610ea88371cc84b39099cc8b0406a4f725d8988bc97415f
3
+ size 24696
model-00002-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4c92b7a94ef53a0bf6e5d898d43520cb01aec15464488fea5fef80ada24c2c4
3
+ size 4278240416
model-00003-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bdf9ebb167ab3474457d26f9e558998fc27a7250ff6c71873734f154e12548c
3
+ size 4278215736
model-00004-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37de5a9b3c6cded31e13146ca04d9e42e6a66231217ff771041994cc4d68bb79
3
+ size 4932552336
model-00005-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:082e26ea56404a98b91f80eb4dddf8cd8c4d4a4e51db63b567da00eef25fa3db
3
+ size 4278215744
model-00006-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8529640bb8e39682cbaa93fe911e8b2f022470265fbdb43397bfc1c0638e8f18
3
+ size 4278215744
model-00007-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42605072ac8ba98de75894d5fe5c8f47474b50fef1f4430ea9b97c9316685634
3
+ size 4932552336
model-00008-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d374ed338857b9e74b51833a559afeaeeb55657e8ffef982e1a93e81bad652af
3
+ size 4278215744
model-00009-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29603fec3da4b0b394069b42dd0329bc8613b3186b00af11237591447992a943
3
+ size 4278215744
model-00010-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:277af3d35e28b911dbbc8389d9c0dda35ae13a71919ea40e32105d0d3f686b59
3
+ size 4932552328
model-00011-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6810512ede1d90a0bef55a68cc24ebc5b6c40f0d4e902e6d0d61c211cd1fd4f6
3
+ size 4278215736
model-00012-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26ad5a3520182ba1eccf7cae63c5a1c46fa9e3ee3ba124cf07d96ae9933b492a
3
+ size 4278215744
model-00013-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e7545d25b4cc6a7d2160bf5c740ebb41037d6edd02c3ee88d0285549b6f120b
3
+ size 4932552336
model-00014-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70459307d42bf703dc8b48da816a7f46982c4d57fbbe4ed1373b6d71ad2b745d
3
+ size 4278215744
model-00015-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4578aefd733a828cc09ba955a8855066c071455845c91bd4bbe5f4188fb836bf
3
+ size 4278215744
model-00016-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44b0ea5fdff70f1c0531eeb35e912729d66d567dcca5e69b17f9302660ee4d34
3
+ size 4932552336
model-00017-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7b53d0ea80fabc20e098c1fdbe02691c38d9cb5804b50d06d74722c3f6e45e1
3
+ size 4278215744
model-00018-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e4ea5cd999c8143a94dff3a62e8081985feb70f223a728b7f8c98ee54f161c2
3
+ size 4278215744
model-00019-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:532008c4604068339fadea5a252cbdd5c7213f1ea8622d30d56cc059d75dbc06
3
+ size 4932552328
model-00020-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af2d3ae9d4e504e56f3a05d511e26147cc19660409025d91d8a55a06d11e8483
3
+ size 4278215744
model-00021-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fd30f755f8733271887ab31f97dc7413d40575d4324b39fc8834ec3e78d5a43
3
+ size 4278215744
model-00022-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f90cf8c8b7baf5b5020f75939beb8595b767ec63bc7724880dbee6b8f6e274a
3
+ size 4932552336
model-00023-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48198a40801aad6c7972b57e2b6ab9e919c44c7ec50a926309a4538cb394b700
3
+ size 4278215744
model-00024-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eec02ac479c9d0aadd3016620c5a17f777e4c18680c890acd68e695f4960677
3
+ size 4278215744
model-00025-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff9986ab4a00e27b65b05c99d933d93b60d3cba8c72e19b0405c398c3a2d1763
3
+ size 4932552336
model-00026-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3a0a71b73581b7e3d17319f6d9fe451c23d471358cb8762ead0b26491be331e
3
+ size 4278215744
model-00027-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0848026561b6813ae558168e201cffd48ddb9da9ad4b3c80588cd730e40bfa7
3
+ size 4278215744
model-00028-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a496ce479fad0e680da0a5d45e246a280eab8f557aa6abcbfc573a468bbc787
3
+ size 4932552328
model-00029-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ddff7a3ab976f543538ad828f2203e27fa81ffb4a564bf3976802cc9e3683e1
3
+ size 4278215744
model-00030-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b3b81ae213d566e929141a6452f6b591a817c913bc19dc9bb30ddb17836a04b
3
+ size 4278215744
model-00031-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:817384a3a982193b0ea73499828e9f8a7b5bb5fbfa2b4f778d37742985ae3ea5
3
+ size 4932552336
model-00032-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30b9f8f103a47fcdd5a64d378f6841bb399553fd728009e0273d9ba6cb1901ca
3
+ size 4278215744
model-00033-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8a2f8bd87797fea66f1ea41874f90a4495eac022400361a17f5e36f063e6f7d
3
+ size 4278215744
model-00034-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae69b273e8d66544e4746fccef6741115976314dbe09ba8f92ab1e4b9d6cb092
3
+ size 4932552336
model-00035-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fed4c229d42df07cf92bb36985fe3e7b95661f7711fcd5cebc0248cdcdbbd6b
3
+ size 4278215744
model-00036-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50547b43af535b8bf0e409d129652cb29547983cca235598cb15990d40784e7f
3
+ size 4278215736
model-00037-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af8e27b4a027fe59fd19e0af15d7d5bb030900d2b8090c260e78fec2b1a0d587
3
+ size 4932552336
model-00038-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d8ddbb27cd62fa05f3d1d0cce83aa373722f71fd14e3256412ded74932bb4ee
3
+ size 4278215744
model-00039-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e57a04bda368e0ee58efe3bfb5222b2d6bfaa80f4d254f39f3c0f7226b502b8
3
+ size 4278215744
model-00040-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16c6fb0e109365620ce7f8fdf6369ca7403531749508a86e41ed9dffc0765da0
3
+ size 4932552336
model-00041-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9672ffbf521faa8f68b4038a161fdec5859e9a98ab1034e3d106625645e16947
3
+ size 4278215744
model-00042-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:782ed0aefae4dd90a954a9cfed14c9af3c2cc7554bcb92665e383218bff45289
3
+ size 4278215744
model-00043-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16fc1cc2b5eafe493fce85edcc4d3b4d06d11b9bb32b65b6407a0870d99b2ae6
3
+ size 4932552328
model-00044-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:292a83ae6ee52c6c0b99fb8ce9427e2c453a2b27bfc26dbe81dcfc3b33ce1798
3
+ size 4278215736