bruhzair commited on
Commit
e540ae4
·
verified ·
1 Parent(s): 6037e6e

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +43 -0
  3. config.json +40 -0
  4. mergekit_config.yml +14 -0
  5. model-00001-of-00049.safetensors +3 -0
  6. model-00002-of-00049.safetensors +3 -0
  7. model-00003-of-00049.safetensors +3 -0
  8. model-00004-of-00049.safetensors +3 -0
  9. model-00005-of-00049.safetensors +3 -0
  10. model-00006-of-00049.safetensors +3 -0
  11. model-00007-of-00049.safetensors +3 -0
  12. model-00008-of-00049.safetensors +3 -0
  13. model-00009-of-00049.safetensors +3 -0
  14. model-00010-of-00049.safetensors +3 -0
  15. model-00011-of-00049.safetensors +3 -0
  16. model-00012-of-00049.safetensors +3 -0
  17. model-00013-of-00049.safetensors +3 -0
  18. model-00014-of-00049.safetensors +3 -0
  19. model-00015-of-00049.safetensors +3 -0
  20. model-00016-of-00049.safetensors +3 -0
  21. model-00017-of-00049.safetensors +3 -0
  22. model-00018-of-00049.safetensors +3 -0
  23. model-00019-of-00049.safetensors +3 -0
  24. model-00020-of-00049.safetensors +3 -0
  25. model-00021-of-00049.safetensors +3 -0
  26. model-00022-of-00049.safetensors +3 -0
  27. model-00023-of-00049.safetensors +3 -0
  28. model-00024-of-00049.safetensors +3 -0
  29. model-00025-of-00049.safetensors +3 -0
  30. model-00026-of-00049.safetensors +3 -0
  31. model-00027-of-00049.safetensors +3 -0
  32. model-00028-of-00049.safetensors +3 -0
  33. model-00029-of-00049.safetensors +3 -0
  34. model-00030-of-00049.safetensors +3 -0
  35. model-00031-of-00049.safetensors +3 -0
  36. model-00032-of-00049.safetensors +3 -0
  37. model-00033-of-00049.safetensors +3 -0
  38. model-00034-of-00049.safetensors +3 -0
  39. model-00035-of-00049.safetensors +3 -0
  40. model-00036-of-00049.safetensors +3 -0
  41. model-00037-of-00049.safetensors +3 -0
  42. model-00038-of-00049.safetensors +3 -0
  43. model-00039-of-00049.safetensors +3 -0
  44. model-00040-of-00049.safetensors +3 -0
  45. model-00041-of-00049.safetensors +3 -0
  46. model-00042-of-00049.safetensors +3 -0
  47. model-00043-of-00049.safetensors +3 -0
  48. model-00044-of-00049.safetensors +3 -0
  49. model-00045-of-00049.safetensors +3 -0
  50. model-00046-of-00049.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: []
3
+ library_name: transformers
4
+ tags:
5
+ - mergekit
6
+ - merge
7
+
8
+ ---
9
+ # Test2
10
+
11
+ This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
12
+
13
+ ## Merge Details
14
+ ### Merge Method
15
+
16
+ This model was merged using the NuSLERP merge method.
17
+
18
+ ### Models Merged
19
+
20
+ The following models were included in the merge:
21
+ * /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
22
+ * /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
23
+
24
+ ### Configuration
25
+
26
+ The following YAML configuration was used to produce this model:
27
+
28
+ ```yaml
29
+ dtype: bfloat16
30
+ merge_method: nuslerp
31
+ modules:
32
+ default:
33
+ slices:
34
+ - sources:
35
+ - layer_range: [0, 64]
36
+ model: /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
37
+ parameters:
38
+ weight: [0.9, 0.85, 0.95, 0.98, 0.95, 0.85, 0.9]
39
+ - layer_range: [0, 64]
40
+ model: /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
41
+ parameters:
42
+ weight: [0.1, 0.15, 0.05, 0.02, 0.05, 0.15, 0.1]
43
+ ```
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Cohere2ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 5,
8
+ "cache_implementation": "hybrid",
9
+ "eos_token_id": 255001,
10
+ "head_dim": 128,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 12288,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 36864,
15
+ "layer_norm_eps": 1e-05,
16
+ "logit_scale": 0.25,
17
+ "max_position_embeddings": 262144,
18
+ "model_type": "cohere2",
19
+ "num_attention_heads": 96,
20
+ "num_hidden_layers": 64,
21
+ "num_key_value_heads": 8,
22
+ "order_of_interleaved_layers": "local_attn_first",
23
+ "pad_token_id": 0,
24
+ "position_embedding_type": "rope_gptj",
25
+ "rope_scaling": null,
26
+ "rope_theta": 50000,
27
+ "rotary_pct": 1.0,
28
+ "sliding_window": 4096,
29
+ "sliding_window_pattern": 4,
30
+ "torch_dtype": "bfloat16",
31
+ "transformers_version": "4.50.3",
32
+ "unsloth_fixed": true,
33
+ "unsloth_version": "2025.3.18",
34
+ "use_cache": true,
35
+ "use_embedding_sharing": true,
36
+ "use_gated_activation": true,
37
+ "use_parallel_block": true,
38
+ "use_parallel_embedding": true,
39
+ "vocab_size": 256000
40
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dtype: bfloat16
2
+ merge_method: nuslerp
3
+ modules:
4
+ default:
5
+ slices:
6
+ - sources:
7
+ - layer_range: [0, 64]
8
+ model: /workspace/cache/models--CohereForAI--c4ai-command-a-03-2025/snapshots/6894b671d755c72573bb1a5722cfcfcd86b42b01
9
+ parameters:
10
+ weight: [0.9, 0.85, 0.95, 0.98, 0.95, 0.85, 0.9]
11
+ - layer_range: [0, 64]
12
+ model: /workspace/cache/models--TheDrummer--Fallen-Command-A-111B-v1/snapshots/5d2b4bdb35d7dff3a4eb51a5f2b231ba27943491
13
+ parameters:
14
+ weight: [0.1, 0.15, 0.05, 0.02, 0.05, 0.15, 0.1]
model-00001-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0e5df379091bffb60a5cfe096243a6c44e2b32bff271a9ea515cda309860764
3
+ size 6291456144
model-00002-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5eb628afc90039f0809cce10c03226a999e3922b7ff414a4fccce11d223a634
3
+ size 4278240416
model-00003-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de9c6831a77f8a4a81ea5028d0581830559b4b9ab3b18310d9d11dbf0093ec54
3
+ size 4278215736
model-00004-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:939906f892492bb49d34061ed328a65216754849a06aeb7fdb3afc41af961c77
3
+ size 4932552336
model-00005-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d62210cc1626640dee6fbbb6ca7ba712818e5860c75d7ae430f4001cbd4c0e9e
3
+ size 4278215744
model-00006-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:516094025fab83fd98cfe5c34733ea94087bbb7825c413fcac448c5220a4f672
3
+ size 4278215744
model-00007-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:542555d4d1b0f0e795d927c44d9f6f9329a0c07a9de0131a21513bb3b5a297d9
3
+ size 4932552336
model-00008-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efda5ce305eeb8b47893d9974fb1e634fbcdd7d44fbca8084493daa44002b7cb
3
+ size 4278215744
model-00009-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c6c3d28e1b48a7694632a7e32940c4eed3bd95cbd96c0953e3f3fbe1d5151b1
3
+ size 4278215744
model-00010-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1804be658ecbbabc623752424f541f8d9a70b8a8be87f93f2478ea1f4295ff66
3
+ size 4932552328
model-00011-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfc258db66d0e39b7ae0cc7b881d7c6f68815c4e7a1e9162aad7c6dd6466a122
3
+ size 4278215736
model-00012-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e72eb7a07fddf8c0177f145185c37cbbb2a82edbcb73281bdb3c7e1026bf051b
3
+ size 4278215744
model-00013-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffe55ba78d81acc57f0399ba0ddd521dce51c35ebfe93e84137f76e306d91efc
3
+ size 4932552336
model-00014-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39ef2d5dd54d166abe334ad00789ac6ebbf7be21f20c7c2af5c7374e53315944
3
+ size 4278215744
model-00015-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98595c13fe1dfff8ebbfbc50a1def4ce8763c9dc9251376ca9135b73c15252c5
3
+ size 4278215744
model-00016-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e15182e57f980e9577780652cfe293f46ea8b5ccea70ea310c8b629285a61546
3
+ size 4932552336
model-00017-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3047b26b6e8528fdf22b0c554065a02a4adb640f74c6f33726849962bec3cfc8
3
+ size 4278215744
model-00018-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9eab73b28704dddd6934aac8215f77a945eb4734aed6651801d651767bd348fe
3
+ size 4278215744
model-00019-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05bf418b37e68620f5609fc7991e618306f6d8a7b318a3872d256ef9acc8f20a
3
+ size 4932552328
model-00020-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77d73f3d5659715f328c4055744be23df80e4e5f275526677ca1a085355c3e13
3
+ size 4278215744
model-00021-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7278e8c3cd759cff51c1299fb5f079166fb1161662c18906a9c42dac02b6b161
3
+ size 4278215744
model-00022-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92dbef98e750fd85db3d2f149e433e8bb40202b4ae3d29d572dc172e1b486b6d
3
+ size 4932552336
model-00023-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27c9cff867b209ff2fe17b3d5e4b10bb5f2f589ea349c2a8d2bb493e5a5db541
3
+ size 4278215744
model-00024-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf1be19dbb96a68c5e11774b2956825fb1d0eef327ea832a01b8f5a5d61f7649
3
+ size 4278215744
model-00025-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f697ae9f8ad625eadb1bc7f528eae0bd56530745c70e562d50e4a40d1ead789c
3
+ size 4932552336
model-00026-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86bb53bc0f3c87619de60f971055ad5c345ff095fa587bb0c85b011d18c37b74
3
+ size 4278215744
model-00027-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0296d4c93530d2a1fea35f85a557443a18ac849276834b97909becc1b3086a95
3
+ size 4278215744
model-00028-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9d3b53ffcb8044f6b494c47e03867c7f55f8e1446092d7d38a2b610336acbc0
3
+ size 4932552328
model-00029-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cdcd3b621922efa80ae8cb1fb36c4cd82e3ba3b760f06752d378e5fe821cb0f
3
+ size 4278215744
model-00030-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1aa551e8a795c77a869006c1b641a6f9e3536927e1f6ee82d9714e64edc7e8f
3
+ size 4278215744
model-00031-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8524bdf769bd0aa0686ff9c2c7af47a60de639345b4d5be1ce311e84b3339d59
3
+ size 4932552336
model-00032-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:798694e80748e8e0c91b67bc10bea6d34e991bcbd54c447baecabaf10567b874
3
+ size 4278215744
model-00033-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f1cb1017e60301b2d37579975cb24512789a06d7e8d2f1d345749de9771923e
3
+ size 4278215744
model-00034-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:388b62979fb589a74b96be54b84073c2bea661f45d400263b7747dc56f0d8cde
3
+ size 4932552336
model-00035-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf802eb95b16d426d0c804afc515f37ab91b1c44d4660540aef986e10dedd6fb
3
+ size 4278215744
model-00036-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd81eeba26c2077c1f290d70965f50a7dd3331a3e998480209b3f3cbc9fa43d9
3
+ size 4278215736
model-00037-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33891a23f4efb1b35c0c7d931706e8ac715a3f172ebd1ee63e21d37d3e2054f1
3
+ size 4932552336
model-00038-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf74323e9f9bc2374b9bedfaa86708358d4b0d5939c490d48657d1b17ee809a4
3
+ size 4278215744
model-00039-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5c36a03f572d29a3902dbd51b9d7c7b621caf94675ccc61fe962b21a2911a7b
3
+ size 4278215744
model-00040-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a2168129f42da9d9e4e698d1245ed430161d7c718dc6d578d0063b983a5e085
3
+ size 4932552336
model-00041-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acb7853189bd7bb9de0c8d494e9c4c868c4c361c8dcb69fd27c9d9d42f337003
3
+ size 4278215744
model-00042-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:039bcf00113029b2a5dce637c074b8043ab3d672dc907465fefdd31d27323d96
3
+ size 4278215744
model-00043-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad9f6676c58a3a9f867777aa2b90c9d866c8186f48397ed67fd08d441965210f
3
+ size 4932552328
model-00044-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49cf2bd37059060c0ee842d0ede27027446979d17e9853b63c98e76fd07f08fe
3
+ size 4278215736
model-00045-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eea36c7c70638906b0e210338865725600d8ef22a4bbe0b618f097aaf7ba11a0
3
+ size 4278215744
model-00046-of-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a501ef7a8f9d93104ca43de2165b7bbda9e7ca9db3ff02896a9ccd7eaf9978ce
3
+ size 4932552336