paulml commited on
Commit
6f6a8f2
1 Parent(s): a3613a2

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +17 -0
  2. added_tokens.json +5 -0
  3. config.json +28 -0
  4. mergekit_config.yml +30 -0
  5. merges.txt +0 -0
  6. model-00001-of-00083.safetensors +3 -0
  7. model-00002-of-00083.safetensors +3 -0
  8. model-00003-of-00083.safetensors +3 -0
  9. model-00004-of-00083.safetensors +3 -0
  10. model-00005-of-00083.safetensors +3 -0
  11. model-00006-of-00083.safetensors +3 -0
  12. model-00007-of-00083.safetensors +3 -0
  13. model-00008-of-00083.safetensors +3 -0
  14. model-00009-of-00083.safetensors +3 -0
  15. model-00010-of-00083.safetensors +3 -0
  16. model-00011-of-00083.safetensors +3 -0
  17. model-00012-of-00083.safetensors +3 -0
  18. model-00013-of-00083.safetensors +3 -0
  19. model-00014-of-00083.safetensors +3 -0
  20. model-00015-of-00083.safetensors +3 -0
  21. model-00016-of-00083.safetensors +3 -0
  22. model-00017-of-00083.safetensors +3 -0
  23. model-00018-of-00083.safetensors +3 -0
  24. model-00019-of-00083.safetensors +3 -0
  25. model-00020-of-00083.safetensors +3 -0
  26. model-00021-of-00083.safetensors +3 -0
  27. model-00022-of-00083.safetensors +3 -0
  28. model-00023-of-00083.safetensors +3 -0
  29. model-00024-of-00083.safetensors +3 -0
  30. model-00025-of-00083.safetensors +3 -0
  31. model-00026-of-00083.safetensors +3 -0
  32. model-00027-of-00083.safetensors +3 -0
  33. model-00028-of-00083.safetensors +3 -0
  34. model-00029-of-00083.safetensors +3 -0
  35. model-00030-of-00083.safetensors +3 -0
  36. model-00031-of-00083.safetensors +3 -0
  37. model-00032-of-00083.safetensors +3 -0
  38. model-00033-of-00083.safetensors +3 -0
  39. model-00034-of-00083.safetensors +3 -0
  40. model-00035-of-00083.safetensors +3 -0
  41. model-00036-of-00083.safetensors +3 -0
  42. model-00037-of-00083.safetensors +3 -0
  43. model-00038-of-00083.safetensors +3 -0
  44. model-00039-of-00083.safetensors +3 -0
  45. model-00040-of-00083.safetensors +3 -0
  46. model-00041-of-00083.safetensors +3 -0
  47. model-00042-of-00083.safetensors +3 -0
  48. model-00043-of-00083.safetensors +3 -0
  49. model-00044-of-00083.safetensors +3 -0
  50. model-00045-of-00083.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - merge
5
+ - mergekit
6
+ - lazymergekit
7
+ - Qwen/Qwen2-72B-Instruct
8
+ - cognitivecomputations/dolphin-2.9.2-qwen2-72b
9
+ ---
10
+
11
+ # merge-qwen2-72B
12
+
13
+ merge-qwen2-72B is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
14
+ * [Qwen/Qwen2-72B-Instruct](https://huggingface.co/Qwen/Qwen2-72B-Instruct)
15
+ * [cognitivecomputations/dolphin-2.9.2-qwen2-72b](https://huggingface.co/cognitivecomputations/dolphin-2.9.2-qwen2-72b)
16
+
17
+ ## 🧩 Configuration
added_tokens.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "<|endoftext|>": 151643,
3
+ "<|im_end|>": 151645,
4
+ "<|im_start|>": 151644
5
+ }
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Qwen/Qwen2-72B-Instruct",
3
+ "architectures": [
4
+ "Qwen2ForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 151643,
8
+ "eos_token_id": 151645,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 8192,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 29568,
13
+ "max_position_embeddings": 32768,
14
+ "max_window_layers": 80,
15
+ "model_type": "qwen2",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 80,
18
+ "num_key_value_heads": 8,
19
+ "rms_norm_eps": 1e-06,
20
+ "rope_theta": 1000000.0,
21
+ "sliding_window": 131072,
22
+ "tie_word_embeddings": false,
23
+ "torch_dtype": "bfloat16",
24
+ "transformers_version": "4.41.2",
25
+ "use_cache": true,
26
+ "use_sliding_window": false,
27
+ "vocab_size": 152064
28
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: Qwen/Qwen2-72B-Instruct
2
+ dtype: bfloat16
3
+ merge_method: slerp
4
+ parameters:
5
+ t:
6
+ - filter: self_attn
7
+ value:
8
+ - 0
9
+ - 0.5
10
+ - 0.3
11
+ - 0.7
12
+ - 1
13
+ - filter: mlp
14
+ value:
15
+ - 1
16
+ - 0.5
17
+ - 0.7
18
+ - 0.3
19
+ - 0
20
+ - value: 0.5
21
+ slices:
22
+ - sources:
23
+ - layer_range:
24
+ - 0
25
+ - 80
26
+ model: Qwen/Qwen2-72B-Instruct
27
+ - layer_range:
28
+ - 0
29
+ - 80
30
+ model: cognitivecomputations/dolphin-2.9.2-qwen2-72b
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b99f1e7c9b6594ec8f4d2d0294a54bf0d413301bf406f88c2b10224ab905461d
3
+ size 1270895648
model-00002-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78a300c002dcb4ce782b7081b3b423086319249e602ad96dc59a44a2eaf7564d
3
+ size 2491416720
model-00003-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:309c7eba9dc99c5a456cbeca1fcf756e340d384969e1f78c617d30d514b89dd7
3
+ size 1906384688
model-00004-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0397bdc9a872c0271b4d66667577764978d23a5de89abc97a84eed8aede7a974
3
+ size 1604373528
model-00005-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b3595115efb6eb05852d6e6b595b91b590519d1876a44e2a73701debd0086f3
3
+ size 1572939800
model-00006-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:358880a365934df041486261be4c668f342581725aeece1813808ee02d7bf5db
3
+ size 1755370856
model-00007-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad8779646769c1bc1661da9b9b175b8b9d6fff8f4217c414e4a0d31fa6266554
3
+ size 1906368192
model-00008-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:989f75dbf0801e457e778e2878c8ff77dfb1ebd0f22160dfa7c763296a1cd682
3
+ size 1604373528
model-00009-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57967606a75903bb07341fa25bb08e55b5c41317ba902ecf25ec0caa9a8d1709
3
+ size 1755354360
model-00010-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b594e3f06d32b08b8e29bae9c78bcbfb6ff09ef574f18cd51c6806a073a409f9
3
+ size 1755354360
model-00011-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:437b68ba36fb40e8a93b9f3459742837935bda04baafac2f33e91e01691142c7
3
+ size 1954597896
model-00012-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72180969172a7ed42c59067d32375ed87a6a1d09924a1660222e5e419017a243
3
+ size 1889605208
model-00013-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78022988cac3c1c23937733c0795d65810d9d98c028f2ed848c581ef7bd40252
3
+ size 1604373544
model-00014-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7787629516d59862ecdf59d43751ce3af9ca5b5b47c3d5f3569b1b4afccedd05
3
+ size 1572939808
model-00015-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9675c0113d3f69c6fc1d4699ccf30e0cff825f4160d4a006898e7b688f80d9e6
3
+ size 1755370872
model-00016-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:406486776279ef6f74e513e9af392557351e7c1f85aa7299508dc2898838b619
3
+ size 1906368208
model-00017-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa360f05de979692225b46531ed5b068ee49b47f0fff0574d55388c9421464b1
3
+ size 1604373536
model-00018-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:227a90586b2e266e5126e7b774ded8b8c3033741f00c5ae853cd4a937dd025d4
3
+ size 1755354368
model-00019-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c97ee16715b0ccb0e71580e9b72aa3bad7c6ddaf7c8708c84b2f84ba81a45c6
3
+ size 1755354376
model-00020-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a2a794cf6ccd865a2e52c6c1d281757d7dd10cf2adccf5b672bf3013f40de54
3
+ size 1954597920
model-00021-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c48355d1782627a280addbd5ad61ae1f3110a8d78a9adda86b6810e9614f41a
3
+ size 1889605208
model-00022-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de5c44be0a11c65e883535fde458d59b80fd22a37196e527abebea6e29c51700
3
+ size 1604373536
model-00023-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03e60fb9d409f3b8eeef561f9118dc08f1fd73b4caabbf52fd7999762bfa8241
3
+ size 1572939816
model-00024-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89131e4da14d21975659b19abbdb0e80c0db3824061ec46d0d9e9500d86e030d
3
+ size 1755370872
model-00025-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23c78cbccfe3e43f990cc55e38df6bfc4bccee5290c33cd9fe35b47f8e1649c4
3
+ size 1906368208
model-00026-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a342761a443fcd90f5b88f5a40d8ec0bcb1ff80924b4dd9bfdfa356f6f17618e
3
+ size 1604373536
model-00027-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0057334038135b8247e8bd00450a208e4fe8cb7f708b95a6d94d93e0ebded6a9
3
+ size 1755354368
model-00028-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f34fd026217977a1d492129209d7958a330294feda3a05179546a7e3687c0b63
3
+ size 1755354376
model-00029-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:300e40390a95bebf179f7a7a37eed1d4f3e956d862963602bcebb31e0dc19a5d
3
+ size 1954597920
model-00030-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc5f5bc63b01b8a3760a47f1af1fe579ab2303047cbe0a42de65d3f6c96a1568
3
+ size 1889605208
model-00031-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:686818d5eb0a8eb483c8fb475183a2c927f5d6d788e9409e1d8ae2180af70684
3
+ size 1604373536
model-00032-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d00b0dfd7dd70ddc53d0f06295be0e592a113dade40e9d0af7b0039b9035f605
3
+ size 1572939816
model-00033-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf2c5b88ef821a3cab0dbb1899d44b3ca31c773795f450484d7ce7e1e50cad32
3
+ size 1755370872
model-00034-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f68ec8c51454f0405d4c54c1833755e58773f481b92d6b831def847adff2a2e
3
+ size 1906368208
model-00035-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38f11618b0bace2e3ef438a14a777516d673aa9fb5a069b2536e30ade5e2dee5
3
+ size 1604373536
model-00036-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c95680a7f0ab26bbcce388afb3c42f88a19d761b27235e8d630fa5be0ccae83a
3
+ size 1755354368
model-00037-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9b4a32d385c3d19fdbfc83c5464f53526204fa9c91fa2ee6985ac8d05e925df
3
+ size 1755354376
model-00038-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3885218d54182f1609432d9bfb080c59f8d5789e83641fe6d2880324ac60b3f3
3
+ size 1954597920
model-00039-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41c0395024eb2449da9da90674521d10964b3269591c3dc58d5b11d820da9b31
3
+ size 1889605208
model-00040-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f527983670ff4164b0e5781b3b1415522859808bed6f0f9dbd98076a374ea0ce
3
+ size 1604373536
model-00041-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8e418d0ed704d05de42b21d649e49ee81ae4d27b6504f3c36255e20d2fff634
3
+ size 1572939816
model-00042-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70ba3caa900ab1dda73fc6ce32c3307eb216b030b44cd27d3f9e4284d0c900fc
3
+ size 1755370872
model-00043-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78ca1884195363156a739bc8a5423a08854c40065939e4f74c8362cb02d263d0
3
+ size 1906368208
model-00044-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97cb70e9e2d4ef20feb2d7e62c7a6ebf0c2f30d8f24217e8e534b154d68fe807
3
+ size 1604373536
model-00045-of-00083.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9829cd3dbdc8a9c4093bd2d6bca579d9fde4975df1b1e96267db323f3a8e6bf7
3
+ size 1755354368