Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +17 -0
- added_tokens.json +5 -0
- config.json +28 -0
- mergekit_config.yml +30 -0
- merges.txt +0 -0
- model-00001-of-00083.safetensors +3 -0
- model-00002-of-00083.safetensors +3 -0
- model-00003-of-00083.safetensors +3 -0
- model-00004-of-00083.safetensors +3 -0
- model-00005-of-00083.safetensors +3 -0
- model-00006-of-00083.safetensors +3 -0
- model-00007-of-00083.safetensors +3 -0
- model-00008-of-00083.safetensors +3 -0
- model-00009-of-00083.safetensors +3 -0
- model-00010-of-00083.safetensors +3 -0
- model-00011-of-00083.safetensors +3 -0
- model-00012-of-00083.safetensors +3 -0
- model-00013-of-00083.safetensors +3 -0
- model-00014-of-00083.safetensors +3 -0
- model-00015-of-00083.safetensors +3 -0
- model-00016-of-00083.safetensors +3 -0
- model-00017-of-00083.safetensors +3 -0
- model-00018-of-00083.safetensors +3 -0
- model-00019-of-00083.safetensors +3 -0
- model-00020-of-00083.safetensors +3 -0
- model-00021-of-00083.safetensors +3 -0
- model-00022-of-00083.safetensors +3 -0
- model-00023-of-00083.safetensors +3 -0
- model-00024-of-00083.safetensors +3 -0
- model-00025-of-00083.safetensors +3 -0
- model-00026-of-00083.safetensors +3 -0
- model-00027-of-00083.safetensors +3 -0
- model-00028-of-00083.safetensors +3 -0
- model-00029-of-00083.safetensors +3 -0
- model-00030-of-00083.safetensors +3 -0
- model-00031-of-00083.safetensors +3 -0
- model-00032-of-00083.safetensors +3 -0
- model-00033-of-00083.safetensors +3 -0
- model-00034-of-00083.safetensors +3 -0
- model-00035-of-00083.safetensors +3 -0
- model-00036-of-00083.safetensors +3 -0
- model-00037-of-00083.safetensors +3 -0
- model-00038-of-00083.safetensors +3 -0
- model-00039-of-00083.safetensors +3 -0
- model-00040-of-00083.safetensors +3 -0
- model-00041-of-00083.safetensors +3 -0
- model-00042-of-00083.safetensors +3 -0
- model-00043-of-00083.safetensors +3 -0
- model-00044-of-00083.safetensors +3 -0
- model-00045-of-00083.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
tags:
|
4 |
+
- merge
|
5 |
+
- mergekit
|
6 |
+
- lazymergekit
|
7 |
+
- Qwen/Qwen2-72B-Instruct
|
8 |
+
- cognitivecomputations/dolphin-2.9.2-qwen2-72b
|
9 |
+
---
|
10 |
+
|
11 |
+
# merge-qwen2-72B
|
12 |
+
|
13 |
+
merge-qwen2-72B is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
|
14 |
+
* [Qwen/Qwen2-72B-Instruct](https://huggingface.co/Qwen/Qwen2-72B-Instruct)
|
15 |
+
* [cognitivecomputations/dolphin-2.9.2-qwen2-72b](https://huggingface.co/cognitivecomputations/dolphin-2.9.2-qwen2-72b)
|
16 |
+
|
17 |
+
## 🧩 Configuration
|
added_tokens.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|endoftext|>": 151643,
|
3 |
+
"<|im_end|>": 151645,
|
4 |
+
"<|im_start|>": 151644
|
5 |
+
}
|
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "Qwen/Qwen2-72B-Instruct",
|
3 |
+
"architectures": [
|
4 |
+
"Qwen2ForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"eos_token_id": 151645,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 8192,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 29568,
|
13 |
+
"max_position_embeddings": 32768,
|
14 |
+
"max_window_layers": 80,
|
15 |
+
"model_type": "qwen2",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 80,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"rms_norm_eps": 1e-06,
|
20 |
+
"rope_theta": 1000000.0,
|
21 |
+
"sliding_window": 131072,
|
22 |
+
"tie_word_embeddings": false,
|
23 |
+
"torch_dtype": "bfloat16",
|
24 |
+
"transformers_version": "4.41.2",
|
25 |
+
"use_cache": true,
|
26 |
+
"use_sliding_window": false,
|
27 |
+
"vocab_size": 152064
|
28 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
base_model: Qwen/Qwen2-72B-Instruct
|
2 |
+
dtype: bfloat16
|
3 |
+
merge_method: slerp
|
4 |
+
parameters:
|
5 |
+
t:
|
6 |
+
- filter: self_attn
|
7 |
+
value:
|
8 |
+
- 0
|
9 |
+
- 0.5
|
10 |
+
- 0.3
|
11 |
+
- 0.7
|
12 |
+
- 1
|
13 |
+
- filter: mlp
|
14 |
+
value:
|
15 |
+
- 1
|
16 |
+
- 0.5
|
17 |
+
- 0.7
|
18 |
+
- 0.3
|
19 |
+
- 0
|
20 |
+
- value: 0.5
|
21 |
+
slices:
|
22 |
+
- sources:
|
23 |
+
- layer_range:
|
24 |
+
- 0
|
25 |
+
- 80
|
26 |
+
model: Qwen/Qwen2-72B-Instruct
|
27 |
+
- layer_range:
|
28 |
+
- 0
|
29 |
+
- 80
|
30 |
+
model: cognitivecomputations/dolphin-2.9.2-qwen2-72b
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model-00001-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b99f1e7c9b6594ec8f4d2d0294a54bf0d413301bf406f88c2b10224ab905461d
|
3 |
+
size 1270895648
|
model-00002-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78a300c002dcb4ce782b7081b3b423086319249e602ad96dc59a44a2eaf7564d
|
3 |
+
size 2491416720
|
model-00003-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:309c7eba9dc99c5a456cbeca1fcf756e340d384969e1f78c617d30d514b89dd7
|
3 |
+
size 1906384688
|
model-00004-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0397bdc9a872c0271b4d66667577764978d23a5de89abc97a84eed8aede7a974
|
3 |
+
size 1604373528
|
model-00005-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b3595115efb6eb05852d6e6b595b91b590519d1876a44e2a73701debd0086f3
|
3 |
+
size 1572939800
|
model-00006-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:358880a365934df041486261be4c668f342581725aeece1813808ee02d7bf5db
|
3 |
+
size 1755370856
|
model-00007-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad8779646769c1bc1661da9b9b175b8b9d6fff8f4217c414e4a0d31fa6266554
|
3 |
+
size 1906368192
|
model-00008-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:989f75dbf0801e457e778e2878c8ff77dfb1ebd0f22160dfa7c763296a1cd682
|
3 |
+
size 1604373528
|
model-00009-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57967606a75903bb07341fa25bb08e55b5c41317ba902ecf25ec0caa9a8d1709
|
3 |
+
size 1755354360
|
model-00010-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b594e3f06d32b08b8e29bae9c78bcbfb6ff09ef574f18cd51c6806a073a409f9
|
3 |
+
size 1755354360
|
model-00011-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:437b68ba36fb40e8a93b9f3459742837935bda04baafac2f33e91e01691142c7
|
3 |
+
size 1954597896
|
model-00012-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72180969172a7ed42c59067d32375ed87a6a1d09924a1660222e5e419017a243
|
3 |
+
size 1889605208
|
model-00013-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78022988cac3c1c23937733c0795d65810d9d98c028f2ed848c581ef7bd40252
|
3 |
+
size 1604373544
|
model-00014-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7787629516d59862ecdf59d43751ce3af9ca5b5b47c3d5f3569b1b4afccedd05
|
3 |
+
size 1572939808
|
model-00015-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9675c0113d3f69c6fc1d4699ccf30e0cff825f4160d4a006898e7b688f80d9e6
|
3 |
+
size 1755370872
|
model-00016-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:406486776279ef6f74e513e9af392557351e7c1f85aa7299508dc2898838b619
|
3 |
+
size 1906368208
|
model-00017-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa360f05de979692225b46531ed5b068ee49b47f0fff0574d55388c9421464b1
|
3 |
+
size 1604373536
|
model-00018-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:227a90586b2e266e5126e7b774ded8b8c3033741f00c5ae853cd4a937dd025d4
|
3 |
+
size 1755354368
|
model-00019-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c97ee16715b0ccb0e71580e9b72aa3bad7c6ddaf7c8708c84b2f84ba81a45c6
|
3 |
+
size 1755354376
|
model-00020-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a2a794cf6ccd865a2e52c6c1d281757d7dd10cf2adccf5b672bf3013f40de54
|
3 |
+
size 1954597920
|
model-00021-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c48355d1782627a280addbd5ad61ae1f3110a8d78a9adda86b6810e9614f41a
|
3 |
+
size 1889605208
|
model-00022-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de5c44be0a11c65e883535fde458d59b80fd22a37196e527abebea6e29c51700
|
3 |
+
size 1604373536
|
model-00023-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03e60fb9d409f3b8eeef561f9118dc08f1fd73b4caabbf52fd7999762bfa8241
|
3 |
+
size 1572939816
|
model-00024-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89131e4da14d21975659b19abbdb0e80c0db3824061ec46d0d9e9500d86e030d
|
3 |
+
size 1755370872
|
model-00025-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23c78cbccfe3e43f990cc55e38df6bfc4bccee5290c33cd9fe35b47f8e1649c4
|
3 |
+
size 1906368208
|
model-00026-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a342761a443fcd90f5b88f5a40d8ec0bcb1ff80924b4dd9bfdfa356f6f17618e
|
3 |
+
size 1604373536
|
model-00027-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0057334038135b8247e8bd00450a208e4fe8cb7f708b95a6d94d93e0ebded6a9
|
3 |
+
size 1755354368
|
model-00028-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f34fd026217977a1d492129209d7958a330294feda3a05179546a7e3687c0b63
|
3 |
+
size 1755354376
|
model-00029-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:300e40390a95bebf179f7a7a37eed1d4f3e956d862963602bcebb31e0dc19a5d
|
3 |
+
size 1954597920
|
model-00030-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc5f5bc63b01b8a3760a47f1af1fe579ab2303047cbe0a42de65d3f6c96a1568
|
3 |
+
size 1889605208
|
model-00031-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:686818d5eb0a8eb483c8fb475183a2c927f5d6d788e9409e1d8ae2180af70684
|
3 |
+
size 1604373536
|
model-00032-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d00b0dfd7dd70ddc53d0f06295be0e592a113dade40e9d0af7b0039b9035f605
|
3 |
+
size 1572939816
|
model-00033-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf2c5b88ef821a3cab0dbb1899d44b3ca31c773795f450484d7ce7e1e50cad32
|
3 |
+
size 1755370872
|
model-00034-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f68ec8c51454f0405d4c54c1833755e58773f481b92d6b831def847adff2a2e
|
3 |
+
size 1906368208
|
model-00035-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38f11618b0bace2e3ef438a14a777516d673aa9fb5a069b2536e30ade5e2dee5
|
3 |
+
size 1604373536
|
model-00036-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c95680a7f0ab26bbcce388afb3c42f88a19d761b27235e8d630fa5be0ccae83a
|
3 |
+
size 1755354368
|
model-00037-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9b4a32d385c3d19fdbfc83c5464f53526204fa9c91fa2ee6985ac8d05e925df
|
3 |
+
size 1755354376
|
model-00038-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3885218d54182f1609432d9bfb080c59f8d5789e83641fe6d2880324ac60b3f3
|
3 |
+
size 1954597920
|
model-00039-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41c0395024eb2449da9da90674521d10964b3269591c3dc58d5b11d820da9b31
|
3 |
+
size 1889605208
|
model-00040-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f527983670ff4164b0e5781b3b1415522859808bed6f0f9dbd98076a374ea0ce
|
3 |
+
size 1604373536
|
model-00041-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8e418d0ed704d05de42b21d649e49ee81ae4d27b6504f3c36255e20d2fff634
|
3 |
+
size 1572939816
|
model-00042-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70ba3caa900ab1dda73fc6ce32c3307eb216b030b44cd27d3f9e4284d0c900fc
|
3 |
+
size 1755370872
|
model-00043-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78ca1884195363156a739bc8a5423a08854c40065939e4f74c8362cb02d263d0
|
3 |
+
size 1906368208
|
model-00044-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97cb70e9e2d4ef20feb2d7e62c7a6ebf0c2f30d8f24217e8e534b154d68fe807
|
3 |
+
size 1604373536
|
model-00045-of-00083.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9829cd3dbdc8a9c4093bd2d6bca579d9fde4975df1b1e96267db323f3a8e6bf7
|
3 |
+
size 1755354368
|