DBDXSS
commited on
Commit
·
1b19d95
1
Parent(s):
4691746
init
Browse files- campplus.onnx +3 -0
- config.json +27 -0
- configuration.json +1 -0
- flow.cache.pt +3 -0
- flow.decoder.estimator.fp32.onnx +3 -0
- flow.encoder.fp16.zip +3 -0
- flow.encoder.fp32.zip +3 -0
- flow.pt +3 -0
- hift.pt +3 -0
- llm-checkpoint.pt +3 -0
- llm.pt +3 -0
- merges.txt +0 -0
- prompt_info.py +41 -0
- speech_tokenizer_v2.onnx +3 -0
- spk2info.pt +3 -0
- tokenizer_config.json +48 -0
- vocab.json +0 -0
campplus.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6ac6a63997761ae2997373e2ee1c47040854b4b759ea41ec48e4e42df0f4d73
|
3 |
+
size 28303423
|
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"CosyVoice2Model"
|
4 |
+
],
|
5 |
+
"attention_dropout": 0.0,
|
6 |
+
"bos_token_id": 151643,
|
7 |
+
"eos_token_id": 6561,
|
8 |
+
"hidden_act": "silu",
|
9 |
+
"hidden_size": 896,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"intermediate_size": 4864,
|
12 |
+
"max_position_embeddings": 32768,
|
13 |
+
"max_window_layers": 24,
|
14 |
+
"model_type": "qwen2",
|
15 |
+
"num_attention_heads": 14,
|
16 |
+
"num_hidden_layers": 24,
|
17 |
+
"num_key_value_heads": 2,
|
18 |
+
"rms_norm_eps": 1e-06,
|
19 |
+
"rope_theta": 1000000.0,
|
20 |
+
"sliding_window": 32768,
|
21 |
+
"tie_word_embeddings": true,
|
22 |
+
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.40.1",
|
24 |
+
"use_cache": true,
|
25 |
+
"use_sliding_window": false,
|
26 |
+
"vocab_size": 151936
|
27 |
+
}
|
configuration.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"framework":"Pytorch","task":"text-to-speech"}
|
flow.cache.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ebde248652c6eed855e08bb6a263af3847039a1361f8019bdb27f5f680a1dc4
|
3 |
+
size 450496991
|
flow.decoder.estimator.fp32.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e5b37b9c065b41d88d04678300f788b30bf621ead115d5a6c2bd7f05cd7a99e
|
3 |
+
size 286644900
|
flow.encoder.fp16.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dab6eeb31aeaf88b443a0fb44ee75b74a0937c32f4bf64ee3a2830dfc5fbf507
|
3 |
+
size 185950580
|
flow.encoder.fp32.zip
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:541f5bb298ac03c3b37b2ec54389b07350d148ffd2f94b490a9ce4de6e31f66f
|
3 |
+
size 330818868
|
flow.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff4c2f867674411e0a08cee702996df13fa67c1cd864c06108da88d16d088541
|
3 |
+
size 450575567
|
hift.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d4af0d661a416c69544eec83ff9c070dc80c37ee53ef44af3a37d910c95bc21
|
3 |
+
size 83364158
|
llm-checkpoint.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1104c6a3638e0376dc1f304bd21e73a0984632dc9a785506c2511846e91b02ff
|
3 |
+
size 2036166186
|
llm.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b144ef55b51ce8cfb79a73c90dbba0bdaba4e451c0ebcfab20f769264f84a608
|
3 |
+
size 2023316821
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
prompt_info.py
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import os
|
2 |
+
__dir__ = os.path.dirname(os.path.abspath(__file__))
|
3 |
+
|
4 |
+
|
5 |
+
ref_audio = {
|
6 |
+
"孙悟空":{"audio":"../../data/audio/孙悟空.WAV","text":"齐天大圣下凡,与两位师弟共保大唐高僧,西天取经的。"},
|
7 |
+
"李白":{"audio":"../../data/audio/李白原声.MP3","text":"神游千山外,化墨入深潭;但承青莲有侠志,莫道红尘无剑仙。"},
|
8 |
+
"唐僧":{"audio":"../../data/audio/唐僧.WAV","text":"佛心四大皆空,贫僧尘念已绝"},
|
9 |
+
"猪八戒":{"audio":"../../data/audio/猪八戒.WAV","text":"一听说抓妖怪,就跟见你外公似的你看"},
|
10 |
+
"沙僧":{"audio":"../../data/audio/沙僧.WAV","text":"取些水来把火扑灭,我们不就得救了吗"},
|
11 |
+
"圣诞老人":{"audio":"../../data/audio/圣诞老人.MP3","text":"我是你的老朋友圣诞老人,今年圣诞节,我会驾驶驯鹿雪橇,从芬兰北部出发"},
|
12 |
+
# "埃隆·马斯克":{"audio":"../../data/audio/马斯克.MP3","text":"videos of rockets blowing up,and made me watch those,just didn't want me to lose all my money"},
|
13 |
+
# "特朗普":{"audio":"../../data/audio/特朗普.WAV","text":"we will make America strong again. we will make America wealthy again."},
|
14 |
+
"观音菩萨":{"audio":"../../data/audio/观音菩萨.WAV","text":"莫伤他命,我那骆伽山后山无人看管,就让他做个守山大神吧"},
|
15 |
+
# "权志龙":{"audio":"../../data/audio/权志龙.WAV","text":"제자신이저를제일잘알겠죠그래서마약을하지않았기때문에이번마약범죄"},
|
16 |
+
"甄嬛":{"audio":"../../data/audio/甄嬛.WAV","text":"能不能让娘娘容下,是嫔妾的本事。溃疡烂到一定程度,才好动刀除去"},
|
17 |
+
"路飞":{"audio":"../../data/audio/路飞.WAV","text":"我还以为一跳就上去了,可恶,还真不容易啊,再试一次,我走了"},
|
18 |
+
# "柯南":{"audio":"../../data/audio/柯南日.WAV","text":"函館、肘方俊三の日本刀を狙い、キッドからの予告状が。なぜ奴が、ビッグジュエルでもない刀を狙う。"},
|
19 |
+
"林黛玉":{"audio":"../../data/audio/黛玉原声.MP3","text":"今儿他来,明儿我再来,这样间错开来着,不至于太冷落,也不至于太热闹"},
|
20 |
+
"诸葛亮":{"audio":"../../data/audio/诸葛亮原音.MP3","text":"后值倾覆,受任于败军之际,奉命于危难之间。"},
|
21 |
+
"吕布":{"audio":"../../data/audio/吕布原声.MP3","text":"谁能和我相比!我才是当世无敌的强者,神的怒火,你要如何熄灭。"},
|
22 |
+
# "鸣人":{"audio":"../../data/audio/鸣人原音.MP3","text":"俺ってばちゃんと飯食ってから大丈夫だって言ってくれえしねえでいろいろ食べてんだ本骨にエミソに"},
|
23 |
+
# "悟空":{"audio":"../../data/audio/龙珠悟空.MP3","text":"えーたちに殺された。 やるためにも。 目をぶっ倒す。"},
|
24 |
+
# "小樱":{"audio":"../../data/audio/小樱原声.MP3","text":"闇の力を秘めし、鍵よ、真の姿を我の前に示せ。 ダメージ。"},
|
25 |
+
# "白雪公主":{"audio":"../../data/audio/白雪公主原声.MP3","text":"oh, she'll never find me here, and if you let me stay. I'll keep house for you."},
|
26 |
+
"哪吒":{"audio":"../../data/audio/哪吒原声.MP3","text":"替天行道是使命,斩妖除魔我最擅长"},
|
27 |
+
"白素贞":{"audio":"../../data/audio/白娘子原声.MP3","text":"无论他在世间何处,无论他是何模样,无论他还记不记得我,我都要找到他"},
|
28 |
+
# "初音未来":{"audio":"../../data/audio/初音未来原音.MP3","text":"来てくれてありが。 思いっきり歌っちゃう。"},
|
29 |
+
"洛天依":{"audio":"../../data/audio/洛天依原声.MP3","text":"早上好,中午好,晚上好,我是天依,不知道我们此时相遇的时间,所以我把一天的问候都送给你啦"},
|
30 |
+
"言和":{"audio":"../../data/audio/言和原声.MP3","text":"你好,我是虚拟歌手言和,很高兴你听我唱歌"},
|
31 |
+
# "凯尔希":{"audio":"../../data/audio/凯尔希原声.MP3","text":"第一に芽吹いた命はどれも強く。 基本的なじゅんや抵抗は? ようにして徒労に終わる。"},
|
32 |
+
"艾希":{"audio":"../../data/audio/艾希原声.MP3","text":"我是艾希,葛伦娜之女,阿瓦罗萨部族的战母"},
|
33 |
+
# "蜘蛛侠":{"audio":"../../data/audio/蜘蛛侠原声.MP3","text":"Are you afraid that i'm going to turn into some kind of criminal, don' worry about me. Okay? something is different, i'll figure it out, stop lecturing me."},
|
34 |
+
# "哈利·波特":{"audio":"../../data/audio/哈利波特原声.MP3","text":"when you are a second away from being murdered or watching a friend die right before your eyes"},
|
35 |
+
# "哈利波特":{"audio":"../../data/audio/哈利波特原声.MP3","text":"when you are a second away from being murdered or watching a friend die right before your eyes"},
|
36 |
+
}
|
37 |
+
|
38 |
+
for role in ref_audio:
|
39 |
+
path = ref_audio[role]["audio"]
|
40 |
+
path = os.path.abspath(os.path.join(__dir__, '..', path))
|
41 |
+
ref_audio[role]["audio"] = path
|
speech_tokenizer_v2.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d43342aa12163a80bf07bffb94c9de2e120a8df2f9917cd2f642e7f4219c6f71
|
3 |
+
size 496082973
|
spk2info.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b57f4fa23fd0c921ed263fc4fa7dc5139afaa35c03000d53762e3213c1813047
|
3 |
+
size 3216336
|
tokenizer_config.json
ADDED
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_prefix_space": false,
|
3 |
+
"added_tokens_decoder": {
|
4 |
+
"151643": {
|
5 |
+
"content": "<|endoftext|>",
|
6 |
+
"lstrip": false,
|
7 |
+
"normalized": false,
|
8 |
+
"rstrip": false,
|
9 |
+
"single_word": false,
|
10 |
+
"special": true
|
11 |
+
},
|
12 |
+
"151644": {
|
13 |
+
"content": "<|im_start|>",
|
14 |
+
"lstrip": false,
|
15 |
+
"normalized": false,
|
16 |
+
"rstrip": false,
|
17 |
+
"single_word": false,
|
18 |
+
"special": true
|
19 |
+
},
|
20 |
+
"151645": {
|
21 |
+
"content": "<|im_end|>",
|
22 |
+
"lstrip": false,
|
23 |
+
"normalized": false,
|
24 |
+
"rstrip": false,
|
25 |
+
"single_word": false,
|
26 |
+
"special": true
|
27 |
+
}
|
28 |
+
},
|
29 |
+
"additional_special_tokens": [
|
30 |
+
"<|im_start|>", "<|im_end|>", "<|endofprompt|>",
|
31 |
+
"[breath]", "<strong>", "</strong>", "[noise]",
|
32 |
+
"[laughter]", "[cough]", "[clucking]", "[accent]",
|
33 |
+
"[quick_breath]",
|
34 |
+
"<laughter>", "</laughter>",
|
35 |
+
"[hissing]", "[sigh]", "[vocalized-noise]",
|
36 |
+
"[lipsmack]", "[mn]"
|
37 |
+
],
|
38 |
+
"bos_token": null,
|
39 |
+
"chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
|
40 |
+
"clean_up_tokenization_spaces": false,
|
41 |
+
"eos_token": "<|im_end|>",
|
42 |
+
"errors": "replace",
|
43 |
+
"model_max_length": 32768,
|
44 |
+
"pad_token": "<|endoftext|>",
|
45 |
+
"split_special_tokens": false,
|
46 |
+
"tokenizer_class": "Qwen2Tokenizer",
|
47 |
+
"unk_token": null
|
48 |
+
}
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|