init

Files changed (17) hide show

campplus.onnx +3 -0
config.json +27 -0
configuration.json +1 -0
flow.cache.pt +3 -0
flow.decoder.estimator.fp32.onnx +3 -0
flow.encoder.fp16.zip +3 -0
flow.encoder.fp32.zip +3 -0
flow.pt +3 -0
hift.pt +3 -0
llm-checkpoint.pt +3 -0
llm.pt +3 -0
merges.txt +0 -0
prompt_info.py +41 -0
speech_tokenizer_v2.onnx +3 -0
spk2info.pt +3 -0
tokenizer_config.json +48 -0
vocab.json +0 -0

campplus.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a6ac6a63997761ae2997373e2ee1c47040854b4b759ea41ec48e4e42df0f4d73
+size 28303423

config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "architectures": [
+    "CosyVoice2Model"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 151643,
+  "eos_token_id": 6561,
+  "hidden_act": "silu",
+  "hidden_size": 896,
+  "initializer_range": 0.02,
+  "intermediate_size": 4864,
+  "max_position_embeddings": 32768,
+  "max_window_layers": 24,
+  "model_type": "qwen2",
+  "num_attention_heads": 14,
+  "num_hidden_layers": 24,
+  "num_key_value_heads": 2,
+  "rms_norm_eps": 1e-06,
+  "rope_theta": 1000000.0,
+  "sliding_window": 32768,
+  "tie_word_embeddings": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.40.1",
+  "use_cache": true,
+  "use_sliding_window": false,
+  "vocab_size": 151936
+}

configuration.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"framework":"Pytorch","task":"text-to-speech"}

flow.cache.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ebde248652c6eed855e08bb6a263af3847039a1361f8019bdb27f5f680a1dc4
+size 450496991

flow.decoder.estimator.fp32.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e5b37b9c065b41d88d04678300f788b30bf621ead115d5a6c2bd7f05cd7a99e
+size 286644900

flow.encoder.fp16.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dab6eeb31aeaf88b443a0fb44ee75b74a0937c32f4bf64ee3a2830dfc5fbf507
+size 185950580

flow.encoder.fp32.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:541f5bb298ac03c3b37b2ec54389b07350d148ffd2f94b490a9ce4de6e31f66f
+size 330818868

flow.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff4c2f867674411e0a08cee702996df13fa67c1cd864c06108da88d16d088541
+size 450575567

hift.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d4af0d661a416c69544eec83ff9c070dc80c37ee53ef44af3a37d910c95bc21
+size 83364158

llm-checkpoint.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1104c6a3638e0376dc1f304bd21e73a0984632dc9a785506c2511846e91b02ff
+size 2036166186

llm.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b144ef55b51ce8cfb79a73c90dbba0bdaba4e451c0ebcfab20f769264f84a608
+size 2023316821

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

prompt_info.py ADDED Viewed

	@@ -0,0 +1,41 @@

+import os
+__dir__ = os.path.dirname(os.path.abspath(__file__))
+ref_audio = {
+          "孙悟空":{"audio":"../../data/audio/孙悟空.WAV","text":"齐天大圣下凡，与两位师弟共保大唐高僧，西天取经的。"},
+          "李白":{"audio":"../../data/audio/李白原声.MP3","text":"神游千山外，化墨入深潭；但承青莲有侠志，莫道红尘无剑仙。"},
+          "唐僧":{"audio":"../../data/audio/唐僧.WAV","text":"佛心四大皆空，贫僧尘念已绝"},
+          "猪八戒":{"audio":"../../data/audio/猪八戒.WAV","text":"一听说抓妖怪，就跟见你外公似的你看"},
+          "沙僧":{"audio":"../../data/audio/沙僧.WAV","text":"取些水来把火扑灭，我们不就得救了吗"},
+          "圣诞老人":{"audio":"../../data/audio/圣诞老人.MP3","text":"我是你的老朋友圣诞老人，今年圣诞节，我会驾驶驯鹿雪橇，从芬兰北部出发"},
+        #   "埃隆·马斯克":{"audio":"../../data/audio/马斯克.MP3","text":"videos of rockets blowing up，and made me watch those，just didn't want me to lose all my money"},
+        #   "特朗普":{"audio":"../../data/audio/特朗普.WAV","text":"we will make America strong again. we will make America wealthy again."},
+          "观音菩萨":{"audio":"../../data/audio/观音菩萨.WAV","text":"莫伤他命，我那骆伽山后山无人看管，就让他做个守山大神吧"},
+        #   "权志龙":{"audio":"../../data/audio/权志龙.WAV","text":"제자신이저를제일잘알겠죠그래서마약을하지않았기때문에이번마약범죄"},
+          "甄嬛":{"audio":"../../data/audio/甄嬛.WAV","text":"能不能让娘娘容下，是嫔妾的本事。溃疡烂到一定程度，才好动刀除去"},
+          "路飞":{"audio":"../../data/audio/路飞.WAV","text":"我还以为一跳就上去了，可恶，还真不容易啊，再试一次，我走了"},
+        #   "柯南":{"audio":"../../data/audio/柯南日.WAV","text":"函館、肘方俊三の日本刀を狙い、キッドからの予告状が。なぜ奴が、ビッグジュエルでもない刀を狙う。"},
+          "林黛玉":{"audio":"../../data/audio/黛玉原声.MP3","text":"今儿他来，明儿我再来，这样间错开来着，不至于太冷落，也不至于太热闹"},
+          "诸葛亮":{"audio":"../../data/audio/诸葛亮原音.MP3","text":"后值倾覆，受任于败军之际，奉命于危难之间。"},
+          "吕布":{"audio":"../../data/audio/吕布原声.MP3","text":"谁能和我相比！我才是当世无敌的强者，神的怒火，你要如何熄灭。"},
+        #   "鸣人":{"audio":"../../data/audio/鸣人原音.MP3","text":"俺ってばちゃんと飯食ってから大丈夫だって言ってくれえしねえでいろいろ食べてんだ本骨にエミソに"},
+        #   "悟空":{"audio":"../../data/audio/龙珠悟空.MP3","text":"えーたちに殺された。 やるためにも。 目をぶっ倒す。"},
+        #   "小樱":{"audio":"../../data/audio/小樱原声.MP3","text":"闇の力を秘めし、鍵よ、真の姿を我の前に示せ。 ダメージ。"},
+        #   "白雪公主":{"audio":"../../data/audio/白雪公主原声.MP3","text":"oh, she'll never find me here, and if you let me stay. I'll keep house for you."},
+          "哪吒":{"audio":"../../data/audio/哪吒原声.MP3","text":"替天行道是使命，斩妖除魔我最擅长"},
+          "白素贞":{"audio":"../../data/audio/白娘子原声.MP3","text":"无论他在世间何处，无论他是何模样，无论他还记不记得我，我都要找到他"},
+        #   "初音未来":{"audio":"../../data/audio/初音未来原音.MP3","text":"来てくれてありが。 思いっきり歌っちゃう。"},
+          "洛天依":{"audio":"../../data/audio/洛天依原声.MP3","text":"早上好，中午好，晚上好，我是天依，不知道我们此时相遇的时间，所以我把一天的问候都送给你啦"},
+          "言和":{"audio":"../../data/audio/言和原声.MP3","text":"你好，我是虚拟歌手言和，很高兴你听我唱歌"},
+        #   "凯尔希":{"audio":"../../data/audio/凯尔希原声.MP3","text":"第一に芽吹いた命はどれも強く。 基本的なじゅんや抵抗は？ ようにして徒労に終わる。"},
+          "艾希":{"audio":"../../data/audio/艾希原声.MP3","text":"我是艾希，葛伦娜之女，阿瓦罗萨部族的战母"},
+        #   "蜘蛛侠":{"audio":"../../data/audio/蜘蛛侠原声.MP3","text":"Are you afraid that i'm going to turn into some kind of criminal, don' worry about me. Okay? something is different, i'll figure it out, stop lecturing me."},
+        #   "哈利·波特":{"audio":"../../data/audio/哈利波特原声.MP3","text":"when you are a second away from being murdered or watching a friend die right before your eyes"},
+        #   "哈利波特":{"audio":"../../data/audio/哈利波特原声.MP3","text":"when you are a second away from being murdered or watching a friend die right before your eyes"},
+         }
+for role in ref_audio:
+    path = ref_audio[role]["audio"]
+    path = os.path.abspath(os.path.join(__dir__, '..', path))
+    ref_audio[role]["audio"] = path

speech_tokenizer_v2.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d43342aa12163a80bf07bffb94c9de2e120a8df2f9917cd2f642e7f4219c6f71
+size 496082973

spk2info.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b57f4fa23fd0c921ed263fc4fa7dc5139afaa35c03000d53762e3213c1813047
+size 3216336

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,48 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151645": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [
+    "<|im_start|>", "<|im_end|>", "<|endofprompt|>",
+    "[breath]", "<strong>", "</strong>", "[noise]",
+    "[laughter]", "[cough]", "[clucking]", "[accent]",
+    "[quick_breath]",
+    "<laughter>", "</laughter>",
+    "[hissing]", "[sigh]", "[vocalized-noise]",
+    "[lipsmack]", "[mn]"
+  ],
+  "bos_token": null,
+  "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|im_end|>",
+  "errors": "replace",
+  "model_max_length": 32768,
+  "pad_token": "<|endoftext|>",
+  "split_special_tokens": false,
+  "tokenizer_class": "Qwen2Tokenizer",
+  "unk_token": null
+}

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff