Spaces:

Rayzggz
/

hanser-Bert-VITS2

Build error

App Files Files Community

Roi Feng commited on Dec 16, 2023

Commit

2e9bf0c

1 Parent(s): 14dc496

new 2.2

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.idea/.name +1 -0
.idea/workspace.xml +202 -0
.pre-commit-config.yaml +3 -3
README.md +42 -12
app.py +0 -229
bert/bert-base-japanese-v3/.gitattributes +34 -0
bert/bert-large-japanese-v2/.gitattributes +34 -0
bert/bert-large-japanese-v2/README.md +53 -0
bert/bert-large-japanese-v2/config.json +19 -0
bert/bert-large-japanese-v2/flax_model.msgpack +3 -0
bert/bert-large-japanese-v2/pytorch_model.bin +3 -0
bert/bert-large-japanese-v2/tf_model.h5 +3 -0
bert/bert-large-japanese-v2/tokenizer_config.json +10 -0
bert/bert-large-japanese-v2/vocab.txt +0 -0
bert/bert_models.json +14 -0
bert/chinese-roberta-wwm-ext-large/.gitignore +0 -1
bert/deberta-v2-large-japanese-char-wwm/.gitattributes +34 -0
bert/deberta-v2-large-japanese-char-wwm/README.md +89 -0
bert/deberta-v2-large-japanese-char-wwm/config.json +37 -0
bert/deberta-v2-large-japanese-char-wwm/model.safetensors +3 -0
bert/deberta-v2-large-japanese-char-wwm/pytorch_model.bin +3 -0
bert/deberta-v2-large-japanese-char-wwm/special_tokens_map.json +7 -0
bert/deberta-v2-large-japanese-char-wwm/tokenizer_config.json +19 -0
bert/deberta-v2-large-japanese-char-wwm/vocab.txt +0 -0
bert/deberta-v2-large-japanese/.gitattributes +34 -0
bert/deberta-v2-large-japanese/README.md +111 -0
bert/deberta-v2-large-japanese/config.json +38 -0
bert/deberta-v2-large-japanese/model.safetensors +3 -0
bert/deberta-v2-large-japanese/pytorch_model.bin +3 -0
bert/deberta-v2-large-japanese/special_tokens_map.json +9 -0
logs/hanser/G_9000_2nd.pth → bert/deberta-v2-large-japanese/spm.model +2 -2
bert/deberta-v2-large-japanese/tokenizer.json +0 -0
bert/deberta-v2-large-japanese/tokenizer_config.json +15 -0
bert/deberta-v3-large/.gitattributes +27 -0
bert/deberta-v3-large/README.md +93 -0
bert/deberta-v3-large/config.json +22 -0
bert/deberta-v3-large/generator_config.json +22 -0
logs/hanser/G_26000.pth → bert/deberta-v3-large/pytorch_model.bin +2 -2
logs/hanser/G_8000.pth → bert/deberta-v3-large/pytorch_model.generator.bin +2 -2
bert/deberta-v3-large/spm.model +3 -0
bert/deberta-v3-large/tf_model.h5 +3 -0
bert/deberta-v3-large/tokenizer_config.json +4 -0
bert_gen.py +32 -17
clap_gen.py +64 -0
clap_wrapper.py +49 -0
commons.py +6 -8
compress_model.py +89 -0
config.py +248 -0
configs/config.json +868 -10
css/custom.css +18 -0

.idea/.name ADDED Viewed

	@@ -0,0 +1 @@


1	+ infer.py

.idea/workspace.xml ADDED Viewed

	@@ -0,0 +1,202 @@

+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="AutoImportSettings">
+    <option name="autoReloadType" value="SELECTIVE" />
+  </component>
+  <component name="ChangeListManager">
+    <list default="true" id="57daa15b-1002-473f-a1f9-e5d1a7c43662" name="更改" comment="new 2.2" />
+    <option name="SHOW_DIALOG" value="false" />
+    <option name="HIGHLIGHT_CONFLICTS" value="true" />
+    <option name="HIGHLIGHT_NON_ACTIVE_CHANGELIST" value="false" />
+    <option name="LAST_RESOLUTION" value="IGNORE" />
+  </component>
+  <component name="Git.Settings">
+    <option name="RECENT_GIT_ROOT_PATH" value="$PROJECT_DIR$" />
+    <option name="RESET_MODE" value="HARD" />
+  </component>
+  <component name="MarkdownSettingsMigration">
+    <option name="stateVersion" value="1" />
+  </component>
+  <component name="ProjectColorInfo">{
+  &quot;associatedIndex&quot;: 0
+}</component>
+  <component name="ProjectId" id="2Wh18f8c0EzBeG8Gv7V4qN17QRN" />
+  <component name="ProjectLevelVcsManager">
+    <ConfirmationsSetting value="2" id="Add" />
+  </component>
+  <component name="ProjectViewState">
+    <option name="hideEmptyMiddlePackages" value="true" />
+    <option name="showLibraryContents" value="true" />
+  </component>
+  <component name="PropertiesComponent"><![CDATA[{
+  "keyToString": {
+    "ASKED_ADD_EXTERNAL_FILES": "true",
+    "RunOnceActivity.OpenProjectViewOnStart": "true",
+    "RunOnceActivity.ShowReadmeOnStart": "true",
+    "WebServerToolWindowFactoryState": "false",
+    "last_opened_file_path": "D:/AI/hanser-tts/git/huggingface/hanser-Bert-VITS2",
+    "node.js.detected.package.eslint": "true",
+    "node.js.detected.package.tslint": "true",
+    "node.js.selected.package.eslint": "(autodetect)",
+    "node.js.selected.package.tslint": "(autodetect)",
+    "nodejs_package_manager_path": "npm",
+    "settings.editor.selected.configurable": "project.propVCSSupport.CommitDialog",
+    "vue.rearranger.settings.migration": "true"
+  }
+}]]></component>
+  <component name="SharedIndexes">
+    <attachedChunks>
+      <set>
+        <option value="bundled-python-sdk-7a29c1521ef0-c986f194a52a-com.jetbrains.pycharm.pro.sharedIndexes.bundled-PY-233.11799.298" />
+      </set>
+    </attachedChunks>
+  </component>
+  <component name="SpellCheckerSettings" RuntimeDictionaries="0" Folders="0" CustomDictionaries="0" DefaultDictionary="应用程序级" UseSingleDictionary="true" transferred="true" />
+  <component name="TaskManager">
+    <task active="true" id="Default" summary="默认任务">
+      <changelist id="57daa15b-1002-473f-a1f9-e5d1a7c43662" name="更改" comment="" />
+      <created>1697169839670</created>
+      <option name="number" value="Default" />
+      <option name="presentableId" value="Default" />
+      <updated>1697169839670</updated>
+      <workItem from="1697169840726" duration="1501000" />
+      <workItem from="1697171613511" duration="10000" />
+      <workItem from="1697171658870" duration="123000" />
+      <workItem from="1697407390249" duration="56000" />
+      <workItem from="1697408996084" duration="639000" />
+      <workItem from="1697521636207" duration="44000" />
+      <workItem from="1697945418812" duration="55000" />
+      <workItem from="1697946142695" duration="24000" />
+      <workItem from="1697946175706" duration="3000" />
+      <workItem from="1697946610680" duration="1000" />
+      <workItem from="1697947997308" duration="58000" />
+      <workItem from="1698505506621" duration="10000" />
+      <workItem from="1702591070149" duration="1513000" />
+      <workItem from="1702592634434" duration="187000" />
+      <workItem from="1702592831699" duration="1603000" />
+      <workItem from="1702594451453" duration="141000" />
+      <workItem from="1702688265810" duration="124000" />
+    </task>
+    <task id="LOCAL-00001" summary="initialize hanser">
+      <option name="closed" value="true" />
+      <created>1697170034064</created>
+      <option name="number" value="00001" />
+      <option name="presentableId" value="LOCAL-00001" />
+      <option name="project" value="LOCAL" />
+      <updated>1697170034064</updated>
+    </task>
+    <task id="LOCAL-00002" summary="initialize hanser">
+      <option name="closed" value="true" />
+      <created>1697171752499</created>
+      <option name="number" value="00002" />
+      <option name="presentableId" value="LOCAL-00002" />
+      <option name="project" value="LOCAL" />
+      <updated>1697171752499</updated>
+    </task>
+    <task id="LOCAL-00003" summary="new model 26000">
+      <option name="closed" value="true" />
+      <created>1697407426756</created>
+      <option name="number" value="00003" />
+      <option name="presentableId" value="LOCAL-00003" />
+      <option name="project" value="LOCAL" />
+      <updated>1697407426756</updated>
+    </task>
+    <task id="LOCAL-00004" summary="add new acknowledge">
+      <option name="closed" value="true" />
+      <created>1697521672965</created>
+      <option name="number" value="00004" />
+      <option name="presentableId" value="LOCAL-00004" />
+      <option name="project" value="LOCAL" />
+      <updated>1697521672965</updated>
+    </task>
+    <task id="LOCAL-00005" summary="add new 2nd generation 9000 model">
+      <option name="closed" value="true" />
+      <created>1697945452959</created>
+      <option name="number" value="00005" />
+      <option name="presentableId" value="LOCAL-00005" />
+      <option name="project" value="LOCAL" />
+      <updated>1697945452959</updated>
+    </task>
+    <task id="LOCAL-00006" summary="fix new 2nd generation 9000 model">
+      <option name="closed" value="true" />
+      <created>1697946163919</created>
+      <option name="number" value="00006" />
+      <option name="presentableId" value="LOCAL-00006" />
+      <option name="project" value="LOCAL" />
+      <updated>1697946163919</updated>
+    </task>
+    <task id="LOCAL-00007" summary="new default speech text">
+      <option name="closed" value="true" />
+      <created>1697948048951</created>
+      <option name="number" value="00007" />
+      <option name="presentableId" value="LOCAL-00007" />
+      <option name="project" value="LOCAL" />
+      <updated>1697948048951</updated>
+    </task>
+    <task id="LOCAL-00008" summary="new 2.2 model">
+      <option name="closed" value="true" />
+      <created>1702591884134</created>
+      <option name="number" value="00008" />
+      <option name="presentableId" value="LOCAL-00008" />
+      <option name="project" value="LOCAL" />
+      <updated>1702591884134</updated>
+    </task>
+    <task id="LOCAL-00009" summary="new 2.2">
+      <option name="closed" value="true" />
+      <created>1702592975256</created>
+      <option name="number" value="00009" />
+      <option name="presentableId" value="LOCAL-00009" />
+      <option name="project" value="LOCAL" />
+      <updated>1702592975256</updated>
+    </task>
+    <task id="LOCAL-00010" summary="new 2.2 part 1">
+      <option name="closed" value="true" />
+      <created>1702594098010</created>
+      <option name="number" value="00010" />
+      <option name="presentableId" value="LOCAL-00010" />
+      <option name="project" value="LOCAL" />
+      <updated>1702594098010</updated>
+    </task>
+    <option name="localTasksCounter" value="11" />
+    <servers />
+  </component>
+  <component name="TypeScriptGeneratedFilesManager">
+    <option name="version" value="3" />
+  </component>
+  <component name="Vcs.Log.Tabs.Properties">
+    <option name="TAB_STATES">
+      <map>
+        <entry key="MAIN">
+          <value>
+            <State>
+              <option name="FILTERS">
+                <map>
+                  <entry key="branch">
+                    <value>
+                      <list>
+                        <option value="main" />
+                      </list>
+                    </value>
+                  </entry>
+                </map>
+              </option>
+            </State>
+          </value>
+        </entry>
+      </map>
+    </option>
+  </component>
+  <component name="VcsManagerConfiguration">
+    <option name="ADD_EXTERNAL_FILES_SILENTLY" value="true" />
+    <MESSAGE value="initialize hanser" />
+    <MESSAGE value="new model 26000" />
+    <MESSAGE value="add new acknowledge" />
+    <MESSAGE value="add new 2nd generation 9000 model" />
+    <MESSAGE value="fix new 2nd generation 9000 model" />
+    <MESSAGE value="new default speech text" />
+    <MESSAGE value="new 2.2 model" />
+    <MESSAGE value="new 2.2" />
+    <MESSAGE value="new 2.2 part 1" />
+    <option name="LAST_COMMIT_MESSAGE" value="new 2.2 part 1" />
+  </component>
+</project>

.pre-commit-config.yaml CHANGED Viewed

@@ -1,19 +1,19 @@
 repos:
   - repo: https://github.com/pre-commit/pre-commit-hooks
-    rev: v4.4.0
     hooks:
       - id: check-yaml
       - id: end-of-file-fixer
       - id: trailing-whitespace
   - repo: https://github.com/astral-sh/ruff-pre-commit
-    rev: v0.0.292
     hooks:
       - id: ruff
         args: [ --fix ]
   - repo: https://github.com/psf/black
-    rev: 23.9.1
     hooks:
       - id: black

 repos:
   - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v4.5.0
     hooks:
       - id: check-yaml
       - id: end-of-file-fixer
       - id: trailing-whitespace
   - repo: https://github.com/astral-sh/ruff-pre-commit
+    rev: v0.1.7
     hooks:
       - id: ruff
         args: [ --fix ]
   - repo: https://github.com/psf/black
+    rev: 23.11.0
     hooks:
       - id: black

README.md CHANGED Viewed

@@ -1,12 +1,42 @@
----
-title: AI Hanser
-emoji: 📊
-colorFrom: yellow
-colorTo: indigo
-sdk: gradio
-sdk_version: 3.47.1
-app_file: app.py
-pinned: false
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+<div align="center">
+<img alt="LOGO" src="https://cdn.jsdelivr.net/gh/fishaudio/fish-diffusion@main/images/logo_512x512.png" width="256" height="256" />
+# Bert-VITS2
+VITS2 Backbone with multilingual bert
+For quick guide, please refer to `webui_preprocess.py`.
+简易教程请参见 `webui_preprocess.py`。
+## 请注意，本项目核心思路来源于[anyvoiceai/MassTTS](https://github.com/anyvoiceai/MassTTS) 一个非常好的tts项目
+## MassTTS的演示demo为[ai版峰哥锐评峰哥本人,并找回了在金三角失落的腰子](https://www.bilibili.com/video/BV1w24y1c7z9)
+[//]: # (## 本项目与[PlayVoice/vits_chinese]&#40;https://github.com/PlayVoice/vits_chinese&#41; 没有任何关系)
+[//]: # ()
+[//]: # (本仓库来源于之前朋友分享了ai峰哥的视频，本人被其中的效果惊艳，在自己尝试MassTTS以后发现fs在音质方面与vits有一定差距，并且training的pipeline比vits更复杂，因此按照其思路将bert)
+## 成熟的旅行者/开拓者/舰长/博士/sensei/猎魔人/喵喵露/V应当参阅代码自己学习如何训练。
+### 严禁将此项目用于一切违反《中华人民共和国宪法》，《中华人民共和国刑法》，《中华人民共和国治安管理处罚法》和《中华人民共和国民法典》之用途。
+### 严禁用于任何政治相关用途。
+#### Video:https://www.bilibili.com/video/BV1hp4y1K78E
+#### Demo:https://www.bilibili.com/video/BV1TF411k78w
+#### QQ Group：815818430
+## References
++ [anyvoiceai/MassTTS](https://github.com/anyvoiceai/MassTTS)
++ [jaywalnut310/vits](https://github.com/jaywalnut310/vits)
++ [p0p4k/vits2_pytorch](https://github.com/p0p4k/vits2_pytorch)
++ [svc-develop-team/so-vits-svc](https://github.com/svc-develop-team/so-vits-svc)
++ [PaddlePaddle/PaddleSpeech](https://github.com/PaddlePaddle/PaddleSpeech)
++ [emotional-vits](https://github.com/innnky/emotional-vits)
++ [Bert-VITS2-en](https://github.com/xwan07017/Bert-VITS2-en)
++ [Bert-VITS2-UI](https://github.com/jiangyuxiaoxiao/Bert-VITS2-UI)
+## 感谢所有贡献者作出的努力
+<a href="https://github.com/fishaudio/Bert-VITS2/graphs/contributors" target="_blank">
+  <img src="https://contrib.rocks/image?repo=fishaudio/Bert-VITS2"/>
+</a>
+[//]: # (# 本项目所有代码引用均已写明，bert部分代码思路来源于[AI峰哥]&#40;https://www.bilibili.com/video/BV1w24y1c7z9&#41;，与[vits_chinese]&#40;https://github.com/PlayVoice/vits_chinese&#41;无任何关系。欢迎各位查阅代码。同时，我们也对该开发者的[碰瓷，乃至开盒开发者的行为]&#40;https://www.bilibili.com/read/cv27101514/&#41;表示强烈谴责。)

app.py DELETED Viewed

@@ -1,229 +0,0 @@
-# flake8: noqa: E402
-import sys, os
-import logging
-logging.getLogger("numba").setLevel(logging.WARNING)
-logging.getLogger("markdown_it").setLevel(logging.WARNING)
-logging.getLogger("urllib3").setLevel(logging.WARNING)
-logging.getLogger("matplotlib").setLevel(logging.WARNING)
-logging.basicConfig(
-    level=logging.INFO, format="| %(name)s | %(levelname)s | %(message)s"
-)
-logger = logging.getLogger(__name__)
-import torch
-import argparse
-import commons
-import utils
-from models import SynthesizerTrn
-from text.symbols import symbols
-from text import cleaned_text_to_sequence, get_bert
-from text.cleaner import clean_text
-import gradio as gr
-import webbrowser
-import numpy as np
-net_g = None
-if sys.platform == "darwin" and torch.backends.mps.is_available():
-    device = "mps"
-    os.environ["PYTORCH_ENABLE_MPS_FALLBACK"] = "1"
-else:
-    device = "cuda"
-def get_text(text, language_str, hps):
-    norm_text, phone, tone, word2ph = clean_text(text, language_str)
-    phone, tone, language = cleaned_text_to_sequence(phone, tone, language_str)
-    if hps.data.add_blank:
-        phone = commons.intersperse(phone, 0)
-        tone = commons.intersperse(tone, 0)
-        language = commons.intersperse(language, 0)
-        for i in range(len(word2ph)):
-            word2ph[i] = word2ph[i] * 2
-        word2ph[0] += 1
-    bert = get_bert(norm_text, word2ph, language_str, device)
-    del word2ph
-    assert bert.shape[-1] == len(phone), phone
-    if language_str == "ZH":
-        bert = bert
-        ja_bert = torch.zeros(768, len(phone))
-    elif language_str == "JP":
-        ja_bert = bert
-        bert = torch.zeros(1024, len(phone))
-    else:
-        bert = torch.zeros(1024, len(phone))
-        ja_bert = torch.zeros(768, len(phone))
-    assert bert.shape[-1] == len(
-        phone
-    ), f"Bert seq len {bert.shape[-1]} != {len(phone)}"
-    phone = torch.LongTensor(phone)
-    tone = torch.LongTensor(tone)
-    language = torch.LongTensor(language)
-    return bert, ja_bert, phone, tone, language
-def infer(text, sdp_ratio, noise_scale, noise_scale_w, length_scale, sid, language):
-    global net_g
-    bert, ja_bert, phones, tones, lang_ids = get_text(text, language, hps)
-    with torch.no_grad():
-        x_tst = phones.to(device).unsqueeze(0)
-        tones = tones.to(device).unsqueeze(0)
-        lang_ids = lang_ids.to(device).unsqueeze(0)
-        bert = bert.to(device).unsqueeze(0)
-        ja_bert = ja_bert.to(device).unsqueeze(0)
-        x_tst_lengths = torch.LongTensor([phones.size(0)]).to(device)
-        del phones
-        speakers = torch.LongTensor([hps.data.spk2id[sid]]).to(device)
-        audio = (
-            net_g.infer(
-                x_tst,
-                x_tst_lengths,
-                speakers,
-                tones,
-                lang_ids,
-                bert,
-                ja_bert,
-                sdp_ratio=sdp_ratio,
-                noise_scale=noise_scale,
-                noise_scale_w=noise_scale_w,
-                length_scale=length_scale,
-            )[0][0, 0]
-            .data.cpu()
-            .float()
-            .numpy()
-        )
-        del x_tst, tones, lang_ids, bert, x_tst_lengths, speakers
-        torch.cuda.empty_cache()
-        return audio
-def tts_fn(text, speaker, sdp_ratio, noise_scale, noise_scale_w, length_scale, language):
-    slices = text.split("|")
-    audio_list = []
-    with torch.no_grad():
-        for slice in slices:
-            audio = infer(slice, sdp_ratio=sdp_ratio, noise_scale=noise_scale, noise_scale_w=noise_scale_w, length_scale=length_scale, sid=speaker, language=language)
-            audio_list.append(audio)
-            silence = np.zeros(hps.data.sampling_rate)  # 生成1秒的静音
-            audio_list.append(silence)  # 将静音添加到列表中
-    audio_concat = np.concatenate(audio_list)
-    return "Success", (hps.data.sampling_rate, audio_concat)
-if __name__ == "__main__":
-    parser = argparse.ArgumentParser()
-    parser.add_argument(
-        "-m", "--model", default="./logs/hanser/G_9000_2nd.pth", help="path of your model"
-    )
-    parser.add_argument(
-        "-c",
-        "--config",
-        default="./configs/config.json",
-        help="path of your config file",
-    )
-    parser.add_argument(
-        "--share", default=False, help="make link public", action="store_true"
-    )
-    parser.add_argument(
-        "-d", "--debug", action="store_true", help="enable DEBUG-LEVEL log"
-    )
-    args = parser.parse_args()
-    if args.debug:
-        logger.info("Enable DEBUG-LEVEL log")
-        logging.basicConfig(level=logging.DEBUG)
-    hps = utils.get_hparams_from_file(args.config)
-    device = (
-        "cuda:0"
-        if torch.cuda.is_available()
-        else (
-            "mps"
-            if sys.platform == "darwin" and torch.backends.mps.is_available()
-            else "cpu"
-        )
-    )
-    net_g = SynthesizerTrn(
-        len(symbols),
-        hps.data.filter_length // 2 + 1,
-        hps.train.segment_size // hps.data.hop_length,
-        n_speakers=hps.data.n_speakers,
-        **hps.model,
-    ).to(device)
-    _ = net_g.eval()
-    _ = utils.load_checkpoint(args.model, net_g, None, skip_optimizer=True)
-    speaker_ids = hps.data.spk2id
-    speakers = list(speaker_ids.keys())
-    languages = ["ZH", "JP"]
-    with gr.Blocks() as app:
-        with gr.Row():
-            with gr.Column():
-                gr.Markdown(value="""
-                                🤖 【AI Hanser】在线语音合成 Bert-Vits2 🤖\n
-                                📝 作者：Rayzggz 📰博客 https://roi.moe 📺B站 https://space.bilibili.com/10501326 📝\n
-                                🎤 声音来源：Hanser https://space.bilibili.com/11073 🎤\n
-                                🔗 Bert-VITS2：https://github.com/fishaudio/Bert-VITS2 🔗\n
-                                ✅ 使用本模型请遵守中华人民共和国和美利坚合众国法律 ✅\n
-                                🏷️ 使用基于本模型的所有生成内容均需标注「使用Bert-VITS2 AI生成」、「本项目地址」、「作者名称」和「声音来源」 🏷️\n
-                                """)
-                text = gr.TextArea(
-                    label="Text",
-                    placeholder="Input Text Here",
-                    value="大家好，我是憨色，今天给大家看看我的摩托车车",
-                )
-                speaker = gr.Dropdown(
-                    choices=speakers, value=speakers[0], label="Speaker"
-                )
-                sdp_ratio = gr.Slider(
-                    minimum=0, maximum=1, value=0.2, step=0.1, label="SDP Ratio"
-                )
-                noise_scale = gr.Slider(
-                    minimum=0.1, maximum=2, value=0.6, step=0.1, label="Noise Scale"
-                )
-                noise_scale_w = gr.Slider(
-                    minimum=0.1, maximum=2, value=0.8, step=0.1, label="Noise Scale W"
-                )
-                length_scale = gr.Slider(
-                    minimum=0.1, maximum=2, value=1, step=0.1, label="Length Scale"
-                )
-                language = gr.Dropdown(
-                    choices=languages, value=languages[0], label="Language"
-                )
-                btn = gr.Button("Generate 生成!", variant="primary")
-            with gr.Column():
-                text_output = gr.Textbox(label="Message")
-                audio_output = gr.Audio(label="Output Audio")
-                gr.Markdown(value="""
-                👏 鸣谢： 👏\n
-                👤 团子是咸鱼 https://space.bilibili.com/10685437 👤\n
-                👤 领航员未鸟 https://space.bilibili.com/2403955 👤\n
-                👤 Xz乔希 https://space.bilibili.com/5859321 👤\n
-                👤 怎么好就怎么来 https://space.bilibili.com/259582714 👤\n
-                🧠 Google Colab https://colab.research.google.com/ 🧠\n
-                📧 如果你是“Hanser”，并且希望对此模型主张权利，请通过上方“作者”部分的联系方式联系，我将积极配合处理。📧 \n
-                """)
-        btn.click(
-            tts_fn,
-            inputs=[
-                text,
-                speaker,
-                sdp_ratio,
-                noise_scale,
-                noise_scale_w,
-                length_scale,
-                language,
-            ],
-            outputs=[text_output, audio_output],
-        )
-    app.launch(show_error=True)

bert/bert-base-japanese-v3/.gitattributes ADDED Viewed

	@@ -0,0 +1,34 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

bert/bert-large-japanese-v2/.gitattributes ADDED Viewed

	@@ -0,0 +1,34 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

bert/bert-large-japanese-v2/README.md ADDED Viewed

	@@ -0,0 +1,53 @@

+---
+license: apache-2.0
+datasets:
+- cc100
+- wikipedia
+language:
+- ja
+widget:
+- text: 東北大学で[MASK]の研究をしています。
+---
+# BERT large Japanese (unidic-lite with whole word masking, CC-100 and jawiki-20230102)
+This is a [BERT](https://github.com/google-research/bert) model pretrained on texts in the Japanese language.
+This version of the model processes input texts with word-level tokenization based on the Unidic 2.1.2 dictionary (available in [unidic-lite](https://pypi.org/project/unidic-lite/) package), followed by the WordPiece subword tokenization.
+Additionally, the model is trained with the whole word masking enabled for the masked language modeling (MLM) objective.
+The codes for the pretraining are available at [cl-tohoku/bert-japanese](https://github.com/cl-tohoku/bert-japanese/).
+## Model architecture
+The model architecture is the same as the original BERT large model; 24 layers, 1024 dimensions of hidden states, and 16 attention heads.
+## Training Data
+The model is trained on the Japanese portion of [CC-100 dataset](https://data.statmt.org/cc-100/) and the Japanese version of Wikipedia.
+For Wikipedia, we generated a text corpus from the [Wikipedia Cirrussearch dump file](https://dumps.wikimedia.org/other/cirrussearch/) as of January 2, 2023.
+The corpus files generated from CC-100 and Wikipedia are 74.3GB and 4.9GB in size and consist of approximately 392M and 34M sentences, respectively.
+For the purpose of splitting texts into sentences, we used [fugashi](https://github.com/polm/fugashi) with [mecab-ipadic-NEologd](https://github.com/neologd/mecab-ipadic-neologd) dictionary (v0.0.7).
+## Tokenization
+The texts are first tokenized by MeCab with the Unidic 2.1.2 dictionary and then split into subwords by the WordPiece algorithm.
+The vocabulary size is 32768.
+We used [fugashi](https://github.com/polm/fugashi) and [unidic-lite](https://github.com/polm/unidic-lite) packages for the tokenization.
+## Training
+We trained the model first on the CC-100 corpus for 1M steps and then on the Wikipedia corpus for another 1M steps.
+For training of the MLM (masked language modeling) objective, we introduced whole word masking in which all of the subword tokens corresponding to a single word (tokenized by MeCab) are masked at once.
+For training of each model, we used a v3-8 instance of Cloud TPUs provided by [TPU Research Cloud](https://sites.research.google/trc/about/).
+## Licenses
+The pretrained models are distributed under the Apache License 2.0.
+## Acknowledgments
+This model is trained with Cloud TPUs provided by [TPU Research Cloud](https://sites.research.google/trc/about/) program.

bert/bert-large-japanese-v2/config.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+    "architectures": [
+        "BertForPreTraining"
+    ],
+    "attention_probs_dropout_prob": 0.1,
+    "hidden_act": "gelu",
+    "hidden_dropout_prob": 0.1,
+    "hidden_size": 1024,
+    "initializer_range": 0.02,
+    "intermediate_size": 4096,
+    "layer_norm_eps": 1e-12,
+    "max_position_embeddings": 512,
+    "model_type": "bert",
+    "num_attention_heads": 16,
+    "num_hidden_layers": 24,
+    "pad_token_id": 0,
+    "type_vocab_size": 2,
+    "vocab_size": 32768
+}

bert/bert-large-japanese-v2/flax_model.msgpack ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5bc5b4b74742d76529fddd0e7699dd9464ed79361f90f8c04f70eda28a0d5f0f
+size 1354127270

bert/bert-large-japanese-v2/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:50212d714f79af45d3e47205faa356d0e5030e1c9a37138eadda544180f9e7c9
+size 1354248201

bert/bert-large-japanese-v2/tf_model.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2cdea8775c5dd96ec0055e6fffe42773aa23811bf14e8c04343e1d85c822fe8e
+size 1491013624

bert/bert-large-japanese-v2/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+    "tokenizer_class": "BertJapaneseTokenizer",
+    "model_max_length": 512,
+    "do_lower_case": false,
+    "word_tokenizer_type": "mecab",
+    "subword_tokenizer_type": "wordpiece",
+    "mecab_kwargs": {
+        "mecab_dic": "unidic_lite"
+    }
+}

bert/bert-large-japanese-v2/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

bert/bert_models.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+    "deberta-v2-large-japanese-char-wwm": {
+        "repo_id": "ku-nlp/deberta-v2-large-japanese-char-wwm",
+        "files": ["pytorch_model.bin"]
+    },
+    "chinese-roberta-wwm-ext-large": {
+        "repo_id": "hfl/chinese-roberta-wwm-ext-large",
+        "files": ["pytorch_model.bin"]
+    },
+    "deberta-v3-large": {
+        "repo_id": "microsoft/deberta-v3-large",
+        "files": ["spm.model", "pytorch_model.bin"]
+    }
+}

bert/chinese-roberta-wwm-ext-large/.gitignore DELETED Viewed

	@@ -1 +0,0 @@
1	- *.bin

bert/deberta-v2-large-japanese-char-wwm/.gitattributes ADDED Viewed

	@@ -0,0 +1,34 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

bert/deberta-v2-large-japanese-char-wwm/README.md ADDED Viewed

	@@ -0,0 +1,89 @@

+---
+language: ja
+license: cc-by-sa-4.0
+library_name: transformers
+tags:
+  - deberta
+  - deberta-v2
+  - fill-mask
+  - character
+  - wwm
+datasets:
+  - wikipedia
+  - cc100
+  - oscar
+metrics:
+  - accuracy
+mask_token: "[MASK]"
+widget:
+    - text: "京都大学で自然言語処理を[MASK][MASK]する。"
+---
+# Model Card for Japanese character-level DeBERTa V2 large
+## Model description
+This is a Japanese DeBERTa V2 large model pre-trained on Japanese Wikipedia, the Japanese portion of CC-100, and the Japanese portion of OSCAR.
+This model is trained with character-level tokenization and whole word masking.
+## How to use
+You can use this model for masked language modeling as follows:
+```python
+from transformers import AutoTokenizer, AutoModelForMaskedLM
+tokenizer = AutoTokenizer.from_pretrained('ku-nlp/deberta-v2-large-japanese-char-wwm')
+model = AutoModelForMaskedLM.from_pretrained('ku-nlp/deberta-v2-large-japanese-char-wwm')
+sentence = '京都大学で自然言語処理を[MASK][MASK]する。'
+encoding = tokenizer(sentence, return_tensors='pt')
+...
+```
+You can also fine-tune this model on downstream tasks.
+## Tokenization
+There is no need to tokenize texts in advance, and you can give raw texts to the tokenizer.
+The texts are tokenized into character-level tokens by [sentencepiece](https://github.com/google/sentencepiece).
+## Training data
+We used the following corpora for pre-training:
+- Japanese Wikipedia (as of 20221020, 3.2GB, 27M sentences, 1.3M documents)
+- Japanese portion of CC-100 (85GB, 619M sentences, 66M documents)
+- Japanese portion of OSCAR (54GB, 326M sentences, 25M documents)
+Note that we filtered out documents annotated with "header", "footer", or "noisy" tags in OSCAR.
+Also note that Japanese Wikipedia was duplicated 10 times to make the total size of the corpus comparable to that of CC-100 and OSCAR. As a result, the total size of the training data is 171GB.
+## Training procedure
+We first segmented texts in the corpora into words using [Juman++ 2.0.0-rc3](https://github.com/ku-nlp/jumanpp/releases/tag/v2.0.0-rc3) for whole word masking.
+Then, we built a sentencepiece model with 22,012 tokens including all characters that appear in the training corpus.
+We tokenized raw corpora into character-level subwords using the sentencepiece model and trained the Japanese DeBERTa model using [transformers](https://github.com/huggingface/transformers) library.
+The training took 26 days using 16 NVIDIA A100-SXM4-40GB GPUs.
+The following hyperparameters were used during pre-training:
+- learning_rate: 1e-4
+- per_device_train_batch_size: 26
+- distributed_type: multi-GPU
+- num_devices: 16
+- gradient_accumulation_steps: 8
+- total_train_batch_size: 3,328
+- max_seq_length: 512
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-06
+- lr_scheduler_type: linear schedule with warmup (lr = 0 at 300k steps)
+- training_steps: 260,000
+- warmup_steps: 10,000
+The accuracy of the trained model on the masked language modeling task was 0.795.
+The evaluation set consists of 5,000 randomly sampled documents from each of the training corpora.
+## Acknowledgments
+This work was supported by Joint Usage/Research Center for Interdisciplinary Large-scale Information Infrastructures (JHPCN) through General Collaboration Project no. jh221004, "Developing a Platform for Constructing and Sharing of Large-Scale Japanese Language Models".
+For training models, we used the mdx: a platform for the data-driven future.

bert/deberta-v2-large-japanese-char-wwm/config.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "architectures": [
+    "DebertaV2ForMaskedLM"
+  ],
+  "attention_head_size": 64,
+  "attention_probs_dropout_prob": 0.1,
+  "conv_act": "gelu",
+  "conv_kernel_size": 3,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "layer_norm_eps": 1e-07,
+  "max_position_embeddings": 512,
+  "max_relative_positions": -1,
+  "model_type": "deberta-v2",
+  "norm_rel_ebd": "layer_norm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "pooler_dropout": 0,
+  "pooler_hidden_act": "gelu",
+  "pooler_hidden_size": 1024,
+  "pos_att_type": [
+    "p2c",
+    "c2p"
+  ],
+  "position_biased_input": false,
+  "position_buckets": 256,
+  "relative_attention": true,
+  "share_att_key": true,
+  "torch_dtype": "float16",
+  "transformers_version": "4.25.1",
+  "type_vocab_size": 0,
+  "vocab_size": 22012
+}

bert/deberta-v2-large-japanese-char-wwm/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2630f547d018524a7b03506a42c700cbac49e29bdc441845b0615bfb3b5d74d2
+size 1318453704

bert/deberta-v2-large-japanese-char-wwm/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf0dab8ad87bd7c22e85ec71e04f2240804fda6d33196157d6b5923af6ea1201
+size 1318456639

bert/deberta-v2-large-japanese-char-wwm/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

bert/deberta-v2-large-japanese-char-wwm/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "do_subword_tokenize": true,
+  "do_word_tokenize": true,
+  "jumanpp_kwargs": null,
+  "mask_token": "[MASK]",
+  "mecab_kwargs": null,
+  "model_max_length": 1000000000000000019884624838656,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "special_tokens_map_file": null,
+  "subword_tokenizer_type": "character",
+  "sudachi_kwargs": null,
+  "tokenizer_class": "BertJapaneseTokenizer",
+  "unk_token": "[UNK]",
+  "word_tokenizer_type": "basic"
+}

bert/deberta-v2-large-japanese-char-wwm/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

bert/deberta-v2-large-japanese/.gitattributes ADDED Viewed

	@@ -0,0 +1,34 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

bert/deberta-v2-large-japanese/README.md ADDED Viewed

	@@ -0,0 +1,111 @@

+---
+language: ja
+license: cc-by-sa-4.0
+library_name: transformers
+tags:
+  - deberta
+  - deberta-v2
+  - fill-mask
+datasets:
+  - wikipedia
+  - cc100
+  - oscar
+metrics:
+  - accuracy
+mask_token: "[MASK]"
+widget:
+  - text: "京都 大学 で 自然 言語 処理 を [MASK] する 。"
+---
+# Model Card for Japanese DeBERTa V2 large
+## Model description
+This is a Japanese DeBERTa V2 large model pre-trained on Japanese Wikipedia, the Japanese portion of CC-100, and the
+Japanese portion of OSCAR.
+## How to use
+You can use this model for masked language modeling as follows:
+```python
+from transformers import AutoTokenizer, AutoModelForMaskedLM
+tokenizer = AutoTokenizer.from_pretrained('ku-nlp/deberta-v2-large-japanese')
+model = AutoModelForMaskedLM.from_pretrained('ku-nlp/deberta-v2-large-japanese')
+sentence = '京都 大学 で 自然 言語 処理 を [MASK] する 。'  # input should be segmented into words by Juman++ in advance
+encoding = tokenizer(sentence, return_tensors='pt')
+...
+```
+You can also fine-tune this model on downstream tasks.
+## Tokenization
+The input text should be segmented into words by [Juman++](https://github.com/ku-nlp/jumanpp) in
+advance. [Juman++ 2.0.0-rc3](https://github.com/ku-nlp/jumanpp/releases/tag/v2.0.0-rc3) was used for pre-training. Each
+word is tokenized into subwords by [sentencepiece](https://github.com/google/sentencepiece).
+## Training data
+We used the following corpora for pre-training:
+- Japanese Wikipedia (as of 20221020, 3.2GB, 27M sentences, 1.3M documents)
+- Japanese portion of CC-100 (85GB, 619M sentences, 66M documents)
+- Japanese portion of OSCAR (54GB, 326M sentences, 25M documents)
+Note that we filtered out documents annotated with "header", "footer", or "noisy" tags in OSCAR.
+Also note that Japanese Wikipedia was duplicated 10 times to make the total size of the corpus comparable to that of
+CC-100 and OSCAR. As a result, the total size of the training data is 171GB.
+## Training procedure
+We first segmented texts in the corpora into words using [Juman++](https://github.com/ku-nlp/jumanpp).
+Then, we built a sentencepiece model with 32000 tokens including words ([JumanDIC](https://github.com/ku-nlp/JumanDIC))
+and subwords induced by the unigram language model of [sentencepiece](https://github.com/google/sentencepiece).
+We tokenized the segmented corpora into subwords using the sentencepiece model and trained the Japanese DeBERTa model
+using [transformers](https://github.com/huggingface/transformers) library.
+The training took 36 days using 8 NVIDIA A100-SXM4-40GB GPUs.
+The following hyperparameters were used during pre-training:
+- learning_rate: 1e-4
+- per_device_train_batch_size: 18
+- distributed_type: multi-GPU
+- num_devices: 8
+- gradient_accumulation_steps: 16
+- total_train_batch_size: 2,304
+- max_seq_length: 512
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-06
+- lr_scheduler_type: linear schedule with warmup
+- training_steps: 300,000
+- warmup_steps: 10,000
+The accuracy of the trained model on the masked language modeling task was 0.799.
+The evaluation set consists of 5,000 randomly sampled documents from each of the training corpora.
+## Fine-tuning on NLU tasks
+We fine-tuned the following models and evaluated them on the dev set of JGLUE.
+We tuned learning rate and training epochs for each model and task
+following [the JGLUE paper](https://www.jstage.jst.go.jp/article/jnlp/30/1/30_63/_pdf/-char/ja).
+| Model                         | MARC-ja/acc | JSTS/pearson | JSTS/spearman | JNLI/acc | JSQuAD/EM | JSQuAD/F1 | JComQA/acc |
+|-------------------------------|-------------|--------------|---------------|----------|-----------|-----------|------------|
+| Waseda RoBERTa base           | 0.965       | 0.913        | 0.876         | 0.905    | 0.853     | 0.916     | 0.853      |
+| Waseda RoBERTa large (seq512) | 0.969       | 0.925        | 0.890         | 0.928    | 0.910     | 0.955     | 0.900      |
+| LUKE Japanese base*           | 0.965       | 0.916        | 0.877         | 0.912    | -         | -         | 0.842      |
+| LUKE Japanese large*          | 0.965       | 0.932        | 0.902         | 0.927    | -         | -         | 0.893      |
+| DeBERTaV2 base                | 0.970       | 0.922        | 0.886         | 0.922    | 0.899     | 0.951     | 0.873      |
+| DeBERTaV2 large               | 0.968       | 0.925        | 0.892         | 0.924    | 0.912     | 0.959     | 0.890      |
+*The scores of LUKE are from [the official repository](https://github.com/studio-ousia/luke).
+## Acknowledgments
+This work was supported by Joint Usage/Research Center for Interdisciplinary Large-scale Information Infrastructures (
+JHPCN) through General Collaboration Project no. jh221004, "Developing a Platform for Constructing and Sharing of
+Large-Scale Japanese Language Models".
+For training models, we used the mdx: a platform for the data-driven future.

bert/deberta-v2-large-japanese/config.json ADDED Viewed

	@@ -0,0 +1,38 @@

+{
+  "_name_or_path": "configs/deberta_v2_large.json",
+  "architectures": [
+    "DebertaV2ForMaskedLM"
+  ],
+  "attention_head_size": 64,
+  "attention_probs_dropout_prob": 0.1,
+  "conv_act": "gelu",
+  "conv_kernel_size": 3,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "layer_norm_eps": 1e-07,
+  "max_position_embeddings": 512,
+  "max_relative_positions": -1,
+  "model_type": "deberta-v2",
+  "norm_rel_ebd": "layer_norm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "pooler_dropout": 0,
+  "pooler_hidden_act": "gelu",
+  "pooler_hidden_size": 1024,
+  "pos_att_type": [
+    "p2c",
+    "c2p"
+  ],
+  "position_biased_input": false,
+  "position_buckets": 256,
+  "relative_attention": true,
+  "share_att_key": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.23.1",
+  "type_vocab_size": 0,
+  "vocab_size": 32000
+}

bert/deberta-v2-large-japanese/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:726bd655468fba70cf5348751a560b0fc969f4064e23759287461aa54b9e27e2
+size 1490606906

bert/deberta-v2-large-japanese/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a6c15feac0dea77ab8835c70e1befa4cf4c2137862c6fb2443b1553f70840047
+size 1490693213

bert/deberta-v2-large-japanese/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "bos_token": "[CLS]",
+  "cls_token": "[CLS]",
+  "eos_token": "[SEP]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

logs/hanser/G_9000_2nd.pth → bert/deberta-v2-large-japanese/spm.model RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2cc7b8dc2f8c63a8ccfa6739e6ac49c41af0788cfa628ec39bb487ce5eb32ef4
-size 857912686

 version https://git-lfs.github.com/spec/v1
+oid sha256:6c111c16e2e52366dcac46b886e40650bb843fe2938a65f5970271fc5697a127
+size 805061

bert/deberta-v2-large-japanese/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

bert/deberta-v2-large-japanese/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "bos_token": "[CLS]",
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "eos_token": "[SEP]",
+  "keep_accents": true,
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "sp_model_kwargs": {},
+  "special_tokens_map_file": null,
+  "split_by_punct": false,
+  "tokenizer_class": "DebertaV2Tokenizer",
+  "unk_token": "[UNK]"
+}

bert/deberta-v3-large/.gitattributes ADDED Viewed

	@@ -0,0 +1,27 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bin.* filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zstandard filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

bert/deberta-v3-large/README.md ADDED Viewed

	@@ -0,0 +1,93 @@

+---
+language: en
+tags:
+  - deberta
+  - deberta-v3
+  - fill-mask
+thumbnail: https://huggingface.co/front/thumbnails/microsoft.png
+license: mit
+---
+## DeBERTaV3: Improving DeBERTa using ELECTRA-Style Pre-Training with Gradient-Disentangled Embedding Sharing
+[DeBERTa](https://arxiv.org/abs/2006.03654) improves the BERT and RoBERTa models using disentangled attention and enhanced mask decoder. With those two improvements, DeBERTa out perform RoBERTa on a majority of NLU tasks with 80GB training data.
+In [DeBERTa V3](https://arxiv.org/abs/2111.09543), we further improved the efficiency of DeBERTa using ELECTRA-Style pre-training with Gradient Disentangled Embedding Sharing. Compared to DeBERTa,  our V3 version significantly improves the model performance on downstream tasks.  You can find more technique details about the new model from our [paper](https://arxiv.org/abs/2111.09543).
+Please check the [official repository](https://github.com/microsoft/DeBERTa) for more implementation details and updates.
+The DeBERTa V3 large model comes with 24 layers and a hidden size of 1024. It has 304M backbone parameters  with a vocabulary containing 128K tokens which introduces 131M parameters in the Embedding layer.  This model was trained using the 160GB data as DeBERTa V2.
+#### Fine-tuning on NLU tasks
+We present the dev results on SQuAD 2.0 and MNLI tasks.
+| Model             |Vocabulary(K)|Backbone #Params(M)| SQuAD 2.0(F1/EM) | MNLI-m/mm(ACC)|
+|-------------------|----------|-------------------|-----------|----------|
+| RoBERTa-large     |50     |304                | 89.4/86.5 | 90.2   |
+| XLNet-large       |32     |-                  | 90.6/87.9 | 90.8   |
+| DeBERTa-large     |50     |-                  | 90.7/88.0 | 91.3   |
+| **DeBERTa-v3-large**|128|304                  |  **91.5/89.0**| **91.8/91.9**|
+#### Fine-tuning with HF transformers
+```bash
+#!/bin/bash
+cd transformers/examples/pytorch/text-classification/
+pip install datasets
+export TASK_NAME=mnli
+output_dir="ds_results"
+num_gpus=8
+batch_size=8
+python -m torch.distributed.launch --nproc_per_node=${num_gpus} \
+  run_glue.py \
+  --model_name_or_path microsoft/deberta-v3-large \
+  --task_name $TASK_NAME \
+  --do_train \
+  --do_eval \
+  --evaluation_strategy steps \
+  --max_seq_length 256 \
+  --warmup_steps 50 \
+  --per_device_train_batch_size ${batch_size} \
+  --learning_rate 6e-6 \
+  --num_train_epochs 2 \
+  --output_dir $output_dir \
+  --overwrite_output_dir \
+  --logging_steps 1000 \
+  --logging_dir $output_dir
+```
+### Citation
+If you find DeBERTa useful for your work, please cite the following papers:
+``` latex
+@misc{he2021debertav3,
+      title={DeBERTaV3: Improving DeBERTa using ELECTRA-Style Pre-Training with Gradient-Disentangled Embedding Sharing},
+      author={Pengcheng He and Jianfeng Gao and Weizhu Chen},
+      year={2021},
+      eprint={2111.09543},
+      archivePrefix={arXiv},
+      primaryClass={cs.CL}
+}
+```
+``` latex
+@inproceedings{
+he2021deberta,
+title={DEBERTA: DECODING-ENHANCED BERT WITH DISENTANGLED ATTENTION},
+author={Pengcheng He and Xiaodong Liu and Jianfeng Gao and Weizhu Chen},
+booktitle={International Conference on Learning Representations},
+year={2021},
+url={https://openreview.net/forum?id=XPZIaotutsD}
+}
+```

bert/deberta-v3-large/config.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+		"model_type": "deberta-v2",
+		"attention_probs_dropout_prob": 0.1,
+		"hidden_act": "gelu",
+		"hidden_dropout_prob": 0.1,
+		"hidden_size": 1024,
+		"initializer_range": 0.02,
+		"intermediate_size": 4096,
+		"max_position_embeddings": 512,
+		"relative_attention": true,
+		"position_buckets": 256,
+		"norm_rel_ebd": "layer_norm",
+		"share_att_key": true,
+		"pos_att_type": "p2c|c2p",
+		"layer_norm_eps": 1e-7,
+		"max_relative_positions": -1,
+		"position_biased_input": false,
+		"num_attention_heads": 16,
+		"num_hidden_layers": 24,
+		"type_vocab_size": 0,
+		"vocab_size": 128100
+}

bert/deberta-v3-large/generator_config.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+	"model_type": "deberta-v2",
+	"attention_probs_dropout_prob": 0.1,
+	"hidden_act": "gelu",
+	"hidden_dropout_prob": 0.1,
+	"hidden_size": 1024,
+	"initializer_range": 0.02,
+	"intermediate_size": 4096,
+	"max_position_embeddings": 512,
+	"relative_attention": true,
+	"position_buckets": 256,
+	"norm_rel_ebd": "layer_norm",
+	"share_att_key": true,
+	"pos_att_type": "p2c|c2p",
+	"layer_norm_eps": 1e-7,
+	"max_relative_positions": -1,
+	"position_biased_input": false,
+	"num_attention_heads": 16,
+	"num_hidden_layers": 12,
+	"type_vocab_size": 0,
+	"vocab_size": 128100
+}

logs/hanser/G_26000.pth → bert/deberta-v3-large/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:78bbd64ec6b6dbdced5f2597fa6489164e54dcad3a459aff008b8bf00d8d6508
-size 857922317

 version https://git-lfs.github.com/spec/v1
+oid sha256:dd5b5d93e2db101aaf281df0ea1216c07ad73620ff59c5b42dccac4bf2eef5b5
+size 873673253

logs/hanser/G_8000.pth → bert/deberta-v3-large/pytorch_model.generator.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:782249a78ac551bda545bdf2126bd20acec871d0f69a027f5047b6f87564e68d
-size 857912255

 version https://git-lfs.github.com/spec/v1
+oid sha256:ff85455c562822ea7001f810d026a68da8a24ffdae5a095081dfe7e84e27989d
+size 571293153

bert/deberta-v3-large/spm.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
+size 2464616

bert/deberta-v3-large/tf_model.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:20462c6c76990df31b0e82ee5d1e2b7cb06e0a3823334149fbb3b169826ed476
+size 1736592160

bert/deberta-v3-large/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "do_lower_case": false,
+  "vocab_type": "spm"
+}

bert_gen.py CHANGED Viewed

@@ -1,19 +1,26 @@
 import torch
-from multiprocessing import Pool
 import commons
 import utils
-from tqdm import tqdm
 from text import cleaned_text_to_sequence, get_bert
-import argparse
-import torch.multiprocessing as mp
 def process_line(line):
-    rank = mp.current_process()._identity
-    rank = rank[0] if len(rank) > 0 else 0
-    if torch.cuda.is_available():
-        gpu_id = rank % torch.cuda.device_count()
-        device = torch.device(f"cuda:{gpu_id}")
     wav_path, _, language_str, text, phones, tone, word2ph = line.strip().split("|")
     phone = phones.split(" ")
     tone = [int(i) for i in tone.split(" ")]
@@ -28,7 +35,7 @@ def process_line(line):
         word2ph[i] = word2ph[i] * 2
     word2ph[0] += 1
-    bert_path = wav_path.replace(".wav", ".bert.pt")
     try:
         bert = torch.load(bert_path)
@@ -39,11 +46,17 @@ def process_line(line):
         torch.save(bert, bert_path)
 if __name__ == "__main__":
     parser = argparse.ArgumentParser()
-    parser.add_argument("-c", "--config", type=str, default="configs/config.json")
-    parser.add_argument("--num_processes", type=int, default=2)
-    args = parser.parse_args()
     config_path = args.config
     hps = utils.get_hparams_from_file(config_path)
     lines = []
@@ -52,8 +65,10 @@ if __name__ == "__main__":
     with open(hps.data.validation_files, encoding="utf-8") as f:
         lines.extend(f.readlines())
-    num_processes = args.num_processes
-    with Pool(processes=num_processes) as pool:
-        for _ in tqdm(pool.imap_unordered(process_line, lines), total=len(lines)):
-            pass

+import argparse
+from multiprocessing import Pool, cpu_count
 import torch
+import torch.multiprocessing as mp
+from tqdm import tqdm
 import commons
 import utils
+from config import config
 from text import cleaned_text_to_sequence, get_bert
 def process_line(line):
+    device = config.bert_gen_config.device
+    if config.bert_gen_config.use_multi_device:
+        rank = mp.current_process()._identity
+        rank = rank[0] if len(rank) > 0 else 0
+        if torch.cuda.is_available():
+            gpu_id = rank % torch.cuda.device_count()
+            device = torch.device(f"cuda:{gpu_id}")
+        else:
+            device = torch.device("cpu")
     wav_path, _, language_str, text, phones, tone, word2ph = line.strip().split("|")
     phone = phones.split(" ")
     tone = [int(i) for i in tone.split(" ")]
         word2ph[i] = word2ph[i] * 2
     word2ph[0] += 1
+    bert_path = wav_path.replace(".WAV", ".wav").replace(".wav", ".bert.pt")
     try:
         bert = torch.load(bert_path)
         torch.save(bert, bert_path)
+preprocess_text_config = config.preprocess_text_config
 if __name__ == "__main__":
     parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "-c", "--config", type=str, default=config.bert_gen_config.config_path
+    )
+    parser.add_argument(
+        "--num_processes", type=int, default=config.bert_gen_config.num_processes
+    )
+    args, _ = parser.parse_known_args()
     config_path = args.config
     hps = utils.get_hparams_from_file(config_path)
     lines = []
     with open(hps.data.validation_files, encoding="utf-8") as f:
         lines.extend(f.readlines())
+    if len(lines) != 0:
+        num_processes = min(args.num_processes, cpu_count())
+        with Pool(processes=num_processes) as pool:
+            for _ in tqdm(pool.imap_unordered(process_line, lines), total=len(lines)):
+                pass
+    print(f"bert生成完毕!, 共有{len(lines)}个bert.pt生成!")

clap_gen.py ADDED Viewed

	@@ -0,0 +1,64 @@

+import argparse
+from multiprocessing import Pool, cpu_count
+import torch
+import torch.multiprocessing as mp
+from tqdm import tqdm
+import utils
+from config import config
+from clap_wrapper import get_clap_audio_feature
+import librosa
+import os
+os.environ["OMP_NUM_THREADS"] = "1"
+os.environ["MKL_NUM_THREADS"] = "1"
+def process_line(line):
+    device = config.emo_gen_config.device
+    if config.emo_gen_config.use_multi_device:
+        rank = mp.current_process()._identity
+        rank = rank[0] if len(rank) > 0 else 0
+        if torch.cuda.is_available():
+            gpu_id = rank % torch.cuda.device_count()
+            device = torch.device(f"cuda:{gpu_id}")
+        else:
+            device = torch.device("cpu")
+    wav_path, _, language_str, text, phones, tone, word2ph = line.strip().split("|")
+    clap_path = wav_path.replace(".WAV", ".wav").replace(".wav", ".emo.npy")
+    if os.path.isfile(clap_path):
+        return
+    audio = librosa.load(wav_path, 48000)[0]
+    # audio = librosa.resample(audio, 44100, 48000)
+    clap = get_clap_audio_feature(audio, device)
+    torch.save(clap, clap_path)
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "-c", "--config", type=str, default=config.emo_gen_config.config_path
+    )
+    parser.add_argument(
+        "--num_processes", type=int, default=config.emo_gen_config.num_processes
+    )
+    args, _ = parser.parse_known_args()
+    config_path = args.config
+    hps = utils.get_hparams_from_file(config_path)
+    lines = []
+    with open(hps.data.training_files, encoding="utf-8") as f:
+        lines.extend(f.readlines())
+    with open(hps.data.validation_files, encoding="utf-8") as f:
+        lines.extend(f.readlines())
+    if len(lines) != 0:
+        num_processes = min(args.num_processes, cpu_count())
+        with Pool(processes=num_processes) as pool:
+            for _ in tqdm(pool.imap_unordered(process_line, lines), total=len(lines)):
+                pass
+    print(f"clap生成完毕!, 共有{len(lines)}个emo.pt生成!")

clap_wrapper.py ADDED Viewed

	@@ -0,0 +1,49 @@

+import sys
+import torch
+from transformers import ClapModel, ClapProcessor
+from config import config
+models = dict()
+processor = ClapProcessor.from_pretrained("./emotional/clap-htsat-fused")
+def get_clap_audio_feature(audio_data, device=config.bert_gen_config.device):
+    if (
+        sys.platform == "darwin"
+        and torch.backends.mps.is_available()
+        and device == "cpu"
+    ):
+        device = "mps"
+    if not device:
+        device = "cuda"
+    if device not in models.keys():
+        models[device] = ClapModel.from_pretrained("./emotional/clap-htsat-fused").to(
+            device
+        )
+    with torch.no_grad():
+        inputs = processor(
+            audios=audio_data, return_tensors="pt", sampling_rate=48000
+        ).to(device)
+        emb = models[device].get_audio_features(**inputs)
+    return emb.T
+def get_clap_text_feature(text, device=config.bert_gen_config.device):
+    if (
+        sys.platform == "darwin"
+        and torch.backends.mps.is_available()
+        and device == "cpu"
+    ):
+        device = "mps"
+    if not device:
+        device = "cuda"
+    if device not in models.keys():
+        models[device] = ClapModel.from_pretrained("./emotional/clap-htsat-fused").to(
+            device
+        )
+    with torch.no_grad():
+        inputs = processor(text=text, return_tensors="pt").to(device)
+        emb = models[device].get_text_features(**inputs)
+    return emb.T

commons.py CHANGED Viewed

@@ -46,20 +46,18 @@ def rand_gumbel_like(x):
 def slice_segments(x, ids_str, segment_size=4):
-    ret = torch.zeros_like(x[:, :, :segment_size])
-    for i in range(x.size(0)):
-        idx_str = ids_str[i]
-        idx_end = idx_str + segment_size
-        ret[i] = x[i, :, idx_str:idx_end]
-    return ret
 def rand_slice_segments(x, x_lengths=None, segment_size=4):
     b, d, t = x.size()
     if x_lengths is None:
         x_lengths = t
-    ids_str_max = x_lengths - segment_size + 1
-    ids_str = (torch.rand([b]).to(device=x.device) * ids_str_max).to(dtype=torch.long)
     ret = slice_segments(x, ids_str, segment_size)
     return ret, ids_str

 def slice_segments(x, ids_str, segment_size=4):
+    gather_indices = ids_str.view(x.size(0), 1, 1).repeat(
+        1, x.size(1), 1
+    ) + torch.arange(segment_size, device=x.device)
+    return torch.gather(x, 2, gather_indices)
 def rand_slice_segments(x, x_lengths=None, segment_size=4):
     b, d, t = x.size()
     if x_lengths is None:
         x_lengths = t
+    ids_str_max = torch.clamp(x_lengths - segment_size + 1, min=0)
+    ids_str = (torch.rand([b], device=x.device) * ids_str_max).to(dtype=torch.long)
     ret = slice_segments(x, ids_str, segment_size)
     return ret, ids_str

compress_model.py ADDED Viewed

	@@ -0,0 +1,89 @@

+from collections import OrderedDict
+from text.symbols import symbols
+import torch
+from tools.log import logger
+import utils
+from models import SynthesizerTrn
+import os
+def copyStateDict(state_dict):
+    if list(state_dict.keys())[0].startswith("module"):
+        start_idx = 1
+    else:
+        start_idx = 0
+    new_state_dict = OrderedDict()
+    for k, v in state_dict.items():
+        name = ",".join(k.split(".")[start_idx:])
+        new_state_dict[name] = v
+    return new_state_dict
+def removeOptimizer(config: str, input_model: str, ishalf: bool, output_model: str):
+    hps = utils.get_hparams_from_file(config)
+    net_g = SynthesizerTrn(
+        len(symbols),
+        hps.data.filter_length // 2 + 1,
+        hps.train.segment_size // hps.data.hop_length,
+        n_speakers=hps.data.n_speakers,
+        **hps.model,
+    )
+    optim_g = torch.optim.AdamW(
+        net_g.parameters(),
+        hps.train.learning_rate,
+        betas=hps.train.betas,
+        eps=hps.train.eps,
+    )
+    state_dict_g = torch.load(input_model, map_location="cpu")
+    new_dict_g = copyStateDict(state_dict_g)
+    keys = []
+    for k, v in new_dict_g["model"].items():
+        if "enc_q" in k:
+            continue  # noqa: E701
+        keys.append(k)
+    new_dict_g = (
+        {k: new_dict_g["model"][k].half() for k in keys}
+        if ishalf
+        else {k: new_dict_g["model"][k] for k in keys}
+    )
+    torch.save(
+        {
+            "model": new_dict_g,
+            "iteration": 0,
+            "optimizer": optim_g.state_dict(),
+            "learning_rate": 0.0001,
+        },
+        output_model,
+    )
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser()
+    parser.add_argument("-c", "--config", type=str, default="configs/config.json")
+    parser.add_argument("-i", "--input", type=str)
+    parser.add_argument("-o", "--output", type=str, default=None)
+    parser.add_argument(
+        "-hf", "--half", action="store_true", default=False, help="Save as FP16"
+    )
+    args = parser.parse_args()
+    output = args.output
+    if output is None:
+        import os.path
+        filename, ext = os.path.splitext(args.input)
+        half = "_half" if args.half else ""
+        output = filename + "_release" + half + ext
+    removeOptimizer(args.config, args.input, args.half, output)
+    logger.info(f"压缩模型成功, 输出模型: {os.path.abspath(output)}")

config.py ADDED Viewed

	@@ -0,0 +1,248 @@

+"""
+@Desc: 全局配置文件读取
+"""
+import argparse
+import yaml
+from typing import Dict, List
+import os
+import shutil
+import sys
+class Resample_config:
+    """重采样配置"""
+    def __init__(self, in_dir: str, out_dir: str, sampling_rate: int = 44100):
+        self.sampling_rate: int = sampling_rate  # 目标采样率
+        self.in_dir: str = in_dir  # 待处理音频目录路径
+        self.out_dir: str = out_dir  # 重采样输出路径
+    @classmethod
+    def from_dict(cls, dataset_path: str, data: Dict[str, any]):
+        """从字典中生成实例"""
+        # 不检查路径是否有效，此逻辑在resample.py中处理
+        data["in_dir"] = os.path.join(dataset_path, data["in_dir"])
+        data["out_dir"] = os.path.join(dataset_path, data["out_dir"])
+        return cls(**data)
+class Preprocess_text_config:
+    """数据预处理配置"""
+    def __init__(
+        self,
+        transcription_path: str,
+        cleaned_path: str,
+        train_path: str,
+        val_path: str,
+        config_path: str,
+        val_per_lang: int = 5,
+        max_val_total: int = 10000,
+        clean: bool = True,
+    ):
+        self.transcription_path: str = transcription_path  # 原始文本文件路径，文本格式应为{wav_path}|{speaker_name}|{language}|{text}。
+        self.cleaned_path: str = cleaned_path  # 数据清洗后文本路径，可以不填。不填则将在原始文本目录生成
+        self.train_path: str = train_path  # 训练集路径，可以不填。不填则将在原始文本目录生成
+        self.val_path: str = val_path  # 验证集路径，可以不填。不填则将在原始文本目录生成
+        self.config_path: str = config_path  # 配置文件路径
+        self.val_per_lang: int = val_per_lang  # 每个speaker的验证集条数
+        self.max_val_total: int = max_val_total  # 验证集最大条数，多于的会被截断并放到训练集中
+        self.clean: bool = clean  # 是否进行数据清洗
+    @classmethod
+    def from_dict(cls, dataset_path: str, data: Dict[str, any]):
+        """从字典中生成实例"""
+        data["transcription_path"] = os.path.join(
+            dataset_path, data["transcription_path"]
+        )
+        if data["cleaned_path"] == "" or data["cleaned_path"] is None:
+            data["cleaned_path"] = None
+        else:
+            data["cleaned_path"] = os.path.join(dataset_path, data["cleaned_path"])
+        data["train_path"] = os.path.join(dataset_path, data["train_path"])
+        data["val_path"] = os.path.join(dataset_path, data["val_path"])
+        data["config_path"] = os.path.join(dataset_path, data["config_path"])
+        return cls(**data)
+class Bert_gen_config:
+    """bert_gen 配置"""
+    def __init__(
+        self,
+        config_path: str,
+        num_processes: int = 2,
+        device: str = "cuda",
+        use_multi_device: bool = False,
+    ):
+        self.config_path = config_path
+        self.num_processes = num_processes
+        self.device = device
+        self.use_multi_device = use_multi_device
+    @classmethod
+    def from_dict(cls, dataset_path: str, data: Dict[str, any]):
+        data["config_path"] = os.path.join(dataset_path, data["config_path"])
+        return cls(**data)
+class Emo_gen_config:
+    """emo_gen 配置"""
+    def __init__(
+        self,
+        config_path: str,
+        num_processes: int = 2,
+        device: str = "cuda",
+        use_multi_device: bool = False,
+    ):
+        self.config_path = config_path
+        self.num_processes = num_processes
+        self.device = device
+        self.use_multi_device = use_multi_device
+    @classmethod
+    def from_dict(cls, dataset_path: str, data: Dict[str, any]):
+        data["config_path"] = os.path.join(dataset_path, data["config_path"])
+        return cls(**data)
+class Train_ms_config:
+    """训练配置"""
+    def __init__(
+        self,
+        config_path: str,
+        env: Dict[str, any],
+        base: Dict[str, any],
+        model: str,
+        num_workers: int,
+        spec_cache: bool,
+        keep_ckpts: int,
+    ):
+        self.env = env  # 需要加载的环境变量
+        self.base = base  # 底模配置
+        self.model = model  # 训练模型存储目录，该路径为相对于dataset_path的路径，而非项目根目录
+        self.config_path = config_path  # 配置文件路径
+        self.num_workers = num_workers  # worker数量
+        self.spec_cache = spec_cache  # 是否启用spec缓存
+        self.keep_ckpts = keep_ckpts  # ckpt数量
+    @classmethod
+    def from_dict(cls, dataset_path: str, data: Dict[str, any]):
+        # data["model"] = os.path.join(dataset_path, data["model"])
+        data["config_path"] = os.path.join(dataset_path, data["config_path"])
+        return cls(**data)
+class Webui_config:
+    """webui 配置"""
+    def __init__(
+        self,
+        device: str,
+        model: str,
+        config_path: str,
+        language_identification_library: str,
+        port: int = 7860,
+        share: bool = False,
+        debug: bool = False,
+    ):
+        self.device: str = device
+        self.model: str = model  # 端口号
+        self.config_path: str = config_path  # 是否公开部署，对外网开放
+        self.port: int = port  # 是否开启debug模式
+        self.share: bool = share  # 模型路径
+        self.debug: bool = debug  # 配置文件路径
+        self.language_identification_library: str = (
+            language_identification_library  # 语种识别库
+        )
+    @classmethod
+    def from_dict(cls, dataset_path: str, data: Dict[str, any]):
+        data["config_path"] = os.path.join(dataset_path, data["config_path"])
+        data["model"] = os.path.join(dataset_path, data["model"])
+        return cls(**data)
+class Server_config:
+    def __init__(
+        self, models: List[Dict[str, any]], port: int = 5000, device: str = "cuda"
+    ):
+        self.models: List[Dict[str, any]] = models  # 需要加载的所有模型的配置
+        self.port: int = port  # 端口号
+        self.device: str = device  # 模型默认使用设备
+    @classmethod
+    def from_dict(cls, data: Dict[str, any]):
+        return cls(**data)
+class Translate_config:
+    """翻译api配置"""
+    def __init__(self, app_key: str, secret_key: str):
+        self.app_key = app_key
+        self.secret_key = secret_key
+    @classmethod
+    def from_dict(cls, data: Dict[str, any]):
+        return cls(**data)
+class Config:
+    def __init__(self, config_path: str):
+        if not os.path.isfile(config_path) and os.path.isfile("default_config.yml"):
+            shutil.copy(src="default_config.yml", dst=config_path)
+            print(
+                f"已根据默认配置文件default_config.yml生成配置文件{config_path}。请按该配置文件的说明进行配置后重新运行。"
+            )
+            print("如无特殊需求，请勿修改default_config.yml或备份该文件。")
+            sys.exit(0)
+        with open(file=config_path, mode="r", encoding="utf-8") as file:
+            yaml_config: Dict[str, any] = yaml.safe_load(file.read())
+            dataset_path: str = yaml_config["dataset_path"]
+            openi_token: str = yaml_config["openi_token"]
+            self.dataset_path: str = dataset_path
+            self.mirror: str = yaml_config["mirror"]
+            self.openi_token: str = openi_token
+            self.resample_config: Resample_config = Resample_config.from_dict(
+                dataset_path, yaml_config["resample"]
+            )
+            self.preprocess_text_config: Preprocess_text_config = (
+                Preprocess_text_config.from_dict(
+                    dataset_path, yaml_config["preprocess_text"]
+                )
+            )
+            self.bert_gen_config: Bert_gen_config = Bert_gen_config.from_dict(
+                dataset_path, yaml_config["bert_gen"]
+            )
+            self.emo_gen_config: Emo_gen_config = Emo_gen_config.from_dict(
+                dataset_path, yaml_config["emo_gen"]
+            )
+            self.train_ms_config: Train_ms_config = Train_ms_config.from_dict(
+                dataset_path, yaml_config["train_ms"]
+            )
+            self.webui_config: Webui_config = Webui_config.from_dict(
+                dataset_path, yaml_config["webui"]
+            )
+            self.server_config: Server_config = Server_config.from_dict(
+                yaml_config["server"]
+            )
+            self.translate_config: Translate_config = Translate_config.from_dict(
+                yaml_config["translate"]
+            )
+parser = argparse.ArgumentParser()
+# 为避免与以前的config.json起冲突，将其更名如下
+parser.add_argument("-y", "--yml_config", type=str, default="config.yml")
+args, _ = parser.parse_known_args()
+config = Config(args.yml_config)

configs/config.json CHANGED Viewed

@@ -2,23 +2,26 @@
   "train": {
     "log_interval": 200,
     "eval_interval": 1000,
-    "seed": 52,
-    "epochs": 10000,
-    "learning_rate": 0.0003,
     "betas": [
       0.8,
       0.99
     ],
     "eps": 1e-09,
-    "batch_size": 8,
     "fp16_run": false,
-    "lr_decay": 0.999875,
     "segment_size": 16384,
     "init_lr_ratio": 1,
     "warmup_epochs": 0,
     "c_mel": 45,
     "c_kl": 1.0,
-    "skip_optimizer": true
   },
   "data": {
     "training_files": "filelists/train.list",
@@ -32,10 +35,864 @@
     "mel_fmin": 0.0,
     "mel_fmax": null,
     "add_blank": true,
-    "n_speakers": 256,
     "cleaned_text": true,
     "spk2id": {
-      "hanser": 0
     }
   },
   "model": {
@@ -91,5 +948,6 @@
     "n_layers_q": 3,
     "use_spectral_norm": false,
     "gin_channels": 256
-  }
-}

   "train": {
     "log_interval": 200,
     "eval_interval": 1000,
+    "seed": 42,
+    "epochs": 1000,
+    "learning_rate": 0.0002,
     "betas": [
       0.8,
       0.99
     ],
     "eps": 1e-09,
+    "batch_size": 12,
     "fp16_run": false,
+    "lr_decay": 0.99995,
     "segment_size": 16384,
     "init_lr_ratio": 1,
     "warmup_epochs": 0,
     "c_mel": 45,
     "c_kl": 1.0,
+    "skip_optimizer": true,
+    "freeze_ZH_bert": false,
+    "freeze_JP_bert": false,
+    "freeze_EN_bert": false
   },
   "data": {
     "training_files": "filelists/train.list",
     "mel_fmin": 0.0,
     "mel_fmax": null,
     "add_blank": true,
+    "n_speakers": 896,
     "cleaned_text": true,
     "spk2id": {
+      "派蒙_ZH": 0,
+      "纳西妲_ZH": 1,
+      "凯亚_ZH": 2,
+      "阿贝多_ZH": 3,
+      "温迪_ZH": 4,
+      "枫原万叶_ZH": 5,
+      "钟离_ZH": 6,
+      "荒泷一斗_ZH": 7,
+      "八重神子_ZH": 8,
+      "艾尔海森_ZH": 9,
+      "提纳里_ZH": 10,
+      "迪希雅_ZH": 11,
+      "卡维_ZH": 12,
+      "宵宫_ZH": 13,
+      "那维莱特_ZH": 14,
+      "莱依拉_ZH": 15,
+      "赛诺_ZH": 16,
+      "莫娜_ZH": 17,
+      "诺艾尔_ZH": 18,
+      "托马_ZH": 19,
+      "凝光_ZH": 20,
+      "林尼_ZH": 21,
+      "北斗_ZH": 22,
+      "柯莱_ZH": 23,
+      "神里绫华_ZH": 24,
+      "可莉_ZH": 25,
+      "芭芭拉_ZH": 26,
+      "雷电将军_ZH": 27,
+      "娜维娅_ZH": 28,
+      "芙宁娜_ZH": 29,
+      "珊瑚宫心海_ZH": 30,
+      "鹿野院平藏_ZH": 31,
+      "迪奥娜_ZH": 32,
+      "琴_ZH": 33,
+      "五郎_ZH": 34,
+      "班尼特_ZH": 35,
+      "达达利亚_ZH": 36,
+      "安柏_ZH": 37,
+      "莱欧斯利_ZH": 38,
+      "夜兰_ZH": 39,
+      "妮露_ZH": 40,
+      "辛焱_ZH": 41,
+      "丽莎_ZH": 42,
+      "珐露珊_ZH": 43,
+      "魈_ZH": 44,
+      "香菱_ZH": 45,
+      "迪卢克_ZH": 46,
+      "砂糖_ZH": 47,
+      "烟绯_ZH": 48,
+      "早柚_ZH": 49,
+      "云堇_ZH": 50,
+      "刻晴_ZH": 51,
+      "重云_ZH": 52,
+      "优菈_ZH": 53,
+      "胡桃_ZH": 54,
+      "流浪者_ZH": 55,
+      "久岐忍_ZH": 56,
+      "神里绫人_ZH": 57,
+      "甘雨_ZH": 58,
+      "戴因斯雷布_ZH": 59,
+      "菲谢尔_ZH": 60,
+      "白术_ZH": 61,
+      "行秋_ZH": 62,
+      "九条裟罗_ZH": 63,
+      "夏洛蒂_ZH": 64,
+      "雷泽_ZH": 65,
+      "申鹤_ZH": 66,
+      "荧_ZH": 67,
+      "空_ZH": 68,
+      "迪娜泽黛_ZH": 69,
+      "凯瑟琳_ZH": 70,
+      "多莉_ZH": 71,
+      "坎蒂丝_ZH": 72,
+      "琳妮特_ZH": 73,
+      "萍姥姥_ZH": 74,
+      "罗莎莉亚_ZH": 75,
+      "埃德_ZH": 76,
+      "爱贝尔_ZH": 77,
+      "伊迪娅_ZH": 78,
+      "留云借风真君_ZH": 79,
+      "绮良良_ZH": 80,
+      "七七_ZH": 81,
+      "式大将_ZH": 82,
+      "瑶瑶_ZH": 83,
+      "奥兹_ZH": 84,
+      "菲米尼_ZH": 85,
+      "米卡_ZH": 86,
+      "哲平_ZH": 87,
+      "大肉丸_ZH": 88,
+      "托克_ZH": 89,
+      "蒂玛乌斯_ZH": 90,
+      "昆钧_ZH": 91,
+      "欧菲妮_ZH": 92,
+      "塞琉斯_ZH": 93,
+      "仆人_ZH": 94,
+      "迈勒斯_ZH": 95,
+      "希格雯_ZH": 96,
+      "阿守_ZH": 97,
+      "拉赫曼_ZH": 98,
+      "杜拉夫_ZH": 99,
+      "伊利亚斯_ZH": 100,
+      "阿晃_ZH": 101,
+      "旁白_ZH": 102,
+      "爱德琳_ZH": 103,
+      "埃洛伊_ZH": 104,
+      "德沃沙克_ZH": 105,
+      "玛乔丽_ZH": 106,
+      "塞塔蕾_ZH": 107,
+      "柊千里_ZH": 108,
+      "海芭夏_ZH": 109,
+      "九条镰治_ZH": 110,
+      "阿娜耶_ZH": 111,
+      "笼钓瓶一心_ZH": 112,
+      "回声海螺_ZH": 113,
+      "劳维克_ZH": 114,
+      "元太_ZH": 115,
+      "阿扎尔_ZH": 116,
+      "查尔斯_ZH": 117,
+      "阿洛瓦_ZH": 118,
+      "埃勒曼_ZH": 119,
+      "纳比尔_ZH": 120,
+      "莎拉_ZH": 121,
+      "康纳_ZH": 122,
+      "博来_ZH": 123,
+      "玛塞勒_ZH": 124,
+      "阿祇_ZH": 125,
+      "博士_ZH": 126,
+      "玛格丽特_ZH": 127,
+      "迪尔菲_ZH": 128,
+      "宛烟_ZH": 129,
+      "羽生田千鹤_ZH": 130,
+      "海妮耶_ZH": 131,
+      "旅行者_ZH": 132,
+      "霍夫曼_ZH": 133,
+      "佐西摩斯_ZH": 134,
+      "鹿野奈奈_ZH": 135,
+      "舒伯特_ZH": 136,
+      "天叔_ZH": 137,
+      "艾莉丝_ZH": 138,
+      "龙二_ZH": 139,
+      "莺儿_ZH": 140,
+      "嘉良_ZH": 141,
+      "一心传名刀_ZH": 142,
+      "费迪南德_ZH": 143,
+      "珊瑚_ZH": 144,
+      "言笑_ZH": 145,
+      "久利须_ZH": 146,
+      "嘉玛_ZH": 147,
+      "艾文_ZH": 148,
+      "克洛琳德_ZH": 149,
+      "丹吉尔_ZH": 150,
+      "女士_ZH": 151,
+      "白老先生_ZH": 152,
+      "天目十五_ZH": 153,
+      "老孟_ZH": 154,
+      "巴达维_ZH": 155,
+      "长生_ZH": 156,
+      "吴船长_ZH": 157,
+      "拉齐_ZH": 158,
+      "艾伯特_ZH": 159,
+      "松浦_ZH": 160,
+      "埃泽_ZH": 161,
+      "阿圆_ZH": 162,
+      "莫塞伊思_ZH": 163,
+      "阿拉夫_ZH": 164,
+      "杜吉耶_ZH": 165,
+      "石头_ZH": 166,
+      "百闻_ZH": 167,
+      "波洛_ZH": 168,
+      "斯坦利_ZH": 169,
+      "博易_ZH": 170,
+      "迈蒙_ZH": 171,
+      "掇星攫辰天君_ZH": 172,
+      "毗伽尔_ZH": 173,
+      "芙卡洛斯_ZH": 174,
+      "恶龙_ZH": 175,
+      "恕筠_ZH": 176,
+      "知易_ZH": 177,
+      "克列门特_ZH": 178,
+      "大慈树王_ZH": 179,
+      "西拉杰_ZH": 180,
+      "上杉_ZH": 181,
+      "阿尔卡米_ZH": 182,
+      "纯水精灵_ZH": 183,
+      "常九爷_ZH": 184,
+      "沙扎曼_ZH": 185,
+      "田铁嘴_ZH": 186,
+      "克罗索_ZH": 187,
+      "阿巴图伊_ZH": 188,
+      "悦_ZH": 189,
+      "阿佩普_ZH": 190,
+      "埃尔欣根_ZH": 191,
+      "萨赫哈蒂_ZH": 192,
+      "塔杰·拉德卡尼_ZH": 193,
+      "安西_ZH": 194,
+      "埃舍尔_ZH": 195,
+      "萨齐因_ZH": 196,
+      "派蒙_JP": 197,
+      "纳西妲_JP": 198,
+      "凯亚_JP": 199,
+      "阿贝多_JP": 200,
+      "温迪_JP": 201,
+      "枫原万叶_JP": 202,
+      "钟离_JP": 203,
+      "荒泷一斗_JP": 204,
+      "八重神子_JP": 205,
+      "艾尔海森_JP": 206,
+      "提纳里_JP": 207,
+      "迪希雅_JP": 208,
+      "卡维_JP": 209,
+      "宵宫_JP": 210,
+      "那维莱特_JP": 211,
+      "莱依拉_JP": 212,
+      "赛诺_JP": 213,
+      "莫娜_JP": 214,
+      "诺艾尔_JP": 215,
+      "托马_JP": 216,
+      "凝光_JP": 217,
+      "林尼_JP": 218,
+      "北斗_JP": 219,
+      "柯莱_JP": 220,
+      "神里绫华_JP": 221,
+      "可莉_JP": 222,
+      "芭芭拉_JP": 223,
+      "雷电将军_JP": 224,
+      "娜维娅_JP": 225,
+      "芙宁娜_JP": 226,
+      "珊瑚宫心海_JP": 227,
+      "鹿野院平藏_JP": 228,
+      "迪奥娜_JP": 229,
+      "琴_JP": 230,
+      "五郎_JP": 231,
+      "班尼特_JP": 232,
+      "达达利亚_JP": 233,
+      "安柏_JP": 234,
+      "莱欧斯利_JP": 235,
+      "夜兰_JP": 236,
+      "妮露_JP": 237,
+      "辛焱_JP": 238,
+      "丽莎_JP": 239,
+      "珐露珊_JP": 240,
+      "魈_JP": 241,
+      "香菱_JP": 242,
+      "迪卢克_JP": 243,
+      "砂糖_JP": 244,
+      "烟绯_JP": 245,
+      "早柚_JP": 246,
+      "云堇_JP": 247,
+      "刻晴_JP": 248,
+      "重云_JP": 249,
+      "优菈_JP": 250,
+      "胡桃_JP": 251,
+      "流浪者_JP": 252,
+      "久岐忍_JP": 253,
+      "神里绫人_JP": 254,
+      "甘雨_JP": 255,
+      "戴因斯雷布_JP": 256,
+      "菲谢尔_JP": 257,
+      "白术_JP": 258,
+      "行秋_JP": 259,
+      "九条裟罗_JP": 260,
+      "夏洛蒂_JP": 261,
+      "雷泽_JP": 262,
+      "申鹤_JP": 263,
+      "空_JP": 264,
+      "荧_JP": 265,
+      "迪娜泽黛_JP": 266,
+      "凯瑟琳_JP": 267,
+      "多莉_JP": 268,
+      "坎蒂丝_JP": 269,
+      "琳妮特_JP": 270,
+      "萍姥姥_JP": 271,
+      "罗莎莉亚_JP": 272,
+      "埃德_JP": 273,
+      "爱贝尔_JP": 274,
+      "伊迪娅_JP": 275,
+      "留云借风真君_JP": 276,
+      "绮良良_JP": 277,
+      "七七_JP": 278,
+      "式大将_JP": 279,
+      "瑶瑶_JP": 280,
+      "奥兹_JP": 281,
+      "菲米尼_JP": 282,
+      "米卡_JP": 283,
+      "哲平_JP": 284,
+      "大肉丸_JP": 285,
+      "托克_JP": 286,
+      "蒂玛乌斯_JP": 287,
+      "昆钧_JP": 288,
+      "欧菲妮_JP": 289,
+      "塞琉斯_JP": 290,
+      "仆人_JP": 291,
+      "迈勒斯_JP": 292,
+      "希格雯_JP": 293,
+      "阿守_JP": 294,
+      "拉赫曼_JP": 295,
+      "杜拉夫_JP": 296,
+      "伊利亚斯_JP": 297,
+      "阿晃_JP": 298,
+      "旁白_JP": 299,
+      "爱德琳_JP": 300,
+      "埃洛伊_JP": 301,
+      "德沃沙克_JP": 302,
+      "玛乔丽_JP": 303,
+      "塞塔蕾_JP": 304,
+      "柊千里_JP": 305,
+      "海芭夏_JP": 306,
+      "九条镰治_JP": 307,
+      "阿娜耶_JP": 308,
+      "笼钓瓶一心_JP": 309,
+      "回声海螺_JP": 310,
+      "劳维克_JP": 311,
+      "元太_JP": 312,
+      "阿扎尔_JP": 313,
+      "查尔斯_JP": 314,
+      "阿洛瓦_JP": 315,
+      "埃勒曼_JP": 316,
+      "纳比尔_JP": 317,
+      "莎拉_JP": 318,
+      "康纳_JP": 319,
+      "博来_JP": 320,
+      "玛塞勒_JP": 321,
+      "阿祇_JP": 322,
+      "博士_JP": 323,
+      "迪尔菲_JP": 324,
+      "玛格丽特_JP": 325,
+      "宛烟_JP": 326,
+      "羽生田千鹤_JP": 327,
+      "海妮耶_JP": 328,
+      "霍夫曼_JP": 329,
+      "旅行者_JP": 330,
+      "佐西摩斯_JP": 331,
+      "舒伯特_JP": 332,
+      "鹿野奈奈_JP": 333,
+      "天叔_JP": 334,
+      "龙二_JP": 335,
+      "艾莉丝_JP": 336,
+      "莺儿_JP": 337,
+      "嘉良_JP": 338,
+      "珊瑚_JP": 339,
+      "言笑_JP": 340,
+      "一心传名刀_JP": 341,
+      "费迪南德_JP": 342,
+      "久利须_JP": 343,
+      "嘉玛_JP": 344,
+      "艾文_JP": 345,
+      "克洛琳德_JP": 346,
+      "丹吉尔_JP": 347,
+      "天目十五_JP": 348,
+      "女士_JP": 349,
+      "老孟_JP": 350,
+      "白老先生_JP": 351,
+      "舍利夫_JP": 352,
+      "巴达维_JP": 353,
+      "拉齐_JP": 354,
+      "长生_JP": 355,
+      "吴船长_JP": 356,
+      "艾伯特_JP": 357,
+      "松浦_JP": 358,
+      "埃泽_JP": 359,
+      "阿圆_JP": 360,
+      "阿拉夫_JP": 361,
+      "莫塞伊思_JP": 362,
+      "石头_JP": 363,
+      "百闻_JP": 364,
+      "杜吉耶_JP": 365,
+      "波洛_JP": 366,
+      "掇星攫辰天君_JP": 367,
+      "迈蒙_JP": 368,
+      "博易_JP": 369,
+      "诗筠_JP": 370,
+      "斯坦利_JP": 371,
+      "毗伽尔_JP": 372,
+      "芙卡洛斯_JP": 373,
+      "恶龙_JP": 374,
+      "小仓澪_JP": 375,
+      "恕筠_JP": 376,
+      "知易_JP": 377,
+      "克列门特_JP": 378,
+      "大慈树王_JP": 379,
+      "望雅_JP": 380,
+      "黑田_JP": 381,
+      "卡莉娜_JP": 382,
+      "马姆杜_JP": 383,
+      "科林斯_JP": 384,
+      "上杉_JP": 385,
+      "西拉杰_JP": 386,
+      "菲尔戈黛特_JP": 387,
+      "一平_JP": 388,
+      "纯水精灵_JP": 389,
+      "阿尔卡米_JP": 390,
+      "老戴_JP": 391,
+      "谢赫祖拜尔_JP": 392,
+      "沙扎曼_JP": 393,
+      "田铁嘴_JP": 394,
+      "小野寺_JP": 395,
+      "百识_JP": 396,
+      "克罗索_JP": 397,
+      "莱斯格_JP": 398,
+      "芷巧_JP": 399,
+      "加藤洋平_JP": 400,
+      "阿巴图伊_JP": 401,
+      "埃尔欣根_JP": 402,
+      "斯嘉莉_JP": 403,
+      "阿佩普_JP": 404,
+      "巫女_JP": 405,
+      "卡布斯_JP": 406,
+      "洛伦佐_JP": 407,
+      "萨赫哈蒂_JP": 408,
+      "娜德瓦_JP": 409,
+      "塞德娜_JP": 410,
+      "塔杰·拉德卡尼_JP": 411,
+      "绘星_JP": 412,
+      "泽田_JP": 413,
+      "安西_JP": 414,
+      "拉伊德_JP": 415,
+      "亚卡巴_JP": 416,
+      "有乐斋_JP": 417,
+      "莱昂_JP": 418,
+      "尤苏波夫_JP": 419,
+      "夏妮_JP": 420,
+      "埃舍尔_JP": 421,
+      "萨齐因_JP": 422,
+      "古山_JP": 423,
+      "自称渊上之物_JP": 424,
+      "丹羽_JP": 425,
+      "塞萨尔的日记_JP": 426,
+      "派蒙_EN": 427,
+      "纳西妲_EN": 428,
+      "凯亚_EN": 429,
+      "阿贝多_EN": 430,
+      "温迪_EN": 431,
+      "枫原万叶_EN": 432,
+      "钟离_EN": 433,
+      "荒泷一斗_EN": 434,
+      "八重神子_EN": 435,
+      "艾尔海森_EN": 436,
+      "提纳里_EN": 437,
+      "迪希雅_EN": 438,
+      "卡维_EN": 439,
+      "宵宫_EN": 440,
+      "莱依拉_EN": 441,
+      "那维莱特_EN": 442,
+      "赛诺_EN": 443,
+      "莫娜_EN": 444,
+      "诺艾尔_EN": 445,
+      "托马_EN": 446,
+      "凝光_EN": 447,
+      "林尼_EN": 448,
+      "北斗_EN": 449,
+      "柯莱_EN": 450,
+      "神里绫华_EN": 451,
+      "可莉_EN": 452,
+      "芭芭拉_EN": 453,
+      "雷电将军_EN": 454,
+      "娜维娅_EN": 455,
+      "芙宁娜_EN": 456,
+      "珊瑚宫心海_EN": 457,
+      "鹿野院平藏_EN": 458,
+      "迪奥娜_EN": 459,
+      "五郎_EN": 460,
+      "琴_EN": 461,
+      "班尼特_EN": 462,
+      "达达利亚_EN": 463,
+      "安柏_EN": 464,
+      "莱欧斯利_EN": 465,
+      "夜兰_EN": 466,
+      "妮露_EN": 467,
+      "辛焱_EN": 468,
+      "珐露珊_EN": 469,
+      "丽莎_EN": 470,
+      "魈_EN": 471,
+      "香菱_EN": 472,
+      "迪卢克_EN": 473,
+      "砂糖_EN": 474,
+      "烟绯_EN": 475,
+      "早柚_EN": 476,
+      "云堇_EN": 477,
+      "刻晴_EN": 478,
+      "重云_EN": 479,
+      "优菈_EN": 480,
+      "胡桃_EN": 481,
+      "流浪者_EN": 482,
+      "久岐忍_EN": 483,
+      "神里绫人_EN": 484,
+      "甘雨_EN": 485,
+      "戴因斯雷布_EN": 486,
+      "菲谢尔_EN": 487,
+      "白术_EN": 488,
+      "行秋_EN": 489,
+      "九条裟罗_EN": 490,
+      "夏洛蒂_EN": 491,
+      "雷泽_EN": 492,
+      "申鹤_EN": 493,
+      "荧_EN": 494,
+      "空_EN": 495,
+      "迪娜泽黛_EN": 496,
+      "凯瑟琳_EN": 497,
+      "多莉_EN": 498,
+      "坎蒂丝_EN": 499,
+      "琳妮特_EN": 500,
+      "萍姥姥_EN": 501,
+      "罗莎莉亚_EN": 502,
+      "埃德_EN": 503,
+      "爱贝尔_EN": 504,
+      "伊迪娅_EN": 505,
+      "留云借风真君_EN": 506,
+      "绮良良_EN": 507,
+      "七七_EN": 508,
+      "式大将_EN": 509,
+      "瑶瑶_EN": 510,
+      "奥兹_EN": 511,
+      "菲米尼_EN": 512,
+      "米卡_EN": 513,
+      "哲平_EN": 514,
+      "大肉丸_EN": 515,
+      "托克_EN": 516,
+      "蒂玛乌斯_EN": 517,
+      "昆钧_EN": 518,
+      "欧菲妮_EN": 519,
+      "塞琉斯_EN": 520,
+      "仆人_EN": 521,
+      "迈勒斯_EN": 522,
+      "希格雯_EN": 523,
+      "阿守_EN": 524,
+      "拉赫曼_EN": 525,
+      "杜拉夫_EN": 526,
+      "伊利亚斯_EN": 527,
+      "阿晃_EN": 528,
+      "���白_EN": 529,
+      "爱德琳_EN": 530,
+      "埃洛伊_EN": 531,
+      "德沃沙克_EN": 532,
+      "玛乔丽_EN": 533,
+      "塞塔蕾_EN": 534,
+      "柊千里_EN": 535,
+      "海芭夏_EN": 536,
+      "九条镰治_EN": 537,
+      "阿娜耶_EN": 538,
+      "笼钓瓶一心_EN": 539,
+      "回声海螺_EN": 540,
+      "劳维克_EN": 541,
+      "元太_EN": 542,
+      "阿扎尔_EN": 543,
+      "查尔斯_EN": 544,
+      "阿洛瓦_EN": 545,
+      "埃勒曼_EN": 546,
+      "纳比尔_EN": 547,
+      "莎拉_EN": 548,
+      "康纳_EN": 549,
+      "博来_EN": 550,
+      "玛塞勒_EN": 551,
+      "阿祇_EN": 552,
+      "博士_EN": 553,
+      "迪尔菲_EN": 554,
+      "宛烟_EN": 555,
+      "玛格丽特_EN": 556,
+      "羽生田千鹤_EN": 557,
+      "海妮耶_EN": 558,
+      "霍夫曼_EN": 559,
+      "旅行者_EN": 560,
+      "佐西摩斯_EN": 561,
+      "鹿野奈奈_EN": 562,
+      "舒伯特_EN": 563,
+      "天叔_EN": 564,
+      "艾莉丝_EN": 565,
+      "龙二_EN": 566,
+      "莺儿_EN": 567,
+      "嘉良_EN": 568,
+      "珊瑚_EN": 569,
+      "费迪南德_EN": 570,
+      "言笑_EN": 571,
+      "一心传名刀_EN": 572,
+      "久利须_EN": 573,
+      "嘉玛_EN": 574,
+      "艾文_EN": 575,
+      "克洛琳德_EN": 576,
+      "丹吉尔_EN": 577,
+      "女士_EN": 578,
+      "天目十五_EN": 579,
+      "老孟_EN": 580,
+      "白老先生_EN": 581,
+      "舍利夫_EN": 582,
+      "巴达维_EN": 583,
+      "拉齐_EN": 584,
+      "长生_EN": 585,
+      "吴船长_EN": 586,
+      "艾伯特_EN": 587,
+      "松浦_EN": 588,
+      "埃泽_EN": 589,
+      "阿圆_EN": 590,
+      "阿拉夫_EN": 591,
+      "莫塞伊思_EN": 592,
+      "石头_EN": 593,
+      "百闻_EN": 594,
+      "杜吉耶_EN": 595,
+      "波洛_EN": 596,
+      "斯坦利_EN": 597,
+      "掇星攫辰天君_EN": 598,
+      "迈蒙_EN": 599,
+      "博易_EN": 600,
+      "诗筠_EN": 601,
+      "毗伽尔_EN": 602,
+      "慧心_EN": 603,
+      "芙卡洛斯_EN": 604,
+      "恶龙_EN": 605,
+      "小仓澪_EN": 606,
+      "恕筠_EN": 607,
+      "知易_EN": 608,
+      "克列门特_EN": 609,
+      "大慈树王_EN": 610,
+      "维多利亚_EN": 611,
+      "黑田_EN": 612,
+      "马姆杜_EN": 613,
+      "科林斯_EN": 614,
+      "上杉_EN": 615,
+      "西拉杰_EN": 616,
+      "宁禄_EN": 617,
+      "纯水精灵_EN": 618,
+      "常九爷_EN": 619,
+      "阿尔卡米_EN": 620,
+      "沙扎曼_EN": 621,
+      "田铁嘴_EN": 622,
+      "加萨尼_EN": 623,
+      "克罗索_EN": 624,
+      "星稀_EN": 625,
+      "莱斯格_EN": 626,
+      "阿巴图伊_EN": 627,
+      "悦_EN": 628,
+      "德田_EN": 629,
+      "埃尔欣根_EN": 630,
+      "阿佩普_EN": 631,
+      "萨赫哈蒂_EN": 632,
+      "洛伦佐_EN": 633,
+      "塔杰·拉德卡尼_EN": 634,
+      "泽田_EN": 635,
+      "安西_EN": 636,
+      "理水叠山真君_EN": 637,
+      "埃舍尔_EN": 638,
+      "萨齐因_EN": 639,
+      "古田_EN": 640,
+      "三月七_ZH": 641,
+      "丹恒_ZH": 642,
+      "希儿_ZH": 643,
+      "娜塔莎_ZH": 644,
+      "希露瓦_ZH": 645,
+      "瓦尔特_ZH": 646,
+      "佩拉_ZH": 647,
+      "布洛妮娅_ZH": 648,
+      "虎克_ZH": 649,
+      "素裳_ZH": 650,
+      "克拉拉_ZH": 651,
+      "符玄_ZH": 652,
+      "白露_ZH": 653,
+      "杰帕德_ZH": 654,
+      "景元_ZH": 655,
+      "藿藿_ZH": 656,
+      "姬子_ZH": 657,
+      "穹_ZH": 658,
+      "星_ZH": 659,
+      "卡芙卡_ZH": 660,
+      "桂乃芬_ZH": 661,
+      "艾丝妲_ZH": 662,
+      "玲可_ZH": 663,
+      "彦卿_ZH": 664,
+      "托帕_ZH": 665,
+      "驭空_ZH": 666,
+      "浮烟_ZH": 667,
+      "停云_ZH": 668,
+      "镜流_ZH": 669,
+      "罗刹_ZH": 670,
+      "卢卡_ZH": 671,
+      "史瓦罗_ZH": 672,
+      "黑塔_ZH": 673,
+      "桑博_ZH": 674,
+      "伦纳德_ZH": 675,
+      "明曦_ZH": 676,
+      "银狼_ZH": 677,
+      "帕姆_ZH": 678,
+      "青雀_ZH": 679,
+      "乔瓦尼_ZH": 680,
+      "公输师傅_ZH": 681,
+      "晴霓_ZH": 682,
+      "螺丝咕姆_ZH": 683,
+      "阿兰_ZH": 684,
+      "奥列格_ZH": 685,
+      "丹枢_ZH": 686,
+      "尾巴_ZH": 687,
+      "寒鸦_ZH": 688,
+      "雪衣_ZH": 689,
+      "可可利亚_ZH": 690,
+      "青镞_ZH": 691,
+      "半夏_ZH": 692,
+      "银枝_ZH": 693,
+      "大毫_ZH": 694,
+      "霄翰_ZH": 695,
+      "信使_ZH": 696,
+      "费斯曼_ZH": 697,
+      "绿芙蓉_ZH": 698,
+      "dev_成男_ZH": 699,
+      "金人会长_ZH": 700,
+      "维利特_ZH": 701,
+      "维尔德_ZH": 702,
+      "斯科特_ZH": 703,
+      "卡波特_ZH": 704,
+      "刃_ZH": 705,
+      "岩明_ZH": 706,
+      "浣溪_ZH": 707,
+      "三月七_JP": 708,
+      "丹恒_JP": 709,
+      "希儿_JP": 710,
+      "娜塔莎_JP": 711,
+      "希露瓦_JP": 712,
+      "瓦尔特_JP": 713,
+      "佩拉_JP": 714,
+      "布洛妮娅_JP": 715,
+      "虎克_JP": 716,
+      "素裳_JP": 717,
+      "克拉拉_JP": 718,
+      "符玄_JP": 719,
+      "白露_JP": 720,
+      "杰帕德_JP": 721,
+      "景元_JP": 722,
+      "藿藿_JP": 723,
+      "姬子_JP": 724,
+      "卡芙卡_JP": 725,
+      "穹_JP": 726,
+      "星_JP": 727,
+      "桂乃芬_JP": 728,
+      "艾丝妲_JP": 729,
+      "彦卿_JP": 730,
+      "玲可_JP": 731,
+      "托帕_JP": 732,
+      "驭空_JP": 733,
+      "浮烟_JP": 734,
+      "停云_JP": 735,
+      "镜流_JP": 736,
+      "罗刹_JP": 737,
+      "卢卡_JP": 738,
+      "史瓦罗_JP": 739,
+      "黑塔_JP": 740,
+      "桑博_JP": 741,
+      "伦纳德_JP": 742,
+      "明曦_JP": 743,
+      "银狼_JP": 744,
+      "帕姆_JP": 745,
+      "青雀_JP": 746,
+      "乔瓦尼_JP": 747,
+      "公输师傅_JP": 748,
+      "晴霓_JP": 749,
+      "螺丝咕姆_JP": 750,
+      "阿兰_JP": 751,
+      "奥列格_JP": 752,
+      "丹枢_JP": 753,
+      "尾巴_JP": 754,
+      "寒鸦_JP": 755,
+      "雪衣_JP": 756,
+      "可可利亚_JP": 757,
+      "青镞_JP": 758,
+      "半夏_JP": 759,
+      "银枝_JP": 760,
+      "大毫_JP": 761,
+      "霄翰_JP": 762,
+      "信使_JP": 763,
+      "费斯曼_JP": 764,
+      "绿芙蓉_JP": 765,
+      "dev_成男_JP": 766,
+      "金人会长_JP": 767,
+      "维利特_JP": 768,
+      "维尔德_JP": 769,
+      "斯科特_JP": 770,
+      "刃_JP": 771,
+      "卡波特_JP": 772,
+      "岩明_JP": 773,
+      "浣溪_JP": 774,
+      "净砚_JP": 775,
+      "紫月季_JP": 776,
+      "歌蒂_JP": 777,
+      "奇怪的云骑_JP": 778,
+      "幻胧_JP": 779,
+      "斯薇塔_JP": 780,
+      "隐书_JP": 781,
+      "三月七_EN": 782,
+      "丹恒_EN": 783,
+      "希儿_EN": 784,
+      "娜塔莎_EN": 785,
+      "希露瓦_EN": 786,
+      "瓦尔特_EN": 787,
+      "佩拉_EN": 788,
+      "布洛妮娅_EN": 789,
+      "虎克_EN": 790,
+      "素裳_EN": 791,
+      "克拉拉_EN": 792,
+      "符玄_EN": 793,
+      "白露_EN": 794,
+      "杰帕德_EN": 795,
+      "景元_EN": 796,
+      "藿藿_EN": 797,
+      "姬子_EN": 798,
+      "卡芙卡_EN": 799,
+      "穹_EN": 800,
+      "星_EN": 801,
+      "桂乃芬_EN": 802,
+      "艾丝妲_EN": 803,
+      "彦卿_EN": 804,
+      "玲可_EN": 805,
+      "托帕_EN": 806,
+      "驭空_EN": 807,
+      "浮烟_EN": 808,
+      "停云_EN": 809,
+      "镜流_EN": 810,
+      "罗刹_EN": 811,
+      "卢卡_EN": 812,
+      "史瓦罗_EN": 813,
+      "黑塔_EN": 814,
+      "桑博_EN": 815,
+      "伦纳德_EN": 816,
+      "明曦_EN": 817,
+      "银狼_EN": 818,
+      "帕姆_EN": 819,
+      "青雀_EN": 820,
+      "乔瓦尼_EN": 821,
+      "公输师傅_EN": 822,
+      "晴霓_EN": 823,
+      "螺丝咕姆_EN": 824,
+      "阿兰_EN": 825,
+      "奥列格_EN": 826,
+      "丹枢_EN": 827,
+      "尾巴_EN": 828,
+      "寒鸦_EN": 829,
+      "雪衣_EN": 830,
+      "可可利亚_EN": 831,
+      "青镞_EN": 832,
+      "半夏_EN": 833,
+      "银枝_EN": 834,
+      "大毫_EN": 835,
+      "霄翰_EN": 836,
+      "信使_EN": 837,
+      "费斯曼_EN": 838,
+      "绿芙蓉_EN": 839,
+      "dev_成男_EN": 840,
+      "金人会长_EN": 841,
+      "维利特_EN": 842,
+      "维尔德_EN": 843,
+      "刃_EN": 844,
+      "卡波特_EN": 845,
+      "岩明_EN": 846,
+      "浣溪_EN": 847,
+      "紫月季_EN": 848,
+      "幻胧_EN": 849,
+      "女声_EN": 850,
+      "陆景和": 851,
+      "莫弈": 852,
+      "左然": 853,
+      "夏彦": 854
     }
   },
   "model": {
     "n_layers_q": 3,
     "use_spectral_norm": false,
     "gin_channels": 256
+  },
+  "version": "2.2"
+}

css/custom.css ADDED Viewed

	@@ -0,0 +1,18 @@

+#yml_code {
+    height: 600px;
+    flex-grow: inherit;
+    overflow-y: auto;
+}
+#json_code {
+    height: 600px;
+    flex-grow: inherit;
+    overflow-y: auto;
+}
+#gpu_code {
+    height: 300px;
+    flex-grow: inherit;
+    overflow-y: auto;
+}