Skip to content

Commit 43b2f41

Browse files
committedJun 18, 2023
Merge remote-tracking branch 'upstream/main'
2 parents 00c70e7 + c1ace16 commit 43b2f41

File tree

4 files changed

+48
-26
lines changed

4 files changed

+48
-26
lines changed
 

‎Changelog_CN.md

+21-9
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,24 @@
1+
### 20230618更新
2+
- v2增加32k和48k两个新预训练模型
3+
- 修复非f0模型推理报错
4+
- 对于超过一小时的训练集的索引建立环节,自动kmeans缩小特征处理以加速索引训练、加入和查询
5+
- 附送一个人声转吉他玩具仓库
6+
- 数据处理剔除异常值切片
7+
- onnx导出选项卡
8+
9+
失败的实验:
10+
- ~~特征检索增加时序维度:寄,没啥效果~~
11+
- ~~特征检索增加PCAR降维可选项:寄,数据大用kmeans缩小数据量,数据小降维操作耗时比省下的匹配耗时还多~~
12+
- ~~支持onnx推理(附带仅推理的小压缩包):寄,生成nsf还是需要pytorch~~
13+
- ~~训练时在音高、gender、eq、噪声等方面对输入进行随机增强:寄,没啥效果~~
14+
15+
todolist:
16+
- 接入小型声码器调研
17+
- 训练集音高识别支持crepe
18+
- crepe的精度支持和RVC-config同步
19+
- 对接F0编辑器
20+
21+
122
### 20230528更新
223
- 增加v2的jupyter notebook,韩文changelog,增加一些环境依赖
324
- 增加呼吸、清辅音、齿音保护模式
@@ -7,15 +28,6 @@
728
- 人声伴奏分离、推理批量导出增加音频导出格式选项
829
- 废弃32k模型的训练
930

10-
todolist:
11-
- ~~特征检索增加时序维度:寄,没啥效果~~
12-
- 特征检索增加pre-kmeans可选项
13-
- ~~特征检索增加PCAR降维可选项:寄,数据大用kmeans缩小数据量,数据小降维操作耗时比省下的匹配耗时还多~~
14-
- ~~支持onnx推理(附带仅推理的小压缩包):寄,生成nsf还是需要pytorch~~
15-
- ~~训练时在音高、gender、eq、噪声等方面对输入进行随机增强:寄,没啥效果~~
16-
- 补全v2版本的48k预训练模型
17-
18-
1931
### 20230513更新
2032
- 清除一键包内部老版本runtime内残留的infer_pack和uvr5_pack
2133
- 修复训练集预处理伪多进程的bug

‎Changelog_EN.md

+20-9
Original file line numberDiff line numberDiff line change
@@ -1,19 +1,30 @@
1+
### 2023-06-18
2+
- New pretrained v2 models: 32k and 48k
3+
- Fix non-f0 model inference errors
4+
- For training-set exceeding 1 hour, do automatic minibatch-kmeans to reduce feature shape, so that index training, adding, and searching will be much faster.
5+
- Provide a toy vocal2guitar huggingface space
6+
- Auto delete outlier short cut training-set audios
7+
- Onnx export tab
8+
9+
Failed experiments:
10+
- ~~Feature retrieval: add temporal feature retrieval: not effective~~
11+
- ~~Feature retrieval: add PCAR dimensionality reduction: searching is even slower~~
12+
- ~~Random data augmentation when training: not effective~~
13+
14+
todolist:
15+
- Vocos-RVC (tiny vocoder)
16+
- Crepe support for training
17+
- Half precision crepe inference
18+
- F0 editor support
19+
120
### 2023-05-28
221
- Add v2 jupyter notebook, korean changelog, fix some environment requirments
322
- Add voiceless consonant and breath protection mode
423
- Support crepe-full pitch detect
524
- UVR5 vocal separation: support dereverb models and de-echo models
625
- Add experiment name and version on the name of index
726
- Support users to manually select export format of output audios when batch voice conversion processing and UVR5 vocal separation
8-
- 32k model training is no more supported
9-
10-
todolist:
11-
- Feature retrieval: add temporal feature retrieval
12-
- Feature retrieval: add pre-kmeans option
13-
- Feature retrieval: add PCAR dimensionality reduction
14-
- Add onnx inference support
15-
- Random data augmentation when training: pitch, gender, eq, noise
16-
- Add v2 version pretrained-models
27+
- v1 32k model training is no more supported
1728

1829
### 2023-05-13
1930
- Clear the redundant codes in the old version of runtime in the one-click-package: infer_pack and uvr5_pack

‎infer-web.py

+6-7
Original file line numberDiff line numberDiff line change
@@ -666,12 +666,12 @@ def change_sr2(sr2, if_f0_3, version19):
666666
if_pretrained_discriminator_exist = os.access(
667667
"pretrained%s/%sD%s.pth" % (path_str, f0_str, sr2), os.F_OK
668668
)
669-
if if_pretrained_generator_exist is not False:
669+
if not if_pretrained_generator_exist:
670670
print(
671671
"pretrained%s/%sG%s.pth" % (path_str, f0_str, sr2),
672672
"not exist, will not use pretrained model",
673673
)
674-
if if_pretrained_discriminator_exist is not False:
674+
if not if_pretrained_discriminator_exist:
675675
print(
676676
"pretrained%s/%sD%s.pth" % (path_str, f0_str, sr2),
677677
"not exist, will not use pretrained model",
@@ -683,7 +683,6 @@ def change_sr2(sr2, if_f0_3, version19):
683683
"pretrained%s/%sD%s.pth" % (path_str, f0_str, sr2)
684684
if if_pretrained_discriminator_exist
685685
else "",
686-
{"visible": True, "__type__": "update"},
687686
)
688687

689688

@@ -692,9 +691,9 @@ def change_version19(sr2, if_f0_3, version19):
692691
if sr2 == "32k" and version19 == "v1":
693692
sr2 = "40k"
694693
to_return_sr2 = (
695-
{"choices": ["40k", "48k"], "__type__": "update"}
694+
{"choices": ["40k", "48k"], "__type__": "update", "value": sr2}
696695
if version19 == "v1"
697-
else {"choices": ["32k", "40k", "48k"], "__type__": "update"}
696+
else {"choices": ["40k", "48k", "32k"], "__type__": "update", "value": sr2}
698697
)
699698
f0_str = "f0" if if_f0_3 else ""
700699
if_pretrained_generator_exist = os.access(
@@ -2106,7 +2105,7 @@ def get_presets():
21062105
sr2.change(
21072106
change_sr2,
21082107
[sr2, if_f0_3, version19],
2109-
[pretrained_G14, pretrained_D15, version19],
2108+
[pretrained_G14, pretrained_D15],
21102109
)
21112110
version19.change(
21122111
change_version19,
@@ -2289,7 +2288,7 @@ def get_presets():
22892288
version_1 = gr.Radio(
22902289
label=i18n("模型版本型号"),
22912290
choices=["v1", "v2"],
2292-
value="v1",
2291+
value="v2",
22932292
interactive=True,
22942293
)
22952294
info___ = gr.Textbox(

‎train/utils.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -360,7 +360,7 @@ def get_hparams(init=True):
360360
if not os.path.exists(experiment_dir):
361361
os.makedirs(experiment_dir)
362362

363-
if(args.version=="v1"or args.sample_rate=="40k"):
363+
if args.version == "v1" or args.sample_rate == "40k":
364364
config_path = "configs/%s.json" % args.sample_rate
365365
else:
366366
config_path = "configs/%s_v2.json" % args.sample_rate

0 commit comments

Comments
 (0)