Skip to content

Commit

Permalink
update
Browse files Browse the repository at this point in the history
  • Loading branch information
aijianiula0601@gmail.com committed Feb 21, 2022
1 parent 2d2f39c commit c04f334
Show file tree
Hide file tree
Showing 32 changed files with 193 additions and 27 deletions.
94 changes: 67 additions & 27 deletions audio/gen_html.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@
sys.path.append(pdj)
print(pdj)

speaker_info_file = "/Users/jia/Downloads/speaker-info.txt"
speaker_info_file = "/Users/jiahong/Downloads/speaker-info.txt"
speaker_gender_dic = {}
with open(speaker_info_file, 'r', encoding='utf-8') as f:
i = 0
Expand Down Expand Up @@ -166,12 +166,68 @@ def gen_tb_html(vits_save_base_dir, vq_save_base_dir, source_wav_name, target_wa
# target_wav_name = to_sp.split("_to_")[1]
# process_data(source_wav_name, target_wav_name)

# target wavs in libritts
# # target wavs in libritts
#
#
# base_dir = "/Users/jia/Downloads"
# vits_save_base_dir = "audio/vits_vctk_vc_to_libritts"
# vq_save_base_dir = "audio/vqmivc_vctk_vc_to_libritts"
#
#
# def process_data(source_wav_name, target_wav_name):
# tq_html = gen_tb_html(vits_save_base_dir, vq_save_base_dir, source_wav_name, target_wav_name)
# print(tq_html)
# cmd = f"cp -rf {base_dir}/{vits_save_base_dir.split('/')[-1]}/{source_wav_name}_to_{target_wav_name} {pdj}/{vits_save_base_dir}/ && cp -rf {base_dir}/{vq_save_base_dir.split('/')[-1]}/{source_wav_name}_to_{target_wav_name} {pdj}/{vq_save_base_dir}/"
# os.system(cmd)
#
#
# to_sp = "p231_406_to_7127_75947_000082_000005"
# source_wav_name = to_sp.split("_to_")[0]
# target_wav_name = to_sp.split("_to_")[1]
# process_data(source_wav_name, target_wav_name)
# # --------------------------------------------------------------
# to_sp = "p231_406_to_8555_284447_000039_000002"
# source_wav_name = to_sp.split("_to_")[0]
# target_wav_name = to_sp.split("_to_")[1]
# process_data(source_wav_name, target_wav_name)
# # --------------------------------------------------------------
# to_sp = "p251_010_to_6829_68771_000042_000002"
# source_wav_name = to_sp.split("_to_")[0]
# target_wav_name = to_sp.split("_to_")[1]
# process_data(source_wav_name, target_wav_name)
# # --------------------------------------------------------------
# to_sp = "p274_247_to_2830_3979_000021_000000"
# source_wav_name = to_sp.split("_to_")[0]
# target_wav_name = to_sp.split("_to_")[1]
# process_data(source_wav_name, target_wav_name)
# # --------------------------------------------------------------
# to_sp = "p284_213_to_1995_1826_000031_000003_16k"
# source_wav_name = to_sp.split("_to_")[0]
# target_wav_name = to_sp.split("_to_")[1]
# process_data(source_wav_name, target_wav_name)
# # --------------------------------------------------------------
# to_sp = "p293_287_to_121_127105_000041_000001"
# source_wav_name = to_sp.split("_to_")[0]
# target_wav_name = to_sp.split("_to_")[1]
# process_data(source_wav_name, target_wav_name)
# # --------------------------------------------------------------
# to_sp = "p326_294_to_121_127105_000041_000001"
# source_wav_name = to_sp.split("_to_")[0]
# target_wav_name = to_sp.split("_to_")[1]
# process_data(source_wav_name, target_wav_name)
# # --------------------------------------------------------------
# to_sp = "p334_210_to_237_126133_000011_000000_16k"
# source_wav_name = to_sp.split("_to_")[0]
# target_wav_name = to_sp.split("_to_")[1]
# process_data(source_wav_name, target_wav_name)
# # --------------------------------------------------------------


# 更高难度的

base_dir = "/Users/jia/Downloads"
vits_save_base_dir = "audio/vits_vctk_vc_to_libritts"
vq_save_base_dir = "audio/vqmivc_vctk_vc_to_libritts"
base_dir = "/Users/jiahong/Documents/vcc/FlowCPCVC论文/提交做mos评分音频"
vits_save_base_dir = "audio/vits_yuqi"
vq_save_base_dir = "audio/vq_yuqi"


def process_data(source_wav_name, target_wav_name):
Expand All @@ -181,43 +237,27 @@ def process_data(source_wav_name, target_wav_name):
os.system(cmd)


to_sp = "p231_406_to_7127_75947_000082_000005"
to_sp = "03-01-05-01-01-01-16_to_p334_018"
source_wav_name = to_sp.split("_to_")[0]
target_wav_name = to_sp.split("_to_")[1]
process_data(source_wav_name, target_wav_name)
# --------------------------------------------------------------
to_sp = "p231_406_to_8555_284447_000039_000002"
to_sp = "0011_001750_to_20_205_000031_000000"
source_wav_name = to_sp.split("_to_")[0]
target_wav_name = to_sp.split("_to_")[1]
process_data(source_wav_name, target_wav_name)
# --------------------------------------------------------------
to_sp = "p251_010_to_6829_68771_000042_000002"
to_sp = "男2_to_10011"
source_wav_name = to_sp.split("_to_")[0]
target_wav_name = to_sp.split("_to_")[1]
process_data(source_wav_name, target_wav_name)
# --------------------------------------------------------------
to_sp = "p274_247_to_2830_3979_000021_000000"
to_sp = "EMD6_to_p231_012"
source_wav_name = to_sp.split("_to_")[0]
target_wav_name = to_sp.split("_to_")[1]
process_data(source_wav_name, target_wav_name)
# --------------------------------------------------------------
to_sp = "p284_213_to_1995_1826_000031_000003_16k"
to_sp = "obm2_to_en-US-ElizabethNeural_1624631702559"
source_wav_name = to_sp.split("_to_")[0]
target_wav_name = to_sp.split("_to_")[1]
process_data(source_wav_name, target_wav_name)
# --------------------------------------------------------------
to_sp = "p293_287_to_121_127105_000041_000001"
source_wav_name = to_sp.split("_to_")[0]
target_wav_name = to_sp.split("_to_")[1]
process_data(source_wav_name, target_wav_name)
# --------------------------------------------------------------
to_sp = "p326_294_to_121_127105_000041_000001"
source_wav_name = to_sp.split("_to_")[0]
target_wav_name = to_sp.split("_to_")[1]
process_data(source_wav_name, target_wav_name)
# --------------------------------------------------------------
to_sp = "p334_210_to_237_126133_000011_000000_16k"
source_wav_name = to_sp.split("_to_")[0]
target_wav_name = to_sp.split("_to_")[1]
process_data(source_wav_name, target_wav_name)
# --------------------------------------------------------------
process_data(source_wav_name, target_wav_name)
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file added audio/vits_yuqi/EMD6_to_p231_012/EMD6.wav
Binary file not shown.
Binary file not shown.
Binary file added audio/vits_yuqi/EMD6_to_p231_012/p231_012.wav
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file added audio/vits_yuqi/男2_to_10011/10011.wav
Binary file not shown.
Binary file added audio/vits_yuqi/男2_to_10011/男2.wav
Binary file not shown.
Binary file added audio/vits_yuqi/男2_to_10011/男2_to_10011.wav
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file added audio/vq_yuqi/EMD6_to_p231_012/EMD6.wav
Binary file not shown.
Binary file not shown.
Binary file added audio/vq_yuqi/EMD6_to_p231_012/p231_012.wav
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file added audio/vq_yuqi/男2_to_10011/10011.wav
Binary file not shown.
Binary file added audio/vq_yuqi/男2_to_10011/男2.wav
Binary file not shown.
Binary file added audio/vq_yuqi/男2_to_10011/男2_to_10011.wav
Binary file not shown.
126 changes: 126 additions & 0 deletions index.md
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
# FlowCPCVC

## Audio Demo for "FlowCPCVC:A flow contrastive predictive coding voice conversion system"


Expand Down Expand Up @@ -645,3 +646,128 @@ ___
</td>
</tr>
</table>

## The results that wavs are more difficult to convert

<table>
<tr>
<th>source</th>
<th>target</th>
<th>FlowCPCVC</th>
<th>VQMIVC</th>
</tr>
<tr>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/03-01-05-01-01-01-16_to_p334_018/03-01-05-01-01-01-16.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/03-01-05-01-01-01-16_to_p334_018/p334_018.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/03-01-05-01-01-01-16_to_p334_018/03-01-05-01-01-01-16_to_p334_018.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vq_yuqi/03-01-05-01-01-01-16_to_p334_018/03-01-05-01-01-01-16_to_p334_018.wav">
</audio>
</td>
</tr>

<tr>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/0011_001750_to_20_205_000031_000000/0011_001750.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/0011_001750_to_20_205_000031_000000/20_205_000031_000000.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/0011_001750_to_20_205_000031_000000/0011_001750_to_20_205_000031_000000.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vq_yuqi/0011_001750_to_20_205_000031_000000/0011_001750_to_20_205_000031_000000.wav">
</audio>
</td>
</tr>

<tr>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/男2_to_10011/男2.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/男2_to_10011/10011.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/男2_to_10011/男2_to_10011.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vq_yuqi/男2_to_10011/男2_to_10011.wav">
</audio>
</td>
</tr>

<tr>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/EMD6_to_p231_012/EMD6.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/EMD6_to_p231_012/p231_012.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/EMD6_to_p231_012/EMD6_to_p231_012.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vq_yuqi/EMD6_to_p231_012/EMD6_to_p231_012.wav">
</audio>
</td>
</tr>

<tr>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/obm2_to_en-US-ElizabethNeural_1624631702559/obm2.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/obm2_to_en-US-ElizabethNeural_1624631702559/en-US-ElizabethNeural_1624631702559.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vits_yuqi/obm2_to_en-US-ElizabethNeural_1624631702559/obm2_to_en-US-ElizabethNeural_1624631702559.wav">
</audio>
</td>
<td>
<audio id="audio" controls="" preload="none">
<source id="wav" src="audio/vq_yuqi/obm2_to_en-US-ElizabethNeural_1624631702559/obm2_to_en-US-ElizabethNeural_1624631702559.wav">
</audio>
</td>
</tr>
</table>

0 comments on commit c04f334

Please sign in to comment.