Skip to content

Commit 8f8232a

Browse files
authored
ずんだもんのID修正漏れ対応 (#154)
* fix requirements.txt * READMEのモデル配置URLの変更等 モデル配置URLの変更、dataset内のファイル構成を実際に作成される内容に則した物に変更 * PIXIV FANBOX問い合わせ先追加 READMEにPIXIV FANBOXの問い合わせ先を追加 * ずんだもんのID修正漏れ対応 ・ID100の場合にずんだもん指定だった状態を修正(現在は101がずんだもん) ・IDの値をプログラムの最初に変数定義する表記に変更 ・multi_speakerの内容を現在の上限等に合わせた物に変更
1 parent 3940993 commit 8f8232a

File tree

3 files changed

+31
-18
lines changed

3 files changed

+31
-18
lines changed

create_dataset_jtalk.py

Lines changed: 19 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,15 @@
55
import pyopenjtalk
66
import json
77

8+
MY_ID = 0
9+
ZUNDAMON_ID = 101
10+
SORA_ID = 102
11+
METHANE_ID = 103
12+
TSUMUGI_ID = 104
13+
KIRITAN_ID = 106
14+
15+
MAX_ID = 255
16+
817
def mozi2phone(mozi):
918
text = pyopenjtalk.g2p(mozi)
1019
text = "sil " + text + " sil"
@@ -58,7 +67,7 @@ def create_dataset(filename):
5867
counter = counter +1
5968
Correspondence_list.append(str(speaker_id)+"|"+os.path.basename(d) + "\n")
6069
speaker_id = speaker_id + 1
61-
if speaker_id > 255:
70+
if speaker_id > MAX_ID:
6271
break
6372

6473
for d in textless_dir_list:
@@ -103,7 +112,7 @@ def create_dataset_zundamon(filename):
103112

104113
#set list wav and text
105114
#myvoice
106-
speaker_id = 0
115+
speaker_id = MY_ID
107116
d = my_path
108117
wav_file_list = glob.glob(d + "/wav/*.wav")
109118
lab_file_list = glob.glob(d + "/text/*.txt")
@@ -127,7 +136,7 @@ def create_dataset_zundamon(filename):
127136
counter = counter +1
128137
Correspondence_list.append(str(speaker_id)+"|"+os.path.basename(d) + "\n")
129138

130-
speaker_id = 101
139+
speaker_id = ZUNDAMON_ID
131140
d = zundamon_path
132141
wav_file_list = glob.glob(d + "/wav/*.wav")
133142
lab_file_list = glob.glob(d + "/text/*.txt")
@@ -175,7 +184,7 @@ def create_dataset_zundamon(filename):
175184
f.writelines(output_file_list_val_textless)
176185
with open('filelists/' + filename + '_Correspondence.txt', 'w', encoding='utf-8', newline='\n') as f:
177186
f.writelines(Correspondence_list)
178-
return 255
187+
return MAX_ID
179188

180189
def create_dataset_character(filename, tid):
181190
textful_dir_list = glob.glob("dataset/textful/*")
@@ -193,7 +202,7 @@ def create_dataset_character(filename, tid):
193202

194203
#set list wav and text
195204
#myvoice
196-
speaker_id = 0
205+
speaker_id = MY_ID
197206
d = my_path
198207
wav_file_list = glob.glob(d + "/wav/*.wav")
199208
lab_file_list = glob.glob(d + "/text/*.txt")
@@ -265,7 +274,7 @@ def create_dataset_character(filename, tid):
265274
f.writelines(output_file_list_val_textless)
266275
with open('filelists/' + filename + '_Correspondence.txt', 'w', encoding='utf-8', newline='\n') as f:
267276
f.writelines(Correspondence_list)
268-
return 255
277+
return MAX_ID
269278

270279
def create_dataset_multi_character(filename, file_path):
271280
Correspondence_list = list()
@@ -311,7 +320,7 @@ def create_dataset_multi_character(filename, file_path):
311320
f.writelines(output_file_list_val_textless)
312321
with open('filelists/' + filename + '_Correspondence.txt', 'w', encoding='utf-8', newline='\n') as f:
313322
f.writelines(Correspondence_list)
314-
return 255
323+
return MAX_ID
315324

316325
def main():
317326
parser = argparse.ArgumentParser()
@@ -320,17 +329,17 @@ def main():
320329
parser.add_argument('-s', '--sr', type=int, default=24000,
321330
help='sampling rate (default = 24000)')
322331
parser.add_argument('-t', '--target', type=int, default=9999,
323-
help='pre_traind targetid (zundamon = 100, sora = 101, methane = 102, tsumugi = 103)')
332+
help='pre_traind targetid (zundamon = {ZUNDAMON_ID}, sora = {SORA_ID}, methane = {METHANE_ID}, tsumugi = {TSUMUGI_ID}, kiritan = {KIRITAN_ID})')
324333
parser.add_argument('-m', '--multi_target', type=str, default=None,
325-
help='pre_traind targetid (zundamon = 100, sora = 101, methane = 102, tsumugi = 103)')
334+
help='pre_traind targetid (zundamon = {ZUNDAMON_ID}, sora = {SORA_ID}, methane = {METHANE_ID}, tsumugi = {TSUMUGI_ID}, kiritan = {KIRITAN_ID})')
326335
parser.add_argument('-c', '--config', type=str, default="./configs/baseconfig.json",
327336
help='JSON file for configuration')
328337
args = parser.parse_args()
329338
filename = args.filename
330339
print(filename)
331340
if args.multi_target != None:
332341
n_spk = create_dataset_multi_character(filename, args.multi_target)
333-
elif args.target != 9999 and args.target == 100:
342+
elif args.target != 9999 and args.target == ZUNDAMON_ID:
334343
n_spk = create_dataset_zundamon(filename)
335344
elif args.target != 9999:
336345
n_spk = create_dataset_character(filename, args.target)
Lines changed: 11 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,11 @@
1-
00_myvoice|107
2-
01_target|108
3-
02_target|109
4-
03_target|0
5-
04_target|1
6-
05_target|2
7-
1205_zundamon|100
1+
00_myvoice|0
2+
01_target|1
3+
02_target|2
4+
03_target|252
5+
04_target|253
6+
05_target|254
7+
1205_zundamon|101
8+
912_sora|102
9+
459_metahne|103
10+
344_tsumugi|104
11+
106_kiritan|106

version.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
v1.3.2.10
1+
v1.3.2.11

0 commit comments

Comments
 (0)