rm test dataset that is never used

This commit is contained in:
Lengyue 2023-03-24 00:43:29 -04:00
parent eb8ef9a305
commit 2854013a8a
No known key found for this signature in database
GPG Key ID: 67CD446B0133EF95
2 changed files with 1 additions and 14 deletions

View File

@ -25,13 +25,11 @@ if __name__ == "__main__":
parser = argparse.ArgumentParser()
parser.add_argument("--train_list", type=str, default="./filelists/train.txt", help="path to train list")
parser.add_argument("--val_list", type=str, default="./filelists/val.txt", help="path to val list")
parser.add_argument("--test_list", type=str, default="./filelists/test.txt", help="path to test list")
parser.add_argument("--source_dir", type=str, default="./dataset/44k", help="path to source dir")
args = parser.parse_args()
train = []
val = []
test = []
idx = 0
spk_dict = {}
spk_id = 0
@ -51,13 +49,11 @@ if __name__ == "__main__":
new_wavs.append(file)
wavs = new_wavs
shuffle(wavs)
train += wavs[2:-2]
train += wavs[2:]
val += wavs[:2]
test += wavs[-2:]
shuffle(train)
shuffle(val)
shuffle(test)
print("Writing", args.train_list)
with open(args.train_list, "w") as f:
@ -70,12 +66,6 @@ if __name__ == "__main__":
for fname in tqdm(val):
wavpath = fname
f.write(wavpath + "\n")
print("Writing", args.test_list)
with open(args.test_list, "w") as f:
for fname in tqdm(test):
wavpath = fname
f.write(wavpath + "\n")
config_template["spk"] = spk_dict
config_template["model"]["n_speakers"] = spk_id

View File

@ -11,12 +11,9 @@ config = json.loads(data)
hps = HParams(**config)
train_dataset = TextAudioSpeakerLoader("filelists/train.txt", hps)
test_dataset = TextAudioSpeakerLoader("filelists/test.txt", hps)
eval_dataset = TextAudioSpeakerLoader("filelists/val.txt", hps)
for _ in tqdm(train_dataset):
pass
for _ in tqdm(eval_dataset):
pass
for _ in tqdm(test_dataset):
pass