| |
| |
| |
| |
|
|
| """ |
| For source datasets' standard samples |
| """ |
|
|
| from collections import defaultdict |
| import os |
| import json |
|
|
| SPEECH_DATASETS = ["vctk", "vctksample"] |
|
|
| GOLDEN_TEST_SAMPLES = defaultdict(list) |
| GOLDEN_TEST_SAMPLES["m4singer"] = [ |
| "Alto-1_美错_0014", |
| "Bass-1_十年_0008", |
| "Soprano-2_同桌的你_0018", |
| "Tenor-5_爱笑的眼睛_0010", |
| ] |
| GOLDEN_TEST_SAMPLES["svcc"] = [ |
| |
| "IDF1_10030", |
| "IDF1_10120", |
| "IDF1_10140", |
| |
| "IDM1_10001", |
| "IDM1_10030", |
| "IDM1_10120", |
| |
| "CDF1_10030", |
| "CDF1_10120", |
| "CDF1_10140", |
| |
| "CDM1_10001", |
| "CDM1_10030", |
| "CDM1_10120", |
| ] |
| GOLDEN_TEST_SAMPLES["svcceval"] = [ |
| |
| "SF1_30001", |
| "SF1_30002", |
| "SF1_30003", |
| |
| "SM1_30001", |
| "SM1_30002", |
| "SM1_30003", |
| ] |
| GOLDEN_TEST_SAMPLES["popbutfy"] = [ |
| "Female1#you_are_my_sunshine_Professional#0", |
| "Female4#Someone_Like_You_Professional#10", |
| "Male2#Lemon_Tree_Professional#12", |
| "Male5#can_you_feel_the_love_tonight_Professional#20", |
| ] |
| GOLDEN_TEST_SAMPLES["opensinger"] = [ |
| "Man_0_大鱼_10", |
| "Man_21_丑八怪_14", |
| "Woman_39_mojito_22", |
| "Woman_40_易燃易爆炸_12", |
| ] |
| GOLDEN_TEST_SAMPLES["nus48e"] = [ |
| "ADIZ_read#01#0000", |
| "MCUR_sing#10#0000", |
| "JLEE_read#08#0001", |
| "SAMF_sing#18#0001", |
| ] |
| GOLDEN_TEST_SAMPLES["popcs"] = [ |
| "明天会更好_0004", |
| "欧若拉_0005", |
| "虫儿飞_0006", |
| "隐形的翅膀_0008", |
| ] |
| GOLDEN_TEST_SAMPLES["kising"] = [ |
| "421_0040", |
| "424_0013", |
| "431_0026", |
| ] |
| GOLDEN_TEST_SAMPLES["csd"] = [ |
| "en_004a_0001", |
| "en_042b_0006", |
| "kr_013a_0006", |
| "kr_045b_0004", |
| ] |
| GOLDEN_TEST_SAMPLES["opera"] = [ |
| "fem_01#neg_1#0000", |
| "fem_12#pos_3#0003", |
| "male_02#neg_1#0002", |
| "male_11#pos_2#0001", |
| ] |
| GOLDEN_TEST_SAMPLES["lijian"] = [ |
| "058矜持_0000", |
| "079绒花_0000", |
| "120遥远的天空底下_0000", |
| ] |
| GOLDEN_TEST_SAMPLES["cdmusiceval"] = ["陶喆_普通朋友", "蔡琴_给电影人的情书"] |
|
|
| GOLDEN_TRAIN_SAMPLES = defaultdict(list) |
|
|
|
|
| def get_golden_samples_indexes( |
| dataset_name, |
| dataset_dir=None, |
| cfg=None, |
| split=None, |
| min_samples=5, |
| ): |
| """ |
| # Get Standard samples' indexes |
| """ |
| if dataset_dir is None: |
| assert cfg is not None |
| dataset_dir = os.path.join( |
| cfg.OUTPUT_PATH, |
| "preprocess/{}_version".format(cfg.PREPROCESS_VERSION), |
| dataset_name, |
| ) |
|
|
| assert split is not None |
| utt_file = os.path.join(dataset_dir, "{}.json".format(split)) |
| with open(utt_file, "r", encoding="utf-8") as f: |
| samples = json.load(f) |
|
|
| if "train" in split: |
| golden_samples = GOLDEN_TRAIN_SAMPLES[dataset_name] |
| if "test" in split: |
| golden_samples = GOLDEN_TEST_SAMPLES[dataset_name] |
|
|
| res = [] |
| for idx, utt in enumerate(samples): |
| if utt["Uid"] in golden_samples: |
| res.append(idx) |
|
|
| if dataset_name == "cdmusiceval": |
| if "_".join(utt["Uid"].split("_")[:2]) in golden_samples: |
| res.append(idx) |
|
|
| if len(res) == 0: |
| res = [i for i in range(min_samples)] |
|
|
| return res |
|
|
|
|
| def get_specific_singer_indexes(dataset_dir, singer_name, split): |
| utt_file = os.path.join(dataset_dir, "{}.json".format(split)) |
| with open(utt_file, "r", encoding="utf-8") as f: |
| samples = json.load(f) |
|
|
| res = [] |
| for idx, utt in enumerate(samples): |
| if utt["Singer"] == singer_name: |
| res.append(idx) |
|
|
| assert len(res) != 0 |
| return res |
|
|
|
|
| def get_uids_and_wav_paths( |
| cfg, dataset, dataset_type="train", only_specific_singer=None, return_singers=False |
| ): |
| dataset_dir = os.path.join( |
| cfg.OUTPUT_PATH, "preprocess/{}_version".format(cfg.PREPROCESS_VERSION), dataset |
| ) |
| dataset_file = os.path.join( |
| dataset_dir, "{}.json".format(dataset_type.split("_")[-1]) |
| ) |
| with open(dataset_file, "r") as f: |
| utterances = json.load(f) |
|
|
| indexes = range(len(utterances)) |
| if "golden" in dataset_type: |
| |
| indexes = get_golden_samples_indexes( |
| dataset, dataset_dir, split=dataset_type.split("_")[-1] |
| ) |
| if only_specific_singer is not None: |
| indexes = get_specific_singer_indexes( |
| dataset_dir, only_specific_singer, dataset_type |
| ) |
|
|
| uids = [utterances[i]["Uid"] for i in indexes] |
| wav_paths = [utterances[i]["Path"] for i in indexes] |
| singers = [utterances[i]["Singer"] for i in indexes] |
|
|
| if not return_singers: |
| return uids, wav_paths |
| else: |
| return uids, wav_paths, singers |
|
|