Open Dream-High opened 2 years ago
@Dream-High to help with debugging, could you copy-paste the code into a comment here instead of using a screenshot?
@Dream-High to help with debugging, could you copy-paste the code into a comment here instead of using a screenshot? Thanks very much.
Below is my code
import os
import crepe
import librosa
import json
import numpy as np
import pandas as pd
from mir_eval.melody import raw_pitch_accuracy, to_cent_voicing, voicing_measures
audio_file = r'D:\联合模型\Data\MIR-1K\Wavfile'
label_file = r'D:\联合模型\Data\MIR-1K\PitchLabel'
rpa_list = []
vr_list = []
vfa_list = []
with open('../split_details.json', 'r') as f:
split_details = json.load(f)
test_dict = split_details['test']
for file in test_dict.values():
audio, sr = librosa.load(os.path.join(audio_file, file), 16000, mono=False)
# audio, sr = librosa.load(os.path.join(audio_file, file), 16000, mono=True)
audio_v = np.array(audio[1])
# audio_v = audio
time, frequency, confidence, activation = crepe.predict(audio_v, sr, viterbi=True, step_size=10)
df_p = pd.DataFrame(columns=['times', 'freqs', 'confi', 'cent', 'midi'])
df_p['times'] = time
df_p['freqs'] = frequency
df_p['confi'] = confidence
est_f = frequency[1:-1]
ref = []
with open(os.path.join(label_file, file.replace('.wav', '.pv')), 'r') as f:
lines = f.readlines()
for line in lines:
ref.append(line)
ref = np.array(ref).astype(float)
ref_f = np.power(2, (ref-69)/12)*440
assert len(est_f) == len(ref_f)
ref_v, ref_c, est_v, est_c = to_cent_voicing(time[1:-1], ref_f, time[1:-1], est_f)
vr, vfa = voicing_measures(ref_v, est_v)
rpa = raw_pitch_accuracy(ref_v, ref_c, est_v, est_c)
rpa_list.append(rpa)
vr_list.append(vr)
vfa_list.append(vfa)
print(len(rpa_list), '\t', rpa, '\t', vr, '\t', vfa)
{"train": {"0": "amy_11_01.wav", "1": "davidson_1_09.wav", "2": "leon_1_07.wav", "3": "davidson_3_14.wav", "4": "yifen_3_06.wav", "5": "leon_1_09.wav", "6": "davidson_2_01.wav", "7": "davidson_2_09.wav", "8": "leon_5_10.wav", "9": "leon_8_12.wav", "10": "geniusturtle_7_02.wav", "11": "amy_4_02.wav", "12": "jmzen_1_01.wav", "13": "amy_4_09.wav", "14": "bug_5_01.wav", "15": "amy_14_05.wav", "16": "bug_5_11.wav", "17": "fdps_2_07.wav", "18": "khair_2_02.wav", "19": "annar_3_02.wav", "20": "Kenshin_3_06.wav", "21": "yifen_1_15.wav", "22": "leon_5_07.wav", "23": "amy_12_02.wav", "24": "bug_3_06.wav", "25": "geniusturtle_3_01.wav", "26": "tammy_1_03.wav", "27": "yifen_1_06.wav", "28": "davidson_3_04.wav", "29": "leon_5_01.wav", "30": "titon_2_09.wav", "31": "davidson_3_11.wav", "32": "amy_6_06.wav", "33": "stool_3_01.wav", "34": "bobon_2_07.wav", "35": "amy_11_05.wav", "36": "khair_1_07.wav", "37": "leon_8_08.wav", "38": "khair_6_04.wav", "39": "leon_2_03.wav", "40": "fdps_2_02.wav", "41": "Kenshin_3_08.wav", "42": "Kenshin_1_10.wav", "43": "amy_16_03.wav", "44": "annar_5_05.wav", "45": "davidson_5_11.wav", "46": "amy_9_01.wav", "47": "heycat_2_01.wav", "48": "ariel_4_02.wav", "49": "tammy_1_08.wav", "50": "amy_13_04.wav", "51": "amy_11_04.wav", "52": "yifen_2_02.wav", "53": "fdps_1_06.wav", "54": "leon_4_02.wav", "55": "Kenshin_2_06.wav", "56": "amy_10_08.wav", "57": "Kenshin_2_02.wav", "58": "khair_5_01.wav", "59": "Kenshin_3_07.wav", "60": "abjones_5_06.wav", "61": "leon_1_10.wav", "62": "leon_7_04.wav", "63": "abjones_2_04.wav", "64": "bobon_1_08.wav", "65": "leon_6_04.wav", "66": "Ani_5_01.wav", "67": "Kenshin_4_07.wav", "68": "ariel_5_05.wav", "69": "annar_3_05.wav", "70": "tammy_1_05.wav", "71": "leon_6_01.wav", "72": "yifen_5_10.wav", "73": "geniusturtle_3_08.wav", "74": "khair_4_02.wav", "75": "titon_2_08.wav", "76": "bobon_4_05.wav", "77": "bug_4_03.wav", "78": "bug_5_14.wav", "79": "yifen_5_05.wav", "80": "abjones_5_08.wav", "81": "amy_8_05.wav", "82": "amy_4_05.wav", "83": "ariel_2_05.wav", "84": "bobon_2_05.wav", "85": "amy_13_03.wav", "86": "stool_5_07.wav", "87": "yifen_4_05.wav", "88": "leon_1_03.wav", "89": "ariel_1_05.wav", "90": "fdps_1_07.wav", "91": "davidson_4_01.wav", "92": "heycat_3_06.wav", "93": "leon_5_08.wav", "94": "Ani_5_03.wav", "95": "fdps_2_03.wav", "96": "leon_1_11.wav", "97": "Kenshin_1_07.wav", "98": "Kenshin_5_07.wav", "99": "stool_2_01.wav", "100": "geniusturtle_2_07.wav", "101": "heycat_4_03.wav", "102": "titon_1_05.wav", "103": "Ani_4_01.wav", "104": "bobon_4_03.wav", "105": "leon_6_08.wav", "106": "fdps_5_03.wav", "107": "titon_2_01.wav", "108": "titon_4_07.wav", "109": "Kenshin_1_09.wav", "110": "amy_7_07.wav", "111": "ariel_3_05.wav", "112": "annar_5_07.wav", "113": "leon_5_02.wav", "114": "abjones_2_12.wav", "115": "khair_6_06.wav", "116": "abjones_3_06.wav", "117": "bug_2_06.wav", "118": "khair_2_03.wav", "119": "yifen_1_10.wav", "120": "leon_3_09.wav", "121": "amy_7_04.wav", "122": "davidson_3_02.wav", "123": "heycat_4_09.wav", "124": "stool_5_02.wav", "125": "khair_2_04.wav", "126": "yifen_5_06.wav", "127": "amy_2_05.wav", "128": "Ani_5_07.wav", "129": "leon_8_07.wav", "130": "geniusturtle_7_06.wav", "131": "annar_4_02.wav", "132": "titon_5_03.wav", "133": "heycat_1_07.wav", "134": "geniusturtle_1_03.wav", "135": "heycat_3_03.wav", "136": "leon_2_08.wav", "137": "amy_13_07.wav", "138": "leon_4_03.wav", "139": "amy_4_08.wav", "140": "davidson_1_08.wav", "141": "annar_5_06.wav", "142": "Ani_5_04.wav", "143": "abjones_3_11.wav", "144": "heycat_3_04.wav", "145": "jmzen_2_09.wav", "146": "ariel_5_07.wav", "147": "davidson_1_01.wav", "148": "ariel_2_02.wav", "149": "stool_4_06.wav", "150": "yifen_2_04.wav", "151": "khair_2_01.wav", "152": "Ani_3_04.wav", "153": "yifen_1_14.wav", "154": "khair_2_05.wav", "155": "ariel_1_06.wav", "156": "heycat_5_08.wav", "157": "ariel_2_09.wav", "158": "Kenshin_2_07.wav", "159": "leon_3_06.wav", "160": "geniusturtle_6_01.wav", "161": "abjones_3_10.wav", "162": "geniusturtle_3_05.wav", "163": "bug_5_10.wav", "164": "Ani_1_06.wav", "165": "amy_12_07.wav", "166": "abjones_2_09.wav", "167": "heycat_2_05.wav", "168": "jmzen_4_05.wav", "169": "bug_4_01.wav", "170": "fdps_5_06.wav", "171": "amy_14_02.wav", "172": "jmzen_4_01.wav", "173": "bobon_1_07.wav", "174": "leon_9_06.wav", "175": "khair_1_03.wav", "176": "leon_5_04.wav", "177": "amy_2_04.wav", "178": "amy_8_04.wav", "179": "fdps_2_08.wav", "180": "abjones_2_11.wav", "181": "Ani_3_05.wav", "182": "titon_5_09.wav", "183": "Kenshin_2_03.wav", "184": "yifen_3_01.wav", "185": "jmzen_4_02.wav", "186": "geniusturtle_4_04.wav", "187": "amy_8_06.wav", "188": "Kenshin_5_02.wav", "189": "bobon_3_08.wav", "190": "jmzen_1_07.wav", "191": "Kenshin_2_05.wav", "192": "geniusturtle_6_03.wav", "193": "Ani_3_02.wav", "194": "titon_3_01.wav", "195": "geniusturtle_4_10.wav", "196": "bobon_4_07.wav", "197": "amy_3_04.wav", "198": "khair_5_07.wav", "199": "titon_4_01.wav", "200": "leon_2_01.wav", "201": "titon_1_03.wav", "202": "amy_6_02.wav", "203": "heycat_1_02.wav", "204": "Kenshin_1_04.wav", "205": "stool_1_03.wav", "206": "jmzen_3_02.wav", "207": "stool_1_01.wav", "208": "leon_7_03.wav", "209": "abjones_3_14.wav", "210": "leon_9_04.wav", "211": "bobon_4_08.wav", "212": "jmzen_4_10.wav", "213": "Ani_1_05.wav", "214": "bug_3_08.wav", "215": "titon_4_09.wav", "216": "annar_3_06.wav", "217": "bug_3_05.wav", "218": "amy_7_03.wav", "219": "geniusturtle_6_07.wav", "220": "Ani_4_09.wav", "221": "Ani_5_06.wav", "222": "geniusturtle_2_01.wav", "223": "amy_2_03.wav", "224": "khair_3_06.wav", "225": "jmzen_2_06.wav", "226": "amy_7_01.wav", "227": "heycat_4_02.wav", "228": "geniusturtle_1_06.wav", "229": "leon_7_02.wav", "230": "khair_5_06.wav", "231": "bobon_5_06.wav", "232": "fdps_1_05.wav", "233": "annar_5_03.wav", "234": "yifen_4_02.wav", "235": "jmzen_5_01.wav", "236": "geniusturtle_4_12.wav", "237": "geniusturtle_7_05.wav", "238": "amy_9_07.wav", "239": "davidson_5_01.wav", "240": "davidson_5_05.wav", "241": "leon_2_07.wav", "242": "bobon_5_05.wav", "243": "fdps_2_05.wav", "244": "davidson_2_03.wav", "245": "annar_1_05.wav", "246": "Kenshin_1_08.wav", "247": "stool_3_09.wav", "248": "khair_3_03.wav", "249": "jmzen_3_01.wav", "250": "Ani_1_01.wav", "251": "fdps_3_05.wav", "252": "fdps_5_04.wav", "253": "annar_2_07.wav", "254": "jmzen_1_09.wav", "255": "Kenshin_2_04.wav", "256": "amy_1_07.wav", "257": "Ani_2_07.wav", "258": "leon_9_05.wav", "259": "bug_5_07.wav", "260": "titon_4_08.wav", "261": "heycat_5_06.wav", "262": "leon_1_08.wav", "263": "stool_1_05.wav", "264": "yifen_2_13.wav", "265": "bug_2_08.wav", "266": "Ani_1_07.wav", "267": "geniusturtle_3_03.wav", "268": "heycat_1_03.wav", "269": "geniusturtle_8_05.wav", "270": "fdps_4_04.wav", "271": "jmzen_3_09.wav", "272": "leon_4_06.wav", "273": "geniusturtle_8_08.wav", "274": "amy_6_09.wav", "275": "bobon_3_06.wav", "276": "jmzen_2_07.wav", "277": "davidson_1_06.wav", "278": "heycat_2_07.wav", "279": "Kenshin_5_05.wav", "280": "amy_1_01.wav", "281": "amy_7_02.wav", "282": "heycat_3_08.wav", "283": "Ani_2_04.wav", "284": "davidson_2_08.wav", "285": "Kenshin_3_03.wav", "286": "amy_15_03.wav", "287": "amy_13_02.wav", "288": "leon_2_09.wav", "289": "geniusturtle_8_02.wav", "290": "stool_4_09.wav", "291": "bug_1_09.wav", "292": "leon_5_03.wav", "293": "khair_3_05.wav", "294": "leon_2_04.wav", "295": "ariel_4_03.wav", "296": "leon_8_10.wav", "297": "yifen_3_03.wav", "298": "jmzen_2_11.wav", "299": "Ani_5_05.wav", "300": "davidson_5_08.wav", "301": "davidson_5_09.wav", "302": "ariel_5_06.wav", "303": "leon_3_04.wav", "304": "ariel_4_04.wav", "305": "bug_3_02.wav", "306": "titon_4_11.wav", "307": "yifen_3_08.wav", "308": "yifen_2_12.wav", "309": "Kenshin_4_06.wav", "310": "geniusturtle_7_14.wav", "311": "Kenshin_4_01.wav", "312": "amy_8_02.wav", "313": "yifen_1_11.wav", "314": "annar_1_07.wav", "315": "yifen_5_04.wav", "316": "geniusturtle_1_07.wav", "317": "ariel_5_04.wav", "318": "leon_9_02.wav", "319": "titon_1_04.wav", "320": "ariel_4_05.wav", "321": "ariel_4_01.wav", "322": "Kenshin_5_12.wav", "323": "leon_5_06.wav", "324": "davidson_1_10.wav", "325": "amy_7_08.wav", "326": "amy_5_01.wav", "327": "Ani_2_02.wav", "328": "fdps_4_03.wav", "329": "bobon_5_03.wav", "330": "bug_5_05.wav", "331": "jmzen_2_10.wav", "332": "Ani_3_06.wav", "333": "geniusturtle_3_04.wav", "334": "amy_2_07.wav", "335": "khair_4_08.wav", "336": "amy_15_08.wav", "337": "amy_10_01.wav", "338": "abjones_5_05.wav", "339": "davidson_3_03.wav", "340": "davidson_2_02.wav", "341": "jmzen_5_08.wav", "342": "titon_3_05.wav", "343": "leon_8_03.wav", "344": "Kenshin_5_13.wav", "345": "bug_5_09.wav", "346": "Kenshin_3_02.wav", "347": "khair_1_04.wav", "348": "jmzen_5_04.wav", "349": "stool_3_06.wav", "350": "yifen_5_03.wav", "351": "khair_6_05.wav", "352": "amy_10_04.wav", "353": "ariel_2_04.wav", "354": "yifen_2_11.wav", "355": "leon_4_04.wav", "356": "yifen_1_12.wav", "357": "leon_7_06.wav", "358": "davidson_5_10.wav", "359": "tammy_1_06.wav", "360": "annar_2_03.wav", "361": "amy_5_05.wav", "362": "geniusturtle_7_01.wav", "363": "yifen_5_08.wav", "364": "stool_1_09.wav", "365": "abjones_2_07.wav", "366": "bobon_5_11.wav", "367": "fdps_2_06.wav", "368": "bug_5_04.wav", "369": "jmzen_2_02.wav", "370": "annar_4_04.wav", "371": "davidson_5_04.wav", "372": "amy_15_09.wav", "373": "geniusturtle_1_01.wav", "374": "geniusturtle_4_09.wav", "375": "khair_6_03.wav", "376": "jmzen_1_08.wav", "377": "leon_2_05.wav", "378": "amy_12_06.wav", "379": "jmzen_5_09.wav", "380": "bug_2_04.wav", "381": "jmzen_1_05.wav", "382": "amy_4_01.wav", "383": "heycat_4_01.wav", "384": "titon_5_01.wav", "385": "jmzen_4_06.wav", "386": "amy_3_02.wav", "387": "amy_5_08.wav", "388": "yifen_5_01.wav", "389": "abjones_2_06.wav", "390": "titon_5_08.wav", "391": "abjones_4_01.wav", "392": "geniusturtle_5_04.wav", "393": "amy_4_07.wav", "394": "abjones_4_07.wav", "395": "yifen_1_01.wav", "396": "Ani_4_03.wav", "397": "leon_5_11.wav", "398": "Kenshin_1_11.wav", "399": "abjones_5_01.wav", "400": "geniusturtle_5_02.wav", "401": "leon_7_01.wav", "402": "amy_6_10.wav", "403": "Kenshin_1_06.wav", "404": "fdps_2_09.wav", "405": "titon_3_08.wav", "406": "geniusturtle_2_05.wav", "407": "heycat_4_07.wav", "408": "amy_2_06.wav", "409": "abjones_2_02.wav", "410": "stool_1_02.wav", "411": "heycat_4_05.wav", "412": "titon_4_10.wav", "413": "tammy_1_07.wav", "414": "amy_14_01.wav", "415": "geniusturtle_4_02.wav", "416": "yifen_1_07.wav", "417": "leon_1_01.wav", "418": "khair_5_04.wav", "419": "amy_5_03.wav", "420": "geniusturtle_7_12.wav", "421": "geniusturtle_2_06.wav", "422": "titon_2_04.wav", "423": "khair_1_05.wav", "424": "jmzen_3_10.wav", "425": "annar_2_01.wav", "426": "Kenshin_3_04.wav", "427": "amy_15_07.wav", "428": "davidson_3_01.wav", "429": "Kenshin_1_05.wav", "430": "bobon_2_02.wav", "431": "leon_3_03.wav", "432": "jmzen_5_03.wav", "433": "fdps_5_07.wav", "434": "titon_4_06.wav", "435": "bobon_4_01.wav", "436": "titon_2_06.wav", "437": "abjones_2_01.wav", "438": "fdps_1_11.wav", "439": "Ani_4_05.wav", "440": "khair_4_01.wav", "441": "tammy_1_04.wav", "442": "yifen_2_03.wav", "443": "Kenshin_2_11.wav", "444": "titon_5_04.wav", "445": "amy_13_01.wav", "446": "jmzen_4_03.wav", "447": "ariel_5_02.wav", "448": "bug_5_12.wav", "449": "amy_15_04.wav", "450": "abjones_5_03.wav", "451": "annar_5_08.wav", "452": "davidson_5_02.wav", "453": "yifen_4_01.wav", "454": "amy_8_07.wav", "455": "davidson_4_07.wav", "456": "abjones_4_03.wav", "457": "amy_6_03.wav", "458": "annar_4_03.wav", "459": "amy_5_04.wav", "460": "abjones_5_02.wav", "461": "yifen_3_12.wav", "462": "stool_1_08.wav", "463": "geniusturtle_7_03.wav", "464": "fdps_1_14.wav", "465": "amy_6_07.wav", "466": "fdps_4_02.wav", "467": "stool_3_05.wav", "468": "ariel_2_08.wav", "469": "jmzen_3_04.wav", "470": "yifen_5_07.wav", "471": "amy_15_13.wav", "472": "leon_7_07.wav", "473": "davidson_2_10.wav", "474": "geniusturtle_3_07.wav", "475": "fdps_4_06.wav", "476": "fdps_5_09.wav", "477": "khair_1_02.wav", "478": "leon_8_09.wav", "479": "ariel_5_08.wav", "480": "amy_15_02.wav", "481": "davidson_2_07.wav", "482": "abjones_4_02.wav", "483": "Kenshin_3_05.wav", "484": "leon_2_11.wav", "485": "bobon_5_10.wav", "486": "amy_1_04.wav", "487": "yifen_5_02.wav", "488": "yifen_3_04.wav", "489": "Kenshin_4_09.wav", "490": "amy_16_01.wav", "491": "tammy_1_01.wav", "492": "jmzen_3_03.wav", "493": "bug_3_09.wav", "494": "bobon_5_01.wav", "495": "amy_6_04.wav", "496": "amy_4_10.wav", "497": "geniusturtle_6_05.wav", "498": "khair_6_01.wav", "499": "annar_1_04.wav", "500": "abjones_4_06.wav", "501": "fdps_1_13.wav", "502": "bobon_4_06.wav", "503": "stool_2_02.wav", "504": "jmzen_4_08.wav", "505": "annar_3_08.wav", "506": "amy_15_01.wav", "507": "fdps_1_12.wav", "508": "yifen_1_03.wav", "509": "geniusturtle_6_02.wav", "510": "amy_16_05.wav", "511": "bug_5_06.wav", "512": "amy_11_06.wav", "513": "annar_2_04.wav", "514": "yifen_4_10.wav", "515": "jmzen_1_10.wav", "516": "ariel_1_02.wav", "517": "davidson_1_04.wav", "518": "amy_1_06.wav", "519": "leon_8_02.wav", "520": "davidson_2_05.wav", "521": "yifen_4_03.wav", "522": "stool_5_03.wav", "523": "leon_3_01.wav", "524": "titon_4_03.wav", "525": "titon_2_05.wav", "526": "fdps_3_01.wav", "527": "Ani_3_03.wav", "528": "Kenshin_2_10.wav", "529": "amy_6_01.wav", "530": "geniusturtle_8_04.wav", "531": "yifen_4_09.wav", "532": "ariel_5_01.wav", "533": "heycat_2_04.wav", "534": "heycat_3_02.wav", "535": "yifen_1_02.wav", "536": "stool_5_08.wav", "537": "leon_4_07.wav", "538": "amy_4_06.wav", "539": "yifen_4_08.wav", "540": "abjones_2_03.wav", "541": "bobon_5_02.wav", "542": "yifen_3_07.wav", "543": "annar_5_09.wav", "544": "leon_8_05.wav", "545": "heycat_1_04.wav", "546": "titon_3_03.wav", "547": "yifen_2_06.wav", "548": "khair_6_02.wav", "549": "Kenshin_4_11.wav", "550": "leon_1_06.wav", "551": "amy_16_04.wav", "552": "yifen_5_09.wav", "553": "amy_6_05.wav", "554": "ariel_3_02.wav", "555": "amy_14_06.wav", "556": "titon_5_05.wav", "557": "Ani_3_01.wav", "558": "leon_6_09.wav", "559": "amy_9_05.wav", "560": "amy_10_02.wav", "561": "jmzen_2_04.wav", "562": "Ani_2_03.wav", "563": "abjones_3_12.wav", "564": "khair_1_01.wav", "565": "Ani_4_07.wav", "566": "amy_15_11.wav", "567": "ariel_3_04.wav", "568": "Ani_4_08.wav", "569": "jmzen_1_03.wav", "570": "annar_5_04.wav", "571": "davidson_1_07.wav", "572": "geniusturtle_1_09.wav", "573": "bobon_5_12.wav", "574": "davidson_4_04.wav", "575": "khair_2_07.wav", "576": "annar_4_05.wav", "577": "leon_4_01.wav", "578": "davidson_3_06.wav", "579": "geniusturtle_4_03.wav", "580": "fdps_1_01.wav", "581": "fdps_1_09.wav", "582": "titon_1_06.wav", "583": "geniusturtle_8_06.wav", "584": "Kenshin_4_10.wav", "585": "yifen_3_10.wav", "586": "davidson_3_12.wav", "587": "Kenshin_1_03.wav", "588": "khair_4_07.wav", "589": "yifen_5_11.wav", "590": "stool_3_07.wav", "591": "bug_3_03.wav", "592": "amy_13_05.wav", "593": "bug_3_07.wav", "594": "khair_3_01.wav", "595": "leon_7_13.wav", "596": "titon_4_05.wav", "597": "khair_3_02.wav", "598": "Ani_4_06.wav", "599": "stool_5_04.wav", "600": "annar_4_08.wav", "601": "fdps_4_05.wav", "602": "heycat_3_07.wav", "603": "Kenshin_5_08.wav", "604": "yifen_2_05.wav", "605": "titon_5_07.wav", "606": "bobon_2_06.wav", "607": "amy_16_07.wav", "608": "leon_7_11.wav", "609": "amy_11_07.wav", "610": "abjones_3_09.wav", "611": "heycat_4_04.wav", "612": "amy_2_01.wav", "613": "heycat_5_05.wav", "614": "geniusturtle_7_15.wav", "615": "Kenshin_4_08.wav", "616": "bobon_5_08.wav", "617": "ariel_4_06.wav", "618": "amy_15_12.wav", "619": "Kenshin_1_02.wav", "620": "leon_5_05.wav", "621": "amy_9_09.wav", "622": "leon_1_04.wav", "623": "heycat_1_05.wav", "624": "davidson_3_09.wav", "625": "amy_10_03.wav", "626": "leon_6_05.wav", "627": "geniusturtle_1_04.wav", "628": "ariel_3_06.wav", "629": "annar_4_01.wav", "630": "stool_1_07.wav", "631": "geniusturtle_4_07.wav", "632": "amy_5_02.wav", "633": "leon_3_05.wav", "634": "heycat_1_08.wav", "635": "ariel_3_03.wav", "636": "bobon_1_09.wav", "637": "amy_12_03.wav", "638": "ariel_2_03.wav", "639": "khair_6_07.wav", "640": "geniusturtle_6_04.wav", "641": "stool_2_07.wav", "642": "stool_2_04.wav", "643": "fdps_3_02.wav", "644": "amy_4_11.wav", "645": "abjones_3_03.wav", "646": "yifen_2_10.wav", "647": "fdps_3_06.wav", "648": "davidson_4_06.wav", "649": "yifen_1_16.wav", "650": "titon_2_07.wav", "651": "geniusturtle_2_08.wav", "652": "geniusturtle_4_05.wav", "653": "bobon_3_09.wav", "654": "leon_8_01.wav", "655": "ariel_2_06.wav", "656": "geniusturtle_4_08.wav", "657": "davidson_1_02.wav", "658": "bug_5_08.wav", "659": "geniusturtle_8_01.wav", "660": "bobon_3_04.wav", "661": "bobon_4_02.wav", "662": "amy_11_03.wav", "663": "ariel_5_03.wav", "664": "heycat_5_01.wav", "665": "abjones_2_08.wav", "666": "jmzen_3_07.wav", "667": "leon_6_02.wav", "668": "Kenshin_1_01.wav", "669": "bobon_3_02.wav", "670": "leon_2_10.wav", "671": "annar_3_03.wav", "672": "davidson_1_03.wav", "673": "abjones_1_03.wav", "674": "geniusturtle_7_04.wav", "675": "davidson_4_03.wav", "676": "Ani_1_04.wav", "677": "geniusturtle_7_11.wav", "678": "leon_7_10.wav", "679": "leon_3_08.wav", "680": "heycat_2_06.wav", "681": "fdps_2_11.wav", "682": "jmzen_3_08.wav", "683": "leon_4_08.wav", "684": "khair_1_08.wav", "685": "bobon_1_10.wav", "686": "ariel_3_08.wav", "687": "abjones_3_01.wav", "688": "fdps_5_05.wav", "689": "leon_2_06.wav", "690": "amy_6_11.wav", "691": "heycat_4_08.wav", "692": "davidson_3_05.wav", "693": "amy_4_03.wav", "694": "tammy_1_02.wav", "695": "bug_2_02.wav", "696": "Kenshin_5_06.wav", "697": "bug_2_03.wav", "698": "ariel_1_03.wav", "699": "geniusturtle_2_02.wav", "700": "amy_8_01.wav", "701": "khair_4_06.wav", "702": "jmzen_3_11.wav", "703": "geniusturtle_8_03.wav", "704": "yifen_4_11.wav", "705": "davidson_2_06.wav", "706": "geniusturtle_8_07.wav", "707": "Ani_4_10.wav", "708": "annar_3_07.wav", "709": "stool_4_08.wav", "710": "stool_3_04.wav", "711": "yifen_3_11.wav", "712": "amy_16_02.wav", "713": "abjones_3_04.wav", "714": "geniusturtle_7_08.wav", "715": "stool_4_10.wav", "716": "Kenshin_2_01.wav", "717": "ariel_4_08.wav", "718": "bobon_2_08.wav", "719": "stool_5_01.wav", "720": "fdps_3_03.wav", "721": "stool_4_05.wav", "722": "fdps_4_01.wav", "723": "annar_5_02.wav", "724": "leon_6_03.wav", "725": "leon_3_10.wav", "726": "davidson_4_05.wav", "727": "jmzen_1_04.wav", "728": "heycat_5_07.wav", "729": "amy_1_02.wav", "730": "abjones_2_10.wav", "731": "khair_3_07.wav", "732": "annar_2_06.wav", "733": "amy_9_08.wav", "734": "bobon_1_05.wav", "735": "leon_1_02.wav", "736": "ariel_1_07.wav", "737": "davidson_3_08.wav", "738": "Ani_4_04.wav", "739": "bug_1_07.wav", "740": "geniusturtle_7_09.wav", "741": "davidson_3_07.wav", "742": "geniusturtle_3_02.wav", "743": "jmzen_1_12.wav", "744": "leon_3_07.wav", "745": "leon_4_05.wav", "746": "geniusturtle_4_01.wav", "747": "yifen_2_01.wav", "748": "davidson_5_03.wav", "749": "davidson_4_02.wav", "750": "yifen_1_09.wav", "751": "jmzen_4_04.wav", "752": "amy_12_01.wav", "753": "yifen_1_05.wav", "754": "geniusturtle_5_03.wav", "755": "bug_4_02.wav", "756": "leon_5_12.wav", "757": "amy_14_03.wav", "758": "jmzen_5_06.wav", "759": "khair_4_03.wav", "760": "bobon_5_09.wav", "761": "titon_3_04.wav", "762": "bobon_2_01.wav", "763": "bobon_3_07.wav", "764": "ariel_2_01.wav", "765": "stool_1_04.wav", "766": "heycat_3_01.wav", "767": "amy_3_08.wav", "768": "titon_1_07.wav", "769": "jmzen_5_07.wav", "770": "heycat_1_06.wav", "771": "heycat_1_01.wav", "772": "bobon_1_06.wav", "773": "Ani_2_06.wav", "774": "stool_1_06.wav", "775": "annar_2_05.wav", "776": "stool_4_03.wav", "777": "amy_4_04.wav", "778": "amy_14_04.wav", "779": "stool_4_02.wav", "780": "khair_5_03.wav", "781": "annar_4_07.wav", "782": "amy_7_06.wav", "783": "leon_3_12.wav", "784": "bobon_3_05.wav", "785": "khair_3_04.wav", "786": "geniusturtle_7_13.wav", "787": "fdps_5_08.wav", "788": "leon_5_09.wav", "789": "Ani_4_02.wav", "790": "jmzen_1_11.wav", "791": "bug_3_01.wav", "792": "Kenshin_4_05.wav", "793": "davidson_3_13.wav", "794": "geniusturtle_7_10.wav", "795": "bobon_4_09.wav", "796": "abjones_4_04.wav", "797": "Kenshin_5_09.wav", "798": "bobon_2_04.wav", "799": "ariel_4_07.wav"}, "test": {"0": "heycat_5_02.wav", "1": "stool_4_04.wav", "2": "bobon_1_02.wav", "3": "geniusturtle_6_06.wav", "4": "abjones_3_02.wav", "5": "bobon_1_01.wav", "6": "bobon_2_03.wav", "7": "davidson_2_04.wav", "8": "amy_9_04.wav", "9": "amy_8_08.wav", "10": "bug_2_07.wav", "11": "fdps_1_08.wav", "12": "abjones_4_05.wav", "13": "stool_2_08.wav", "14": "leon_3_02.wav", "15": "abjones_2_05.wav", "16": "amy_12_04.wav", "17": "Kenshin_5_01.wav", "18": "yifen_3_05.wav", "19": "fdps_1_10.wav", "20": "stool_2_06.wav", "21": "jmzen_1_02.wav", "22": "leon_7_09.wav", "23": "titon_2_02.wav", "24": "amy_2_02.wav", "25": "Kenshin_3_01.wav", "26": "jmzen_2_12.wav", "27": "bug_2_01.wav", "28": "leon_2_02.wav", "29": "Kenshin_5_04.wav", "30": "leon_8_06.wav", "31": "abjones_5_07.wav", "32": "leon_6_07.wav", "33": "stool_4_01.wav", "34": "heycat_4_06.wav", "35": "Kenshin_4_04.wav", "36": "fdps_3_04.wav", "37": "fdps_2_04.wav", "38": "amy_1_03.wav", "39": "khair_4_05.wav", "40": "leon_9_01.wav", "41": "yifen_2_07.wav", "42": "amy_7_05.wav", "43": "abjones_5_04.wav", "44": "leon_7_08.wav", "45": "yifen_3_09.wav", "46": "geniusturtle_1_02.wav", "47": "geniusturtle_4_11.wav", "48": "bobon_1_04.wav", "49": "yifen_2_09.wav", "50": "leon_6_06.wav", "51": "stool_5_05.wav", "52": "jmzen_5_02.wav", "53": "amy_15_06.wav", "54": "Ani_5_08.wav", "55": "amy_3_05.wav", "56": "jmzen_5_05.wav", "57": "bobon_3_01.wav", "58": "yifen_2_15.wav", "59": "ariel_1_04.wav", "60": "stool_2_05.wav", "61": "amy_3_07.wav", "62": "yifen_3_02.wav", "63": "bobon_3_10.wav", "64": "khair_5_05.wav", "65": "amy_5_06.wav", "66": "leon_8_13.wav", "67": "titon_5_02.wav", "68": "khair_4_04.wav", "69": "leon_8_11.wav", "70": "titon_1_08.wav", "71": "ariel_2_07.wav", "72": "titon_2_03.wav", "73": "fdps_2_01.wav", "74": "jmzen_4_07.wav", "75": "Kenshin_4_03.wav", "76": "geniusturtle_5_01.wav", "77": "yifen_1_13.wav", "78": "annar_5_01.wav", "79": "amy_13_06.wav", "80": "Ani_2_01.wav", "81": "stool_3_10.wav", "82": "annar_4_09.wav", "83": "bug_5_02.wav", "84": "yifen_4_04.wav", "85": "annar_1_03.wav", "86": "amy_5_07.wav", "87": "yifen_2_14.wav", "88": "titon_1_01.wav", "89": "Ani_2_05.wav", "90": "titon_5_06.wav", "91": "heycat_3_05.wav", "92": "Kenshin_5_11.wav", "93": "amy_6_08.wav", "94": "amy_16_08.wav", "95": "leon_7_12.wav", "96": "amy_9_06.wav", "97": "heycat_2_02.wav", "98": "ariel_3_01.wav", "99": "amy_11_02.wav", "100": "fdps_1_02.wav", "101": "amy_3_06.wav", "102": "bobon_3_03.wav", "103": "khair_5_02.wav", "104": "jmzen_2_03.wav", "105": "abjones_1_02.wav", "106": "ariel_3_07.wav", "107": "titon_3_02.wav", "108": "heycat_5_04.wav", "109": "davidson_1_05.wav", "110": "yifen_4_06.wav", "111": "Ani_1_03.wav", "112": "bug_1_08.wav", "113": "leon_9_03.wav", "114": "geniusturtle_3_06.wav", "115": "bobon_5_07.wav", "116": "annar_3_04.wav", "117": "bobon_1_03.wav", "118": "jmzen_4_09.wav", "119": "leon_7_05.wav", "120": "fdps_5_02.wav", "121": "bobon_5_04.wav", "122": "amy_15_05.wav", "123": "geniusturtle_4_06.wav", "124": "Kenshin_5_10.wav", "125": "titon_3_07.wav", "126": "jmzen_2_01.wav", "127": "khair_2_06.wav", "128": "fdps_1_03.wav", "129": "stool_3_02.wav", "130": "amy_9_03.wav", "131": "bug_5_13.wav", "132": "annar_1_06.wav", "133": "annar_1_01.wav", "134": "titon_4_02.wav", "135": "heycat_5_03.wav", "136": "stool_5_06.wav", "137": "abjones_1_04.wav", "138": "yifen_1_04.wav", "139": "leon_8_04.wav", "140": "amy_3_01.wav", "141": "titon_4_04.wav", "142": "heycat_2_03.wav", "143": "geniusturtle_1_05.wav", "144": "amy_9_02.wav", "145": "amy_10_07.wav", "146": "bobon_4_10.wav", "147": "bug_2_05.wav", "148": "yifen_4_07.wav", "149": "davidson_3_10.wav", "150": "amy_10_05.wav", "151": "geniusturtle_1_08.wav", "152": "fdps_5_01.wav", "153": "jmzen_3_05.wav", "154": "fdps_2_10.wav", "155": "abjones_4_08.wav", "156": "Ani_5_02.wav", "157": "titon_1_02.wav", "158": "stool_2_03.wav", "159": "annar_4_06.wav", "160": "titon_3_06.wav", "161": "geniusturtle_7_07.wav", "162": "fdps_2_12.wav", "163": "annar_2_02.wav", "164": "Kenshin_4_02.wav", "165": "amy_10_06.wav", "166": "leon_1_05.wav", "167": "bobon_4_04.wav", "168": "jmzen_3_06.wav", "169": "stool_3_03.wav", "170": "annar_1_02.wav", "171": "fdps_1_04.wav", "172": "Ani_1_02.wav", "173": "amy_12_05.wav", "174": "stool_3_08.wav", "175": "yifen_1_08.wav", "176": "khair_1_06.wav", "177": "abjones_5_09.wav", "178": "bug_5_03.wav", "179": "bug_1_10.wav", "180": "amy_3_03.wav", "181": "annar_2_08.wav", "182": "jmzen_2_08.wav", "183": "leon_1_12.wav", "184": "davidson_5_07.wav", "185": "stool_4_07.wav", "186": "ariel_1_01.wav", "187": "abjones_1_01.wav", "188": "leon_3_13.wav", "189": "amy_8_03.wav", "190": "annar_1_08.wav", "191": "yifen_2_08.wav", "192": "davidson_5_06.wav", "193": "fdps_3_07.wav", "194": "leon_3_11.wav", "195": "annar_3_01.wav", "196": "bug_3_04.wav", "197": "amy_1_05.wav", "198": "Kenshin_5_03.wav", "199": "amy_16_06.wav"}}
Recently, I evaluate crepe on MIR-1K dataset using the open model. The step_size=20, corresponding to MIR-1K label. And transfer MIR-1K pitch label to frequency using f = np.power(2, (m-69)/12)*440. However, the performance is not very well. Is there something bug in my code.