diff --git a/annotations_filtered/g-2hB5Kd5aM_filtered.json b/annotations_filtered/g-2hB5Kd5aM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d99216720907ffee9f680504c368f15de931c4b9 --- /dev/null +++ b/annotations_filtered/g-2hB5Kd5aM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.01], [15.0, 24.98], [29.0, 32.04], [34.0, 35.07], [35.0, 36.36], [39.0, 46.18], [48.0, 52.66], [54.0, 54.68], [56.0, 64.3], [71.0, 107.16], [110.0, 110.51], [112.0, 116.24]], "keep_status": [true, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [30.36, 32.15, 34.63, 0.0, 0.0, 31.23, 30.74, 0.0, 30.0, 0.0, 0.0, 94.52], "audiomae_on_audioset": [[["music", 17.07], ["synthesizer", 15.61], ["distortion", 13.93]], [["sidetone", 42.31], ["speech", 29.62], ["hum", 6.64]], [["music", 88.73], ["electronic music", 1.39], ["techno", 1.35]], null, null, [["synthesizer", 33.37], ["music", 12.68], ["noise", 10.48]], [["music", 46.83], ["noise", 13.69], ["synthesizer", 9.47]], null, [["speech", 64.72], ["music", 11.57], ["sidetone", 4.79]], null, null, null], "duration": [5.01, 9.98, 3.04, 1.07, 1.36, 7.18, 4.66, 0.68, 8.3, 36.16, 0.51, 4.24]} \ No newline at end of file diff --git a/annotations_filtered/g-GJDgd7D8k_filtered.json b/annotations_filtered/g-GJDgd7D8k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..071106c16374f27f13e339c9f00c6bab6db9d03d --- /dev/null +++ b/annotations_filtered/g-GJDgd7D8k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.62], [17.0, 20.14], [23.0, 24.68], [27.0, 27.51], [30.0, 31.53], [33.0, 34.1], [37.0, 57.64], [58.0, 69.25], [70.0, 101.07], [105.0, 105.85], [109.0, 108.84], [115.0, 121.54], [126.0, 127.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 99.99, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.62, 3.14, 1.68, 0.51, 1.53, 1.1, 20.64, 11.25, 31.07, 0.85, -0.16, 6.54, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/g-P53rME1xE_filtered.json b/annotations_filtered/g-P53rME1xE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..325543291279276b233c62135ea017bed55c7f02 --- /dev/null +++ b/annotations_filtered/g-P53rME1xE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 73.94], [78.0, 122.93]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [48.94, 44.93]} \ No newline at end of file diff --git a/annotations_filtered/g-Yufp_dafk_filtered.json b/annotations_filtered/g-Yufp_dafk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/g-Yufp_dafk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/g-g4vCbZsDM_filtered.json b/annotations_filtered/g-g4vCbZsDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33b3f40fe45d0e0c399e3830e9885c07a1a6715c --- /dev/null +++ b/annotations_filtered/g-g4vCbZsDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.48], [7.0, 7.1], [10.0, 10.84], [12.0, 15.72], [16.0, 27.84], [28.0, 30.38], [42.0, 44.09], [45.0, 46.26], [48.0, 48.0], [48.0, 48.78], [50.0, 49.69], [51.0, 104.33], [105.0, 115.5], [117.0, 121.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.97, 90.43, 58.98, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 0.1, 0.84, 3.72, 11.84, 2.38, 2.09, 1.26, 0.0, 0.78, -0.31, 53.33, 10.5, 4.95]} \ No newline at end of file diff --git a/annotations_filtered/g-gebDSBFkY_filtered.json b/annotations_filtered/g-gebDSBFkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21c45e7942354605ab1ced53d127f136e74041fa --- /dev/null +++ b/annotations_filtered/g-gebDSBFkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 33.88], [36.0, 36.05], [40.0, 48.32], [49.0, 73.94], [75.0, 75.83], [77.0, 81.55], [84.0, 88.92]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.05, 30.64, 0.0, 57.09, 60.98], "audiomae_on_audioset": [null, null, [["speech", 44.19], ["music", 19.6], ["shatter", 10.21]], [["speech", 64.12], ["music", 7.08], ["sidetone", 5.98]], null, null, null], "duration": [-0.12, 0.05, 8.32, 24.94, 0.83, 4.55, 4.92]} \ No newline at end of file diff --git a/annotations_filtered/g-uc5_QEmuM_filtered.json b/annotations_filtered/g-uc5_QEmuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2928a9004df1175c666526417116d3dcd848eca1 --- /dev/null +++ b/annotations_filtered/g-uc5_QEmuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [7.0, 7.69], [10.0, 10.52], [17.0, 19.7], [25.0, 25.73], [28.0, 28.27], [31.0, 33.66], [35.0, 36.04], [40.0, 40.36], [44.0, 68.99], [80.0, 79.98], [80.0, 85.19], [89.0, 92.82], [94.0, 95.34], [98.0, 102.41], [103.0, 108.16], [112.0, 119.85]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.76, 0.0, 0.0, 35.94, 0.0, 0.0, 28.7, 0.0, 28.67, 28.79, 0.0, 29.34, 28.81, 28.83], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 18.03], ["music", 16.66], ["moo", 16.44]], null, null, [["music", 57.61], ["synthesizer", 2.97], ["didgeridoo", 2.95]], null, null, [["music", 79.17], ["crowd", 4.78], ["electronic music", 1.58]], null, [["music", 67.11], ["didgeridoo", 7.88], ["rattle (instrument)", 2.77]], [["music", 59.65], ["didgeridoo", 7.01], ["motorcycle", 2.71]], null, [["music", 89.27], ["didgeridoo", 3.33], ["musical instrument", 0.92]], [["music", 52.33], ["throbbing", 6.19], ["didgeridoo", 5.6]], [["music", 85.62], ["ska", 1.64], ["musical instrument", 0.89]]], "duration": [0.55, 0.69, 0.52, 2.7, 0.73, 0.27, 2.66, 1.04, 0.36, 24.99, -0.02, 5.19, 3.82, 1.34, 4.41, 5.16, 7.85]} \ No newline at end of file diff --git a/annotations_filtered/g05Ja_89tOg_filtered.json b/annotations_filtered/g05Ja_89tOg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9cdd2b62d9281543728ad56643e9804bfddeb26 --- /dev/null +++ b/annotations_filtered/g05Ja_89tOg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [4.0, 4.19], [5.0, 15.11], [15.0, 15.87], [19.0, 19.9], [23.0, 23.38], [25.0, 29.61], [35.0, 41.74], [44.0, 44.9], [47.0, 54.65], [56.0, 56.79], [66.0, 66.16], [67.0, 67.71], [68.0, 72.03], [74.0, 93.26], [94.0, 99.69], [102.0, 101.82], [104.0, 106.98], [108.0, 109.8], [111.0, 112.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.55, 0.0, 0.0, 0.0, 61.77, 86.09, 0.0, 35.18, 0.0, 0.0, 0.0, 99.56, 74.29, 100.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 86.76], ["sidetone", 2.94], ["radio", 1.92]], null, null, null, null, null, null, [["speech", 87.84], ["sidetone", 3.44], ["stomach rumble", 0.71]], null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 0.19, 10.11, 0.87, 0.9, 0.38, 4.61, 6.74, 0.9, 7.65, 0.79, 0.16, 0.71, 4.03, 19.26, 5.69, -0.18, 2.98, 1.8, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/g0AMLVSBfSs_filtered.json b/annotations_filtered/g0AMLVSBfSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..038664adabf11d6b05cadb40463ec9e65d062c21 --- /dev/null +++ b/annotations_filtered/g0AMLVSBfSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.45], [3.0, 3.3], [6.0, 5.85], [13.0, 13.46], [25.0, 25.17], [28.0, 28.36], [29.0, 29.71], [39.0, 39.48]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.45, 0.3, -0.15, 0.46, 0.17, 0.36, 0.71, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/g0CFQF54ePo_filtered.json b/annotations_filtered/g0CFQF54ePo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c061ccfc37236196374a5c03231491d32c2a556 --- /dev/null +++ b/annotations_filtered/g0CFQF54ePo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.46], [8.0, 8.21], [9.0, 9.98], [24.0, 24.53], [25.0, 26.65], [27.0, 29.56], [33.0, 33.93], [35.0, 35.33], [38.0, 37.98], [52.0, 53.0], [53.0, 54.04], [81.0, 84.1], [110.0, 113.51], [114.0, 113.61], [114.0, 114.1], [116.0, 119.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 34.46, 34.41, 0.0, 0.0, 58.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 30.92], ["moo", 27.83], ["speech", 13.68]], [["speech", 27.68], ["vehicle", 7.9], ["livestock, farm animals, working animals", 7.68]], null, null, null], "duration": [0.46, 0.21, 0.98, 0.53, 1.65, 2.56, 0.93, 0.33, -0.02, 1.0, 1.04, 3.1, 3.51, -0.39, 0.1, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/g0HwVyKSC_8_filtered.json b/annotations_filtered/g0HwVyKSC_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cfb3c3ce0f1112baed1c8bfae77c9a6ebbf8d35 --- /dev/null +++ b/annotations_filtered/g0HwVyKSC_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.3], [10.0, 10.57], [13.0, 49.65], [51.0, 51.12], [54.0, 53.89], [62.0, 63.09], [66.0, 66.73], [69.0, 69.55], [71.0, 71.36], [72.0, 73.63], [75.0, 76.06], [84.0, 84.54], [91.0, 90.91], [96.0, 96.28], [102.0, 102.79], [108.0, 108.33], [110.0, 110.24], [112.0, 117.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 0.57, 36.65, 0.12, -0.11, 1.09, 0.73, 0.55, 0.36, 1.63, 1.06, 0.54, -0.09, 0.28, 0.79, 0.33, 0.24, 5.76]} \ No newline at end of file diff --git a/annotations_filtered/g0TZztZJGRo_filtered.json b/annotations_filtered/g0TZztZJGRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84b2fc6088bf764de9817eebdf6fbe3281e15c99 --- /dev/null +++ b/annotations_filtered/g0TZztZJGRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 29.37], [31.0, 31.48], [32.0, 35.61], [36.0, 67.85]], "keep_status": [true, false, true, false], "silence_prob": [33.59, 0.0, 28.31, 0.0], "audiomae_on_audioset": [[["music", 23.98], ["buzz", 17.16], ["electric shaver, electric razor", 14.06]], null, [["music", 55.46], ["speech", 6.77], ["burst, pop", 3.35]], null], "duration": [9.37, 0.48, 3.61, 31.85]} \ No newline at end of file diff --git a/annotations_filtered/g0UV6ug96c0_filtered.json b/annotations_filtered/g0UV6ug96c0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..508a68fd454c30af4be1ea39af496f59a7c1bf58 --- /dev/null +++ b/annotations_filtered/g0UV6ug96c0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.16], [17.0, 18.47], [21.0, 25.27], [26.0, 26.35], [31.0, 36.64], [56.0, 56.54], [65.0, 65.01], [67.0, 78.44], [83.0, 83.57], [99.0, 100.16]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [31.35, 0.0, 34.03, 0.0, 31.48, 0.0, 0.0, 29.7, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 29.28], ["mains hum", 20.55], ["hum", 13.42]], null, [["speech", 43.76], ["sidetone", 32.84], ["radio", 5.56]], null, [["speech", 68.53], ["vehicle", 9.25], ["car", 2.11]], null, null, [["speech", 74.1], ["explosion", 6.04], ["music", 5.66]], null, null], "duration": [3.16, 1.47, 4.27, 0.35, 5.64, 0.54, 0.01, 11.44, 0.57, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/g0j2dVuhr6s_filtered.json b/annotations_filtered/g0j2dVuhr6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f649884b3725129c5ae166abf3302df0f55082a --- /dev/null +++ b/annotations_filtered/g0j2dVuhr6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.92], [6.0, 9.73], [12.0, 13.36], [16.0, 17.0], [20.0, 19.95], [26.0, 26.69], [28.0, 29.74], [30.0, 31.18], [32.0, 32.75], [34.0, 34.77], [35.0, 37.17], [40.0, 40.24], [42.0, 42.99], [45.0, 46.92], [49.0, 50.3], [53.0, 58.31], [60.0, 60.64], [62.0, 63.59], [66.0, 67.56], [68.0, 69.18], [71.0, 70.68], [73.0, 73.62], [80.0, 80.49], [85.0, 87.83], [92.0, 92.01], [95.0, 95.66], [107.0, 114.57], [120.0, 123.01], [124.0, 124.77], [126.0, 126.06]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 29.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.92, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 38.56, 39.28, 0.0, 0.0], "audiomae_on_audioset": [null, [["busy signal", 39.56], ["sine wave", 15.52], ["sidetone", 14.66]], null, null, null, null, null, null, null, null, [["speech", 48.88], ["music", 19.45], ["sidetone", 18.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 9.28], ["music", 8.59], ["mains hum", 6.5]], [["firecracker", 18.58], ["noise", 17.84], ["fireworks", 6.37]], null, null], "duration": [0.92, 3.73, 1.36, 1.0, -0.05, 0.69, 1.74, 1.18, 0.75, 0.77, 2.17, 0.24, 0.99, 1.92, 1.3, 5.31, 0.64, 1.59, 1.56, 1.18, -0.32, 0.62, 0.49, 2.83, 0.01, 0.66, 7.57, 3.01, 0.77, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/g0mHVE8ebqA_filtered.json b/annotations_filtered/g0mHVE8ebqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82902593951562932b4739b6d7548ae828dec03a --- /dev/null +++ b/annotations_filtered/g0mHVE8ebqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [7.0, 7.03], [8.0, 10.98], [13.0, 13.26], [15.0, 16.75], [19.0, 20.73], [29.0, 29.89], [31.0, 32.05], [41.0, 43.14], [49.0, 48.96], [59.0, 61.77], [64.0, 65.65], [67.0, 67.69], [70.0, 75.41], [77.0, 77.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.03, 2.98, 0.26, 1.75, 1.73, 0.89, 1.05, 2.14, -0.04, 2.77, 1.65, 0.69, 5.41, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/g0nhEzoCkJo_filtered.json b/annotations_filtered/g0nhEzoCkJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e190ef944fd23ed6d514d2488a68ba4c4c280a26 --- /dev/null +++ b/annotations_filtered/g0nhEzoCkJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[89.0, 93.16], [94.0, 114.67], [117.0, 117.75], [119.0, 122.08], [123.0, 129.0], [130.0, 131.28]], "keep_status": [true, true, false, true, false, false], "silence_prob": [38.51, 32.24, 0.0, 29.39, 55.89, 0.0], "audiomae_on_audioset": [[["whale vocalization", 13.65], ["livestock, farm animals, working animals", 11.27], ["music", 10.4]], [["music", 27.56], ["cattle, bovinae", 14.43], ["livestock, farm animals, working animals", 14.33]], null, [["mosquito", 22.21], ["insect", 18.74], ["fly, housefly", 16.96]], null, null], "duration": [4.16, 20.67, 0.75, 3.08, 6.0, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/g0yYxO89lQA_filtered.json b/annotations_filtered/g0yYxO89lQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a46f1ce8b98165b7e98f403fbb1284e9de1b1efe --- /dev/null +++ b/annotations_filtered/g0yYxO89lQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.33], [43.0, 43.34], [44.0, 44.39], [48.0, 84.99], [85.0, 86.29], [90.0, 90.9], [97.0, 98.25], [101.0, 100.99], [118.0, 118.08], [121.0, 122.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [3.33, 0.34, 0.39, 36.99, 1.29, 0.9, 1.25, -0.01, 0.08, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/g1JAILio6-s_filtered.json b/annotations_filtered/g1JAILio6-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..523f5dcbd9cb852b4856d91c6c4f6b6bdc4f2174 --- /dev/null +++ b/annotations_filtered/g1JAILio6-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.14], [51.0, 52.02], [54.0, 57.75], [66.0, 69.13], [72.0, 74.82], [76.0, 122.47]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.89, 36.25, 70.16, 0.0], "audiomae_on_audioset": [null, null, [["hum", 36.79], ["mains hum", 34.25], ["speech", 12.33]], [["whale vocalization", 39.87], ["hum", 8.25], ["music", 6.86]], null, null], "duration": [0.14, 1.02, 3.75, 3.13, 2.82, 46.47]} \ No newline at end of file diff --git a/annotations_filtered/g1jO4_HQQX4_filtered.json b/annotations_filtered/g1jO4_HQQX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..952fc6a3e384303fcfc8aa7cf9ccd8691b2a028f --- /dev/null +++ b/annotations_filtered/g1jO4_HQQX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.35], [9.0, 12.9], [21.0, 21.29], [25.0, 25.76], [28.0, 28.32], [39.0, 39.63], [41.0, 41.89], [42.0, 43.6], [45.0, 45.47], [46.0, 62.29], [67.0, 67.24], [74.0, 87.1], [88.0, 93.07]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 31.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.48, 0.0, 29.71, 28.67], "audiomae_on_audioset": [null, [["hum", 31.29], ["speech", 11.97], ["music", 9.27]], null, null, null, null, null, null, null, [["music", 46.74], ["hum", 10.28], ["throbbing", 9.32]], null, [["hum", 30.43], ["mains hum", 15.89], ["speech", 12.65]], [["fly, housefly", 33.14], ["mosquito", 11.65], ["whack, thwack", 10.69]]], "duration": [0.35, 3.9, 0.29, 0.76, 0.32, 0.63, 0.89, 1.6, 0.47, 16.29, 0.24, 13.1, 5.07]} \ No newline at end of file diff --git a/annotations_filtered/g1lpI9wZtiI_filtered.json b/annotations_filtered/g1lpI9wZtiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31a2e1d60acb30b2c088989b156325f0b3784cce --- /dev/null +++ b/annotations_filtered/g1lpI9wZtiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.36], [20.0, 28.56], [31.0, 48.39], [52.0, 53.32], [58.0, 58.08], [72.0, 84.74], [86.0, 173.25]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [29.85, 31.44, 64.75, 0.0, 0.0, 35.16, 0.0], "audiomae_on_audioset": [[["music", 43.07], ["hum", 25.29], ["mains hum", 13.43]], [["hum", 40.97], ["mains hum", 20.74], ["music", 11.19]], null, null, null, [["music", 44.82], ["theremin", 19.12], ["didgeridoo", 2.72]], null], "duration": [9.36, 8.56, 17.39, 1.32, 0.08, 12.74, 87.25]} \ No newline at end of file diff --git a/annotations_filtered/g1r-B5ZGZWY_filtered.json b/annotations_filtered/g1r-B5ZGZWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17099f8c58832901c850c1ac20ff7a04d8c7695a --- /dev/null +++ b/annotations_filtered/g1r-B5ZGZWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 51.44], [52.0, 52.73], [54.0, 54.23], [55.0, 56.29], [57.0, 59.0], [60.0, 66.29], [68.0, 89.51], [91.0, 119.03], [120.0, 138.47], [139.0, 140.8], [143.0, 143.02], [144.0, 145.1], [148.0, 148.53], [154.0, 154.5], [157.0, 164.22], [175.0, 188.94], [190.0, 196.55], [197.0, 198.36], [201.0, 201.75]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.74, 32.56, 32.42, 32.89, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 38.98, 35.96, 93.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 25.45], ["music", 18.08], ["throbbing", 17.42]], [["music", 33.56], ["speech", 25.97], ["buzz", 4.36]], [["music", 31.59], ["throbbing", 30.15], ["hum", 17.59]], null, null, null, null, null, null, [["music", 57.22], ["speech", 9.47], ["frog", 2.85]], [["music", 64.38], ["speech", 12.64], ["bleat", 2.03]], null, null, null], "duration": [0.44, 0.73, 0.23, 1.29, 2.0, 6.29, 21.51, 28.03, 18.47, 1.8, 0.02, 1.1, 0.53, 0.5, 7.22, 13.94, 6.55, 1.36, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/g2atr8aQ0zg_filtered.json b/annotations_filtered/g2atr8aQ0zg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0b8370741e1df80ce5a457e718b281a87b67c82 --- /dev/null +++ b/annotations_filtered/g2atr8aQ0zg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.74], [6.0, 7.4], [10.0, 12.11], [17.0, 18.77], [19.0, 20.36], [22.0, 24.21], [30.0, 30.57], [33.0, 35.06], [36.0, 37.98], [39.0, 40.73], [42.0, 45.0], [46.0, 48.27], [53.0, 54.19], [55.0, 54.8], [63.0, 63.02], [67.0, 68.98], [72.0, 72.45], [73.0, 73.2], [76.0, 76.57], [83.0, 84.77], [86.0, 86.41], [88.0, 88.84], [91.0, 91.25], [94.0, 97.29], [98.0, 97.82], [101.0, 102.15], [103.0, 106.66], [110.0, 115.69], [117.0, 117.41], [123.0, 126.91], [127.0, 129.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 0.0, 0.0, 94.37, 0.0, 84.25, 0.0, 0.0, 99.84, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 90.43, 99.26, 0.0, 85.17, 69.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.74, 1.4, 2.11, 1.77, 1.36, 2.21, 0.57, 2.06, 1.98, 1.73, 3.0, 2.27, 1.19, -0.2, 0.02, 1.98, 0.45, 0.2, 0.57, 1.77, 0.41, 0.84, 0.25, 3.29, -0.18, 1.15, 3.66, 5.69, 0.41, 3.91, 2.34]} \ No newline at end of file diff --git a/annotations_filtered/g2dAymk715E_filtered.json b/annotations_filtered/g2dAymk715E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..385835099296a6ce1ce465b8ab62afab98c62667 --- /dev/null +++ b/annotations_filtered/g2dAymk715E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.91], [14.0, 14.94], [27.0, 33.02], [35.0, 36.56], [38.0, 39.06], [45.0, 45.79], [55.0, 55.56], [67.0, 73.04], [76.0, 80.87], [83.0, 83.03], [86.0, 87.1], [106.0, 106.79], [122.0, 122.88], [138.0, 139.4], [151.0, 151.56], [154.0, 158.14], [160.0, 161.23], [166.0, 165.87], [174.0, 174.38]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.08, 0.0, 0.0, 0.0, 0.0, 34.13, 42.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 64.55], ["speech", 28.04], ["hum", 1.24]], null, null, null, null, [["speech", 48.5], ["whack, thwack", 22.07], ["thunk", 12.64]], [["speech", 19.26], ["hum", 7.64], ["fart", 7.14]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 0.94, 6.02, 1.56, 1.06, 0.79, 0.56, 6.04, 4.87, 0.03, 1.1, 0.79, 0.88, 1.4, 0.56, 4.14, 1.23, -0.13, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/g2h8xRzMxtA_filtered.json b/annotations_filtered/g2h8xRzMxtA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e405806e799e5284f0516e9ef61939a1134b80d --- /dev/null +++ b/annotations_filtered/g2h8xRzMxtA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [10.0, 10.5], [13.0, 14.23], [16.0, 16.17], [17.0, 17.47], [23.0, 24.46], [26.0, 34.69], [36.0, 39.09], [40.0, 41.35], [42.0, 42.35], [43.0, 45.3], [47.0, 48.0], [51.0, 51.46], [59.0, 60.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 98.19, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.5, 1.23, 0.17, 0.47, 1.46, 8.69, 3.09, 1.35, 0.35, 2.3, 1.0, 0.46, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/g2iWVWVSb6Q_filtered.json b/annotations_filtered/g2iWVWVSb6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f2819670de5305f1daca56be0d2fe1c92fb81cf --- /dev/null +++ b/annotations_filtered/g2iWVWVSb6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 24.49], [31.0, 31.36], [32.0, 32.49], [34.0, 34.43], [36.0, 37.15], [37.0, 38.87], [43.0, 43.56], [53.0, 54.06], [55.0, 55.58], [63.0, 64.4], [65.0, 64.94], [74.0, 73.99], [82.0, 83.24], [84.0, 83.96], [85.0, 85.33], [86.0, 97.53], [101.0, 101.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.49, 0.36, 0.49, 0.43, 1.15, 1.87, 0.56, 1.06, 0.58, 1.4, -0.06, -0.01, 1.24, -0.04, 0.33, 11.53, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/g2tNQ_6-kpg_filtered.json b/annotations_filtered/g2tNQ_6-kpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b0018c51301ba55612032f5ac37fb6e43a11421 --- /dev/null +++ b/annotations_filtered/g2tNQ_6-kpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.22], [7.0, 8.13], [10.0, 11.3], [13.0, 14.25], [15.0, 15.75], [17.0, 25.17], [26.0, 29.74], [30.0, 33.71], [36.0, 40.58], [42.0, 43.75], [44.0, 46.38], [47.0, 49.72], [51.0, 51.85], [55.0, 57.15], [59.0, 60.76], [62.0, 62.5], [63.0, 63.76], [65.0, 65.42], [67.0, 72.66], [75.0, 85.16], [86.0, 91.52], [92.0, 91.57], [92.0, 96.47], [98.0, 100.35], [101.0, 104.48], [107.0, 107.74], [109.0, 110.76], [113.0, 112.94], [114.0, 115.5], [117.0, 123.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [72.9, 0.0, 0.0, 0.0, 0.0, 65.67, 66.15, 59.15, 78.38, 0.0, 65.55, 53.65, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 55.18, 53.1, 61.67, 0.0, 44.84, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 41.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 21.25], ["noise", 12.27], ["hum", 11.54]], null, null, null, null, null, null, [["noise", 35.53], ["speech", 11.33], ["music", 7.73]]], "duration": [2.22, 1.13, 1.3, 1.25, 0.75, 8.17, 3.74, 3.71, 4.58, 1.75, 2.38, 2.72, 0.85, 2.15, 1.76, 0.5, 0.76, 0.42, 5.66, 10.16, 5.52, -0.43, 4.47, 2.35, 3.48, 0.74, 1.76, -0.06, 1.5, 6.69]} \ No newline at end of file diff --git a/annotations_filtered/g3D2eGiLoeI_filtered.json b/annotations_filtered/g3D2eGiLoeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e287aec50b6f774cc84b05f8606e5caf459d777 --- /dev/null +++ b/annotations_filtered/g3D2eGiLoeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 36.73], [39.0, 53.43], [55.0, 55.16], [56.0, 63.29], [67.0, 68.57], [76.0, 77.08], [78.0, 78.92], [85.0, 86.48], [88.0, 88.94], [90.0, 92.11], [93.0, 95.54], [98.0, 98.76], [99.0, 100.77], [101.0, 102.74], [104.0, 106.19]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.55, 33.94, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 99.99, 0.0, 0.0, 0.0, 66.15], "audiomae_on_audioset": [null, [["speech", 51.88], ["fart", 5.09], ["aircraft", 3.92]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [25.73, 14.43, 0.16, 7.29, 1.57, 1.08, 0.92, 1.48, 0.94, 2.11, 2.54, 0.76, 1.77, 1.74, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/g3E69dpurZA_filtered.json b/annotations_filtered/g3E69dpurZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7318646d79f5bd4b0f442dcd3bbda19b82fef6c4 --- /dev/null +++ b/annotations_filtered/g3E69dpurZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.07], [17.0, 17.44], [17.0, 21.95]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 32.71], "audiomae_on_audioset": [null, null, [["speech", 75.89], ["sidetone", 7.95], ["radio", 2.05]]], "duration": [0.07, 0.44, 4.95]} \ No newline at end of file diff --git a/annotations_filtered/g3FFfmWvyAk_filtered.json b/annotations_filtered/g3FFfmWvyAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd5564e4ba36e03e2b4082da5e40325057dcd75a --- /dev/null +++ b/annotations_filtered/g3FFfmWvyAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [9.0, 10.45], [11.0, 11.99], [18.0, 19.45], [22.0, 24.16], [27.0, 27.18], [28.0, 30.7], [38.0, 39.5], [43.0, 50.48], [51.0, 53.27], [54.0, 61.7], [63.0, 63.41], [64.0, 64.49], [71.0, 71.64], [72.0, 74.31], [98.0, 99.47], [111.0, 111.05], [114.0, 114.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 65.2, 0.0, 68.15, 99.94, 80.29, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.45, 0.99, 1.45, 2.16, 0.18, 2.7, 1.5, 7.48, 2.27, 7.7, 0.41, 0.49, 0.64, 2.31, 1.47, 0.05, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/g3WSsm57iVM_filtered.json b/annotations_filtered/g3WSsm57iVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06546f538eb4feb7aacb53807b6952da5ba52096 --- /dev/null +++ b/annotations_filtered/g3WSsm57iVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 13.56], [16.0, 21.1], [22.0, 23.46], [26.0, 27.6], [29.0, 34.37], [35.0, 39.04], [41.0, 40.85], [44.0, 44.56], [46.0, 48.02], [49.0, 51.33], [52.0, 65.3], [66.0, 70.12], [72.0, 72.35], [73.0, 79.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.95, 100.0, 0.0, 0.0, 94.07, 90.08, 0.0, 0.0, 99.94, 99.97, 99.96, 98.51, 0.0, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.56, 5.1, 1.46, 1.6, 5.37, 4.04, -0.15, 0.56, 2.02, 2.33, 13.3, 4.12, 0.35, 6.49]} \ No newline at end of file diff --git a/annotations_filtered/g3WtvzmKCQQ_filtered.json b/annotations_filtered/g3WtvzmKCQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..284b544334600d720de640b759edd11077486c8e --- /dev/null +++ b/annotations_filtered/g3WtvzmKCQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [4.0, 11.82], [15.0, 17.15], [18.0, 18.49], [20.0, 21.44], [23.0, 25.98], [28.0, 30.3], [32.0, 33.13], [36.0, 37.23], [39.0, 40.49], [42.0, 42.23], [45.0, 47.01], [47.0, 47.97], [49.0, 50.94], [53.0, 52.91], [54.0, 54.48], [55.0, 55.46], [56.0, 57.99], [59.0, 62.45], [63.0, 63.61], [65.0, 66.02], [68.0, 76.6], [77.0, 78.02], [82.0, 83.84], [86.0, 86.49], [91.0, 93.85], [95.0, 97.53], [99.0, 99.1], [102.0, 104.82]], "keep_status": [false, true, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false, true], "silence_prob": [0.0, 42.13, 41.83, 0.0, 0.0, 38.42, 40.4, 0.0, 0.0, 0.0, 0.0, 40.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.34, 0.0, 0.0, 29.54, 0.0, 0.0, 0.0, 44.29, 42.37, 0.0, 37.91], "audiomae_on_audioset": [null, [["noise", 12.06], ["synthesizer", 11.57], ["hum", 10.32]], [["hum", 17.08], ["rumble", 11.86], ["mains hum", 6.18]], null, null, [["speech", 38.41], ["hum", 19.53], ["mains hum", 9.47]], [["music", 15.18], ["hum", 13.02], ["effects unit", 8.83]], null, null, null, null, [["hum", 55.08], ["mains hum", 17.07], ["throbbing", 9.93]], null, null, null, null, null, null, [["hum", 37.61], ["mains hum", 14.15], ["noise", 8.63]], null, null, [["music", 43.38], ["guitar", 10.65], ["musical instrument", 7.22]], null, null, null, [["hum", 32.47], ["throbbing", 25.86], ["whale vocalization", 11.31]], [["speech", 27.79], ["whale vocalization", 23.29], ["sidetone", 19.44]], null, [["throbbing", 33.47], ["hum", 24.13], ["music", 6.43]]], "duration": [0.61, 7.82, 2.15, 0.49, 1.44, 2.98, 2.3, 1.13, 1.23, 1.49, 0.23, 2.01, 0.97, 1.94, -0.09, 0.48, 0.46, 1.99, 3.45, 0.61, 1.02, 8.6, 1.02, 1.84, 0.49, 2.85, 2.53, 0.1, 2.82]} \ No newline at end of file diff --git a/annotations_filtered/g3a9qZnTzJQ_filtered.json b/annotations_filtered/g3a9qZnTzJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1a22e47712e2e625e36111c8f9bbad231732ea1 --- /dev/null +++ b/annotations_filtered/g3a9qZnTzJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.21], [7.0, 9.78], [13.0, 13.24], [20.0, 26.33], [28.0, 41.84], [48.0, 48.03], [51.0, 50.67], [52.0, 53.1], [59.0, 63.09], [65.0, 64.79], [67.0, 67.04], [69.0, 83.56], [84.0, 85.04], [86.0, 88.1], [89.0, 94.71], [95.0, 96.04], [97.0, 122.25], [123.0, 122.94], [124.0, 134.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true], "silence_prob": [0.0, 68.8, 0.0, 59.86, 59.33, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 79.94, 0.0, 46.72, 33.45, 0.0, 34.25, 0.0, 34.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.14], ["ambient music", 11.19], ["electronic music", 6.99]], [["speech", 17.56], ["groan", 14.67], ["music", 13.32]], null, [["buzz", 17.09], ["fly, housefly", 12.75], ["speech", 11.45]], null, [["speech", 38.99], ["music", 19.22], ["thump, thud", 4.81]]], "duration": [1.21, 2.78, 0.24, 6.33, 13.84, 0.03, -0.33, 1.1, 4.09, -0.21, 0.04, 14.56, 1.04, 2.1, 5.71, 1.04, 25.25, -0.06, 10.59]} \ No newline at end of file diff --git a/annotations_filtered/g3hYbDHwBJY_filtered.json b/annotations_filtered/g3hYbDHwBJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4c0e7f725ea73418a82d87b0cc8b08946c42837 --- /dev/null +++ b/annotations_filtered/g3hYbDHwBJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.17], [23.0, 25.24], [33.0, 39.26], [39.0, 47.17], [48.0, 49.52], [51.0, 51.12], [58.0, 58.19], [60.0, 61.25], [62.0, 62.46], [63.0, 63.49], [102.0, 109.02], [110.0, 110.3]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [30.62, 33.11, 30.32, 52.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.59, 0.0], "audiomae_on_audioset": [[["music", 51.76], ["speech", 19.34], ["fly, housefly", 7.84]], [["music", 41.48], ["speech", 10.56], ["hum", 10.39]], [["throbbing", 24.33], ["hum", 14.73], ["music", 8.76]], null, null, null, null, null, null, null, [["hum", 30.97], ["throbbing", 13.7], ["mains hum", 8.89]], null], "duration": [9.17, 2.24, 6.26, 8.17, 1.52, 0.12, 0.19, 1.25, 0.46, 0.49, 7.02, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/g3jImb6V4wI_filtered.json b/annotations_filtered/g3jImb6V4wI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b1b0baf49115f4a906e6dbcade5bf344f0400c6 --- /dev/null +++ b/annotations_filtered/g3jImb6V4wI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.57], [8.0, 11.26], [20.0, 20.41], [24.0, 24.95], [26.0, 28.81], [32.0, 33.03], [35.0, 34.89], [36.0, 36.54], [38.0, 38.11], [40.0, 41.37], [42.0, 42.96], [45.0, 47.83], [48.0, 48.59], [50.0, 51.54], [57.0, 60.76], [61.0, 62.21], [63.0, 63.29], [65.0, 65.99], [67.0, 67.66], [68.0, 67.91], [69.0, 69.67], [73.0, 74.61], [75.0, 76.18], [93.0, 95.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 47.7, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.99], "audiomae_on_audioset": [null, [["speech", 73.29], ["synthesizer", 6.01], ["music", 3.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.04], ["bass guitar", 13.79], ["guitar", 12.38]]], "duration": [0.57, 3.26, 0.41, 0.95, 2.81, 1.03, -0.11, 0.54, 0.11, 1.37, 0.96, 2.83, 0.59, 1.54, 3.76, 1.21, 0.29, 0.99, 0.66, -0.09, 0.67, 1.61, 1.18, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/g3kYdbqIwBE_filtered.json b/annotations_filtered/g3kYdbqIwBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0d0fd94c14d15f02076da9481dd9372e9500123 --- /dev/null +++ b/annotations_filtered/g3kYdbqIwBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.33], [17.0, 18.25], [21.0, 25.22], [35.0, 36.39], [49.0, 51.8], [55.0, 55.51], [64.0, 64.35], [68.0, 68.45], [88.0, 88.89], [90.0, 90.93]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.5, 0.0, 33.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["mosquito", 23.43], ["fly, housefly", 17.39], ["insect", 12.71]], null, [["boing", 73.83], ["speech", 8.73], ["cattle, bovinae", 2.73]], null, null, null, null, null], "duration": [0.33, 1.25, 4.22, 1.39, 2.8, 0.51, 0.35, 0.45, 0.89, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/g3svdzmBtic_filtered.json b/annotations_filtered/g3svdzmBtic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d4eac829b04020dfa321551de41348c915e3595 --- /dev/null +++ b/annotations_filtered/g3svdzmBtic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 39.75], [42.0, 61.38], [67.0, 71.66], [75.0, 115.2], [118.0, 125.42], [126.0, 127.5], [134.0, 138.25], [143.0, 142.67], [155.0, 159.68], [168.0, 173.3]], "keep_status": [true, true, true, false, false, false, true, false, true, true], "silence_prob": [28.88, 29.03, 29.95, 0.0, 30.08, 0.0, 29.42, 0.0, 29.37, 28.8], "audiomae_on_audioset": [[["speech", 37.51], ["fly, housefly", 13.03], ["music", 8.41]], [["music", 28.02], ["speech", 18.53], ["hum", 13.12]], [["speech", 46.15], ["music", 9.43], ["fart", 6.15]], null, [["music", 52.08], ["theremin", 22.94], ["scary music", 5.13]], null, [["hum", 30.47], ["mains hum", 21.69], ["music", 12.3]], null, [["mosquito", 23.02], ["speech", 19.58], ["fly, housefly", 12.74]], [["music", 46.9], ["speech", 4.63], ["musical instrument", 2.89]]], "duration": [12.75, 19.38, 4.66, 40.2, 7.42, 1.5, 4.25, -0.33, 4.68, 5.3]} \ No newline at end of file diff --git a/annotations_filtered/g425SDBoDBI_filtered.json b/annotations_filtered/g425SDBoDBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c28410c3efc7e15a20cea07cd77dbf69a8a9ee75 --- /dev/null +++ b/annotations_filtered/g425SDBoDBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.57], [9.0, 9.48], [15.0, 15.58], [18.0, 20.6], [24.0, 25.19], [29.0, 29.22], [31.0, 31.68], [32.0, 32.88], [40.0, 42.28], [44.0, 45.5], [58.0, 58.35], [60.0, 60.0], [61.0, 61.53], [62.0, 63.26], [64.0, 64.52], [65.0, 65.5], [66.0, 67.34], [68.0, 69.55], [73.0, 76.06], [80.0, 80.32], [82.0, 86.95], [92.0, 92.58], [97.0, 96.77], [104.0, 104.45], [105.0, 105.88], [107.0, 201.11], [203.0, 205.34], [207.0, 208.26], [208.0, 211.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [59.59, 0.0, 0.0, 63.64, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 40.62, 0.0, 0.0, 0.0, 0.0, 0.0, 39.63, 0.0, 31.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.9], ["throbbing", 13.75], ["hum", 9.29]], null, null, null, null, null, [["music", 43.05], ["ambient music", 12.78], ["hum", 9.34]], null, [["music", 40.59], ["ambient music", 14.58], ["gong", 7.39]]], "duration": [2.57, 0.48, 0.58, 2.6, 1.19, 0.22, 0.68, 0.88, 2.28, 1.5, 0.35, 0.0, 0.53, 1.26, 0.52, 0.5, 1.34, 1.55, 3.06, 0.32, 4.95, 0.58, -0.23, 0.45, 0.88, 94.11, 2.34, 1.26, 3.67]} \ No newline at end of file diff --git a/annotations_filtered/g46IxT3MGP8_filtered.json b/annotations_filtered/g46IxT3MGP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..851fc609ab0f21cd5b74b976e53c64d0e5d2a9ec --- /dev/null +++ b/annotations_filtered/g46IxT3MGP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 29.07], [30.0, 53.45], [54.0, 54.21], [54.0, 56.46], [57.0, 58.5], [59.0, 60.39], [62.0, 62.13], [63.0, 65.69], [67.0, 68.49], [72.0, 72.49], [80.0, 80.37], [81.0, 81.89], [83.0, 84.08], [88.0, 96.01], [97.0, 98.44], [102.0, 103.84], [105.0, 105.36], [106.0, 106.91], [109.0, 109.21], [111.0, 112.51], [114.0, 116.13], [117.0, 117.95], [119.0, 119.74]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [57.81, 35.73, 0.0, 52.92, 0.0, 0.0, 0.0, 59.59, 0.0, 0.0, 0.0, 0.0, 0.0, 41.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 47.29], ["hum", 10.87], ["throbbing", 6.81]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.58], ["music", 17.53], ["hum", 4.76]], null, null, null, null, null, null, null, null, null], "duration": [25.07, 23.45, 0.21, 2.46, 1.5, 1.39, 0.13, 2.69, 1.49, 0.49, 0.37, 0.89, 1.08, 8.01, 1.44, 1.84, 0.36, 0.91, 0.21, 1.51, 2.13, 0.95, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/g4FOpeshqA8_filtered.json b/annotations_filtered/g4FOpeshqA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30c00d7e8698efbe8b1346813cccb70d4bd5b4d0 --- /dev/null +++ b/annotations_filtered/g4FOpeshqA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.7], [6.0, 8.95], [11.0, 12.65], [15.0, 17.98], [19.0, 20.34], [22.0, 22.82], [36.0, 36.29], [49.0, 49.37], [51.0, 51.33], [56.0, 56.98], [58.0, 60.39], [65.0, 66.19], [72.0, 73.01], [82.0, 85.16], [89.0, 90.86], [94.0, 95.2], [97.0, 98.27], [104.0, 105.02], [111.0, 112.83], [116.0, 117.91], [120.0, 122.25], [124.0, 126.94], [129.0, 131.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.13, 0.0, 68.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.42, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.17, 52.22, 50.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 73.36], ["synthesizer", 5.3], ["electronic music", 3.06]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.7, 2.95, 1.65, 2.98, 1.34, 0.82, 0.29, 0.37, 0.33, 0.98, 2.39, 1.19, 1.01, 3.16, 1.86, 1.2, 1.27, 1.02, 1.83, 1.91, 2.25, 2.94, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/g4v51XeJnkw_filtered.json b/annotations_filtered/g4v51XeJnkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89e7e7362bf6a199a661d4ede368fe32214fdefa --- /dev/null +++ b/annotations_filtered/g4v51XeJnkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.9], [3.0, 6.08], [6.0, 8.83], [10.0, 22.84], [25.0, 30.33], [31.0, 35.16], [37.0, 40.95], [41.0, 41.35], [42.0, 47.44], [48.0, 48.95], [49.0, 54.43], [55.0, 57.25], [59.0, 60.78], [62.0, 63.39], [64.0, 64.69], [66.0, 85.29], [91.0, 91.17], [93.0, 94.09], [98.0, 99.0], [104.0, 105.04], [108.0, 110.69], [111.0, 111.67], [115.0, 116.43], [119.0, 119.77], [121.0, 123.55]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.4, 96.17, 39.57, 71.57, 30.88, 33.54, 0.0, 94.66, 0.0, 75.39, 53.16, 0.0, 0.0, 0.0, 42.67, 0.0, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 0.0, 92.97], "audiomae_on_audioset": [null, [["music", 30.28], ["speech", 25.91], ["thunk", 8.08]], null, [["speech", 70.65], ["whack, thwack", 3.03], ["sidetone", 2.84]], null, [["fly, housefly", 40.98], ["mosquito", 13.44], ["speech", 6.86]], [["speech", 78.23], ["echo", 2.16], ["music", 1.63]], null, null, null, null, null, null, null, null, [["music", 65.04], ["speech", 8.52], ["throbbing", 4.89]], null, null, null, null, null, null, null, null, null], "duration": [0.9, 3.08, 2.83, 12.84, 5.33, 4.16, 3.95, 0.35, 5.44, 0.95, 5.43, 2.25, 1.78, 1.39, 0.69, 19.29, 0.17, 1.09, 1.0, 1.04, 2.69, 0.67, 1.43, 0.77, 2.55]} \ No newline at end of file diff --git a/annotations_filtered/g5-KsABvVzU_filtered.json b/annotations_filtered/g5-KsABvVzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8e2501e85c33a48197d6c613abc72904b985320 --- /dev/null +++ b/annotations_filtered/g5-KsABvVzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [4.0, 6.25], [7.0, 9.27], [9.0, 11.16], [13.0, 13.88], [15.0, 16.44], [18.0, 18.45], [20.0, 24.46], [26.0, 26.86], [28.0, 39.53], [40.0, 47.95], [51.0, 55.93], [58.0, 61.91], [67.0, 68.28], [70.0, 70.65], [79.0, 98.44], [100.0, 104.55], [106.0, 121.96], [123.0, 125.44], [128.0, 132.98], [134.0, 135.46], [139.0, 141.08], [146.0, 147.61], [151.0, 150.94], [152.0, 169.35], [171.0, 171.26], [171.0, 174.51]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 89.01, 98.51, 0.0, 0.0, 0.0, 45.72, 0.0, 50.31, 75.88, 96.42, 82.43, 0.0, 0.0, 53.34, 100.0, 62.07, 75.72, 67.51, 0.0, 50.41, 0.0, 0.0, 41.16, 0.0, 35.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["stomach rumble", 50.44], ["whale vocalization", 7.97], ["burping, eructation", 5.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.8], ["throbbing", 12.29], ["hum", 5.3]], null, [["speech", 54.32], ["whale vocalization", 13.08], ["music", 6.62]]], "duration": [1.38, 2.25, 2.27, 2.16, 0.88, 1.44, 0.45, 4.46, 0.86, 11.53, 7.95, 4.93, 3.91, 1.28, 0.65, 19.44, 4.55, 15.96, 2.44, 4.98, 1.46, 2.08, 1.61, -0.06, 17.35, 0.26, 3.51]} \ No newline at end of file diff --git a/annotations_filtered/g511NYTRiOE_filtered.json b/annotations_filtered/g511NYTRiOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61e13f1de9afbf806e0d2115222bb2e2d5f87e8b --- /dev/null +++ b/annotations_filtered/g511NYTRiOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.97], [6.0, 7.52], [8.0, 12.38], [13.0, 14.07], [15.0, 16.6], [17.0, 17.2], [17.0, 29.94], [32.0, 35.94], [37.0, 39.7], [40.0, 42.65], [45.0, 46.77], [50.0, 54.08], [59.0, 60.59], [61.0, 63.81], [65.0, 67.78], [68.0, 69.89], [83.0, 85.46], [90.0, 93.39], [95.0, 95.61], [98.0, 98.14], [99.0, 99.42], [101.0, 101.65], [104.0, 105.09], [114.0, 113.9], [122.0, 127.3], [128.0, 131.63], [132.0, 134.22], [135.0, 136.0], [138.0, 140.29], [146.0, 147.28], [151.0, 151.75], [154.0, 154.08], [169.0, 168.59], [169.0, 169.87], [190.0, 189.94], [192.0, 191.91], [196.0, 196.57], [198.0, 198.68], [201.0, 201.99], [203.0, 203.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.67, 0.0, 62.78, 0.0, 0.0, 0.0, 55.89, 97.92, 96.54, 59.07, 0.0, 98.8, 0.0, 98.66, 47.5, 0.0, 96.04, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 97.22, 39.54, 0.0, 35.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 53.62], ["speech", 19.83], ["sine wave", 5.3]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.49], ["hum", 11.99], ["throbbing", 5.89]], null, [["music", 28.54], ["musical instrument", 21.74], ["drum", 10.62]], null, null, null, null, null, null, null, null, null, null, null], "duration": [4.97, 1.52, 4.38, 1.07, 1.6, 0.2, 12.94, 3.94, 2.7, 2.65, 1.77, 4.08, 1.59, 2.81, 2.78, 1.89, 2.46, 3.39, 0.61, 0.14, 0.42, 0.65, 1.09, -0.1, 5.3, 3.63, 2.22, 1.0, 2.29, 1.28, 0.75, 0.08, -0.41, 0.87, -0.06, -0.09, 0.57, 0.68, 0.99, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/g5AixBKy7b4_filtered.json b/annotations_filtered/g5AixBKy7b4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2f7ebc9fb74327de0e69f98ef994008945f9d0 --- /dev/null +++ b/annotations_filtered/g5AixBKy7b4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [6.0, 5.81], [14.0, 15.38], [21.0, 23.94], [26.0, 27.92], [30.0, 33.34], [35.0, 36.41], [38.0, 39.23], [40.0, 41.39], [44.0, 52.89], [53.0, 54.73], [57.0, 59.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 65.2, 0.0, 75.88, 0.0, 0.0, 0.0, 40.07, 0.0, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 63.66], ["speech", 12.24], ["synthesizer", 7.32]], null, null], "duration": [0.72, -0.19, 1.38, 2.94, 1.92, 3.34, 1.41, 1.23, 1.39, 8.89, 1.73, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/g5Y-PN_duno_filtered.json b/annotations_filtered/g5Y-PN_duno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34eceeed4cd388f58c8f99bd48adaf336c8a57e5 --- /dev/null +++ b/annotations_filtered/g5Y-PN_duno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.37], [16.0, 17.88], [23.0, 23.21], [24.0, 25.25], [26.0, 27.31], [29.0, 30.77], [32.0, 33.54], [36.0, 36.73], [39.0, 39.04], [43.0, 43.7], [45.0, 46.31], [48.0, 49.77], [52.0, 53.92], [55.0, 54.73], [56.0, 56.2], [61.0, 61.72], [64.0, 65.15], [69.0, 69.99], [74.0, 77.65], [80.0, 81.55], [82.0, 82.43], [86.0, 86.95], [89.0, 88.94], [92.0, 93.39], [95.0, 95.35], [98.0, 98.49], [103.0, 104.55], [108.0, 111.64], [113.0, 114.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 1.88, 0.21, 1.25, 1.31, 1.77, 1.54, 0.73, 0.04, 0.7, 1.31, 1.77, 1.92, -0.27, 0.2, 0.72, 1.15, 0.99, 3.65, 1.55, 0.43, 0.95, -0.06, 1.39, 0.35, 0.49, 1.55, 3.64, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/g5e3qoREpuA_filtered.json b/annotations_filtered/g5e3qoREpuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f7011d7e7ab47e75f306c8b0f35ff34dd305e3d --- /dev/null +++ b/annotations_filtered/g5e3qoREpuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [5.0, 12.19], [13.0, 14.99], [16.0, 18.99], [19.0, 21.05], [22.0, 22.45], [23.0, 24.44], [26.0, 27.77], [32.0, 32.58], [34.0, 34.7], [42.0, 48.49], [50.0, 52.1], [55.0, 55.41], [56.0, 68.61], [72.0, 87.54], [90.0, 95.88], [97.0, 97.53], [98.0, 99.86], [108.0, 141.03], [146.0, 147.55], [150.0, 161.2], [162.0, 162.53], [163.0, 163.83], [165.0, 165.96], [167.0, 168.34], [168.0, 168.4], [168.0, 170.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 56.86, 0.0, 68.8, 55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 57.48, 0.0, 33.01, 31.1, 30.8, 0.0, 0.0, 0.0, 0.0, 39.19, 0.0, 0.0, 0.0, 0.0, 0.0, 35.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.15], ["mains hum", 17.68], ["sidetone", 15.13]], [["speech", 35.94], ["music", 13.31], ["outside, rural or natural", 6.25]], [["music", 47.52], ["theremin", 15.54], ["musical instrument", 6.38]], null, null, null, null, [["music", 42.7], ["didgeridoo", 10.29], ["wind instrument, woodwind instrument", 6.0]], null, null, null, null, null, [["livestock, farm animals, working animals", 19.14], ["cattle, bovinae", 15.99], ["moo", 13.49]]], "duration": [0.5, 7.19, 1.99, 2.99, 2.05, 0.45, 1.44, 1.77, 0.58, 0.7, 6.49, 2.1, 0.41, 12.61, 15.54, 5.88, 0.53, 1.86, 33.03, 1.55, 11.2, 0.53, 0.83, 0.96, 1.34, 0.4, 2.06]} \ No newline at end of file diff --git a/annotations_filtered/g5lJIy5IcWc_filtered.json b/annotations_filtered/g5lJIy5IcWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..326111c773836c9bfa8caadcfead1243a0b2ebd8 --- /dev/null +++ b/annotations_filtered/g5lJIy5IcWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.31], [23.0, 24.43], [27.0, 27.48], [31.0, 31.19], [33.0, 33.56], [38.0, 37.99], [39.0, 41.15], [47.0, 48.1], [48.0, 52.08], [55.0, 56.2], [57.0, 57.86], [58.0, 58.67], [61.0, 67.61], [72.0, 72.94], [76.0, 81.62], [88.0, 88.38], [88.0, 88.5], [92.0, 92.38], [106.0, 107.15], [114.0, 114.39], [117.0, 120.53], [121.0, 121.51], [123.0, 123.45], [123.0, 125.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [54.1, 0.0, 0.0, 0.0, 0.0, 0.0, 57.81, 0.0, 61.97, 0.0, 0.0, 0.0, 70.86, 0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 0.0, 50.46, 0.0, 0.0, 53.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.31, 1.43, 0.48, 0.19, 0.56, -0.01, 2.15, 1.1, 4.08, 1.2, 0.86, 0.67, 6.61, 0.94, 5.62, 0.38, 0.5, 0.38, 1.15, 0.39, 3.53, 0.51, 0.45, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/g5m411zcNA4_filtered.json b/annotations_filtered/g5m411zcNA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5369bbc5d34d83d74f8cdbad192278d112c17960 --- /dev/null +++ b/annotations_filtered/g5m411zcNA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.74], [4.0, 10.98], [12.0, 15.6], [16.0, 18.45], [19.0, 20.31], [21.0, 22.99], [25.0, 26.22], [27.0, 29.34], [30.0, 31.58], [32.0, 33.84], [35.0, 36.05], [37.0, 37.93], [40.0, 42.65], [43.0, 44.83], [45.0, 46.62], [48.0, 48.78], [51.0, 51.49], [53.0, 53.96], [55.0, 63.86], [67.0, 67.54], [70.0, 70.44], [72.0, 74.41], [75.0, 78.09]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 84.43, 65.44, 46.75, 0.0, 0.0, 0.0, 46.5, 0.0, 0.0, 0.0, 0.0, 38.2, 0.0, 0.0, 0.0, 0.0, 0.0, 58.81, 0.0, 0.0, 66.15, 35.33], "audiomae_on_audioset": [null, null, null, [["hum", 15.06], ["owl", 8.68], ["mains hum", 7.11]], null, null, null, [["music", 37.81], ["gong", 11.17], ["synthesizer", 5.72]], null, null, null, null, [["speech", 53.87], ["radio", 9.98], ["sidetone", 6.54]], null, null, null, null, null, null, null, null, null, [["hum", 24.27], ["sidetone", 16.88], ["whale vocalization", 8.59]]], "duration": [0.74, 6.98, 3.6, 2.45, 1.31, 1.99, 1.22, 2.34, 1.58, 1.84, 1.05, 0.93, 2.65, 1.83, 1.62, 0.78, 0.49, 0.96, 8.86, 0.54, 0.44, 2.41, 3.09]} \ No newline at end of file diff --git a/annotations_filtered/g6DnsZvudTI_filtered.json b/annotations_filtered/g6DnsZvudTI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63002ff5e4247fb49c980b55888c5f7481299124 --- /dev/null +++ b/annotations_filtered/g6DnsZvudTI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.76], [17.0, 21.95], [25.0, 28.0], [29.0, 50.06], [53.0, 54.23], [58.0, 61.25]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 79.94, 33.06, 69.47, 0.0, 72.75], "audiomae_on_audioset": [null, null, [["thunk", 53.01], ["speech", 28.62], ["telephone", 2.35]], null, null, null], "duration": [0.76, 4.95, 3.0, 21.06, 1.23, 3.25]} \ No newline at end of file diff --git a/annotations_filtered/g6mF_yokyiA_filtered.json b/annotations_filtered/g6mF_yokyiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12a8b2de25b7d0f8fcb6a130ee273e66f8b203d3 --- /dev/null +++ b/annotations_filtered/g6mF_yokyiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.83], [25.0, 25.3], [28.0, 29.29], [35.0, 35.19], [41.0, 42.04], [44.0, 44.02], [49.0, 50.45], [51.0, 51.63]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.83, 0.3, 1.29, 0.19, 1.04, 0.02, 1.45, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/g6sSw9vrO0s_filtered.json b/annotations_filtered/g6sSw9vrO0s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e700ecefc383628d78b52d04395f2a19564c024 --- /dev/null +++ b/annotations_filtered/g6sSw9vrO0s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [6.0, 22.38], [23.0, 39.51], [43.0, 49.76], [57.0, 57.75], [59.0, 59.1], [70.0, 70.21], [72.0, 72.57]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.42, 35.91, 53.4, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 35.25], ["throbbing", 21.32], ["hum", 19.38]], [["music", 83.44], ["throbbing", 2.29], ["hum", 1.97]], null, null, null, null, null], "duration": [0.04, 16.38, 16.51, 6.76, 0.75, 0.1, 0.21, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/g7QBS0O7gT0_filtered.json b/annotations_filtered/g7QBS0O7gT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82fe8fa5fe61b7aab5072fb53abde58464eb69b6 --- /dev/null +++ b/annotations_filtered/g7QBS0O7gT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [11.0, 13.17], [17.0, 19.01], [22.0, 22.44], [25.0, 26.38], [35.0, 37.61], [38.0, 45.13], [48.0, 49.15], [50.0, 62.67], [64.0, 65.25], [67.0, 71.74], [74.0, 76.87], [88.0, 93.58], [96.0, 96.74], [100.0, 104.77], [105.0, 104.82], [108.0, 107.89], [109.0, 113.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 90.43, 0.0, 0.0, 84.62, 99.52, 0.0, 45.88, 0.0, 37.58, 37.56, 59.42, 0.0, 68.02, 0.0, 0.0, 60.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 57.13], ["didgeridoo", 10.32], ["fly, housefly", 3.17]], null, [["vehicle", 11.84], ["music", 9.46], ["speech", 7.06]], [["fly, housefly", 25.06], ["insect", 22.99], ["whale vocalization", 22.65]], null, null, null, null, null, null], "duration": [0.57, 2.17, 2.01, 0.44, 1.38, 2.61, 7.13, 1.15, 12.67, 1.25, 4.74, 2.87, 5.58, 0.74, 4.77, -0.18, -0.11, 4.88]} \ No newline at end of file diff --git a/annotations_filtered/g7bQ7ynurn8_filtered.json b/annotations_filtered/g7bQ7ynurn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8623a008a7afdd3a293c9a7ede0f138820626dc --- /dev/null +++ b/annotations_filtered/g7bQ7ynurn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.83], [16.0, 18.52], [19.0, 22.17], [27.0, 27.75], [32.0, 33.57], [42.0, 44.96], [50.0, 51.44], [54.0, 54.4], [58.0, 57.97], [60.0, 62.43], [64.0, 64.67]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 59.86, 33.65, 0.0, 0.0, 29.74, 0.0, 0.0, 0.0, 31.11, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.93], ["guitar", 6.3], ["musical instrument", 6.21]], null, null, [["music", 88.43], ["rock music", 1.15], ["musical instrument", 0.85]], null, null, null, [["music", 34.36], ["didgeridoo", 20.89], ["synthesizer", 7.97]], null], "duration": [0.83, 2.52, 3.17, 0.75, 1.57, 2.96, 1.44, 0.4, -0.03, 2.43, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/g7yAbv_u-FA_filtered.json b/annotations_filtered/g7yAbv_u-FA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7c613999ab54a45196209a53b09b8e113d4ff70 --- /dev/null +++ b/annotations_filtered/g7yAbv_u-FA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 48.32], [75.0, 74.98], [87.0, 87.99], [95.0, 95.79], [97.0, 98.02], [105.0, 106.17], [110.0, 110.19], [111.0, 111.77], [112.0, 116.26], [117.0, 118.77], [120.0, 121.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, -0.02, 0.99, 0.79, 1.02, 1.17, 0.19, 0.77, 4.26, 1.77, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/g8YFtf6tfRg_filtered.json b/annotations_filtered/g8YFtf6tfRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74acafd81e7daef79d00d1eaf3fb101a2f0d8fc0 --- /dev/null +++ b/annotations_filtered/g8YFtf6tfRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.22], [24.0, 23.72], [24.0, 25.24], [26.0, 27.11], [28.0, 31.06], [33.0, 33.93], [36.0, 37.44], [41.0, 41.94], [45.0, 45.57], [52.0, 53.01], [56.0, 57.42], [59.0, 60.62], [63.0, 63.49], [65.0, 66.18], [67.0, 69.53], [71.0, 73.06], [75.0, 77.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 70.72, 68.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.22, -0.28, 1.24, 1.11, 3.06, 0.93, 1.44, 0.94, 0.57, 1.01, 1.42, 1.62, 0.49, 1.18, 2.53, 2.06, 2.95]} \ No newline at end of file diff --git a/annotations_filtered/g8fheDIG_RA_filtered.json b/annotations_filtered/g8fheDIG_RA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d7dd2990f858f55594b23dd4f3b1baa388fa5e7 --- /dev/null +++ b/annotations_filtered/g8fheDIG_RA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [8.0, 9.21], [17.0, 18.74], [26.0, 26.99], [29.0, 29.46], [74.0, 74.49], [79.0, 80.4], [82.0, 82.32], [89.0, 89.94], [95.0, 94.69], [97.0, 109.43], [112.0, 111.99], [112.0, 112.51], [128.0, 128.14], [136.0, 136.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.17, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 58.65], ["clarinet", 13.24], ["musical instrument", 4.46]], null, null, null, null], "duration": [0.48, 1.21, 1.74, 0.99, 0.46, 0.49, 1.4, 0.32, 0.94, -0.31, 12.43, -0.01, 0.51, 0.14, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/g8hPeRFRiHY_filtered.json b/annotations_filtered/g8hPeRFRiHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ccc394846fe809222cf5ac47d7c45ec8582dd17 --- /dev/null +++ b/annotations_filtered/g8hPeRFRiHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.8], [6.0, 7.25], [8.0, 8.61], [11.0, 12.6], [16.0, 17.46], [23.0, 24.06], [26.0, 25.74], [28.0, 28.26], [31.0, 31.77], [33.0, 34.08], [35.0, 35.55], [37.0, 38.48], [41.0, 42.47], [46.0, 46.65], [48.0, 65.64], [66.0, 72.91], [74.0, 74.68], [77.0, 78.65], [79.0, 92.67], [96.0, 98.39], [99.0, 101.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [39.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.71, 33.49, 0.0, 0.0, 46.02, 69.34, 40.48], "audiomae_on_audioset": [[["moo", 37.02], ["cattle, bovinae", 35.33], ["livestock, farm animals, working animals", 20.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.74], ["cattle, bovinae", 4.51], ["moo", 3.62]], null, null, [["music", 56.46], ["theremin", 11.32], ["bleat", 9.11]], null, [["didgeridoo", 19.03], ["music", 13.75], ["throbbing", 7.44]]], "duration": [2.8, 1.25, 0.61, 1.6, 1.46, 1.06, -0.26, 0.26, 0.77, 1.08, 0.55, 1.48, 1.47, 0.65, 17.64, 6.91, 0.68, 1.65, 13.67, 2.39, 2.92]} \ No newline at end of file diff --git a/annotations_filtered/g8nPKVElb88_filtered.json b/annotations_filtered/g8nPKVElb88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52bd991ab1f7699cbd5993f1876fe800f10d02ac --- /dev/null +++ b/annotations_filtered/g8nPKVElb88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.21], [6.0, 9.29], [12.0, 13.04], [15.0, 17.27], [19.0, 19.45], [21.0, 22.87], [27.0, 27.33], [28.0, 31.38], [32.0, 32.88], [41.0, 41.99], [46.0, 47.71], [58.0, 57.94], [58.0, 58.31], [65.0, 68.12], [68.0, 69.36], [75.0, 76.27], [77.0, 79.41], [83.0, 82.97], [84.0, 85.29], [89.0, 92.26], [98.0, 97.8], [99.0, 99.12], [102.0, 103.05], [104.0, 114.51], [115.0, 116.51], [121.0, 122.37], [123.0, 126.49], [130.0, 131.85]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 48.44, 0.0, 46.61, 0.0, 0.0, 0.0, 36.42, 0.0, 0.0, 0.0, 0.0, 0.0, 36.32, 0.0, 0.0, 66.27, 0.0, 0.0, 39.99, 0.0, 0.0, 0.0, 43.77, 0.0, 0.0, 56.48, 0.0], "audiomae_on_audioset": [null, [["speech", 24.97], ["music", 24.17], ["synthesizer", 7.89]], null, [["music", 11.56], ["speech", 11.38], ["moo", 6.87]], null, null, null, [["music", 40.78], ["speech", 25.73], ["synthesizer", 5.09]], null, null, null, null, null, [["music", 45.55], ["speech", 22.33], ["synthesizer", 4.19]], null, null, null, null, null, [["music", 51.8], ["speech", 18.4], ["thunk", 5.44]], null, null, null, [["music", 71.99], ["throbbing", 5.83], ["hum", 3.63]], null, null, null, null], "duration": [0.21, 3.29, 1.04, 2.27, 0.45, 1.87, 0.33, 3.38, 0.88, 0.99, 1.71, -0.06, 0.31, 3.12, 1.36, 1.27, 2.41, -0.03, 1.29, 3.26, -0.2, 0.12, 1.05, 10.51, 1.51, 1.37, 3.49, 1.85]} \ No newline at end of file diff --git a/annotations_filtered/g8pt9OoaPlY_filtered.json b/annotations_filtered/g8pt9OoaPlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5d8c25ccf9af345223455f1db38faba1b734b5b --- /dev/null +++ b/annotations_filtered/g8pt9OoaPlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [4.0, 6.08], [8.0, 10.88], [16.0, 26.06], [33.0, 33.54], [35.0, 35.18], [40.0, 45.52], [48.0, 50.35], [56.0, 72.6], [74.0, 74.33], [75.0, 75.47], [76.0, 76.87], [78.0, 80.72], [84.0, 101.12], [102.0, 103.72], [107.0, 115.06]], "keep_status": [false, true, true, true, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 46.12, 28.83, 28.72, 0.0, 0.0, 28.97, 28.87, 29.49, 0.0, 0.0, 0.0, 31.0, 29.73, 0.0, 29.37], "audiomae_on_audioset": [null, [["speech", 34.59], ["music", 18.02], ["sidetone", 14.17]], [["music", 39.76], ["burst, pop", 7.14], ["whack, thwack", 5.48]], [["music", 20.02], ["whip", 15.59], ["speech", 12.58]], null, null, [["music", 42.08], ["speech", 35.95], ["sidetone", 5.74]], [["music", 46.48], ["speech", 24.86], ["sound effect", 2.21]], [["sonar", 28.78], ["music", 21.29], ["gong", 10.37]], null, null, null, [["foghorn", 44.64], ["music", 28.15], ["speech", 13.91]], [["speech", 53.34], ["whack, thwack", 10.04], ["groan", 4.98]], null, [["music", 59.76], ["breaking", 9.06], ["speech", 4.58]]], "duration": [0.5, 2.08, 2.88, 10.06, 0.54, 0.18, 5.52, 2.35, 16.6, 0.33, 0.47, 0.87, 2.72, 17.12, 1.72, 8.06]} \ No newline at end of file diff --git a/annotations_filtered/g92cHdRbgag_filtered.json b/annotations_filtered/g92cHdRbgag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43b5d4b21ede60466161d62f4033e1795e89492a --- /dev/null +++ b/annotations_filtered/g92cHdRbgag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.92], [25.0, 29.0], [32.0, 36.59], [39.0, 39.18], [42.0, 68.52], [69.0, 69.72], [70.0, 70.61], [72.0, 72.37], [75.0, 76.0], [78.0, 78.49], [79.0, 81.65], [87.0, 88.59], [89.0, 90.0], [91.0, 92.26], [95.0, 95.69], [97.0, 98.51], [101.0, 104.45], [106.0, 109.11]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.84, 92.8, 100.0, 0.0, 37.18, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 64.07], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 18.45], ["speech", 15.7], ["cattle, bovinae", 13.08]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.92, 4.0, 4.59, 0.18, 26.52, 0.72, 0.61, 0.37, 1.0, 0.49, 2.65, 1.59, 1.0, 1.26, 0.69, 1.51, 3.45, 3.11]} \ No newline at end of file diff --git a/annotations_filtered/g95ZXrh2oK4_filtered.json b/annotations_filtered/g95ZXrh2oK4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8fa620feaf03cd76d2451b5ded41859a8c2aa18 --- /dev/null +++ b/annotations_filtered/g95ZXrh2oK4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.95], [8.0, 15.08], [16.0, 17.61], [19.0, 27.35], [28.0, 28.53], [32.0, 33.12], [36.0, 37.39], [38.0, 39.38], [40.0, 44.63], [45.0, 61.21], [64.0, 65.13], [67.0, 68.76], [74.0, 75.68], [78.0, 79.29], [81.0, 81.41], [82.0, 82.83], [84.0, 85.53], [90.0, 90.31], [93.0, 94.14], [95.0, 96.58], [98.0, 98.27], [100.0, 101.34], [103.0, 124.09], [126.0, 126.22], [126.0, 128.58], [130.0, 138.2], [142.0, 142.65], [145.0, 146.64], [149.0, 155.95], [167.0, 171.66], [174.0, 178.73], [181.0, 201.02]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [73.97, 39.94, 0.0, 93.13, 0.0, 0.0, 0.0, 0.0, 80.46, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 52.22, 40.71, 0.0, 0.0, 37.84, 33.17, 32.72, 33.26], "audiomae_on_audioset": [null, [["moo", 19.51], ["cattle, bovinae", 19.28], ["livestock, farm animals, working animals", 10.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.4], ["double bass", 3.87], ["musical instrument", 3.61]], null, null, [["music", 60.85], ["double bass", 4.44], ["musical instrument", 3.73]], [["music", 62.07], ["musical instrument", 6.24], ["guitar", 4.53]], [["music", 75.16], ["musical instrument", 4.44], ["plucked string instrument", 2.57]], [["music", 81.1], ["double bass", 1.93], ["musical instrument", 1.23]]], "duration": [2.95, 7.08, 1.61, 8.35, 0.53, 1.12, 1.39, 1.38, 4.63, 16.21, 1.13, 1.76, 1.68, 1.29, 0.41, 0.83, 1.53, 0.31, 1.14, 1.58, 0.27, 1.34, 21.09, 0.22, 2.58, 8.2, 0.65, 1.64, 6.95, 4.66, 4.73, 20.02]} \ No newline at end of file diff --git a/annotations_filtered/g9GBuciv20A_filtered.json b/annotations_filtered/g9GBuciv20A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f7f0c6797e6d320feb7d7122c0ec1a98fb91a7f --- /dev/null +++ b/annotations_filtered/g9GBuciv20A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.82], [13.0, 17.12], [19.0, 23.55], [26.0, 29.79], [34.0, 37.4], [38.0, 43.7], [49.0, 49.49], [53.0, 53.38], [55.0, 56.67], [57.0, 58.6], [60.0, 61.64], [76.0, 92.57], [93.0, 95.25], [97.0, 97.71], [103.0, 102.96], [106.0, 105.66], [115.0, 116.07], [135.0, 135.09], [138.0, 140.43], [159.0, 159.0], [160.0, 159.98], [178.0, 178.26], [184.0, 184.3], [187.0, 187.79], [190.0, 190.09], [192.0, 196.64], [197.0, 196.67], [197.0, 196.7], [197.0, 196.74], [197.0, 196.77], [197.0, 196.8], [197.0, 196.84], [197.0, 196.87], [197.0, 196.91]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.54, 50.16, 46.68, 51.99, 50.26, 0.0, 0.0, 0.0, 0.0, 0.0, 41.78, 39.38, 0.0, 0.0, 0.0, 0.0, 0.0, 43.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.92], ["speech", 21.37], ["synthesizer", 6.12]], null, [["music", 66.35], ["musical instrument", 4.82], ["sampler", 2.61]], null, null, null, null, null, null, null, [["music", 50.62], ["musical instrument", 6.19], ["speech", 4.89]], [["music", 45.47], ["boing", 7.9], ["effects unit", 6.88]], null, null, null, null, null, [["music", 33.78], ["drum machine", 30.62], ["dubstep", 6.33]], null, null, null, null, null, null, [["cattle, bovinae", 19.78], ["moo", 18.39], ["music", 9.9]], null, null, null, null, null, null, null, null], "duration": [1.82, 4.12, 4.55, 3.79, 3.4, 5.7, 0.49, 0.38, 1.67, 1.6, 1.64, 16.57, 2.25, 0.71, -0.04, -0.34, 1.07, 0.09, 2.43, 0.0, -0.02, 0.26, 0.3, 0.79, 0.09, 4.64, -0.33, -0.3, -0.26, -0.23, -0.2, -0.16, -0.13, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/g9S5GndUhko_filtered.json b/annotations_filtered/g9S5GndUhko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa13fb79062e7e2937c3624a1634c0b907cd385a --- /dev/null +++ b/annotations_filtered/g9S5GndUhko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[158.0, 157.94], [158.0, 170.31]], "keep_status": [false, true], "silence_prob": [0.0, 28.15], "audiomae_on_audioset": [null, [["music", 52.27], ["drum and bass", 10.79], ["electronic music", 5.9]]], "duration": [-0.06, 12.31]} \ No newline at end of file diff --git a/annotations_filtered/g9U0df6KJiA_filtered.json b/annotations_filtered/g9U0df6KJiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fe686e795af9ef776be5cfa2d7042225581d753 --- /dev/null +++ b/annotations_filtered/g9U0df6KJiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.63], [25.0, 42.06], [46.0, 58.65], [63.0, 64.0], [67.0, 77.43], [80.0, 95.25], [99.0, 109.02], [114.0, 116.5], [117.0, 130.45]], "keep_status": [false, false, true, false, false, false, true, false, true], "silence_prob": [32.9, 31.62, 29.74, 0.0, 29.79, 29.64, 30.32, 33.3, 30.49], "audiomae_on_audioset": [[["boing", 68.3], ["music", 18.32], ["whack, thwack", 3.85]], [["speech", 60.11], ["music", 9.85], ["whack, thwack", 5.77]], [["music", 41.29], ["hum", 14.41], ["cacophony", 11.3]], null, [["music", 62.8], ["throbbing", 9.31], ["hum", 8.81]], [["hum", 31.43], ["music", 27.92], ["throbbing", 16.3]], [["hum", 29.85], ["music", 25.89], ["speech", 11.63]], [["music", 30.35], ["speech", 22.24], ["hum", 19.4]], [["music", 34.98], ["hum", 9.17], ["buzz", 7.7]]], "duration": [2.63, 17.06, 12.65, 1.0, 10.43, 15.25, 10.02, 2.5, 13.45]} \ No newline at end of file diff --git a/annotations_filtered/g9d1TR6Lb9g_filtered.json b/annotations_filtered/g9d1TR6Lb9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4087d6ef78fd6cfcf435cd22e2117e130574f210 --- /dev/null +++ b/annotations_filtered/g9d1TR6Lb9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 49.89], [52.0, 51.95], [52.0, 55.36], [59.0, 73.13], [74.0, 73.94], [74.0, 84.94], [85.0, 172.29]], "keep_status": [false, false, true, true, false, true, false], "silence_prob": [31.37, 0.0, 29.96, 31.36, 0.0, 30.89, 0.0], "audiomae_on_audioset": [[["music", 65.38], ["speech", 8.9], ["breaking", 3.23]], null, [["music", 21.57], ["cacophony", 19.1], ["noise", 13.15]], [["music", 25.53], ["speech", 25.02], ["hum", 13.49]], null, [["music", 25.77], ["hum", 25.3], ["mains hum", 16.29]], null], "duration": [15.89, -0.05, 3.36, 14.13, -0.06, 10.94, 87.29]} \ No newline at end of file diff --git a/annotations_filtered/g9hEJv2uZLM_filtered.json b/annotations_filtered/g9hEJv2uZLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fa0267ed529846b6b8d926eea30e4d8d23cf564 --- /dev/null +++ b/annotations_filtered/g9hEJv2uZLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 32.66], [38.0, 40.32], [41.0, 46.65], [47.0, 48.98], [50.0, 50.97], [51.0, 52.93], [57.0, 87.1], [89.0, 89.19], [96.0, 101.95], [102.0, 102.54]], "keep_status": [false, false, true, false, false, false, false, false, true, false], "silence_prob": [30.85, 30.31, 30.38, 0.0, 0.0, 0.0, 0.0, 0.0, 33.8, 0.0], "audiomae_on_audioset": [[["music", 55.67], ["didgeridoo", 19.12], ["speech", 10.12]], [["didgeridoo", 43.87], ["music", 23.97], ["cattle, bovinae", 2.32]], [["music", 47.81], ["animal", 4.94], ["speech", 3.3]], null, null, null, null, null, [["breaking", 44.97], ["glass", 18.74], ["livestock, farm animals, working animals", 5.02]], null], "duration": [6.66, 2.32, 5.65, 1.98, 0.97, 1.93, 30.1, 0.19, 5.95, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/g9vPtCW9pJ8_filtered.json b/annotations_filtered/g9vPtCW9pJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20b81ded26c23bb08331483421421a08939a8b60 --- /dev/null +++ b/annotations_filtered/g9vPtCW9pJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [5.0, 5.71], [8.0, 8.72], [16.0, 16.65], [20.0, 29.49], [42.0, 51.33], [51.0, 51.87], [52.0, 51.97], [56.0, 58.36], [61.0, 71.36], [75.0, 83.12], [84.0, 105.9], [111.0, 115.96], [118.0, 118.49], [124.0, 126.27]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.64, 31.0, 0.0, 0.0, 74.44, 33.65, 39.41, 33.34, 31.29, 0.0, 36.93], "audiomae_on_audioset": [null, null, null, null, [["music", 22.02], ["fly, housefly", 20.7], ["hum", 11.92]], [["music", 63.01], ["speech", 18.99], ["hum", 2.99]], null, null, null, [["music", 67.22], ["speech", 5.15], ["synthesizer", 4.06]], [["music", 63.53], ["didgeridoo", 8.57], ["musical instrument", 4.98]], [["music", 43.82], ["double bass", 5.64], ["cello", 5.25]], [["music", 52.73], ["theremin", 18.58], ["didgeridoo", 2.31]], null, [["music", 43.05], ["hum", 9.17], ["mains hum", 4.78]]], "duration": [0.89, 0.71, 0.72, 0.65, 9.49, 9.33, 0.87, -0.03, 2.36, 10.36, 8.12, 21.9, 4.96, 0.49, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/gA-VU0mczSI_filtered.json b/annotations_filtered/gA-VU0mczSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e05c546cb74cfae35d4600a9c83536c1c6af2c73 --- /dev/null +++ b/annotations_filtered/gA-VU0mczSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.82], [18.0, 20.46], [21.0, 22.49], [23.0, 57.16], [57.0, 57.94], [59.0, 68.67], [69.0, 70.92], [73.0, 73.82], [79.0, 80.91], [89.0, 92.1], [92.0, 92.82], [93.0, 92.94], [93.0, 96.52], [97.0, 108.9], [111.0, 114.54], [117.0, 122.77]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [42.69, 60.6, 0.0, 0.0, 0.0, 33.04, 0.0, 0.0, 0.0, 29.88, 0.0, 0.0, 31.07, 48.06, 53.34, 49.27], "audiomae_on_audioset": [[["civil defense siren", 53.47], ["music", 11.42], ["siren", 8.35]], null, null, null, null, [["music", 35.47], ["theremin", 11.86], ["speech", 10.85]], null, null, null, [["cattle, bovinae", 50.46], ["moo", 18.74], ["livestock, farm animals, working animals", 12.01]], null, null, [["speech", 46.46], ["music", 7.22], ["hum", 5.99]], [["music", 59.89], ["frog", 11.18], ["croak", 8.37]], null, [["music", 44.51], ["theremin", 7.58], ["musical instrument", 4.67]]], "duration": [9.82, 2.46, 1.49, 34.16, 0.94, 9.67, 1.92, 0.82, 1.91, 3.1, 0.82, -0.06, 3.52, 11.9, 3.54, 5.77]} \ No newline at end of file diff --git a/annotations_filtered/gA0u3Iir0CU_filtered.json b/annotations_filtered/gA0u3Iir0CU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1915720bfaf3ca5f5dcfb48cb6b23840a43d31ff --- /dev/null +++ b/annotations_filtered/gA0u3Iir0CU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.71], [21.0, 23.11], [28.0, 69.97], [70.0, 70.24], [70.0, 70.38], [70.0, 95.35], [96.0, 97.46], [98.0, 111.64], [112.0, 138.79], [139.0, 167.16]], "keep_status": [true, true, false, false, false, false, false, false, true, false], "silence_prob": [32.0, 31.07, 0.0, 0.0, 0.0, 44.46, 0.0, 48.82, 36.9, 74.6], "audiomae_on_audioset": [[["throbbing", 28.97], ["hum", 17.53], ["speech", 14.49]], [["music", 24.53], ["hum", 20.1], ["throbbing", 14.74]], null, null, null, [["throbbing", 39.18], ["hum", 37.5], ["music", 10.05]], null, [["hum", 45.3], ["throbbing", 44.8], ["heart sounds, heartbeat", 3.47]], [["speech", 37.2], ["hum", 10.61], ["throbbing", 4.92]], null], "duration": [3.71, 2.11, 41.97, 0.24, 0.38, 25.35, 1.46, 13.64, 26.79, 28.16]} \ No newline at end of file diff --git a/annotations_filtered/gA3wJRuClks_filtered.json b/annotations_filtered/gA3wJRuClks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1616f23a9787ea6296cc2e9813112973b3454a5 --- /dev/null +++ b/annotations_filtered/gA3wJRuClks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.71], [11.0, 11.5], [13.0, 13.09], [14.0, 14.74], [19.0, 19.57], [21.0, 26.84], [27.0, 27.77], [28.0, 28.95], [30.0, 30.28], [32.0, 31.8], [34.0, 34.57], [35.0, 39.61], [43.0, 43.48], [48.0, 48.1], [49.0, 49.81], [51.0, 50.99], [51.0, 51.6], [53.0, 54.8], [57.0, 57.77], [58.0, 58.45], [60.0, 60.13], [61.0, 61.3], [63.0, 63.14], [67.0, 67.42], [69.0, 69.18], [71.0, 70.71], [72.0, 72.22], [74.0, 74.93], [75.0, 75.64], [79.0, 79.41], [87.0, 88.08], [92.0, 92.82], [94.0, 94.2], [96.0, 97.23], [101.0, 101.93], [114.0, 114.78], [117.0, 117.42], [119.0, 119.2], [121.0, 121.53], [123.0, 124.04], [126.0, 126.32], [127.0, 130.49], [132.0, 133.07], [135.0, 135.57], [139.0, 139.23], [140.0, 141.07], [142.0, 142.3], [144.0, 144.19], [145.0, 144.96], [148.0, 150.18], [151.0, 151.04], [152.0, 152.88], [154.0, 155.71], [156.0, 157.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.71, 0.5, 0.09, 0.74, 0.57, 5.84, 0.77, 0.95, 0.28, -0.2, 0.57, 4.61, 0.48, 0.1, 0.81, -0.01, 0.6, 1.8, 0.77, 0.45, 0.13, 0.3, 0.14, 0.42, 0.18, -0.29, 0.22, 0.93, 0.64, 0.41, 1.08, 0.82, 0.2, 1.23, 0.93, 0.78, 0.42, 0.2, 0.53, 1.04, 0.32, 3.49, 1.07, 0.57, 0.23, 1.07, 0.3, 0.19, -0.04, 2.18, 0.04, 0.88, 1.71, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/gA8z3Yk3wWc_filtered.json b/annotations_filtered/gA8z3Yk3wWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5144e6afc9f619151cd0dd611d7d52049549452 --- /dev/null +++ b/annotations_filtered/gA8z3Yk3wWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [3.0, 11.35], [16.0, 16.7], [20.0, 20.55], [27.0, 27.51], [28.0, 28.49], [30.0, 31.19], [32.0, 33.3], [35.0, 35.88], [38.0, 39.07], [40.0, 40.96], [45.0, 46.74], [47.0, 46.84], [52.0, 53.11], [54.0, 55.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 38.19], ["buzz", 25.28], ["didgeridoo", 12.36]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 8.35, 0.7, 0.55, 0.51, 0.49, 1.19, 1.3, 0.88, 1.07, 0.96, 1.74, -0.16, 1.11, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/gAKiWvjfCiQ_filtered.json b/annotations_filtered/gAKiWvjfCiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28d59716965daf6a3c0f013d6a224d4c86c3d81e --- /dev/null +++ b/annotations_filtered/gAKiWvjfCiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.11], [11.0, 12.5], [14.0, 15.08], [16.0, 20.41], [25.0, 25.79], [28.0, 29.22], [30.0, 30.77], [32.0, 34.99], [37.0, 37.96], [39.0, 40.46], [45.0, 46.23], [49.0, 50.11], [51.0, 56.15], [58.0, 60.35], [62.0, 62.31], [63.0, 63.61], [64.0, 66.48], [69.0, 69.47], [70.0, 71.1], [72.0, 74.6], [78.0, 79.1], [84.0, 83.71], [87.0, 92.11], [93.0, 92.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [46.57, 0.0, 0.0, 40.99, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 0.0, 0.0, 44.99, 45.52, 0.0, 0.0, 32.67, 0.0, 0.0, 44.18, 0.0, 0.0, 30.76, 0.0], "audiomae_on_audioset": [[["music", 32.53], ["musical instrument", 10.55], ["brass instrument", 8.86]], null, null, [["music", 69.1], ["synthesizer", 9.63], ["musical instrument", 4.41]], null, null, null, null, null, null, null, null, [["music", 56.99], ["theremin", 12.59], ["synthesizer", 8.42]], [["theremin", 57.83], ["music", 22.54], ["synthesizer", 6.39]], null, null, [["music", 54.69], ["speech", 11.26], ["synthesizer", 4.22]], null, null, [["music", 32.69], ["speech", 24.43], ["synthesizer", 6.76]], null, null, [["music", 53.27], ["speech", 20.66], ["musical instrument", 2.86]], null], "duration": [2.11, 1.5, 1.08, 4.41, 0.79, 1.22, 0.77, 2.99, 0.96, 1.46, 1.23, 1.11, 5.15, 2.35, 0.31, 0.61, 2.48, 0.47, 1.1, 2.6, 1.1, -0.29, 5.11, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/gAM2Q7Sqlbk_filtered.json b/annotations_filtered/gAM2Q7Sqlbk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a561810bc5e55d623a9d79e0411e1aa814f502a --- /dev/null +++ b/annotations_filtered/gAM2Q7Sqlbk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.75], [8.0, 9.12], [30.0, 30.89], [41.0, 44.27], [54.0, 54.57], [55.0, 59.32], [65.0, 65.38], [69.0, 71.63], [74.0, 77.55], [78.0, 83.07], [83.0, 87.57], [95.0, 106.08], [107.0, 107.94], [112.0, 112.67], [115.0, 115.05], [116.0, 123.33], [125.0, 126.81], [127.0, 128.61]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.57, 0.0, 50.81, 0.0, 74.92, 61.67, 52.68, 30.66, 46.22, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 33.8], ["noise", 12.84], ["fart", 9.67]], null, null, null, null, null, null, [["speech", 28.61], ["music", 28.16], ["hum", 8.36]], [["speech", 77.96], ["sidetone", 4.39], ["telephone", 2.72]], null, null, null, null, null, null], "duration": [1.75, 1.12, 0.89, 3.27, 0.57, 4.32, 0.38, 2.63, 3.55, 5.07, 4.57, 11.08, 0.94, 0.67, 0.05, 7.33, 1.81, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/gAWrAQp7pWQ_filtered.json b/annotations_filtered/gAWrAQp7pWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e9b119c66a3bd40b408d17b291b6ecf797a0015 --- /dev/null +++ b/annotations_filtered/gAWrAQp7pWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.74], [26.0, 33.91], [37.0, 38.91], [48.0, 49.5], [57.0, 82.48], [85.0, 94.93], [98.0, 101.41], [104.0, 106.56], [109.0, 110.52], [116.0, 117.15], [118.0, 118.59], [122.0, 125.47], [127.0, 129.93], [135.0, 139.13], [144.0, 148.41]], "keep_status": [false, true, false, false, false, false, true, true, false, false, false, true, false, true, true], "silence_prob": [0.0, 38.58, 0.0, 0.0, 33.77, 38.42, 39.38, 47.39, 0.0, 0.0, 0.0, 44.07, 57.72, 35.33, 35.18], "audiomae_on_audioset": [null, [["insect", 22.68], ["fly, housefly", 18.83], ["music", 11.01]], null, null, [["music", 60.1], ["hum", 9.8], ["throbbing", 5.75]], [["hum", 33.81], ["throbbing", 30.88], ["music", 11.59]], [["music", 58.63], ["theremin", 6.12], ["musical instrument", 3.47]], [["music", 46.05], ["frog", 9.58], ["didgeridoo", 7.79]], null, null, null, [["mosquito", 21.5], ["music", 18.81], ["fly, housefly", 17.69]], null, [["music", 26.39], ["fly, housefly", 9.57], ["insect", 7.65]], [["music", 47.26], ["synthesizer", 11.01], ["musical instrument", 10.53]]], "duration": [0.74, 7.91, 1.91, 1.5, 25.48, 9.93, 3.41, 2.56, 1.52, 1.15, 0.59, 3.47, 2.93, 4.13, 4.41]} \ No newline at end of file diff --git a/annotations_filtered/gAmo3FcaovM_filtered.json b/annotations_filtered/gAmo3FcaovM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83c6d3e033e7771a002d6a786d06332749115cde --- /dev/null +++ b/annotations_filtered/gAmo3FcaovM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 38.1], [38.0, 48.03], [48.0, 77.92], [79.0, 78.92], [79.0, 79.68], [81.0, 82.38], [88.0, 103.77], [106.0, 112.72], [115.0, 118.25]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.77, 29.64, 0.0, 0.0, 0.0, 67.51, 32.14, 28.71], "audiomae_on_audioset": [null, [["music", 61.81], ["scary music", 22.13], ["soundtrack music", 3.27]], [["music", 70.75], ["throbbing", 13.02], ["hum", 4.62]], null, null, null, null, [["music", 46.4], ["speech", 18.89], ["whack, thwack", 9.34]], [["music", 66.9], ["didgeridoo", 2.06], ["sound effect", 1.85]]], "duration": [30.1, 10.03, 29.92, -0.08, 0.68, 1.38, 15.77, 6.72, 3.25]} \ No newline at end of file diff --git a/annotations_filtered/gB1LgDhJQMI_filtered.json b/annotations_filtered/gB1LgDhJQMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce1434d4198d68be7bd25f776f0d1cc3f90489c8 --- /dev/null +++ b/annotations_filtered/gB1LgDhJQMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.65], [1.0, 0.72], [1.0, 0.75], [1.0, 1.65], [3.0, 3.47], [4.0, 4.62], [5.0, 5.58], [7.0, 7.72], [8.0, 8.83], [11.0, 10.88], [17.0, 16.95], [17.0, 17.05], [17.0, 17.39], [21.0, 22.25], [23.0, 27.8], [30.0, 35.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.86, 34.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.06], ["speech", 22.86], ["musical instrument", 1.11]], [["music", 77.98], ["fart", 2.73], ["theremin", 2.31]]], "duration": [-0.35, -0.28, -0.25, 0.65, 0.47, 0.62, 0.58, 0.72, 0.83, -0.12, -0.05, 0.05, 0.39, 1.25, 4.8, 5.51]} \ No newline at end of file diff --git a/annotations_filtered/gBdbUMTXKIA_filtered.json b/annotations_filtered/gBdbUMTXKIA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..838f37130402f6ec0fce12cccbc9bed52831e643 --- /dev/null +++ b/annotations_filtered/gBdbUMTXKIA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[88.0, 88.5], [90.0, 114.84], [117.0, 126.0], [126.0, 126.23], [126.0, 126.72], [127.0, 127.68], [130.0, 130.06]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 33.93, 38.62, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["cattle, bovinae", 20.39], ["moo", 20.21], ["whale vocalization", 17.59]], [["speech", 64.96], ["whale vocalization", 16.27], ["noise", 4.38]], null, null, null, null], "duration": [0.5, 24.84, 9.0, 0.23, 0.72, 0.68, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/gBxaGB65TB8_filtered.json b/annotations_filtered/gBxaGB65TB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bda34f701433e8f7b0c8aede9a4b941524c67ebe --- /dev/null +++ b/annotations_filtered/gBxaGB65TB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 82.78], [83.0, 128.17]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [68.78, 45.17]} \ No newline at end of file diff --git a/annotations_filtered/gC672314kEU_filtered.json b/annotations_filtered/gC672314kEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2aaced5c502d1ac40c0bc7f0c4f88cfdfa5da6a3 --- /dev/null +++ b/annotations_filtered/gC672314kEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.65], [17.0, 17.68], [23.0, 23.09], [29.0, 29.22], [32.0, 32.59], [36.0, 40.0], [47.0, 47.87], [49.0, 63.39], [65.0, 65.26], [67.0, 66.78], [69.0, 70.78], [74.0, 73.99], [75.0, 84.72], [88.0, 87.94], [91.0, 90.8], [92.0, 92.38], [96.0, 97.8], [102.0, 102.66], [103.0, 103.37], [106.0, 105.85], [108.0, 116.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 44.93, 0.0, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 44.21], ["music", 28.04], ["hum", 4.4]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.05], ["throbbing", 7.48], ["hum", 5.86]]], "duration": [0.65, 0.68, 0.09, 0.22, 0.59, 4.0, 0.87, 14.39, 0.26, -0.22, 1.78, -0.01, 9.72, -0.06, -0.2, 0.38, 1.8, 0.66, 0.37, -0.15, 8.26]} \ No newline at end of file diff --git a/annotations_filtered/gC6gD7Qzry8_filtered.json b/annotations_filtered/gC6gD7Qzry8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4aca73613a494db29d430c00a73f0ff912b189b --- /dev/null +++ b/annotations_filtered/gC6gD7Qzry8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 55.71], [58.0, 60.0], [60.0, 61.13], [70.0, 70.56], [79.0, 79.1], [86.0, 87.44], [104.0, 103.77], [111.0, 114.89], [117.0, 128.51], [131.0, 131.94], [134.0, 135.11], [140.0, 145.2], [146.0, 148.76], [151.0, 151.01], [152.0, 155.01], [159.0, 159.29], [161.0, 161.38], [162.0, 196.3]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 40.16, 57.81, 0.0, 0.0, 99.95, 92.15, 0.0, 68.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 30.63], ["sidetone", 14.02], ["hum", 11.68]], null, null, null, null, null, null, null, null, null, null], "duration": [41.71, 2.0, 1.13, 0.56, 0.1, 1.44, -0.23, 3.89, 11.51, 0.94, 1.11, 5.2, 2.76, 0.01, 3.01, 0.29, 0.38, 34.3]} \ No newline at end of file diff --git a/annotations_filtered/gCE5175IkoY_filtered.json b/annotations_filtered/gCE5175IkoY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5a05026df8684a7cdcd41d48779b6829a691b67 --- /dev/null +++ b/annotations_filtered/gCE5175IkoY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 22.35], [29.0, 32.16], [42.0, 42.85], [45.0, 121.56], [123.0, 130.11], [133.0, 133.73], [149.0, 152.25], [158.0, 158.94], [178.0, 179.9]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [54.3, 43.74, 0.0, 0.0, 32.28, 0.0, 61.47, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.2], ["speech", 17.17], ["musical instrument", 5.29]], null, null, [["music", 84.72], ["musical instrument", 3.11], ["synthesizer", 2.07]], null, null, null, null], "duration": [10.35, 3.16, 0.85, 76.56, 7.11, 0.73, 3.25, 0.94, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/gCFBkXA374Y_filtered.json b/annotations_filtered/gCFBkXA374Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f62955a96be594f40d842625d5813e4a4c389dc --- /dev/null +++ b/annotations_filtered/gCFBkXA374Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.34], [12.0, 27.73], [34.0, 64.57], [67.0, 78.76]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 32.97, 0.0, 31.9], "audiomae_on_audioset": [null, [["speech", 28.25], ["clang", 24.35], ["ding", 13.6]], null, [["hum", 44.89], ["mains hum", 32.33], ["throbbing", 12.72]]], "duration": [1.34, 15.73, 30.57, 11.76]} \ No newline at end of file diff --git a/annotations_filtered/gCHCR0wZclg_filtered.json b/annotations_filtered/gCHCR0wZclg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..376d2396f3b184a7a152d436574c7958d35fbbf8 --- /dev/null +++ b/annotations_filtered/gCHCR0wZclg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.5], [8.0, 9.46], [13.0, 17.59], [19.0, 21.57], [23.0, 25.95], [29.0, 30.32], [31.0, 32.76], [34.0, 35.73], [38.0, 38.77], [42.0, 42.72], [51.0, 52.24], [61.0, 61.33], [62.0, 62.72], [65.0, 66.21], [67.0, 67.78], [71.0, 71.39], [73.0, 73.01], [79.0, 78.76], [86.0, 86.48], [105.0, 106.69], [110.0, 116.04], [117.0, 118.07], [130.0, 130.54], [132.0, 132.73], [138.0, 139.65], [141.0, 142.57], [143.0, 144.31], [145.0, 146.5], [150.0, 151.66], [153.0, 152.91], [164.0, 172.94], [178.0, 178.46], [180.0, 182.63], [186.0, 187.51], [201.0, 204.94], [205.0, 205.44]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 97.33, 98.99, 41.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.09, 0.0, 99.8, 0.0, 29.33, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 49.49], ["hiccup", 5.92], ["chirp tone", 4.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 37.75], ["livestock, farm animals, working animals", 28.18], ["moo", 19.55]], null, null, null, [["speech", 66.86], ["crowd", 7.34], ["outside, urban or manmade", 2.94]], null], "duration": [0.5, 1.46, 4.59, 2.57, 2.95, 1.32, 1.76, 1.73, 0.77, 0.72, 1.24, 0.33, 0.72, 1.21, 0.78, 0.39, 0.01, -0.24, 0.48, 1.69, 6.04, 1.07, 0.54, 0.73, 1.65, 1.57, 1.31, 1.5, 1.66, -0.09, 8.94, 0.46, 2.63, 1.51, 3.94, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/gCdXiOssbM0_filtered.json b/annotations_filtered/gCdXiOssbM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46516a430bfb5d56a9b1f80a570bf67b655d20e7 --- /dev/null +++ b/annotations_filtered/gCdXiOssbM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.5], [4.0, 7.96], [8.0, 8.7], [10.0, 10.71], [13.0, 14.07], [18.0, 19.45], [20.0, 20.93], [22.0, 22.71], [23.0, 23.46], [30.0, 30.2], [36.0, 45.01], [46.0, 45.99], [48.0, 49.32], [52.0, 52.81], [55.0, 56.19], [58.0, 58.94], [62.0, 63.04], [66.0, 66.85], [68.0, 68.28], [70.0, 73.18], [73.0, 79.27], [80.0, 83.34], [84.0, 88.91], [90.0, 89.92], [93.0, 93.58], [95.0, 95.52], [97.0, 97.8], [99.0, 99.39], [104.0, 106.64], [113.0, 113.93], [118.0, 129.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 80.11, 99.62, 44.9, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 40.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.28], ["radio", 15.55], ["sidetone", 7.6]], null, null, null, null, null, null, null, [["speech", 45.82], ["electric shaver, electric razor", 16.13], ["explosion", 13.98]]], "duration": [1.5, 3.96, 0.7, 0.71, 1.07, 1.45, 0.93, 0.71, 0.46, 0.2, 9.01, -0.01, 1.32, 0.81, 1.19, 0.94, 1.04, 0.85, 0.28, 3.18, 6.27, 3.34, 4.91, -0.08, 0.58, 0.52, 0.8, 0.39, 2.64, 0.93, 11.51]} \ No newline at end of file diff --git a/annotations_filtered/gDOSJkcKPbo_filtered.json b/annotations_filtered/gDOSJkcKPbo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a9c3c4306693699807d7bdc9e48f522e18b3145 --- /dev/null +++ b/annotations_filtered/gDOSJkcKPbo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [6.0, 5.9], [7.0, 8.11], [12.0, 12.23], [13.0, 13.24], [15.0, 15.67], [20.0, 20.41], [23.0, 23.6], [25.0, 25.42], [26.0, 26.25], [27.0, 27.65], [31.0, 30.91], [35.0, 35.46], [36.0, 36.26], [43.0, 43.34], [48.0, 48.09], [58.0, 58.72], [60.0, 60.3], [69.0, 69.8], [73.0, 73.45], [77.0, 82.26], [83.0, 85.4], [97.0, 101.41], [106.0, 106.14], [114.0, 114.94], [119.0, 119.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.09, 47.46, 71.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 22.68], ["speech", 10.79], ["frog", 9.21]], [["speech", 50.64], ["radio", 12.04], ["sidetone", 8.2]], null, null, null, null], "duration": [0.57, -0.1, 1.11, 0.23, 0.24, 0.67, 0.41, 0.6, 0.42, 0.25, 0.65, -0.09, 0.46, 0.26, 0.34, 0.09, 0.72, 0.3, 0.8, 0.45, 5.26, 2.4, 4.41, 0.14, 0.94, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/gDPJG9FP3iM_filtered.json b/annotations_filtered/gDPJG9FP3iM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd82778675541676888aa779886d285ce1d88965 --- /dev/null +++ b/annotations_filtered/gDPJG9FP3iM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.13], [8.0, 9.42], [12.0, 14.88], [15.0, 20.76], [27.0, 37.37], [40.0, 57.37], [58.0, 59.05], [61.0, 61.64], [64.0, 65.5], [66.0, 69.92], [72.0, 71.85], [75.0, 77.6], [80.0, 82.48], [84.0, 88.5], [94.0, 94.39], [101.0, 105.73], [107.0, 109.14], [110.0, 112.18], [114.0, 119.25], [120.0, 120.9], [122.0, 125.22], [126.0, 128.09], [132.0, 138.67], [140.0, 140.75], [142.0, 146.47], [148.0, 148.14], [149.0, 158.52], [161.0, 164.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.51, 0.0, 52.8, 30.11, 30.83, 53.72, 0.0, 0.0, 0.0, 54.43, 0.0, 67.25, 60.6, 71.43, 0.0, 54.7, 75.07, 62.99, 73.67, 0.0, 75.88, 95.51, 60.23, 0.0, 73.21, 0.0, 50.56, 52.45], "audiomae_on_audioset": [null, null, null, [["speech", 62.5], ["music", 12.81], ["outside, rural or natural", 5.75]], [["hum", 39.85], ["mains hum", 26.83], ["music", 17.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.13, 1.42, 2.88, 5.76, 10.37, 17.37, 1.05, 0.64, 1.5, 3.92, -0.15, 2.6, 2.48, 4.5, 0.39, 4.73, 2.14, 2.18, 5.25, 0.9, 3.22, 2.09, 6.67, 0.75, 4.47, 0.14, 9.52, 3.44]} \ No newline at end of file diff --git a/annotations_filtered/gDSrAm2CKdU_filtered.json b/annotations_filtered/gDSrAm2CKdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe43afa6b1f40b2b1f2c3bc6be9051123a375646 --- /dev/null +++ b/annotations_filtered/gDSrAm2CKdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [7.0, 7.4], [8.0, 9.05], [12.0, 12.04], [33.0, 34.08], [55.0, 56.73], [58.0, 58.29], [58.0, 58.99], [60.0, 60.96], [67.0, 67.02], [78.0, 79.14], [82.0, 82.97], [84.0, 84.35], [89.0, 91.37], [97.0, 97.63], [99.0, 100.06], [101.0, 101.28], [102.0, 101.92], [103.0, 104.53], [105.0, 105.85], [107.0, 108.45], [110.0, 111.15], [113.0, 114.0], [115.0, 115.89], [131.0, 131.13], [139.0, 138.99], [156.0, 157.22], [159.0, 159.44], [161.0, 162.67], [164.0, 164.83], [166.0, 165.92], [167.0, 167.71], [169.0, 169.64], [175.0, 175.02], [181.0, 182.44], [186.0, 185.92], [187.0, 189.92], [191.0, 192.42], [194.0, 195.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.4, 1.05, 0.04, 1.08, 1.73, 0.29, 0.99, 0.96, 0.02, 1.14, 0.97, 0.35, 2.37, 0.63, 1.06, 0.28, -0.08, 1.53, 0.85, 1.45, 1.15, 1.0, 0.89, 0.13, -0.01, 1.22, 0.44, 1.67, 0.83, -0.08, 0.71, 0.64, 0.02, 1.44, -0.08, 2.92, 1.42, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/gDVyEzQNvhU_filtered.json b/annotations_filtered/gDVyEzQNvhU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1586c8b9225bec467d2482bfdea40075f8c8b0a5 --- /dev/null +++ b/annotations_filtered/gDVyEzQNvhU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [6.0, 7.42], [8.0, 8.28], [15.0, 17.02], [19.0, 19.18], [19.0, 52.84], [53.0, 55.93], [58.0, 65.7], [67.0, 73.68], [76.0, 82.07], [84.0, 89.04], [90.0, 111.1], [113.0, 113.09], [119.0, 129.47]], "keep_status": [false, false, false, true, false, false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.35, 0.0, 0.0, 30.06, 30.18, 30.0, 30.15, 32.35, 31.08, 0.0, 31.09], "audiomae_on_audioset": [null, null, null, [["music", 24.76], ["didgeridoo", 6.88], ["effects unit", 5.61]], null, null, [["music", 60.87], ["speech", 11.26], ["dubstep", 4.76]], [["music", 44.38], ["whack, thwack", 16.92], ["whip", 6.39]], [["music", 42.54], ["livestock, farm animals, working animals", 15.27], ["cattle, bovinae", 9.04]], [["speech", 30.55], ["music", 18.75], ["whack, thwack", 8.15]], [["music", 69.83], ["throbbing", 5.83], ["electronic music", 2.33]], [["music", 46.33], ["throbbing", 31.78], ["hum", 7.38]], null, [["music", 46.49], ["carnatic music", 15.5], ["musical instrument", 9.85]]], "duration": [0.98, 1.42, 0.28, 2.02, 0.18, 33.84, 2.93, 7.7, 6.68, 6.07, 5.04, 21.1, 0.09, 10.47]} \ No newline at end of file diff --git a/annotations_filtered/gDtB0Sr8sbY_filtered.json b/annotations_filtered/gDtB0Sr8sbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b4b7027e30634d2ea558808f205c3037cfc6059 --- /dev/null +++ b/annotations_filtered/gDtB0Sr8sbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.53], [17.0, 18.22], [19.0, 20.07], [22.0, 25.25], [29.0, 30.47], [33.0, 43.48], [45.0, 127.31], [127.0, 127.45], [127.0, 127.58], [130.0, 142.69], [153.0, 154.52], [158.0, 161.08], [170.0, 172.37], [176.0, 176.42], [184.0, 186.0]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 38.03, 0.0, 37.05, 0.0, 0.0, 0.0, 45.62, 0.0, 37.58, 31.02, 0.0, 32.78], "audiomae_on_audioset": [null, null, null, [["speech", 57.7], ["radio", 16.75], ["sidetone", 5.67]], null, [["livestock, farm animals, working animals", 28.08], ["animal", 9.69], ["cattle, bovinae", 8.82]], null, null, null, [["music", 61.02], ["effects unit", 6.21], ["synthesizer", 5.21]], null, [["speech", 14.53], ["music", 14.53], ["inside, small room", 6.52]], [["frog", 25.32], ["whale vocalization", 18.57], ["speech", 17.06]], null, [["whale vocalization", 30.11], ["cattle, bovinae", 13.33], ["moo", 10.47]]], "duration": [0.53, 1.22, 1.07, 3.25, 1.47, 10.48, 82.31, 0.45, 0.58, 12.69, 1.52, 3.08, 2.37, 0.42, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/gEC1WbYzZYk_filtered.json b/annotations_filtered/gEC1WbYzZYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a74131ca28e41f127377b68c7ba7e7653fd42ccf --- /dev/null +++ b/annotations_filtered/gEC1WbYzZYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.32], [18.0, 18.5], [20.0, 23.73], [26.0, 26.7], [42.0, 42.55], [43.0, 46.04], [46.0, 47.07], [52.0, 52.76], [54.0, 55.71], [62.0, 73.43], [74.0, 79.79], [84.0, 85.24], [87.0, 86.7], [93.0, 119.45], [120.0, 119.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.64, 0.0, 0.0, 34.13, 0.0, 0.0, 0.0, 28.56, 29.27, 0.0, 0.0, 28.55, 0.0], "audiomae_on_audioset": [null, null, [["speech", 35.79], ["music", 29.38], ["throbbing", 5.97]], null, null, [["music", 58.62], ["speech", 6.76], ["didgeridoo", 4.72]], null, null, null, [["music", 53.45], ["speech", 32.43], ["musical instrument", 1.33]], [["speech", 53.54], ["music", 28.29], ["outside, rural or natural", 3.64]], null, null, [["whale vocalization", 44.21], ["music", 23.83], ["brass instrument", 6.36]], null], "duration": [0.32, 0.5, 3.73, 0.7, 0.55, 3.04, 1.07, 0.76, 1.71, 11.43, 5.79, 1.24, -0.3, 26.45, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/gEdTciZtW4o_filtered.json b/annotations_filtered/gEdTciZtW4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2af781808ef87cab3ccf72588ed4d5e367e58ceb --- /dev/null +++ b/annotations_filtered/gEdTciZtW4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [6.0, 9.88], [12.0, 29.96], [34.0, 34.64], [35.0, 44.27], [46.0, 87.02], [90.0, 91.98], [92.0, 92.5], [93.0, 93.43], [94.0, 95.08], [97.0, 98.41], [100.0, 100.75], [103.0, 122.86], [124.0, 130.6], [131.0, 159.49], [160.0, 160.64], [165.0, 181.8], [187.0, 187.73], [189.0, 190.17]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 97.64, 35.57, 0.0, 36.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5, 94.95, 96.17, 0.0, 32.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["insect", 27.75], ["fly, housefly", 21.57], ["electric shaver, electric razor", 11.71]], null, [["speech", 34.29], ["music", 12.57], ["glass", 9.25]], null, null, null, null, null, null, null, [["mains hum", 44.14], ["hum", 23.98], ["insect", 6.61]], null, null, null, [["music", 27.69], ["hum", 18.93], ["mains hum", 5.52]], null, null], "duration": [1.38, 3.88, 17.96, 0.64, 9.27, 41.02, 1.98, 0.5, 0.43, 1.08, 1.41, 0.75, 19.86, 6.6, 28.49, 0.64, 16.8, 0.73, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/gEhB7HuQk7M_filtered.json b/annotations_filtered/gEhB7HuQk7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a0932a66c0f2ec901f1227a49a8ecfaa2c53a53 --- /dev/null +++ b/annotations_filtered/gEhB7HuQk7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [2.0, 2.51], [13.0, 13.2], [30.0, 30.28], [32.0, 34.69], [36.0, 38.4], [39.0, 42.55], [49.0, 50.63], [51.0, 51.88], [54.0, 55.05], [58.0, 62.13], [72.0, 72.71], [74.0, 77.21], [83.0, 85.41], [99.0, 99.71], [101.0, 103.22], [112.0, 112.31], [119.0, 121.24], [127.0, 127.75], [130.0, 129.83], [132.0, 132.58], [134.0, 134.76], [136.0, 136.49], [141.0, 141.0], [143.0, 144.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 95.78, 78.55, 40.92, 0.0, 0.0, 0.0, 39.12, 0.0, 42.69, 53.16, 0.0, 42.24, 0.0, 36.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 60.97], ["musical instrument", 11.31], ["boing", 5.41]], null, null, null, [["music", 54.27], ["theremin", 25.44], ["musical instrument", 2.98]], null, [["music", 37.44], ["speech", 8.65], ["animal", 4.59]], null, null, [["music", 31.85], ["musical instrument", 6.63], ["speech", 6.18]], null, [["speech", 31.14], ["boing", 16.65], ["moo", 8.51]], null, null, null, null, null, null, null], "duration": [0.24, 0.51, 0.2, 0.28, 2.69, 2.4, 3.55, 1.63, 0.88, 1.05, 4.13, 0.71, 3.21, 2.41, 0.71, 2.22, 0.31, 2.24, 0.75, -0.17, 0.58, 0.76, 0.49, 0.0, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/gEqHJ1tomnk_filtered.json b/annotations_filtered/gEqHJ1tomnk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8b64c713ff4e7559a2795f03ab27915974168da --- /dev/null +++ b/annotations_filtered/gEqHJ1tomnk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.83], [15.0, 15.52], [17.0, 17.83], [21.0, 30.28], [31.0, 35.65], [37.0, 40.14], [44.0, 45.17], [46.0, 56.03], [57.0, 63.41], [66.0, 68.34], [70.0, 75.39], [76.0, 79.03], [80.0, 84.75], [88.0, 91.45], [96.0, 97.04], [98.0, 104.18], [105.0, 113.32], [114.0, 115.64], [117.0, 118.57], [121.0, 123.01], [124.0, 125.42], [127.0, 127.23]], "keep_status": [false, false, false, true, true, true, false, false, true, true, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.06, 39.34, 34.27, 0.0, 34.53, 37.36, 44.32, 46.72, 38.06, 57.89, 86.45, 0.0, 88.64, 78.55, 0.0, 0.0, 68.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 23.42], ["fly, housefly", 15.82], ["sine wave", 11.51]], [["music", 49.84], ["hum", 9.67], ["mains hum", 6.39]], [["fly, housefly", 21.37], ["insect", 20.24], ["sidetone", 10.95]], null, [["music", 67.9], ["electronic music", 4.26], ["hum", 3.27]], [["music", 50.4], ["theremin", 10.03], ["musical instrument", 4.17]], [["music", 40.41], ["cello", 4.44], ["musical instrument", 4.06]], [["mains hum", 28.03], ["music", 15.41], ["fly, housefly", 12.72]], [["speech", 38.27], ["mains hum", 9.72], ["music", 7.43]], null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 0.52, 0.83, 9.28, 4.65, 3.14, 1.17, 10.03, 6.41, 2.34, 5.39, 3.03, 4.75, 3.45, 1.04, 6.18, 8.32, 1.64, 1.57, 2.01, 1.42, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/gEq_wldXBww_filtered.json b/annotations_filtered/gEq_wldXBww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d587673261a6e1da293ce6ebdafd2e8dc04855fc --- /dev/null +++ b/annotations_filtered/gEq_wldXBww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [5.0, 5.07], [6.0, 6.67], [14.0, 14.79], [19.0, 19.87], [22.0, 22.47], [25.0, 25.41], [28.0, 28.48], [30.0, 30.77], [45.0, 45.94], [63.0, 63.31], [70.0, 73.4], [77.0, 79.02], [86.0, 86.31], [87.0, 94.2], [95.0, 97.31], [98.0, 100.72], [102.0, 103.52], [105.0, 106.84], [110.0, 110.56], [111.0, 115.53], [116.0, 116.46], [117.0, 125.61], [126.0, 148.98], [149.0, 150.18], [152.0, 152.15], [153.0, 156.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 84.8, 0.0, 49.82, 52.51, 43.77, 0.0, 0.0, 0.0, 49.92, 0.0, 52.68, 38.55, 0.0, 0.0, 32.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.3], ["hum", 5.49], ["harp", 5.29]], null, [["speech", 36.59], ["music", 30.44], ["musical instrument", 2.67]], null, null, null, [["speech", 35.64], ["hum", 13.21], ["music", 7.76]], null, null, [["music", 55.85], ["hum", 10.51], ["speech", 8.59]], null, null, [["music", 42.33], ["throbbing", 16.2], ["speech", 13.12]]], "duration": [0.29, 0.07, 0.67, 0.79, 0.87, 0.47, 0.41, 0.48, 0.77, 0.94, 0.31, 3.4, 2.02, 0.31, 7.2, 2.31, 2.72, 1.52, 1.84, 0.56, 4.53, 0.46, 8.61, 22.98, 1.18, 0.15, 3.46]} \ No newline at end of file diff --git a/annotations_filtered/gEygOJWaMk0_filtered.json b/annotations_filtered/gEygOJWaMk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cefcb0ae94dbcef887b11ecdb9b7e92228732ab8 --- /dev/null +++ b/annotations_filtered/gEygOJWaMk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.16], [6.0, 8.4], [10.0, 10.89], [12.0, 13.09], [20.0, 20.98], [21.0, 23.3], [24.0, 25.71], [29.0, 30.33], [32.0, 32.37], [33.0, 33.56], [37.0, 38.85], [40.0, 41.42], [43.0, 44.81], [46.0, 46.92], [49.0, 50.8], [53.0, 53.76], [57.0, 57.15], [58.0, 62.36], [64.0, 66.06], [67.0, 69.04], [73.0, 74.61], [75.0, 76.89], [79.0, 79.49], [81.0, 84.89], [88.0, 95.0], [96.0, 97.6], [100.0, 101.34], [102.0, 113.02]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.43, 99.4, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 98.01, 84.8, 0.0, 0.0, 0.0, 60.51, 92.8, 0.0, 0.0, 45.49], "audiomae_on_audioset": [[["speech", 32.7], ["sidetone", 21.87], ["music", 11.19]], null, null, null, null, [["speech", 59.59], ["tuning fork", 6.39], ["dial tone", 5.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.59], ["speech", 20.16], ["singing bowl", 16.0]]], "duration": [2.16, 2.4, 0.89, 1.09, 0.98, 2.3, 1.71, 1.33, 0.37, 0.56, 1.85, 1.42, 1.81, 0.92, 1.8, 0.76, 0.15, 4.36, 2.06, 2.04, 1.61, 1.89, 0.49, 3.89, 7.0, 1.6, 1.34, 11.02]} \ No newline at end of file diff --git a/annotations_filtered/gFES6-SLD_s_filtered.json b/annotations_filtered/gFES6-SLD_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/gFES6-SLD_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/gFJT9ziRAUI_filtered.json b/annotations_filtered/gFJT9ziRAUI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7d1804cb69dc634d1fe2b6389307e366c9140f6 --- /dev/null +++ b/annotations_filtered/gFJT9ziRAUI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.71], [16.0, 17.36], [19.0, 65.15], [68.0, 69.99], [72.0, 71.85], [74.0, 75.49], [78.0, 90.86], [95.0, 98.91], [99.0, 101.78], [104.0, 104.62], [106.0, 108.09], [115.0, 115.86], [119.0, 120.75], [121.0, 121.34], [125.0, 125.58], [130.0, 130.71], [131.0, 135.41], [139.0, 151.41], [157.0, 156.78], [158.0, 159.17], [160.0, 164.76], [167.0, 167.91], [170.0, 170.75]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [35.41, 0.0, 0.0, 0.0, 0.0, 0.0, 30.82, 31.07, 34.18, 0.0, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 31.16, 29.76, 0.0, 0.0, 29.38, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.89], ["throbbing", 14.45], ["speech", 12.78]], null, null, null, null, null, [["speech", 35.56], ["music", 21.52], ["whack, thwack", 10.17]], [["speech", 35.2], ["music", 31.93], ["throbbing", 7.35]], [["speech", 42.78], ["music", 16.19], ["aircraft", 5.77]], null, [["mains hum", 58.71], ["hum", 23.44], ["speech", 4.59]], null, null, null, null, null, [["music", 40.42], ["throbbing", 8.01], ["hum", 5.63]], [["music", 43.18], ["speech", 11.5], ["hum", 9.54]], null, null, [["music", 39.82], ["throbbing", 6.89], ["electronic music", 5.61]], null, null], "duration": [5.71, 1.36, 46.15, 1.99, -0.15, 1.49, 12.86, 3.91, 2.78, 0.62, 2.09, 0.86, 1.75, 0.34, 0.58, 0.71, 4.41, 12.41, -0.22, 1.17, 4.76, 0.91, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/gFKba_Esjt0_filtered.json b/annotations_filtered/gFKba_Esjt0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdce13a8460de45c9d488bd21c64f78acaa45d0f --- /dev/null +++ b/annotations_filtered/gFKba_Esjt0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [6.0, 6.56], [11.0, 12.65], [14.0, 14.35], [16.0, 17.49], [21.0, 22.01], [23.0, 24.98], [27.0, 27.35], [31.0, 31.8], [34.0, 38.01], [40.0, 43.34], [44.0, 52.98], [54.0, 56.02], [58.0, 59.14], [61.0, 61.8], [64.0, 64.02], [65.0, 65.77], [69.0, 70.78], [72.0, 73.55], [75.0, 76.37], [78.0, 78.8], [81.0, 82.59], [84.0, 84.48], [86.0, 86.44], [88.0, 88.43], [90.0, 90.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 66.76, 53.47, 41.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.15], ["horse", 8.22], ["animal", 6.67]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.56, 1.65, 0.35, 1.49, 1.01, 1.98, 0.35, 0.8, 4.01, 3.34, 8.98, 2.02, 1.14, 0.8, 0.02, 0.77, 1.78, 1.55, 1.37, 0.8, 1.59, 0.48, 0.44, 0.43, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/gFX14TEiBOw_filtered.json b/annotations_filtered/gFX14TEiBOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d5d14dd2a3d4d8f94aa464ba447a63a19f3f868 --- /dev/null +++ b/annotations_filtered/gFX14TEiBOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [5.0, 5.24], [16.0, 16.58], [38.0, 38.52], [48.0, 49.06], [73.0, 74.33], [95.0, 97.6], [99.0, 101.58], [103.0, 103.18], [103.0, 103.42], [105.0, 104.9], [108.0, 108.55], [110.0, 110.46], [110.0, 110.54], [111.0, 156.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.24, 0.58, 0.52, 1.06, 1.33, 2.6, 2.58, 0.18, 0.42, -0.1, 0.55, 0.46, 0.54, 45.64]} \ No newline at end of file diff --git a/annotations_filtered/gFocZQa78ho_filtered.json b/annotations_filtered/gFocZQa78ho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8db7b574fbe70752524b6ae0c02cdd9e08d64c --- /dev/null +++ b/annotations_filtered/gFocZQa78ho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.2], [20.0, 22.89], [23.0, 25.15], [25.0, 40.98], [46.0, 47.9], [49.0, 51.85], [54.0, 54.9], [61.0, 64.98], [66.0, 66.21], [70.0, 86.8], [89.0, 90.19], [97.0, 98.64], [100.0, 99.87], [108.0, 112.11], [113.0, 113.91], [118.0, 118.93], [120.0, 126.96], [130.0, 134.74], [135.0, 136.66], [164.0, 165.45]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 28.79, 28.71, 30.13, 0.0, 31.54, 0.0, 32.43, 0.0, 32.08, 0.0, 0.0, 0.0, 39.05, 0.0, 0.0, 34.71, 35.95, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 65.81], ["electronic music", 6.21], ["whale vocalization", 4.26]], [["music", 78.31], ["musical instrument", 2.84], ["electronic music", 1.36]], [["music", 82.65], ["brass instrument", 4.17], ["musical instrument", 3.06]], null, [["music", 66.53], ["foghorn", 3.74], ["theremin", 3.21]], null, [["music", 31.12], ["cacophony", 5.86], ["fly, housefly", 5.51]], null, [["music", 59.66], ["speech", 6.72], ["crowd", 6.1]], null, null, null, [["music", 42.0], ["throbbing", 15.82], ["hum", 12.77]], null, null, [["music", 60.66], ["throbbing", 3.67], ["trombone", 3.37]], [["music", 64.54], ["foghorn", 10.45], ["throbbing", 3.03]], null, null], "duration": [1.2, 2.89, 2.15, 15.98, 1.9, 2.85, 0.9, 3.98, 0.21, 16.8, 1.19, 1.64, -0.13, 4.11, 0.91, 0.93, 6.96, 4.74, 1.66, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/gG1XmKlqhIU_filtered.json b/annotations_filtered/gG1XmKlqhIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d18561eb8c44c1c4d4285921b16518ea760ff91f --- /dev/null +++ b/annotations_filtered/gG1XmKlqhIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.25], [26.0, 31.4], [35.0, 46.08], [48.0, 54.21], [55.0, 83.29], [85.0, 86.86], [90.0, 95.72], [100.0, 120.26], [122.0, 133.54], [137.0, 139.4], [147.0, 149.57], [151.0, 155.48]], "keep_status": [false, false, true, false, true, false, true, false, true, false, true, true], "silence_prob": [100.0, 43.1, 30.66, 29.99, 30.25, 0.0, 31.1, 31.16, 29.69, 39.63, 49.87, 38.64], "audiomae_on_audioset": [null, [["speech", 85.29], ["snicker", 3.41], ["telephone", 1.85]], [["hum", 40.11], ["throbbing", 18.88], ["music", 10.32]], [["speech", 45.52], ["sidetone", 22.92], ["music", 12.5]], [["music", 54.59], ["speech", 6.84], ["throbbing", 3.39]], null, [["speech", 41.84], ["music", 19.14], ["explosion", 7.84]], [["music", 34.38], ["speech", 27.53], ["boing", 22.76]], [["music", 28.11], ["noise", 14.96], ["explosion", 12.25]], [["speech", 60.1], ["music", 10.79], ["sidetone", 4.3]], [["music", 49.52], ["speech", 7.92], ["musical instrument", 6.15]], [["hum", 21.77], ["speech", 18.36], ["music", 15.97]]], "duration": [2.25, 5.4, 11.08, 6.21, 28.29, 1.86, 5.72, 20.26, 11.54, 2.4, 2.57, 4.48]} \ No newline at end of file diff --git a/annotations_filtered/gG5kz32ot20_filtered.json b/annotations_filtered/gG5kz32ot20_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94ae91204310d8d312d8490a7b3233304b690cf2 --- /dev/null +++ b/annotations_filtered/gG5kz32ot20_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.98], [5.0, 7.11], [9.0, 9.73], [11.0, 11.23], [17.0, 17.59], [24.0, 24.87], [29.0, 29.61], [31.0, 31.58], [33.0, 33.25], [39.0, 39.07], [41.0, 41.59], [42.0, 43.28], [47.0, 48.14], [51.0, 51.39], [52.0, 52.49], [56.0, 56.51], [58.0, 58.97], [61.0, 62.09], [67.0, 68.93], [69.0, 70.6], [71.0, 71.58], [74.0, 74.29], [77.0, 77.06], [81.0, 82.27], [83.0, 84.79], [86.0, 88.47], [90.0, 90.37], [92.0, 93.39], [96.0, 96.65], [99.0, 99.98], [102.0, 101.98], [104.0, 104.11], [107.0, 107.15], [112.0, 115.21], [117.0, 118.23], [120.0, 120.21], [126.0, 126.86], [129.0, 129.51], [131.0, 132.98], [135.0, 137.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.98, 2.11, 0.73, 0.23, 0.59, 0.87, 0.61, 0.58, 0.25, 0.07, 0.59, 1.28, 1.14, 0.39, 0.49, 0.51, 0.97, 1.09, 1.93, 1.6, 0.58, 0.29, 0.06, 1.27, 1.79, 2.47, 0.37, 1.39, 0.65, 0.98, -0.02, 0.11, 0.15, 3.21, 1.23, 0.21, 0.86, 0.51, 1.98, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/gGKNhGbPp6Y_filtered.json b/annotations_filtered/gGKNhGbPp6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a4ac5fbb8c954ae42c87e7b8384898eecb0a79f --- /dev/null +++ b/annotations_filtered/gGKNhGbPp6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.33], [12.0, 12.11], [12.0, 12.73], [14.0, 14.42], [16.0, 17.58], [19.0, 19.55], [39.0, 39.56]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.33, 0.11, 0.73, 0.42, 1.58, 0.55, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/gGxrQOUaM_E_filtered.json b/annotations_filtered/gGxrQOUaM_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cde336705d88e717a85cc290305c0ed473c1e2b --- /dev/null +++ b/annotations_filtered/gGxrQOUaM_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 20.28], [24.0, 25.84], [27.0, 35.95], [37.0, 48.1], [55.0, 55.27], [60.0, 60.44], [69.0, 70.04], [72.0, 87.98], [89.0, 97.68], [100.0, 129.96]], "keep_status": [true, false, false, false, false, false, false, false, true, false], "silence_prob": [34.49, 0.0, 37.69, 37.74, 0.0, 0.0, 0.0, 37.82, 33.72, 33.21], "audiomae_on_audioset": [[["fly, housefly", 28.14], ["insect", 21.05], ["speech", 17.78]], null, [["music", 81.14], ["funny music", 1.75], ["didgeridoo", 1.13]], [["music", 83.62], ["singing", 1.8], ["middle eastern music", 1.7]], null, null, null, [["music", 79.1], ["middle eastern music", 3.6], ["folk music", 2.37]], [["music", 23.24], ["speech", 15.9], ["mosquito", 6.15]], [["cattle, bovinae", 37.48], ["livestock, farm animals, working animals", 31.97], ["moo", 30.01]]], "duration": [12.28, 1.84, 8.95, 11.1, 0.27, 0.44, 1.04, 15.98, 8.68, 29.96]} \ No newline at end of file diff --git a/annotations_filtered/gH1kstAfb5g_filtered.json b/annotations_filtered/gH1kstAfb5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31b56773e734e3ba0b67170235308e7d6b3b38b6 --- /dev/null +++ b/annotations_filtered/gH1kstAfb5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.81], [17.0, 16.78], [19.0, 21.14], [21.0, 21.17], [22.0, 23.97], [35.0, 35.13], [36.0, 36.1], [37.0, 37.32], [44.0, 50.89], [52.0, 52.39], [56.0, 56.3], [63.0, 75.57], [83.0, 98.71], [100.0, 100.9], [101.0, 100.97], [101.0, 101.04], [101.0, 103.6], [104.0, 103.87], [104.0, 106.2], [108.0, 114.25], [115.0, 116.29]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 35.59, 0.0, 0.0, 29.84, 29.18, 0.0, 0.0, 0.0, 29.56, 0.0, 28.83, 38.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 44.97], ["fart", 11.01], ["fly, housefly", 9.93]], null, null, [["music", 62.63], ["speech", 10.72], ["boing", 9.12]], [["music", 70.02], ["speech", 9.71], ["cacophony", 2.37]], null, null, null, [["music", 89.59], ["boing", 0.6], ["funny music", 0.47]], null, [["music", 81.69], ["throbbing", 2.1], ["boing", 1.26]], [["music", 31.07], ["didgeridoo", 10.47], ["gong", 7.41]], null], "duration": [-0.19, -0.22, 2.14, 0.17, 1.97, 0.13, 0.1, 0.32, 6.89, 0.39, 0.3, 12.57, 15.71, 0.9, -0.03, 0.04, 2.6, -0.13, 2.2, 6.25, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/gH4dw-S1esk_filtered.json b/annotations_filtered/gH4dw-S1esk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f8c54c652094f2e8ce88ce0f088e7d9faa9edff --- /dev/null +++ b/annotations_filtered/gH4dw-S1esk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 80.27], [81.0, 82.24], [87.0, 95.12], [97.0, 104.63], [106.0, 106.44], [106.0, 150.58], [153.0, 175.73]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 30.96, 29.0, 0.0, 0.0, 28.16], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 31.3], ["speech", 11.21], ["cattle, bovinae", 8.39]], [["music", 50.54], ["mains hum", 11.78], ["hum", 11.71]], null, null, [["music", 59.18], ["speech", 13.67], ["musical instrument", 2.75]]], "duration": [76.27, 1.24, 8.12, 7.63, 0.44, 44.58, 22.73]} \ No newline at end of file diff --git a/annotations_filtered/gHAJY34g-LY_filtered.json b/annotations_filtered/gHAJY34g-LY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5689bf284b5defc6e01b5f07f4d085feda98f615 --- /dev/null +++ b/annotations_filtered/gHAJY34g-LY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.96], [15.0, 15.96], [19.0, 26.25], [27.0, 37.59], [38.0, 77.33]], "keep_status": [false, false, false, false, false], "silence_prob": [61.67, 0.0, 60.98, 74.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [3.96, 0.96, 7.25, 10.59, 39.33]} \ No newline at end of file diff --git a/annotations_filtered/gHJwn_JEazA_filtered.json b/annotations_filtered/gHJwn_JEazA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eccfac2a197778a74d2f389e89344b7db25c15ac --- /dev/null +++ b/annotations_filtered/gHJwn_JEazA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.44], [8.0, 18.2], [19.0, 24.83], [25.0, 26.11], [27.0, 28.63], [31.0, 31.67], [34.0, 34.64], [37.0, 37.56], [38.0, 39.5], [41.0, 48.57], [49.0, 49.69], [50.0, 51.44], [52.0, 53.03], [53.0, 56.67], [58.0, 59.37], [60.0, 61.4], [63.0, 64.02], [65.0, 66.88], [70.0, 72.52], [73.0, 73.82], [75.0, 75.84], [76.0, 80.45], [81.0, 82.09], [83.0, 85.56], [87.0, 88.21], [91.0, 91.18], [92.0, 92.33], [94.0, 94.59], [96.0, 99.06], [100.0, 103.23], [103.0, 103.35], [103.0, 104.55], [105.0, 105.36], [106.0, 110.3], [117.0, 120.82], [122.0, 124.04], [126.0, 126.96], [128.0, 131.72]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [35.39, 38.46, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.1, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 46.19, 0.0, 54.97, 0.0, 0.0, 0.0, 0.0, 89.36, 49.31, 0.0, 0.0, 0.0, 42.37, 57.81, 99.96, 0.0, 55.53], "audiomae_on_audioset": [[["speech", 35.73], ["music", 9.14], ["moo", 5.34]], [["speech", 12.83], ["hum", 11.09], ["music", 10.76]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.07], ["radio", 7.98], ["music", 4.93]], null, null, null, null, null, null, null, [["speech", 33.56], ["music", 27.15], ["hum", 4.26]], null, null, null, null, null, null, null, [["music", 43.25], ["hum", 6.24], ["throbbing", 4.96]], null, null, null, [["music", 39.2], ["speech", 21.78], ["synthesizer", 10.0]], null, null, null, null], "duration": [2.44, 10.2, 5.83, 1.11, 1.63, 0.67, 0.64, 0.56, 1.5, 7.57, 0.69, 1.44, 1.03, 3.67, 1.37, 1.4, 1.02, 1.88, 2.52, 0.82, 0.84, 4.45, 1.09, 2.56, 1.21, 0.18, 0.33, 0.59, 3.06, 3.23, 0.35, 1.55, 0.36, 4.3, 3.82, 2.04, 0.96, 3.72]} \ No newline at end of file diff --git a/annotations_filtered/gHQV6AMclGA_filtered.json b/annotations_filtered/gHQV6AMclGA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42e99ab7765a7ad09c82bac2f9f43bddfc09846d --- /dev/null +++ b/annotations_filtered/gHQV6AMclGA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [6.0, 6.66], [7.0, 8.31], [10.0, 12.43], [15.0, 16.85], [17.0, 18.52], [19.0, 19.95], [22.0, 23.52], [24.0, 25.98], [28.0, 29.91], [30.0, 35.85], [37.0, 42.18], [48.0, 48.68], [50.0, 52.12], [56.0, 58.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 94.81, 0.0, 92.64, 96.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.66, 1.31, 2.43, 1.85, 1.52, 0.95, 1.52, 1.98, 1.91, 5.85, 5.18, 0.68, 2.12, 2.6]} \ No newline at end of file diff --git a/annotations_filtered/gHWnmlpmub4_filtered.json b/annotations_filtered/gHWnmlpmub4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84b88ad2e783dc2426c2894e6a48ce18d28df20a --- /dev/null +++ b/annotations_filtered/gHWnmlpmub4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 34.5], [39.0, 40.37], [43.0, 44.91], [45.0, 47.04], [48.0, 49.84], [50.0, 50.99], [52.0, 51.87], [53.0, 57.96], [59.0, 61.25], [62.0, 63.96], [66.0, 67.91], [70.0, 71.34], [72.0, 74.83], [83.0, 96.13], [96.0, 97.12], [99.0, 99.91], [106.0, 116.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 100.0, 84.07, 0.0, 0.0, 0.0, 98.27, 100.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.5, 1.37, 1.91, 2.04, 1.84, 0.99, -0.13, 4.96, 2.25, 1.96, 1.91, 1.34, 2.83, 13.13, 1.12, 0.91, 10.53]} \ No newline at end of file diff --git a/annotations_filtered/gHf9n0jhBdk_filtered.json b/annotations_filtered/gHf9n0jhBdk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b830797d5d9771b094eec25843dd927a94c56879 --- /dev/null +++ b/annotations_filtered/gHf9n0jhBdk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [2.0, 2.19], [6.0, 5.95], [6.0, 6.91], [9.0, 9.48], [13.0, 14.77], [17.0, 16.98], [18.0, 20.6], [22.0, 25.34]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 93.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.19, -0.05, 0.91, 0.48, 1.77, -0.02, 2.6, 3.34]} \ No newline at end of file diff --git a/annotations_filtered/gHfRl_ZjHj8_filtered.json b/annotations_filtered/gHfRl_ZjHj8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff3357cc0f34adbbc43902bbeceff27691abc0b0 --- /dev/null +++ b/annotations_filtered/gHfRl_ZjHj8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [11.0, 11.04], [12.0, 13.29], [15.0, 16.41], [29.0, 41.81], [44.0, 44.59], [46.0, 46.52], [47.0, 47.7], [49.0, 49.18], [53.0, 53.64], [54.0, 56.86], [58.0, 57.96], [59.0, 59.9], [60.0, 63.86], [66.0, 65.8], [68.0, 73.52], [76.0, 76.0], [79.0, 94.56], [100.0, 109.88], [111.0, 130.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 63.74, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 0.0, 56.7, 0.0, 58.72, 0.0, 62.89, 60.7, 45.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.74], ["speech", 36.84], ["hum", 3.79]]], "duration": [0.62, 0.04, 1.29, 1.41, 12.81, 0.59, 0.52, 0.7, 0.18, 0.64, 2.86, -0.04, 0.9, 3.86, -0.2, 5.52, 0.0, 15.56, 9.88, 19.13]} \ No newline at end of file diff --git a/annotations_filtered/gHfTsIMdlPg_filtered.json b/annotations_filtered/gHfTsIMdlPg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dc3fdf4247c83cf0d624f9a59682ee3f3ae647f --- /dev/null +++ b/annotations_filtered/gHfTsIMdlPg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.07], [11.0, 12.7], [13.0, 13.27], [14.0, 17.73], [18.0, 17.76], [22.0, 22.64], [24.0, 25.69], [32.0, 32.59], [43.0, 43.33], [65.0, 66.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [4.07, 1.7, 0.27, 3.73, -0.24, 0.64, 1.69, 0.59, 0.33, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/gI1_6ob3hio_filtered.json b/annotations_filtered/gI1_6ob3hio_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14f866b76ec2472042daa92c2d57ab06b237a2cf --- /dev/null +++ b/annotations_filtered/gI1_6ob3hio_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [8.0, 12.56], [16.0, 16.17], [18.0, 20.34], [26.0, 26.27], [30.0, 31.7], [34.0, 36.41], [38.0, 38.96], [40.0, 40.59], [48.0, 49.99], [65.0, 65.75], [67.0, 67.85], [70.0, 70.77], [76.0, 76.01], [82.0, 85.94], [87.0, 88.26], [90.0, 90.75], [92.0, 92.99], [98.0, 100.55], [102.0, 103.23], [105.0, 105.09], [110.0, 114.08], [116.0, 116.48], [117.0, 117.04], [123.0, 124.39], [126.0, 126.52], [130.0, 130.11], [131.0, 131.28], [133.0, 132.68], [133.0, 133.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.52, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 4.56, 0.17, 2.34, 0.27, 1.7, 2.41, 0.96, 0.59, 1.99, 0.75, 0.85, 0.77, 0.01, 3.94, 1.26, 0.75, 0.99, 2.55, 1.23, 0.09, 4.08, 0.48, 0.04, 1.39, 0.52, 0.11, 0.28, -0.32, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/gIGtDdiHlA8_filtered.json b/annotations_filtered/gIGtDdiHlA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..970ac8069718eaba13757546a4ecf0f4efcf50d2 --- /dev/null +++ b/annotations_filtered/gIGtDdiHlA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 29.37], [33.0, 55.92], [56.0, 104.75], [106.0, 139.5], [140.0, 141.05], [143.0, 143.19], [144.0, 153.84], [156.0, 167.7], [170.0, 197.6], [198.0, 198.21], [199.0, 199.81], [201.0, 201.6], [202.0, 202.32], [203.0, 203.42], [204.0, 204.01], [205.0, 206.07], [206.0, 206.61]], "keep_status": [true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [39.98, 63.42, 0.0, 0.0, 0.0, 0.0, 30.71, 31.28, 31.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 31.89], ["speech", 18.07], ["noise", 14.81]], null, null, null, null, null, [["animal", 46.19], ["bow-wow", 17.02], ["dog", 12.32]], [["sidetone", 15.81], ["buzz", 12.44], ["music", 7.96]], [["gurgling", 11.87], ["rain on surface", 9.68], ["rain", 8.51]], null, null, null, null, null, null, null, null], "duration": [29.37, 22.92, 48.75, 33.5, 1.05, 0.19, 9.84, 11.7, 27.6, 0.21, 0.81, 0.6, 0.32, 0.42, 0.01, 1.07, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/gILsE7uSUkA_filtered.json b/annotations_filtered/gILsE7uSUkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bf2e3a54ed92ae3c7166f126c440b7f960e5f36 --- /dev/null +++ b/annotations_filtered/gILsE7uSUkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.47], [27.0, 27.55], [33.0, 35.11], [44.0, 45.05], [52.0, 52.39]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 60.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.47, 0.55, 2.11, 1.05, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/gIZ64_sZbCY_filtered.json b/annotations_filtered/gIZ64_sZbCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73d14f094cdb352f9a1274bb94caa2ad62699fda --- /dev/null +++ b/annotations_filtered/gIZ64_sZbCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [5.0, 5.02], [5.0, 9.71], [15.0, 27.51], [28.0, 36.22], [40.0, 43.93], [47.0, 47.6], [59.0, 60.52], [64.0, 64.72], [66.0, 67.73], [75.0, 76.01], [78.0, 79.78], [82.0, 97.44], [98.0, 102.63], [103.0, 104.55], [108.0, 126.64], [128.0, 130.91], [132.0, 133.54], [145.0, 145.84]], "keep_status": [false, false, true, true, true, true, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 35.01, 37.28, 36.42, 40.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 64.75, 0.0, 42.02, 34.2, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 33.93], ["fart", 12.09], ["cattle, bovinae", 6.92]], [["music", 56.16], ["speech", 8.23], ["smash, crash", 3.44]], [["speech", 44.28], ["crack", 7.61], ["music", 7.05]], [["speech", 19.11], ["fart", 13.33], ["thunk", 8.17]], null, null, null, null, null, null, null, null, null, [["music", 40.29], ["didgeridoo", 13.32], ["theremin", 5.65]], [["music", 25.39], ["speech", 15.36], ["sheep", 3.04]], null, null], "duration": [0.43, 0.02, 4.71, 12.51, 8.22, 3.93, 0.6, 1.52, 0.72, 1.73, 1.01, 1.78, 15.44, 4.63, 1.55, 18.64, 2.91, 1.54, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/gIaqrkn0ymo_filtered.json b/annotations_filtered/gIaqrkn0ymo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..514e2057a476dfc66c3369ecb61165db33c8ce43 --- /dev/null +++ b/annotations_filtered/gIaqrkn0ymo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.96], [14.0, 14.45], [20.0, 20.28], [37.0, 38.53], [53.0, 53.25], [54.0, 53.74], [69.0, 69.21], [80.0, 83.91], [87.0, 88.21], [92.0, 92.13], [113.0, 114.71], [117.0, 120.29], [122.0, 123.69], [125.0, 125.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 35.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.19], ["music", 24.58], ["sidetone", 2.46]], null, null], "duration": [-0.04, 0.45, 0.28, 1.53, 0.25, -0.26, 0.21, 3.91, 1.21, 0.13, 1.71, 3.29, 1.69, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/gIdOE4SoDfU_filtered.json b/annotations_filtered/gIdOE4SoDfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b436d82f9874f438c1d68d4b977635500ad9f3a --- /dev/null +++ b/annotations_filtered/gIdOE4SoDfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [6.0, 6.67], [9.0, 9.81], [13.0, 13.8], [18.0, 18.49], [22.0, 23.11], [25.0, 26.72], [28.0, 29.64], [32.0, 34.45], [35.0, 36.15], [43.0, 44.73], [46.0, 47.07], [48.0, 54.95], [56.0, 57.21], [59.0, 59.75], [63.0, 63.98], [68.0, 68.84], [70.0, 70.41], [72.0, 71.69], [77.0, 77.89], [82.0, 83.96], [89.0, 90.59], [92.0, 94.22], [96.0, 97.56], [100.0, 102.49], [104.0, 109.0], [111.0, 117.1], [118.0, 119.43], [121.0, 121.9], [124.0, 125.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 90.6, 77.7, 87.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 0.67, 0.81, 0.8, 0.49, 1.11, 1.72, 1.64, 2.45, 1.15, 1.73, 1.07, 6.95, 1.21, 0.75, 0.98, 0.84, 0.41, -0.31, 0.89, 1.96, 1.59, 2.22, 1.56, 2.49, 5.0, 6.1, 1.43, 0.9, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/gJCMd15eaW8_filtered.json b/annotations_filtered/gJCMd15eaW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41931c35640e70bb44654ab213674c2bc1d46d90 --- /dev/null +++ b/annotations_filtered/gJCMd15eaW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.8], [12.0, 23.36], [26.0, 67.78], [68.0, 67.95], [68.0, 71.34], [74.0, 74.92], [78.0, 107.5]], "keep_status": [false, false, false, false, true, false, true], "silence_prob": [99.78, 99.21, 0.0, 0.0, 40.93, 0.0, 32.19], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 32.12], ["hum", 17.64], ["speech", 6.42]], null, [["hum", 19.02], ["music", 17.52], ["speech", 8.69]]], "duration": [2.8, 11.36, 41.78, -0.05, 3.34, 0.92, 29.5]} \ No newline at end of file diff --git a/annotations_filtered/gJDpyQ1Efto_filtered.json b/annotations_filtered/gJDpyQ1Efto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..654115c39eaddc40334354b13d938a4c82e4a992 --- /dev/null +++ b/annotations_filtered/gJDpyQ1Efto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.1], [17.0, 19.33], [24.0, 25.39], [30.0, 34.69], [35.0, 35.26], [36.0, 38.1], [47.0, 48.95], [56.0, 58.82], [70.0, 71.32], [72.0, 73.2], [80.0, 80.86], [95.0, 95.69], [96.0, 96.99], [98.0, 98.85], [104.0, 103.99], [105.0, 105.04], [105.0, 105.51], [111.0, 113.83], [115.0, 116.73], [121.0, 121.56], [122.0, 122.55]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [31.73, 32.85, 0.0, 38.52, 0.0, 33.57, 0.0, 30.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.18], ["speech", 20.0], ["boing", 8.21]], [["music", 31.74], ["didgeridoo", 14.1], ["clarinet", 11.03]], null, [["music", 49.03], ["brass instrument", 13.75], ["trombone", 9.8]], null, [["music", 45.79], ["speech", 12.34], ["saxophone", 7.61]], null, [["music", 40.2], ["speech", 35.05], ["musical instrument", 5.29]], null, null, null, null, null, null, null, null, null, [["echo", 14.78], ["wild animals", 9.78], ["speech", 7.63]], null, null, null], "duration": [4.1, 2.33, 1.39, 4.69, 0.26, 2.1, 1.95, 2.82, 1.32, 1.2, 0.86, 0.69, 0.99, 0.85, -0.01, 0.04, 0.51, 2.83, 1.73, 0.56, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/gJOWAISZDhs_filtered.json b/annotations_filtered/gJOWAISZDhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ad108ade3f8033724794733895076b5f3cb675f --- /dev/null +++ b/annotations_filtered/gJOWAISZDhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 66.45], [70.0, 88.59], [89.0, 88.62], [89.0, 89.26], [97.0, 97.95], [99.0, 100.89], [104.0, 103.52], [104.0, 104.79], [106.0, 114.27], [119.0, 128.82]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 39.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.3, 42.93], "audiomae_on_audioset": [null, [["didgeridoo", 42.46], ["music", 22.45], ["throbbing", 17.02]], null, null, null, null, null, null, [["hum", 15.16], ["speech", 10.84], ["stomach rumble", 7.39]], [["music", 68.89], ["musical instrument", 7.42], ["synthesizer", 6.42]]], "duration": [0.45, 18.59, -0.38, 0.26, 0.95, 1.89, -0.48, 0.79, 8.27, 9.82]} \ No newline at end of file diff --git a/annotations_filtered/gJ_cx3AmCuI_filtered.json b/annotations_filtered/gJ_cx3AmCuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..245cfc3530310cda001cadc54d986d5f7d0b2f1d --- /dev/null +++ b/annotations_filtered/gJ_cx3AmCuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.45], [10.0, 11.03], [15.0, 17.85], [20.0, 26.91], [30.0, 32.32], [33.0, 36.41], [37.0, 45.5], [47.0, 49.64], [54.0, 55.21], [56.0, 57.86], [61.0, 68.5], [70.0, 71.74], [76.0, 77.7], [82.0, 83.08], [84.0, 83.91], [85.0, 84.87], [86.0, 90.0], [94.0, 93.8], [94.0, 94.41], [97.0, 96.99], [104.0, 105.76], [107.0, 106.98], [108.0, 110.42], [112.0, 118.49], [127.0, 127.6], [129.0, 132.12], [137.0, 137.27], [139.0, 145.93], [147.0, 148.39], [149.0, 151.12], [153.0, 153.13], [153.0, 153.93], [155.0, 155.38], [156.0, 156.63], [157.0, 158.13], [159.0, 159.31], [159.0, 159.85], [164.0, 167.95], [169.0, 170.8]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 67.13, 31.12, 32.98, 38.0, 37.75, 36.8, 0.0, 0.0, 33.68, 0.0, 0.0, 0.0, 0.0, 0.0, 33.11, 0.0, 0.0, 0.0, 0.0, 0.0, 31.02, 30.32, 0.0, 31.63, 0.0, 34.73, 0.0, 59.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.12, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 72.34], ["throbbing", 6.26], ["music", 6.24]], [["speech", 54.47], ["music", 17.55], ["radio", 2.06]], [["crushing", 24.75], ["crack", 16.3], ["speech", 11.95]], [["music", 37.99], ["speech", 22.72], ["synthesizer", 7.66]], [["speech", 40.72], ["music", 20.26], ["croak", 11.88]], null, null, [["speech", 56.81], ["music", 9.06], ["synthesizer", 5.6]], null, null, null, null, null, [["speech", 28.75], ["radio", 12.37], ["music", 7.16]], null, null, null, null, null, [["music", 23.25], ["grunt", 11.88], ["fart", 11.5]], [["grunt", 18.96], ["music", 9.29], ["animal", 9.13]], null, [["speech", 17.74], ["music", 6.82], ["grunt", 5.76]], null, [["music", 20.74], ["hum", 18.35], ["mains hum", 14.94]], null, null, null, null, null, null, null, null, null, [["music", 34.95], ["speech", 14.19], ["hum", 10.63]], null], "duration": [1.45, 1.03, 2.85, 6.91, 2.32, 3.41, 8.5, 2.64, 1.21, 1.86, 7.5, 1.74, 1.7, 1.08, -0.09, -0.13, 4.0, -0.2, 0.41, -0.01, 1.76, -0.02, 2.42, 6.49, 0.6, 3.12, 0.27, 6.93, 1.39, 2.12, 0.13, 0.93, 0.38, 0.63, 1.13, 0.31, 0.85, 3.95, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/gJvoeKHjuvE_filtered.json b/annotations_filtered/gJvoeKHjuvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fb1624f0f66be872ffdc89b8303aaab0fdecdfc --- /dev/null +++ b/annotations_filtered/gJvoeKHjuvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.94], [11.0, 13.0], [14.0, 17.14], [18.0, 18.87], [23.0, 26.4], [29.0, 30.08], [35.0, 35.67], [39.0, 39.58], [40.0, 41.42], [42.0, 46.6], [55.0, 56.89], [60.0, 61.69], [65.0, 72.3], [73.0, 73.89], [77.0, 77.19], [82.0, 81.92], [92.0, 97.63], [100.0, 103.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 50.36, 52.27, 0.0, 45.65, 0.0, 0.0, 0.0, 0.0, 33.32, 0.0, 0.0, 36.67, 0.0, 0.0, 0.0, 35.23, 36.65], "audiomae_on_audioset": [null, null, null, null, [["music", 80.37], ["bass guitar", 1.73], ["ding-dong", 1.09]], null, null, null, null, [["boing", 47.88], ["speech", 15.07], ["music", 14.97]], null, null, [["music", 24.75], ["effects unit", 7.19], ["boing", 6.64]], null, null, null, [["music", 35.72], ["speech", 31.98], ["boing", 4.45]], [["moo", 40.88], ["cattle, bovinae", 17.64], ["livestock, farm animals, working animals", 7.66]]], "duration": [1.94, 2.0, 3.14, 0.87, 3.4, 1.08, 0.67, 0.58, 1.42, 4.6, 1.89, 1.69, 7.3, 0.89, 0.19, -0.08, 5.63, 3.03]} \ No newline at end of file diff --git a/annotations_filtered/gJyibprvYQk_filtered.json b/annotations_filtered/gJyibprvYQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddbda98e511e8e3f06fe2d42e0b92ba929f4e8f2 --- /dev/null +++ b/annotations_filtered/gJyibprvYQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.04], [18.0, 21.74], [27.0, 30.06], [32.0, 32.85], [39.0, 40.05], [41.0, 43.77], [44.0, 45.72], [47.0, 48.34], [50.0, 50.82], [54.0, 56.12], [60.0, 65.01], [66.0, 68.81], [70.0, 92.5], [93.0, 96.89], [98.0, 100.4], [101.0, 106.3], [107.0, 112.4], [114.0, 114.44], [119.0, 122.4]], "keep_status": [false, false, true, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false], "silence_prob": [93.13, 34.25, 31.49, 0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 38.27, 35.62, 39.28, 36.06, 52.39, 57.48, 60.14, 54.5, 0.0, 85.9], "audiomae_on_audioset": [null, [["music", 60.59], ["hum", 5.28], ["theremin", 4.96]], [["music", 46.44], ["speech", 17.92], ["mains hum", 3.51]], null, null, null, null, null, null, [["speech", 22.89], ["music", 20.06], ["didgeridoo", 14.78]], [["music", 45.46], ["speech", 7.81], ["theremin", 6.31]], [["music", 41.81], ["sheep", 8.76], ["bleat", 8.46]], [["music", 36.54], ["synthesizer", 12.74], ["ambient music", 9.79]], null, null, null, null, null, null], "duration": [2.04, 3.74, 3.06, 0.85, 1.05, 2.77, 1.72, 1.34, 0.82, 2.12, 5.01, 2.81, 22.5, 3.89, 2.4, 5.3, 5.4, 0.44, 3.4]} \ No newline at end of file diff --git a/annotations_filtered/gK06H6EpKP4_filtered.json b/annotations_filtered/gK06H6EpKP4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e896f0ac384c2e0621f74c13999794cb495c9b89 --- /dev/null +++ b/annotations_filtered/gK06H6EpKP4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.99], [7.0, 8.21], [9.0, 12.63], [13.0, 14.67], [19.0, 24.12], [25.0, 26.82], [28.0, 35.23], [36.0, 44.24], [45.0, 47.12], [53.0, 53.81], [64.0, 66.07], [71.0, 71.83], [73.0, 74.07], [83.0, 87.18], [92.0, 92.16], [93.0, 95.81], [98.0, 98.96], [100.0, 99.89], [104.0, 104.52], [105.0, 105.66], [114.0, 114.34], [115.0, 115.91], [118.0, 118.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.09, 0.0, 91.3, 0.0, 47.23, 70.3, 91.81, 0.0, 99.16, 0.0, 0.0, 81.17, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["breaking", 44.33], ["thunk", 15.42], ["whack, thwack", 11.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 1.21, 3.63, 1.67, 5.12, 1.82, 7.23, 8.24, 2.12, 0.81, 2.07, 0.83, 1.07, 4.18, 0.16, 2.81, 0.96, -0.11, 0.52, 0.66, 0.34, 0.91, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/gK6JyAanVNE_filtered.json b/annotations_filtered/gK6JyAanVNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7af846a6fa957f36868cde733411e0cb51f5a45e --- /dev/null +++ b/annotations_filtered/gK6JyAanVNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.36], [13.0, 14.01], [14.0, 15.31], [20.0, 19.95], [20.0, 34.06], [47.0, 57.35], [58.0, 58.6], [62.0, 65.96], [66.0, 66.06], [66.0, 66.11], [66.0, 66.21], [66.0, 74.38], [79.0, 82.21], [86.0, 89.16], [95.0, 97.28], [105.0, 107.82], [109.0, 109.41], [111.0, 111.87], [115.0, 118.08], [122.0, 125.69], [127.0, 130.57], [133.0, 133.59]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, true, true, false], "silence_prob": [31.56, 0.0, 0.0, 0.0, 29.95, 30.54, 0.0, 29.7, 0.0, 0.0, 0.0, 29.89, 30.17, 30.58, 30.43, 30.41, 0.0, 0.0, 37.84, 35.24, 30.72, 0.0], "audiomae_on_audioset": [[["music", 24.94], ["throbbing", 13.85], ["electronic music", 9.61]], null, null, null, [["music", 79.95], ["electronic music", 3.69], ["shout", 1.49]], [["music", 72.25], ["speech", 10.91], ["didgeridoo", 2.62]], null, [["music", 41.6], ["boing", 10.59], ["cattle, bovinae", 6.36]], null, null, null, [["cattle, bovinae", 31.89], ["music", 26.67], ["moo", 19.86]], [["music", 56.31], ["sidetone", 8.8], ["speech", 6.77]], [["music", 44.7], ["fly, housefly", 15.48], ["mosquito", 10.31]], [["music", 51.64], ["speech", 18.37], ["musical instrument", 2.66]], [["music", 27.8], ["livestock, farm animals, working animals", 15.25], ["cattle, bovinae", 11.11]], null, null, [["music", 37.58], ["frog", 9.58], ["croak", 8.98]], [["music", 54.0], ["theremin", 6.31], ["musical instrument", 3.49]], [["music", 23.36], ["cattle, bovinae", 11.62], ["moo", 9.67]], null], "duration": [2.36, 1.01, 1.31, -0.05, 14.06, 10.35, 0.6, 3.96, 0.06, 0.11, 0.21, 8.38, 3.21, 3.16, 2.28, 2.82, 0.41, 0.87, 3.08, 3.69, 3.57, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/gKGOG-Pr81E_filtered.json b/annotations_filtered/gKGOG-Pr81E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc8d7b137ef7d8b7ebfa7a8dafd6f653737073c0 --- /dev/null +++ b/annotations_filtered/gKGOG-Pr81E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [3.0, 3.43], [6.0, 7.08], [11.0, 12.04], [13.0, 13.41], [15.0, 15.96], [19.0, 19.84], [22.0, 22.23], [23.0, 23.48], [24.0, 25.47], [26.0, 26.87], [28.0, 28.58], [29.0, 35.26], [37.0, 37.35], [38.0, 38.5], [46.0, 46.41], [49.0, 49.59], [51.0, 51.51], [53.0, 53.67], [57.0, 56.89], [58.0, 60.07], [65.0, 81.72], [82.0, 83.0], [89.0, 90.0], [91.0, 91.88], [92.0, 100.87], [102.0, 103.42], [104.0, 105.58], [109.0, 120.16], [122.0, 122.81], [125.0, 125.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 33.32, 0.0, 0.0, 0.0, 36.09, 0.0, 0.0, 33.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 78.72], ["clip-clop", 4.99], ["animal", 4.75]], null, null, null, null, null, null, null, null, [["music", 47.16], ["foghorn", 8.24], ["speech", 8.14]], null, null, null, [["music", 48.55], ["speech", 13.36], ["hum", 5.33]], null, null, [["speech", 40.18], ["music", 32.62], ["wind instrument, woodwind instrument", 4.76]], null, null], "duration": [0.36, 0.43, 1.08, 1.04, 0.41, 0.96, 0.84, 0.23, 0.48, 1.47, 0.87, 0.58, 6.26, 0.35, 0.5, 0.41, 0.59, 0.51, 0.67, -0.11, 2.07, 16.72, 1.0, 1.0, 0.88, 8.87, 1.42, 1.58, 11.16, 0.81, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/gKGmO34XgMU_filtered.json b/annotations_filtered/gKGmO34XgMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b88c1d03ec8e67e2395ab3575f88f2203f7e738 --- /dev/null +++ b/annotations_filtered/gKGmO34XgMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.96], [10.0, 12.56], [16.0, 16.92], [18.0, 17.96], [32.0, 33.86], [35.0, 35.83], [41.0, 42.23], [43.0, 43.56], [45.0, 45.12], [53.0, 53.05], [54.0, 54.31], [55.0, 55.27], [57.0, 60.84], [62.0, 61.94], [64.0, 63.76], [64.0, 64.44], [65.0, 65.5], [67.0, 67.39], [68.0, 68.4], [69.0, 73.5], [76.0, 75.96], [77.0, 77.55], [84.0, 84.75], [85.0, 86.17], [87.0, 87.4], [89.0, 88.8], [92.0, 96.09], [97.0, 97.53], [99.0, 99.4], [101.0, 101.14], [103.0, 103.2], [105.0, 107.08], [108.0, 108.41], [110.0, 109.75], [114.0, 113.71], [118.0, 119.04], [121.0, 123.48], [124.0, 131.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 64.18, 0.0, 0.0, 0.0, 0.0, 42.69, 50.21], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 86.19], ["sidetone", 3.83], ["radio", 2.21]], null, null, null, null, null, null, [["speech", 50.12], ["fart", 38.36], ["radio", 1.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 61.03], ["sidetone", 18.48], ["dial tone", 8.34]], null], "duration": [1.96, 2.56, 0.92, -0.04, 1.86, 0.83, 1.23, 0.56, 0.12, 0.05, 0.31, 0.27, 3.84, -0.06, -0.24, 0.44, 0.5, 0.39, 0.4, 4.5, -0.04, 0.55, 0.75, 1.17, 0.4, -0.2, 4.09, 0.53, 0.4, 0.14, 0.2, 2.08, 0.41, -0.25, -0.29, 1.04, 2.48, 7.63]} \ No newline at end of file diff --git a/annotations_filtered/gKJerAxfSzw_filtered.json b/annotations_filtered/gKJerAxfSzw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0e54e0e4b0289ca7f829ad53c6f3c72f4ee4673 --- /dev/null +++ b/annotations_filtered/gKJerAxfSzw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 52.27], [52.0, 53.08], [53.0, 54.6], [56.0, 56.57], [58.0, 58.08], [60.0, 65.8], [66.0, 67.26], [70.0, 73.4], [74.0, 74.55], [76.0, 78.51], [79.0, 83.57], [84.0, 85.82], [87.0, 87.42], [89.0, 89.01], [90.0, 90.85], [91.0, 93.39], [94.0, 95.35], [98.0, 98.88], [100.0, 102.25], [110.0, 110.37], [116.0, 117.12], [127.0, 127.97], [128.0, 128.07], [128.0, 134.1], [135.0, 136.95], [138.0, 140.44], [142.0, 143.26], [146.0, 154.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 60.14, 0.0, 56.25, 0.0, 51.99, 66.76, 0.0, 0.0, 0.0, 0.0, 32.21, 0.0, 0.0, 49.73, 0.0, 0.0, 0.0, 0.0, 33.66, 0.0, 32.48, 0.0, 37.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.35], ["music", 14.93], ["didgeridoo", 6.53]], null, null, [["hum", 33.3], ["throbbing", 29.4], ["music", 13.41]], null, null, null, null, [["hum", 29.67], ["throbbing", 20.32], ["music", 18.97]], null, [["music", 72.48], ["speech", 8.52], ["didgeridoo", 6.6]], null, [["music", 58.69], ["theremin", 6.04], ["musical instrument", 3.6]]], "duration": [36.27, 1.08, 1.6, 0.57, 0.08, 5.8, 1.26, 3.4, 0.55, 2.51, 4.57, 1.82, 0.42, 0.01, 0.85, 2.39, 1.35, 0.88, 2.25, 0.37, 1.12, 0.97, 0.07, 6.1, 1.95, 2.44, 1.26, 8.87]} \ No newline at end of file diff --git a/annotations_filtered/gKY3ShRZPkA_filtered.json b/annotations_filtered/gKY3ShRZPkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..896264eb638b02593c97a8931f07420264d4b99e --- /dev/null +++ b/annotations_filtered/gKY3ShRZPkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [8.0, 9.9], [10.0, 22.99], [24.0, 28.11], [29.0, 47.31], [48.0, 49.35], [52.0, 52.59], [53.0, 53.15], [53.0, 53.69], [54.0, 54.84]], "keep_status": [false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.67, 35.75, 33.09, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 72.3], ["fart", 11.32], ["didgeridoo", 5.11]], [["music", 40.47], ["theremin", 6.25], ["didgeridoo", 4.55]], [["music", 56.22], ["explosion", 8.04], ["burst, pop", 2.79]], null, null, null, null, null], "duration": [0.59, 1.9, 12.99, 4.11, 18.31, 1.35, 0.59, 0.15, 0.69, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/gKpPQ6SqHvQ_filtered.json b/annotations_filtered/gKpPQ6SqHvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34a0b70e109e79477688a22b2abe263249632287 --- /dev/null +++ b/annotations_filtered/gKpPQ6SqHvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.13], [4.0, 5.19], [10.0, 9.88], [11.0, 11.62], [15.0, 15.84], [18.0, 18.62], [20.0, 19.92], [22.0, 22.55], [25.0, 25.03], [26.0, 26.45], [36.0, 36.07], [38.0, 38.13], [39.0, 39.23], [40.0, 40.59], [42.0, 43.12], [43.0, 43.73], [45.0, 44.83], [49.0, 48.74], [51.0, 51.83], [53.0, 54.58], [55.0, 57.7], [59.0, 61.32], [62.0, 63.64], [65.0, 65.31], [67.0, 67.63], [69.0, 69.63], [71.0, 71.76], [73.0, 73.09], [74.0, 74.65], [81.0, 81.65], [89.0, 89.68], [90.0, 91.66], [94.0, 103.01], [104.0, 105.54], [107.0, 107.47], [112.0, 113.19], [115.0, 115.06], [128.0, 128.01], [128.0, 128.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.97, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 32.46], ["cattle, bovinae", 20.04], ["moo", 17.9]], null, null, null, null, null, null, null, null, null, null, null, [["music", 58.06], ["timpani", 13.37], ["musical instrument", 11.57]], null, null, null, null, null, null], "duration": [2.13, 1.19, -0.12, 0.62, 0.84, 0.62, -0.08, 0.55, 0.03, 0.45, 0.07, 0.13, 0.23, 0.59, 1.12, 0.73, -0.17, -0.26, 0.83, 1.58, 2.7, 2.32, 1.64, 0.31, 0.63, 0.63, 0.76, 0.09, 0.65, 0.65, 0.68, 1.66, 9.01, 1.54, 0.47, 1.19, 0.06, 0.01, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/gL17bwbFDAI_filtered.json b/annotations_filtered/gL17bwbFDAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0815d0dbf161d063f1b0f57eef70959fc142b4b --- /dev/null +++ b/annotations_filtered/gL17bwbFDAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.05], [2.0, 3.62], [5.0, 5.29], [6.0, 8.63], [9.0, 9.96], [10.0, 12.99], [15.0, 15.65], [17.0, 17.41], [18.0, 18.82], [20.0, 22.22], [23.0, 27.24], [29.0, 29.27], [29.0, 31.45], [34.0, 36.02], [37.0, 38.35], [39.0, 41.1], [41.0, 41.89], [44.0, 44.14], [45.0, 51.29], [52.0, 54.77], [55.0, 57.3], [59.0, 61.28], [64.0, 66.53], [67.0, 69.62], [71.0, 73.31], [76.0, 78.36], [80.0, 124.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 89.19, 0.0, 0.0, 0.0, 52.16, 99.99, 0.0, 99.9, 99.99, 0.0, 99.99, 0.0, 0.0, 100.0, 98.36, 95.23, 88.83, 99.76, 86.64, 96.17, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 1.62, 0.29, 2.63, 0.96, 2.99, 0.65, 0.41, 0.82, 2.22, 4.24, 0.27, 2.45, 2.02, 1.35, 2.1, 0.89, 0.14, 6.29, 2.77, 2.3, 2.28, 2.53, 2.62, 2.31, 2.36, 44.7]} \ No newline at end of file diff --git a/annotations_filtered/gL3mN-UpSyQ_filtered.json b/annotations_filtered/gL3mN-UpSyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34fe5ea283f213cc1577d2a65326f08286f048ad --- /dev/null +++ b/annotations_filtered/gL3mN-UpSyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.47], [20.0, 22.0], [24.0, 49.28], [51.0, 62.65], [64.0, 63.86], [64.0, 64.98], [65.0, 80.1], [81.0, 81.53], [83.0, 106.22], [108.0, 111.3]], "keep_status": [false, false, false, true, false, false, true, false, true, true], "silence_prob": [0.0, 32.89, 35.74, 32.38, 0.0, 0.0, 37.54, 0.0, 33.15, 33.07], "audiomae_on_audioset": [null, [["speech", 90.42], ["inside, small room", 1.76], ["radio", 1.29]], [["livestock, farm animals, working animals", 32.01], ["cattle, bovinae", 29.27], ["moo", 12.96]], [["livestock, farm animals, working animals", 20.43], ["sheep", 19.47], ["whack, thwack", 15.3]], null, null, [["frog", 14.31], ["whack, thwack", 12.52], ["speech", 7.61]], null, [["speech", 33.36], ["electric shaver, electric razor", 6.49], ["whack, thwack", 4.78]], [["cash register", 17.28], ["noise", 12.3], ["music", 6.75]]], "duration": [0.47, 2.0, 25.28, 11.65, -0.14, 0.98, 15.1, 0.53, 23.22, 3.3]} \ No newline at end of file diff --git a/annotations_filtered/gLB9F9QftwM_filtered.json b/annotations_filtered/gLB9F9QftwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..290064ab4305aa30b6bf052d713bb0a0c252a7e8 --- /dev/null +++ b/annotations_filtered/gLB9F9QftwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.64], [20.0, 20.78], [21.0, 23.13], [29.0, 29.27], [39.0, 39.73], [45.0, 45.96], [47.0, 48.0], [51.0, 51.24], [52.0, 52.32], [54.0, 59.73], [60.0, 61.38], [62.0, 81.95], [85.0, 87.81], [105.0, 105.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [89.54, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 34.51, 34.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 79.99], ["theremin", 9.1], ["chant", 1.32]], [["music", 54.49], ["theremin", 8.9], ["musical instrument", 6.53]], null], "duration": [2.64, 0.78, 2.13, 0.27, 0.73, 0.96, 1.0, 0.24, 0.32, 5.73, 1.38, 19.95, 2.81, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/gLD9INIOo00_filtered.json b/annotations_filtered/gLD9INIOo00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6516675953921ccdb98781e0385d763d0982af84 --- /dev/null +++ b/annotations_filtered/gLD9INIOo00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 44.12], [46.0, 48.78], [53.0, 83.22], [84.0, 94.61], [95.0, 106.73]], "keep_status": [false, false, false, false, false], "silence_prob": [31.22, 32.92, 0.0, 29.57, 31.4], "audiomae_on_audioset": [[["music", 83.43], ["scary music", 3.51], ["sound effect", 1.48]], [["music", 73.77], ["hum", 6.67], ["mains hum", 4.55]], null, [["speech", 41.03], ["explosion", 35.85], ["burst, pop", 5.36]], [["music", 82.21], ["didgeridoo", 4.17], ["buzz", 1.87]]], "duration": [8.12, 2.78, 30.22, 10.61, 11.73]} \ No newline at end of file diff --git a/annotations_filtered/gLLgGSdfy3I_filtered.json b/annotations_filtered/gLLgGSdfy3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/gLLgGSdfy3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/gLYTObRhcSY_filtered.json b/annotations_filtered/gLYTObRhcSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fedcf940d4ec9acd9d2ab5940e504d50ef7bfea0 --- /dev/null +++ b/annotations_filtered/gLYTObRhcSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.54], [6.0, 5.64], [6.0, 6.02], [6.0, 6.05], [6.0, 6.08], [7.0, 8.19], [10.0, 10.96], [13.0, 14.18], [15.0, 14.93], [26.0, 26.76], [30.0, 31.35], [34.0, 34.57], [38.0, 38.33], [41.0, 41.57], [44.0, 46.53], [49.0, 50.48], [51.0, 52.29], [55.0, 54.75], [56.0, 55.81], [57.0, 57.5], [59.0, 59.49], [60.0, 61.52], [63.0, 63.93], [68.0, 67.81], [69.0, 69.5], [73.0, 73.4], [79.0, 79.73], [86.0, 86.48], [96.0, 96.04], [102.0, 102.32], [110.0, 110.86], [136.0, 136.36]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.7], ["theremin", 20.17], ["synthesizer", 8.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.75], ["radio", 3.84], ["animal", 3.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.54, -0.36, 0.02, 0.05, 0.08, 1.19, 0.96, 1.18, -0.07, 0.76, 1.35, 0.57, 0.33, 0.57, 2.53, 1.48, 1.29, -0.25, -0.19, 0.5, 0.49, 1.52, 0.93, -0.19, 0.5, 0.4, 0.73, 0.48, 0.04, 0.32, 0.86, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/gM4-jiKNuIs_filtered.json b/annotations_filtered/gM4-jiKNuIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dafab16f8476ffe0f5cace12f6c33584c4a4f1ea --- /dev/null +++ b/annotations_filtered/gM4-jiKNuIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [7.0, 7.42], [9.0, 9.93], [13.0, 13.8], [16.0, 28.97], [30.0, 30.82], [32.0, 34.96], [35.0, 39.18], [41.0, 41.61], [43.0, 44.07], [47.0, 47.48], [49.0, 55.43], [60.0, 61.35], [62.0, 65.42], [67.0, 68.82], [69.0, 70.63], [76.0, 79.1], [80.0, 81.75], [83.0, 84.3], [86.0, 86.51], [90.0, 91.44], [93.0, 93.36], [94.0, 96.01], [101.0, 101.68]], "keep_status": [true, false, false, false, false, false, true, true, false, false, false, true, false, true, false, false, true, false, false, false, false, false, true, false], "silence_prob": [34.44, 0.0, 0.0, 0.0, 36.13, 0.0, 36.97, 37.85, 0.0, 0.0, 0.0, 36.91, 0.0, 39.07, 0.0, 0.0, 37.01, 0.0, 0.0, 0.0, 0.0, 0.0, 39.28, 0.0], "audiomae_on_audioset": [[["music", 25.46], ["ambient music", 11.85], ["electronic music", 8.76]], null, null, null, [["music", 58.13], ["theremin", 17.37], ["whale vocalization", 9.67]], null, [["whale vocalization", 26.11], ["music", 22.29], ["speech", 13.31]], [["speech", 23.77], ["hum", 19.47], ["mains hum", 9.99]], null, null, null, [["music", 50.13], ["foghorn", 8.66], ["hum", 6.03]], null, [["hum", 11.45], ["whale vocalization", 8.22], ["music", 7.7]], null, null, [["hum", 30.08], ["music", 12.58], ["mains hum", 10.13]], null, null, null, null, null, [["music", 38.22], ["speech", 17.51], ["hum", 2.8]], null], "duration": [2.11, 0.42, 0.93, 0.8, 12.97, 0.82, 2.96, 4.18, 0.61, 1.07, 0.48, 6.43, 1.35, 3.42, 1.82, 1.63, 3.1, 1.75, 1.3, 0.51, 1.44, 0.36, 2.01, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/gM8trQSURdg_filtered.json b/annotations_filtered/gM8trQSURdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb1b1d31dbc05b9597d8ff1bc5b4ee8a3baab584 --- /dev/null +++ b/annotations_filtered/gM8trQSURdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.95], [6.0, 8.31], [10.0, 13.12], [14.0, 18.03], [19.0, 23.09], [25.0, 27.9], [32.0, 32.68], [34.0, 41.54], [42.0, 43.33], [48.0, 50.25], [52.0, 53.38], [55.0, 56.52], [62.0, 63.98], [67.0, 68.81], [71.0, 74.04], [77.0, 78.26], [80.0, 80.42], [81.0, 82.88], [91.0, 91.94], [93.0, 95.23], [97.0, 98.54], [100.0, 101.83], [107.0, 108.5], [113.0, 113.95], [115.0, 115.59], [131.0, 131.09], [139.0, 139.95], [144.0, 146.26], [148.0, 149.81], [153.0, 154.84], [162.0, 163.17], [166.0, 167.73], [168.0, 169.69], [171.0, 174.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 100.0, 99.97, 99.99, 0.0, 99.21, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.95, 2.31, 3.12, 4.03, 4.09, 2.9, 0.68, 7.54, 1.33, 2.25, 1.38, 1.52, 1.98, 1.81, 3.04, 1.26, 0.42, 1.88, 0.94, 2.23, 1.54, 1.83, 1.5, 0.95, 0.59, 0.09, 0.95, 2.26, 1.81, 1.84, 1.17, 1.73, 1.69, 3.16]} \ No newline at end of file diff --git a/annotations_filtered/gMBEqbV0mw4_filtered.json b/annotations_filtered/gMBEqbV0mw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdab985f07720f5f290b50f74028222bb0338e39 --- /dev/null +++ b/annotations_filtered/gMBEqbV0mw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.65], [17.0, 17.05], [49.0, 49.77], [51.0, 51.27]], "keep_status": [false, false, false, false], "silence_prob": [31.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["thunk", 71.84], ["speech", 14.2], ["whack, thwack", 5.51]], null, null, null], "duration": [3.65, 0.05, 0.77, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/gMCgkXpEOIY_filtered.json b/annotations_filtered/gMCgkXpEOIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d819d2866f174c216ccab57c811ef4bf4af0b17 --- /dev/null +++ b/annotations_filtered/gMCgkXpEOIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.66], [12.0, 21.93], [26.0, 26.74], [28.0, 32.21], [33.0, 35.87], [37.0, 53.08], [54.0, 53.79], [56.0, 57.5], [63.0, 63.17], [64.0, 64.74], [68.0, 69.62], [71.0, 71.78], [72.0, 73.58], [76.0, 77.36], [81.0, 81.73], [83.0, 91.23], [93.0, 93.68], [96.0, 98.39], [102.0, 102.63], [104.0, 105.24], [107.0, 107.6], [110.0, 137.35], [139.0, 140.61], [158.0, 158.58], [159.0, 161.64], [164.0, 165.55], [166.0, 167.36], [169.0, 169.05], [172.0, 172.27], [176.0, 182.75], [191.0, 190.63], [192.0, 200.15], [201.0, 201.78], [204.0, 204.53]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.51, 0.0, 47.9, 98.8, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.94, 0.0, 99.52, 0.0, 0.0, 0.0, 32.23, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 38.74, 0.0, 72.9, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.5], ["fly, housefly", 16.55], ["insect", 5.69]], null, [["theremin", 79.49], ["music", 13.41], ["musical instrument", 1.25]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 94.16], ["cough", 2.8], ["noise", 0.52]], null, null, null, null, null, [["vehicle", 24.34], ["buzz", 17.39], ["race car, auto racing", 11.85]], null, null, null, null, null, null, null, [["snicker", 35.39], ["laughter", 33.03], ["baby laughter", 8.02]], null, null, null, null], "duration": [0.66, 9.93, 0.74, 4.21, 2.87, 16.08, -0.21, 1.5, 0.17, 0.74, 1.62, 0.78, 1.58, 1.36, 0.73, 8.23, 0.68, 2.39, 0.63, 1.24, 0.6, 27.35, 1.61, 0.58, 2.64, 1.55, 1.36, 0.05, 0.27, 6.75, -0.37, 8.15, 0.78, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/gMPr9rchJMs_filtered.json b/annotations_filtered/gMPr9rchJMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6121e17dce18d2e0f56d6ce5bba22afa87d60139 --- /dev/null +++ b/annotations_filtered/gMPr9rchJMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.16], [5.0, 5.85], [9.0, 10.64], [12.0, 12.18], [14.0, 15.52], [17.0, 17.19], [20.0, 20.22], [21.0, 23.95], [25.0, 27.63], [30.0, 30.37], [35.0, 36.24], [38.0, 40.32], [46.0, 45.91], [48.0, 47.93], [52.0, 52.81], [56.0, 56.02], [64.0, 65.47], [73.0, 72.72], [78.0, 78.88], [85.0, 85.28], [87.0, 87.72], [89.0, 89.13], [90.0, 90.27], [94.0, 93.88], [100.0, 103.01], [105.0, 106.34], [113.0, 113.02], [116.0, 118.12], [120.0, 122.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.85, 1.64, 0.18, 1.52, 0.19, 0.22, 2.95, 2.63, 0.37, 1.24, 2.32, -0.09, -0.07, 0.81, 0.02, 1.47, -0.28, 0.88, 0.28, 0.72, 0.13, 0.27, -0.12, 3.01, 1.34, 0.02, 2.12, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/gMdTl2R354A_filtered.json b/annotations_filtered/gMdTl2R354A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10c67be9fa6959c90f2002195bbcc3e7416698de --- /dev/null +++ b/annotations_filtered/gMdTl2R354A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.38], [44.0, 45.0], [52.0, 53.22], [68.0, 67.91], [70.0, 70.97], [83.0, 83.07], [86.0, 86.95], [91.0, 91.89], [93.0, 94.91], [102.0, 104.4], [111.0, 110.94], [120.0, 120.65], [123.0, 124.7], [127.0, 128.48], [138.0, 138.55], [157.0, 157.98], [167.0, 168.05], [174.0, 175.59], [209.0, 210.56], [213.0, 213.14], [235.0, 236.21], [237.0, 238.17], [239.0, 241.64], [244.0, 246.27]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.52, 34.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["didgeridoo", 14.64], ["speech", 11.17], ["music", 7.17]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.49], ["hum", 5.57], ["busy signal", 5.49]], [["music", 32.48], ["musical instrument", 17.54], ["hum", 12.84]]], "duration": [0.38, 1.0, 1.22, -0.09, 0.97, 0.07, 0.95, 0.89, 1.91, 2.4, -0.06, 0.65, 1.7, 1.48, 0.55, 0.98, 1.05, 1.59, 1.56, 0.14, 1.21, 1.17, 2.64, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/gN1BjYlhKvc_filtered.json b/annotations_filtered/gN1BjYlhKvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bda7237fe1888836a65ad99b9ebdba5e8a325458 --- /dev/null +++ b/annotations_filtered/gN1BjYlhKvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.33], [10.0, 10.07], [11.0, 11.97], [15.0, 15.23], [16.0, 18.17], [20.0, 21.71], [28.0, 28.51], [30.0, 31.24], [34.0, 35.19], [39.0, 58.58], [62.0, 61.86], [63.0, 70.71], [73.0, 77.62], [78.0, 84.03], [85.0, 132.56], [134.0, 134.2], [135.0, 136.88], [138.0, 139.68], [141.0, 141.91], [145.0, 146.15], [148.0, 149.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0, 30.84, 0.0, 30.66, 30.88, 31.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 44.39], ["throbbing", 25.61], ["hum", 10.34]], null, [["music", 55.77], ["electronic music", 9.94], ["throbbing", 7.06]], [["music", 43.15], ["throbbing", 24.43], ["hum", 9.48]], [["music", 42.5], ["throbbing", 12.96], ["hum", 12.82]], null, null, null, null, null, null, null], "duration": [1.33, 0.07, 0.97, 0.23, 2.17, 1.71, 0.51, 1.24, 1.19, 19.58, -0.14, 7.71, 4.62, 6.03, 47.56, 0.2, 1.88, 1.68, 0.91, 1.15, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/gN2ZP-q_qpc_filtered.json b/annotations_filtered/gN2ZP-q_qpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b65cf4d057e3d55e32b3db8be9686c3717c330c0 --- /dev/null +++ b/annotations_filtered/gN2ZP-q_qpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.87], [13.0, 13.49], [15.0, 15.08], [17.0, 17.71], [19.0, 19.68], [21.0, 21.84], [24.0, 25.47], [27.0, 28.81], [33.0, 34.52], [38.0, 38.48], [40.0, 39.83], [41.0, 42.13], [43.0, 43.44], [44.0, 45.13], [46.0, 47.24], [55.0, 56.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.49, 0.08, 0.71, 0.68, 0.84, 1.47, 1.81, 1.52, 0.48, -0.17, 1.13, 0.44, 1.13, 1.24, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/gNCAj7eS07I_filtered.json b/annotations_filtered/gNCAj7eS07I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85190263732aad6e0dab2fe8c178626af5678840 --- /dev/null +++ b/annotations_filtered/gNCAj7eS07I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 21.3], [29.0, 30.75], [32.0, 34.26], [40.0, 41.44], [43.0, 44.41], [48.0, 47.92], [49.0, 50.14], [53.0, 53.32], [54.0, 54.58], [63.0, 65.84], [76.0, 79.89], [86.0, 89.38], [95.0, 98.63], [100.0, 101.78]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.43, 0.0, 38.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.55, 55.31, 63.1, 48.74, 0.0], "audiomae_on_audioset": [[["whale vocalization", 17.3], ["fly, housefly", 16.47], ["animal", 9.52]], null, [["whale vocalization", 21.94], ["hum", 12.99], ["music", 8.41]], null, null, null, null, null, null, null, null, null, [["speech", 58.61], ["music", 22.14], ["hum", 1.79]], null], "duration": [6.3, 1.75, 2.26, 1.44, 1.41, -0.08, 1.14, 0.32, 0.58, 2.84, 3.89, 3.38, 3.63, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/gNCkFkii-tA_filtered.json b/annotations_filtered/gNCkFkii-tA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..602a8045f794eb87741eb5b733be4a254f78c68d --- /dev/null +++ b/annotations_filtered/gNCkFkii-tA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [7.0, 7.57], [9.0, 10.17], [15.0, 15.45], [18.0, 20.41], [24.0, 27.28], [29.0, 31.46], [38.0, 45.89], [48.0, 50.25], [55.0, 55.54], [56.0, 56.56], [58.0, 60.25], [64.0, 64.76], [65.0, 66.02], [75.0, 79.08], [82.0, 86.46], [86.0, 86.51], [94.0, 99.12], [107.0, 108.28], [113.0, 113.56], [116.0, 116.85], [125.0, 126.55], [129.0, 131.08]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, true, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.66, 33.57, 35.29, 34.89, 30.43, 0.0, 0.0, 30.35, 0.0, 0.0, 29.04, 30.72, 0.0, 30.5, 0.0, 0.0, 0.0, 0.0, 34.07], "audiomae_on_audioset": [null, null, null, null, [["speech", 44.04], ["sidetone", 17.38], ["rumble", 7.13]], [["whale vocalization", 36.97], ["speech", 31.21], ["stomach rumble", 10.89]], [["speech", 20.89], ["creak", 11.1], ["animal", 8.19]], [["speech", 48.91], ["mains hum", 15.18], ["hum", 13.98]], [["sidetone", 40.96], ["speech", 22.93], ["radio", 11.66]], null, null, [["music", 27.16], ["whale vocalization", 17.43], ["hum", 3.85]], null, null, [["whale vocalization", 29.7], ["hum", 13.32], ["throbbing", 10.32]], [["throbbing", 20.43], ["speech", 18.2], ["hum", 14.15]], null, [["speech", 47.43], ["car", 8.44], ["vehicle", 6.77]], null, null, null, null, [["music", 67.67], ["musical instrument", 6.2], ["synthesizer", 3.58]]], "duration": [0.85, 0.57, 1.17, 0.45, 2.41, 3.28, 2.46, 7.89, 2.25, 0.54, 0.56, 2.25, 0.76, 1.02, 4.08, 4.46, 0.51, 5.12, 1.28, 0.56, 0.85, 1.55, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/gNEB3vRczjA_filtered.json b/annotations_filtered/gNEB3vRczjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41c5d12bbb95fbd345905265a7687715c9c2706d --- /dev/null +++ b/annotations_filtered/gNEB3vRczjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [6.0, 11.79], [19.0, 22.13], [24.0, 25.22], [25.0, 26.49], [30.0, 39.63], [44.0, 65.3], [67.0, 70.33], [71.0, 71.76], [73.0, 90.66], [95.0, 103.96], [106.0, 106.78], [108.0, 109.86], [111.0, 120.36], [122.0, 133.74]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, true], "silence_prob": [0.0, 31.09, 93.29, 0.0, 0.0, 51.5, 33.4, 36.54, 0.0, 29.82, 29.66, 0.0, 0.0, 29.26, 29.72], "audiomae_on_audioset": [null, [["speech", 55.94], ["explosion", 8.67], ["hum", 6.79]], null, null, null, null, [["music", 39.92], ["hum", 23.29], ["throbbing", 20.67]], [["speech", 21.35], ["music", 14.7], ["hum", 9.52]], null, [["speech", 36.34], ["music", 31.19], ["breaking", 5.84]], [["smash, crash", 64.24], ["breaking", 8.72], ["speech", 5.22]], null, null, [["music", 35.91], ["vehicle", 13.72], ["car", 6.07]], [["music", 21.57], ["noise", 10.07], ["buzz", 8.59]]], "duration": [1.56, 5.79, 3.13, 1.22, 1.49, 9.63, 21.3, 3.33, 0.76, 17.66, 8.96, 0.78, 1.86, 9.36, 11.74]} \ No newline at end of file diff --git a/annotations_filtered/gNGmuLYwd3o_filtered.json b/annotations_filtered/gNGmuLYwd3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07f3b216b2d10994f68c53de9c8c0b72724c5bf8 --- /dev/null +++ b/annotations_filtered/gNGmuLYwd3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.96], [10.0, 11.04], [12.0, 13.07], [14.0, 15.33], [17.0, 17.51], [21.0, 21.44], [22.0, 22.91], [26.0, 27.03]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [3.96, 1.04, 1.07, 1.33, 0.51, 0.44, 0.91, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/gNSs_gF1T_Q_filtered.json b/annotations_filtered/gNSs_gF1T_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3139d3ff478868b4008c5d81d16a3858c5c0e360 --- /dev/null +++ b/annotations_filtered/gNSs_gF1T_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [5.0, 6.94], [7.0, 7.16], [8.0, 9.37], [10.0, 10.42], [13.0, 14.23], [35.0, 34.87], [35.0, 37.1], [43.0, 44.37], [45.0, 46.04], [50.0, 52.08], [54.0, 54.38], [61.0, 61.42], [72.0, 73.25], [93.0, 93.56], [99.0, 99.17], [100.0, 100.85], [102.0, 102.88], [104.0, 105.09], [105.0, 108.38], [109.0, 111.7], [112.0, 114.35], [118.0, 118.52], [120.0, 120.26], [124.0, 125.42], [127.0, 129.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.11, 0.0, 0.0, 74.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 100.0, 94.66, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 1.94, 0.16, 1.37, 0.42, 1.23, -0.13, 2.1, 1.37, 1.04, 2.08, 0.38, 0.42, 1.25, 0.56, 0.17, 0.85, 0.88, 1.09, 3.38, 2.7, 2.35, 0.52, 0.26, 1.42, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/gNbqn47rt3M_filtered.json b/annotations_filtered/gNbqn47rt3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c83cd3d2085304d2b09b7d1aa2fd68f1d870a49e --- /dev/null +++ b/annotations_filtered/gNbqn47rt3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.88], [13.0, 13.54], [39.0, 55.81], [79.0, 79.59], [82.0, 81.65], [84.0, 84.35], [87.0, 88.59], [90.0, 93.99], [95.0, 96.7], [108.0, 109.92], [114.0, 114.51], [119.0, 119.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.69, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 81.47], ["psychedelic rock", 1.11], ["musical instrument", 0.79]], null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.54, 16.81, 0.59, -0.35, 0.35, 1.59, 3.99, 1.7, 1.92, 0.51, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/gO6qemCFhEU_filtered.json b/annotations_filtered/gO6qemCFhEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbc7bb37dabd592a750932d6dfa60e8df66315c9 --- /dev/null +++ b/annotations_filtered/gO6qemCFhEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.23], [6.0, 6.59], [10.0, 36.41], [38.0, 39.73], [42.0, 42.63], [43.0, 43.9], [45.0, 46.03], [47.0, 49.91], [50.0, 53.37], [54.0, 64.22], [70.0, 73.95], [75.0, 78.26], [79.0, 80.5], [81.0, 82.24], [83.0, 83.15], [85.0, 85.02], [86.0, 88.33], [89.0, 98.24], [99.0, 111.42], [112.0, 111.55], [112.0, 112.46], [113.0, 128.38], [132.0, 133.95], [135.0, 136.53], [148.0, 156.39], [157.0, 158.43]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.93, 0.0, 0.0, 0.0, 0.0, 41.34, 40.73, 37.92, 82.97, 85.17, 0.0, 0.0, 0.0, 0.0, 71.72, 38.9, 36.48, 0.0, 0.0, 38.36, 0.0, 0.0, 33.12, 0.0], "audiomae_on_audioset": [null, null, [["music", 44.39], ["speech", 10.45], ["musical instrument", 7.13]], null, null, null, null, [["music", 66.45], ["theremin", 5.59], ["wind instrument, woodwind instrument", 3.93]], [["music", 35.17], ["theremin", 23.36], ["wind instrument, woodwind instrument", 8.95]], [["music", 48.34], ["wind instrument, woodwind instrument", 16.85], ["speech", 9.21]], null, null, null, null, null, null, null, [["music", 33.3], ["whale vocalization", 19.37], ["wind instrument, woodwind instrument", 13.21]], [["music", 37.18], ["wind instrument, woodwind instrument", 25.57], ["musical instrument", 9.72]], null, null, [["music", 45.12], ["theremin", 22.23], ["musical instrument", 10.59]], null, null, [["music", 34.05], ["clarinet", 27.0], ["wind instrument, woodwind instrument", 13.47]], null], "duration": [1.23, 0.59, 26.41, 1.73, 0.63, 0.9, 1.03, 2.91, 3.37, 10.22, 3.95, 3.26, 1.5, 1.24, 0.15, 0.02, 2.33, 9.24, 12.42, -0.45, 0.46, 15.38, 1.95, 1.53, 8.39, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/gOJJm_cSRds_filtered.json b/annotations_filtered/gOJJm_cSRds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebacf7a5a49a7c1eb2a34879c10d67a59aeaf45d --- /dev/null +++ b/annotations_filtered/gOJJm_cSRds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 76.33], [77.0, 94.14], [96.0, 123.26], [124.0, 133.07], [135.0, 136.39], [137.0, 139.36], [140.0, 141.05], [147.0, 173.2], [176.0, 206.0]], "keep_status": [true, true, true, true, false, true, false, true, true], "silence_prob": [30.31, 30.42, 31.3, 32.76, 0.0, 41.03, 0.0, 30.66, 31.42], "audiomae_on_audioset": [[["sound effect", 22.47], ["reverberation", 10.37], ["echo", 9.59]], [["effects unit", 15.08], ["music", 13.99], ["noise", 12.02]], [["noise", 15.31], ["music", 13.03], ["sound effect", 11.1]], [["speech", 43.9], ["radio", 18.1], ["sidetone", 4.25]], null, [["sidetone", 50.92], ["music", 8.96], ["radio", 6.31]], null, [["music", 27.26], ["synthesizer", 14.73], ["effects unit", 8.13]], [["speech", 38.46], ["effects unit", 6.45], ["music", 5.6]]], "duration": [24.33, 17.14, 27.26, 9.07, 1.39, 2.36, 1.05, 26.2, 30.0]} \ No newline at end of file diff --git a/annotations_filtered/gOb8HH2oKcE_filtered.json b/annotations_filtered/gOb8HH2oKcE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e20d10cd68d0964d52f970af4ac5f99b76bc137e --- /dev/null +++ b/annotations_filtered/gOb8HH2oKcE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.55], [4.0, 4.9], [7.0, 8.99], [11.0, 12.11], [13.0, 13.41], [14.0, 14.55], [15.0, 16.07], [18.0, 21.83], [22.0, 26.37], [28.0, 28.88], [31.0, 33.35], [34.0, 35.75], [36.0, 40.44], [42.0, 43.97], [44.0, 46.79], [50.0, 54.85], [56.0, 58.67], [60.0, 62.21], [63.0, 64.66], [67.0, 69.48], [83.0, 93.82], [95.0, 96.03], [96.0, 96.43], [97.0, 99.17], [101.0, 103.92], [106.0, 107.38], [108.0, 109.93], [111.0, 112.58], [116.0, 118.47], [121.0, 124.36], [126.0, 127.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 99.48, 0.0, 99.97, 0.0, 99.95, 0.0, 87.74, 100.0, 99.62, 99.97, 0.0, 96.54, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 99.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.55, 0.9, 1.99, 1.11, 0.41, 0.55, 1.07, 3.83, 4.37, 0.88, 2.35, 1.75, 4.44, 1.97, 2.79, 4.85, 2.67, 2.21, 1.66, 2.48, 10.82, 1.03, 0.43, 2.17, 2.92, 1.38, 1.93, 1.58, 2.47, 3.36, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/gOy7KDtN3mc_filtered.json b/annotations_filtered/gOy7KDtN3mc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c68378db1f8fca09f2a117b2894943ca96f9f217 --- /dev/null +++ b/annotations_filtered/gOy7KDtN3mc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.41], [7.0, 7.5], [10.0, 10.83], [13.0, 14.89], [16.0, 18.28], [19.0, 21.59], [23.0, 22.94], [24.0, 24.49], [27.0, 27.18], [33.0, 36.15], [38.0, 40.05], [43.0, 43.11], [47.0, 50.26], [51.0, 52.74], [53.0, 84.89]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [49.87, 0.0, 0.0, 0.0, 70.16, 87.19, 0.0, 0.0, 0.0, 60.79, 33.3, 0.0, 31.36, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.4], ["speech", 9.25], ["drum", 4.57]], null, null, null, null, null, null, null, null, null, [["music", 40.67], ["pulse", 7.45], ["mains hum", 5.53]], null, [["speech", 47.56], ["fart", 25.41], ["explosion", 4.47]], null, null], "duration": [4.41, 0.5, 0.83, 1.89, 2.28, 2.59, -0.06, 0.49, 0.18, 3.15, 2.05, 0.11, 3.26, 1.74, 31.89]} \ No newline at end of file diff --git a/annotations_filtered/gP2sCE166o4_filtered.json b/annotations_filtered/gP2sCE166o4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9272fc42663f130f2c7690ec4aec95111c6b3c79 --- /dev/null +++ b/annotations_filtered/gP2sCE166o4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [4.0, 4.08], [5.0, 4.9], [8.0, 8.51], [9.0, 11.38], [12.0, 13.91], [16.0, 16.7], [18.0, 18.28], [20.0, 21.84], [24.0, 24.88], [26.0, 28.05], [29.0, 29.13], [30.0, 30.62]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.14, 0.0, 0.0, 0.0, 0.0, 0.0, 33.35, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 39.86], ["eruption", 10.46], ["vehicle", 7.01]], null, null, null, null, null, [["speech", 68.87], ["sidetone", 7.0], ["white noise", 3.08]], null, null], "duration": [0.25, 0.08, -0.1, 0.51, 2.38, 1.91, 0.7, 0.28, 1.84, 0.88, 2.05, 0.13, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/gP8_w1J5raY_filtered.json b/annotations_filtered/gP8_w1J5raY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc2f2695084fe7092237c157750b2507b542be9e --- /dev/null +++ b/annotations_filtered/gP8_w1J5raY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.62], [1.0, 0.73], [16.0, 17.42], [18.0, 19.33], [21.0, 21.86], [23.0, 24.88], [26.0, 27.57], [29.0, 29.78], [32.0, 32.02], [34.0, 35.23], [36.0, 36.39], [45.0, 45.3], [46.0, 46.85], [50.0, 51.41], [55.0, 55.54], [56.0, 57.75], [58.0, 59.22], [62.0, 62.36], [64.0, 64.74], [65.0, 64.91], [65.0, 67.85], [69.0, 70.02], [76.0, 76.18], [78.0, 78.78], [87.0, 89.28], [91.0, 94.53], [98.0, 97.9], [99.0, 100.41], [102.0, 102.27], [104.0, 106.44], [109.0, 109.32], [110.0, 110.84], [112.0, 111.97], [116.0, 116.33], [124.0, 126.47], [129.0, 129.63], [131.0, 131.57], [134.0, 135.95], [138.0, 138.87], [144.0, 144.42], [146.0, 147.38], [149.0, 150.53], [151.0, 151.63], [154.0, 155.75], [160.0, 174.36], [177.0, 177.47], [178.0, 178.63], [179.0, 179.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.2, 0.0, 0.0, 0.0, 63.31, 56.55, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 48.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.47], ["speech", 15.13], ["synthesizer", 3.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.08], ["didgeridoo", 4.68], ["speech", 3.76]], null, null, null, null, null, null, null, null, null, [["music", 58.28], ["musical instrument", 4.73], ["didgeridoo", 4.49]], null, null, null], "duration": [0.62, -0.27, 1.42, 1.33, 0.86, 1.88, 1.57, 0.78, 0.02, 1.23, 0.39, 0.3, 0.85, 1.41, 0.54, 1.75, 1.22, 0.36, 0.74, -0.09, 2.85, 1.02, 0.18, 0.78, 2.28, 3.53, -0.1, 1.41, 0.27, 2.44, 0.32, 0.84, -0.03, 0.33, 2.47, 0.63, 0.57, 1.95, 0.87, 0.42, 1.38, 1.53, 0.63, 1.75, 14.36, 0.47, 0.63, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/gPAI19a84KU_filtered.json b/annotations_filtered/gPAI19a84KU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0544fa8591782c6f6c265209c67a9f69ef973111 --- /dev/null +++ b/annotations_filtered/gPAI19a84KU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [8.0, 8.88], [13.0, 16.66], [18.0, 32.7], [33.0, 33.84], [34.0, 34.99], [40.0, 42.08], [44.0, 48.44], [49.0, 52.52], [54.0, 75.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 53.72, 0.0, 0.0, 98.1, 99.26, 95.51, 99.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 0.88, 3.66, 14.7, 0.84, 0.99, 2.08, 4.44, 3.52, 21.07]} \ No newline at end of file diff --git a/annotations_filtered/gPJFxEvmHpQ_filtered.json b/annotations_filtered/gPJFxEvmHpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02ae43f335342554fda7d7a3024ef5725a6180a4 --- /dev/null +++ b/annotations_filtered/gPJFxEvmHpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[132.0, 135.62], [137.0, 138.03], [142.0, 142.23], [145.0, 146.25], [151.0, 160.84]], "keep_status": [true, false, false, false, true], "silence_prob": [42.84, 0.0, 0.0, 0.0, 39.88], "audiomae_on_audioset": [[["music", 26.6], ["synthesizer", 11.01], ["sine wave", 7.9]], null, null, null, [["music", 30.3], ["speech", 29.08], ["synthesizer", 10.39]]], "duration": [3.62, 1.03, 0.23, 1.25, 9.84]} \ No newline at end of file diff --git a/annotations_filtered/gP_GbzDWoY0_filtered.json b/annotations_filtered/gP_GbzDWoY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1746e8f00212c7e0c9bf764a45cdd0bb2423be7 --- /dev/null +++ b/annotations_filtered/gP_GbzDWoY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.68], [9.0, 9.59], [10.0, 10.59], [11.0, 11.72], [13.0, 16.07], [20.0, 20.16], [23.0, 23.53], [25.0, 26.25], [28.0, 28.0], [34.0, 34.77], [39.0, 40.15], [72.0, 72.57], [94.0, 95.76], [99.0, 99.05], [100.0, 100.25], [104.0, 104.35], [115.0, 115.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.68, 0.59, 0.59, 0.72, 3.07, 0.16, 0.53, 1.25, 0.0, 0.77, 1.15, 0.57, 1.76, 0.05, 0.25, 0.35, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/gPadm1Ql1Is_filtered.json b/annotations_filtered/gPadm1Ql1Is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5876a4460277e846262839f59373824a9a1632e3 --- /dev/null +++ b/annotations_filtered/gPadm1Ql1Is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.05], [4.0, 5.44], [7.0, 8.24], [11.0, 12.95], [14.0, 18.66], [24.0, 26.16], [28.0, 30.08], [32.0, 32.54], [36.0, 36.41], [42.0, 42.03], [46.0, 47.36], [50.0, 50.55], [53.0, 58.83], [60.0, 61.33], [64.0, 64.32], [64.0, 79.56], [81.0, 85.89], [89.0, 90.69], [92.0, 100.95], [103.0, 104.3], [106.0, 106.76], [116.0, 117.17], [120.0, 121.22], [122.0, 124.26], [125.0, 126.72], [130.0, 132.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [92.8, 0.0, 0.0, 0.0, 99.93, 99.65, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 86.82, 37.1, 0.0, 32.99, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 94.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 37.13], ["mains hum", 23.64], ["music", 8.69]], null, [["speech", 44.71], ["animal", 21.0], ["clip-clop", 17.28]], null, null, null, null, null, null, null], "duration": [2.05, 1.44, 1.24, 1.95, 4.66, 2.16, 2.08, 0.54, 0.41, 0.03, 1.36, 0.55, 5.83, 1.33, 0.32, 15.56, 4.89, 1.69, 8.95, 1.3, 0.76, 1.17, 1.22, 2.26, 1.72, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/gPv4C6gIdOo_filtered.json b/annotations_filtered/gPv4C6gIdOo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b873148ac60ec14f733d5f43aa37c5e7ed321e0 --- /dev/null +++ b/annotations_filtered/gPv4C6gIdOo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.27], [28.0, 31.75], [32.0, 33.91], [35.0, 36.73], [40.0, 42.38], [44.0, 45.67], [54.0, 54.45], [63.0, 63.49], [65.0, 66.58], [67.0, 68.07], [73.0, 73.35], [75.0, 75.1], [76.0, 76.74], [83.0, 83.46], [86.0, 86.7], [87.0, 88.26], [93.0, 93.41], [106.0, 106.61], [108.0, 109.09], [112.0, 114.15], [115.0, 118.37], [121.0, 121.53], [123.0, 122.98]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 39.63, 0.0, 0.0, 38.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.23, 36.75, 0.0, 0.0], "audiomae_on_audioset": [null, [["mains hum", 42.5], ["hum", 37.77], ["white noise", 2.38]], null, null, [["hum", 35.29], ["mains hum", 11.52], ["bee, wasp, etc.", 4.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.62], ["insect", 8.89], ["mains hum", 8.29]], [["speech", 21.18], ["hum", 15.64], ["sine wave", 15.13]], null, null], "duration": [0.27, 3.75, 1.91, 1.73, 2.38, 1.67, 0.45, 0.49, 1.58, 1.07, 0.35, 0.1, 0.74, 0.46, 0.7, 1.26, 0.41, 0.61, 1.09, 2.15, 3.37, 0.53, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/gQ3YdU0WlPw_filtered.json b/annotations_filtered/gQ3YdU0WlPw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b7c225d2bb4da8e8cf18d88263a6d806af6ef90 --- /dev/null +++ b/annotations_filtered/gQ3YdU0WlPw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.8], [13.0, 19.28], [30.0, 33.74], [45.0, 44.91], [45.0, 46.43], [48.0, 49.2], [50.0, 52.05], [54.0, 69.47], [75.0, 86.41], [87.0, 87.96], [89.0, 90.15], [91.0, 93.24], [97.0, 98.63], [101.0, 101.66], [102.0, 103.5], [105.0, 106.24]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.91, 34.56, 0.0, 0.0, 0.0, 81.0, 38.52, 67.0, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 32.36], ["music", 21.77], ["hum", 6.31]], [["mains hum", 34.65], ["hum", 33.38], ["music", 15.9]], null, null, null, null, [["music", 30.67], ["theremin", 13.43], ["speech", 12.9]], null, null, null, null, null, null, null, null], "duration": [0.8, 6.28, 3.74, -0.09, 1.43, 1.2, 2.05, 15.47, 11.41, 0.96, 1.15, 2.24, 1.63, 0.66, 1.5, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/gQ48-nl8wwc_filtered.json b/annotations_filtered/gQ48-nl8wwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a872c78a25fc7072da5f930c59781d548eccf5b8 --- /dev/null +++ b/annotations_filtered/gQ48-nl8wwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [4.0, 12.63], [15.0, 22.23], [25.0, 60.51], [64.0, 66.87], [68.0, 68.17], [70.0, 70.88], [72.0, 75.0], [84.0, 84.94], [91.0, 92.37], [99.0, 99.25], [101.0, 114.64]], "keep_status": [false, false, true, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 29.99, 29.95, 0.0, 48.19, 0.0, 0.0, 33.99, 0.0, 0.0, 0.0, 31.58], "audiomae_on_audioset": [null, [["music", 69.51], ["fart", 5.42], ["speech", 2.79]], [["music", 37.46], ["speech", 15.57], ["vehicle", 7.59]], null, [["hum", 25.17], ["music", 19.35], ["throbbing", 10.63]], null, null, [["whale vocalization", 24.62], ["speech", 16.99], ["hum", 5.7]], null, null, null, [["music", 72.48], ["speech", 4.37], ["synthesizer", 3.78]]], "duration": [1.05, 8.63, 7.23, 35.51, 2.87, 0.17, 0.88, 3.0, 0.94, 1.37, 0.25, 13.64]} \ No newline at end of file diff --git a/annotations_filtered/gQ5KDSBMFRU_filtered.json b/annotations_filtered/gQ5KDSBMFRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27c3c979771484ddca6f3b46f292e7e5c8f034ab --- /dev/null +++ b/annotations_filtered/gQ5KDSBMFRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.8], [2.0, 2.49], [4.0, 5.19], [6.0, 12.83], [17.0, 18.2], [20.0, 20.93], [24.0, 26.13], [28.0, 29.56], [31.0, 33.47], [36.0, 36.46], [38.0, 41.22], [41.0, 41.91], [42.0, 42.8], [44.0, 44.81], [46.0, 49.22], [50.0, 50.63], [53.0, 53.65], [55.0, 54.95], [58.0, 60.54], [62.0, 62.82], [67.0, 68.94], [71.0, 72.77], [74.0, 77.04], [79.0, 79.12], [80.0, 80.99], [84.0, 85.21], [89.0, 90.39], [92.0, 92.85], [96.0, 96.23], [96.0, 100.41], [100.0, 103.06], [106.0, 106.73], [108.0, 110.96], [113.0, 115.05], [116.0, 119.82], [121.0, 127.52], [130.0, 131.25], [132.0, 133.15], [136.0, 136.66], [138.0, 140.22], [145.0, 146.2], [149.0, 151.24], [154.0, 154.68], [157.0, 159.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 99.97, 0.0, 96.42, 0.0, 79.24, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 99.26, 0.0, 99.94, 100.0, 86.82, 99.65, 0.0, 0.0, 0.0, 99.26, 0.0, 94.95, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 0.49, 1.19, 6.83, 1.2, 0.93, 2.13, 1.56, 2.47, 0.46, 3.22, 0.91, 0.8, 0.81, 3.22, 0.63, 0.65, -0.05, 2.54, 0.82, 1.94, 1.77, 3.04, 0.12, 0.99, 1.21, 1.39, 0.85, 0.23, 4.41, 3.06, 0.73, 2.96, 2.05, 3.82, 6.52, 1.25, 1.15, 0.66, 2.22, 1.2, 2.24, 0.68, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/gQATrdAXELg_filtered.json b/annotations_filtered/gQATrdAXELg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea760fb48498da72c699bf772ca317d016f9c046 --- /dev/null +++ b/annotations_filtered/gQATrdAXELg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [1.0, 25.52], [27.0, 46.53], [47.0, 48.49], [50.0, 50.9], [54.0, 54.77], [60.0, 62.21], [63.0, 103.59], [104.0, 110.0], [115.0, 115.64], [116.0, 116.97], [118.0, 133.07], [135.0, 134.97], [137.0, 137.62], [142.0, 143.68], [145.0, 145.96], [146.0, 146.1], [147.0, 150.84], [153.0, 155.29]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 30.41, 30.04, 0.0, 0.0, 0.0, 42.48, 0.0, 59.15, 0.0, 0.0, 31.03, 0.0, 0.0, 0.0, 0.0, 0.0, 28.54, 36.91], "audiomae_on_audioset": [null, [["music", 54.36], ["speech", 14.99], ["hum", 4.69]], [["music", 48.24], ["hum", 15.78], ["mains hum", 10.68]], null, null, null, [["helicopter", 15.42], ["vehicle", 11.92], ["hum", 8.78]], null, null, null, null, [["music", 63.4], ["speech", 7.4], ["throbbing", 6.9]], null, null, null, null, null, [["music", 40.65], ["eruption", 13.57], ["explosion", 8.63]], [["music", 56.5], ["ambient music", 6.11], ["scary music", 4.11]]], "duration": [0.21, 24.52, 19.53, 1.49, 0.9, 0.77, 2.21, 40.59, 6.0, 0.64, 0.97, 15.07, -0.03, 0.62, 1.68, 0.96, 0.1, 3.84, 2.29]} \ No newline at end of file diff --git a/annotations_filtered/gQMtp2WxEA4_filtered.json b/annotations_filtered/gQMtp2WxEA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe069e9fcdc8099d7f8e3397d47fdb78570aabe4 --- /dev/null +++ b/annotations_filtered/gQMtp2WxEA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [5.0, 5.1], [6.0, 7.74], [16.0, 15.75], [18.0, 19.53], [26.0, 26.43], [29.0, 29.62], [32.0, 32.68], [52.0, 56.89], [66.0, 66.78], [70.0, 70.66], [97.0, 98.1], [101.0, 104.7], [134.0, 134.99], [153.0, 159.07], [165.0, 169.94], [173.0, 177.35], [180.0, 179.91]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81, 0.0, 0.0, 0.0, 46.97, 0.0, 42.6, 31.5, 30.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["grunt", 53.87], ["fart", 6.97], ["animal", 5.01]], null, null, null, [["speech", 11.33], ["music", 8.4], ["bleat", 7.48]], null, [["music", 16.68], ["speech", 12.94], ["didgeridoo", 12.29]], [["music", 79.12], ["didgeridoo", 4.25], ["musical instrument", 3.74]], [["music", 58.02], ["foghorn", 9.23], ["trombone", 8.39]], null], "duration": [0.26, 0.1, 1.74, -0.25, 1.53, 0.43, 0.62, 0.68, 4.89, 0.78, 0.66, 1.1, 3.7, 0.99, 6.07, 4.94, 4.35, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/gQNFCRom7c0_filtered.json b/annotations_filtered/gQNFCRom7c0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ba7df57a7d1e7df69f26fea8f27a48fc1d5f467 --- /dev/null +++ b/annotations_filtered/gQNFCRom7c0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.99], [8.0, 7.92], [10.0, 14.4], [16.0, 16.21], [21.0, 22.42], [24.0, 26.65], [28.0, 31.11], [31.0, 41.52], [42.0, 41.55], [42.0, 41.59], [42.0, 41.62], [42.0, 45.28], [46.0, 45.94], [46.0, 49.54], [51.0, 51.46], [54.0, 55.0], [56.0, 58.26], [61.0, 68.18], [74.0, 75.88], [79.0, 78.87], [79.0, 78.95], [89.0, 90.86], [93.0, 92.8], [93.0, 93.43], [94.0, 96.85], [99.0, 101.83], [117.0, 118.23], [121.0, 124.23], [126.0, 125.74], [128.0, 128.92], [129.0, 131.73], [132.0, 133.51], [134.0, 135.19], [135.0, 142.89], [144.0, 145.12]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 42.04, 0.0, 0.0, 41.91, 37.57, 42.24, 0.0, 0.0, 0.0, 45.43, 0.0, 39.7, 0.0, 0.0, 37.99, 40.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.8, 49.31, 0.0, 40.97, 0.0, 0.0, 40.28, 0.0, 0.0, 39.4, 0.0], "audiomae_on_audioset": [null, null, [["music", 49.18], ["musical instrument", 7.22], ["guitar", 7.17]], null, null, [["music", 53.33], ["electric piano", 3.97], ["keyboard (musical)", 3.34]], [["music", 40.45], ["musical instrument", 9.35], ["plucked string instrument", 7.37]], [["music", 78.81], ["musical instrument", 6.79], ["keyboard (musical)", 2.11]], null, null, null, [["music", 52.15], ["speech", 9.91], ["keyboard (musical)", 5.56]], null, [["music", 37.13], ["harp", 6.75], ["pizzicato", 5.27]], null, null, [["music", 65.01], ["musical instrument", 7.08], ["plucked string instrument", 4.44]], [["music", 65.27], ["musical instrument", 5.53], ["double bass", 4.98]], null, null, null, null, null, null, [["music", 49.34], ["musical instrument", 15.84], ["piano", 5.44]], [["music", 72.97], ["didgeridoo", 8.22], ["musical instrument", 5.2]], null, [["music", 43.4], ["musical instrument", 19.46], ["piano", 15.99]], null, null, [["music", 49.95], ["musical instrument", 10.78], ["double bass", 7.67]], null, null, [["music", 50.78], ["musical instrument", 11.46], ["plucked string instrument", 7.21]], null], "duration": [1.99, -0.08, 4.4, 0.21, 1.42, 2.65, 3.11, 10.52, -0.45, -0.41, -0.38, 3.28, -0.06, 3.54, 0.46, 1.0, 2.26, 7.18, 1.88, -0.13, -0.05, 1.86, -0.2, 0.43, 2.85, 2.83, 1.23, 3.23, -0.26, 0.92, 2.73, 1.51, 1.19, 7.89, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/gQO9bgOLhmg_filtered.json b/annotations_filtered/gQO9bgOLhmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..806adc9577dd85bd1fe8bbc2f0fc1f09741cd290 --- /dev/null +++ b/annotations_filtered/gQO9bgOLhmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.9], [6.0, 6.37], [9.0, 16.87], [22.0, 29.27], [31.0, 35.07], [36.0, 36.68], [38.0, 38.55], [39.0, 40.14], [42.0, 44.24], [51.0, 52.02], [53.0, 58.83], [61.0, 62.41], [64.0, 65.82], [67.0, 69.47], [72.0, 116.13], [117.0, 136.07], [138.0, 138.82], [143.0, 146.82], [148.0, 152.32]], "keep_status": [false, false, true, true, true, false, false, false, true, false, true, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 38.45, 31.12, 43.23, 0.0, 0.0, 0.0, 30.75, 0.0, 30.87, 0.0, 0.0, 34.53, 0.0, 30.75, 0.0, 57.48, 37.41], "audiomae_on_audioset": [null, null, [["speech", 26.89], ["hum", 21.71], ["mains hum", 17.79]], [["hum", 23.38], ["mains hum", 20.36], ["music", 16.6]], [["music", 38.03], ["hum", 11.93], ["throbbing", 11.49]], null, null, null, [["speech", 25.2], ["vehicle", 13.51], ["mains hum", 7.98]], null, [["music", 31.5], ["hum", 14.44], ["mains hum", 8.69]], null, null, [["music", 55.86], ["throbbing", 9.0], ["hum", 6.28]], null, [["music", 28.38], ["hum", 17.58], ["speech", 10.76]], null, null, [["hum", 30.31], ["speech", 18.34], ["mains hum", 14.1]]], "duration": [0.9, 0.37, 7.87, 7.27, 4.07, 0.68, 0.55, 1.14, 2.24, 1.02, 5.83, 1.41, 1.82, 2.47, 44.13, 19.07, 0.82, 3.82, 4.32]} \ No newline at end of file diff --git a/annotations_filtered/gQgdweybPwk_filtered.json b/annotations_filtered/gQgdweybPwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c820bbc6371a85007b9a948bbb12577eb7db9fa9 --- /dev/null +++ b/annotations_filtered/gQgdweybPwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [5.0, 5.58], [6.0, 6.76], [8.0, 9.69], [16.0, 17.2], [22.0, 22.82], [23.0, 23.09], [23.0, 23.14], [23.0, 23.23], [23.0, 23.4], [23.0, 23.75], [24.0, 23.97], [26.0, 29.02], [31.0, 32.64], [33.0, 33.83], [43.0, 54.53], [56.0, 56.83], [62.0, 62.5], [66.0, 66.58], [94.0, 97.07], [100.0, 99.84], [105.0, 105.16], [109.0, 111.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.53, 0.0, 0.0, 40.04, 0.0, 0.0, 0.0, 37.32, 0.0, 0.0, 38.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 75.27], ["radio", 4.29], ["noise", 3.27]], null, null, [["speech", 85.92], ["animal", 3.02], ["electric shaver, electric razor", 2.42]], null, null, null, [["moo", 23.67], ["livestock, farm animals, working animals", 20.37], ["cattle, bovinae", 19.28]], null, null, [["music", 28.39], ["moo", 13.13], ["livestock, farm animals, working animals", 11.52]]], "duration": [0.45, 0.58, 0.76, 1.69, 1.2, 0.82, 0.09, 0.14, 0.23, 0.4, 0.75, -0.03, 3.02, 1.64, 0.83, 11.53, 0.83, 0.5, 0.58, 3.07, -0.16, 0.16, 2.45]} \ No newline at end of file diff --git a/annotations_filtered/gQubL9r0qAQ_filtered.json b/annotations_filtered/gQubL9r0qAQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eba92c5ca3ccaa0474c5a3c580604cf773f79d7 --- /dev/null +++ b/annotations_filtered/gQubL9r0qAQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.45], [5.0, 9.95], [11.0, 12.01], [14.0, 19.48], [21.0, 23.87], [25.0, 32.73], [33.0, 39.56], [40.0, 41.39], [43.0, 43.12], [45.0, 46.92], [47.0, 50.67], [51.0, 54.57], [55.0, 57.5], [58.0, 81.33], [82.0, 84.35], [86.0, 93.39], [95.0, 97.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.93, 0.0, 58.55, 67.76, 62.89, 48.91, 0.0, 0.0, 0.0, 61.97, 50.51, 46.02, 69.47, 63.53, 65.79, 73.51], "audiomae_on_audioset": [null, null, null, null, null, null, [["sidetone", 92.24], ["hum", 1.51], ["sine wave", 1.51]], null, null, null, null, null, [["sidetone", 49.2], ["speech", 28.11], ["hum", 7.55]], null, null, null, null], "duration": [1.45, 4.95, 1.01, 5.48, 2.87, 7.73, 6.56, 1.39, 0.12, 1.92, 3.67, 3.57, 2.5, 23.33, 2.35, 7.39, 2.9]} \ No newline at end of file diff --git a/annotations_filtered/gQwpd1247J8_filtered.json b/annotations_filtered/gQwpd1247J8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9dc4743f6149ad534f173f9dfee55928f5e7b8b --- /dev/null +++ b/annotations_filtered/gQwpd1247J8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.77], [11.0, 12.07], [12.0, 12.9], [19.0, 19.13], [25.0, 33.25], [35.0, 35.06], [36.0, 37.25], [41.0, 41.74], [42.0, 42.72], [44.0, 73.36], [74.0, 74.04], [76.0, 83.37], [86.0, 95.44], [99.0, 102.84], [103.0, 106.84], [107.0, 114.25], [115.0, 130.18], [131.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.37, 0.0, 0.0, 0.0, 0.0, 33.31, 0.0, 35.8, 34.89, 100.0, 100.0, 99.44, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 39.4], ["moo", 28.7], ["cattle, bovinae", 14.5]], null, null, null, null, [["music", 41.03], ["speech", 13.76], ["fly, housefly", 8.2]], null, [["music", 28.96], ["speech", 25.64], ["foghorn", 4.66]], [["music", 42.23], ["speech", 17.87], ["quack", 9.78]], null, null, null, null, null], "duration": [0.77, 1.07, 0.9, 0.13, 8.25, 0.06, 1.25, 0.74, 0.72, 29.36, 0.04, 7.37, 9.44, 3.84, 3.84, 7.25, 15.18, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/gRBOrpdfsiM_filtered.json b/annotations_filtered/gRBOrpdfsiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe8ac76c5a75691fdbf275690fcbd91743639952 --- /dev/null +++ b/annotations_filtered/gRBOrpdfsiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.58], [16.0, 30.77], [32.0, 34.5], [35.0, 42.08], [43.0, 47.22], [53.0, 53.65], [55.0, 55.48], [56.0, 58.75], [62.0, 63.14], [64.0, 64.91], [69.0, 68.88], [70.0, 70.83], [77.0, 78.56], [79.0, 79.05], [80.0, 82.97], [85.0, 86.8], [88.0, 89.73], [90.0, 94.58], [96.0, 97.65], [98.0, 98.63], [99.0, 101.24]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.79, 36.06, 46.22, 40.06, 56.1, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 97.83, 0.0, 0.0, 94.95], "audiomae_on_audioset": [[["speech", 65.33], ["music", 12.2], ["boing", 10.9]], [["mains hum", 26.31], ["hum", 24.58], ["music", 17.38]], [["music", 36.09], ["throbbing", 12.77], ["hum", 7.72]], [["shatter", 32.06], ["music", 28.51], ["speech", 26.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.58, 14.77, 2.5, 7.08, 4.22, 0.65, 0.48, 2.75, 1.14, 0.91, -0.12, 0.83, 1.56, 0.05, 2.97, 1.8, 1.73, 4.58, 1.65, 0.63, 2.24]} \ No newline at end of file diff --git a/annotations_filtered/gRLpvojaVBM_filtered.json b/annotations_filtered/gRLpvojaVBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ce43928198fc05ccc8b744f9e58bbc45edd7d41 --- /dev/null +++ b/annotations_filtered/gRLpvojaVBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.21], [7.0, 7.97], [10.0, 12.09], [14.0, 16.21], [23.0, 23.38], [25.0, 25.62], [30.0, 31.92], [34.0, 33.69], [36.0, 36.36], [37.0, 54.82], [58.0, 58.65], [60.0, 62.14], [65.0, 77.79], [81.0, 81.46], [83.0, 83.29], [85.0, 85.13], [86.0, 92.94], [93.0, 98.86], [99.0, 98.9], [100.0, 100.75], [101.0, 114.51], [118.0, 119.6], [120.0, 120.46], [121.0, 123.13], [124.0, 124.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 99.78, 99.68, 0.0, 0.0, 0.0, 99.97, 54.63, 0.0, 0.0, 44.69, 0.0, 0.0, 96.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.72], ["speech", 15.13], ["boing", 5.33]], null, null, null, null], "duration": [0.21, 0.97, 2.09, 2.21, 0.38, 0.62, 1.92, -0.31, 0.36, 17.82, 0.65, 2.14, 12.79, 0.46, 0.29, 0.13, 6.94, 5.86, -0.1, 0.75, 13.51, 1.6, 0.46, 2.13, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/gRNkQRhMUiE_filtered.json b/annotations_filtered/gRNkQRhMUiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c2c190f8f4fa72164224515f267c3b637256503 --- /dev/null +++ b/annotations_filtered/gRNkQRhMUiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.37], [8.0, 12.26], [14.0, 16.77], [18.0, 20.06], [21.0, 22.15], [22.0, 24.83], [27.0, 27.72], [28.0, 29.07], [30.0, 32.58], [36.0, 38.7], [41.0, 42.16], [43.0, 43.9], [46.0, 46.41], [49.0, 50.04], [50.0, 52.03], [54.0, 55.02], [55.0, 56.61], [62.0, 64.22], [66.0, 66.02], [69.0, 70.82], [73.0, 75.61], [76.0, 79.27], [80.0, 88.91]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, true, true], "silence_prob": [63.31, 58.72, 60.6, 64.07, 0.0, 42.91, 0.0, 0.0, 79.94, 84.62, 0.0, 0.0, 0.0, 0.0, 47.94, 0.0, 0.0, 42.6, 0.0, 0.0, 34.47, 35.1, 31.03], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 31.54], ["hum", 11.63], ["mains hum", 9.73]], null, null, null, null, null, null, null, null, [["speech", 29.29], ["chirp tone", 11.09], ["music", 9.09]], null, null, [["music", 45.93], ["theremin", 6.26], ["musical instrument", 5.7]], null, null, [["music", 36.38], ["synthesizer", 18.23], ["musical instrument", 7.82]], [["music", 25.59], ["mains hum", 20.05], ["speech", 17.11]], [["music", 50.22], ["cello", 7.94], ["foghorn", 7.9]]], "duration": [2.37, 4.26, 2.77, 2.06, 1.15, 2.83, 0.72, 1.07, 2.58, 2.7, 1.16, 0.9, 0.41, 1.04, 2.03, 1.02, 1.61, 2.22, 0.02, 1.82, 2.61, 3.27, 8.91]} \ No newline at end of file diff --git a/annotations_filtered/gRP3sdjszlQ_filtered.json b/annotations_filtered/gRP3sdjszlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..360380962c4eed01698851764b80421759784a3f --- /dev/null +++ b/annotations_filtered/gRP3sdjszlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.87], [22.0, 27.62], [28.0, 27.8], [28.0, 34.28], [44.0, 47.19], [50.0, 50.14], [52.0, 53.0], [54.0, 61.99], [71.0, 72.12], [73.0, 75.74], [78.0, 79.2], [83.0, 84.72], [87.0, 91.79], [100.0, 104.87], [110.0, 114.59], [119.0, 120.36], [128.0, 136.04], [138.0, 143.33], [145.0, 146.97], [147.0, 151.38]], "keep_status": [true, false, false, true, true, false, false, true, false, false, false, false, true, true, true, false, true, true, false, true], "silence_prob": [40.62, 34.04, 0.0, 35.27, 32.97, 0.0, 0.0, 30.12, 0.0, 33.3, 0.0, 0.0, 31.55, 30.49, 32.43, 0.0, 31.49, 30.26, 0.0, 33.19], "audiomae_on_audioset": [[["music", 48.35], ["speech", 5.05], ["boing", 3.22]], [["music", 52.9], ["speech", 19.22], ["thunk", 2.68]], null, [["music", 43.69], ["thunk", 8.05], ["sound effect", 7.73]], [["music", 15.56], ["speech", 12.49], ["boing", 9.37]], null, null, [["fly, housefly", 20.69], ["music", 15.85], ["mosquito", 11.35]], null, [["speech", 36.68], ["music", 31.75], ["effects unit", 4.77]], null, null, [["livestock, farm animals, working animals", 17.46], ["cattle, bovinae", 15.42], ["mosquito", 10.14]], [["music", 40.7], ["boing", 7.72], ["cacophony", 6.16]], [["music", 25.38], ["speech", 11.84], ["musical instrument", 3.14]], null, [["music", 24.6], ["speech", 18.53], ["mosquito", 12.27]], [["music", 33.13], ["throbbing", 5.7], ["fart", 4.53]], null, [["music", 57.19], ["musical instrument", 8.15], ["synthesizer", 3.2]]], "duration": [2.87, 5.62, -0.2, 6.28, 3.19, 0.14, 1.0, 7.99, 1.12, 2.74, 1.2, 1.72, 4.79, 4.87, 4.59, 1.36, 8.04, 5.33, 1.97, 4.38]} \ No newline at end of file diff --git a/annotations_filtered/gRadASOF2m0_filtered.json b/annotations_filtered/gRadASOF2m0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e055617c93a3b439d7df4e04f153727628e76b33 --- /dev/null +++ b/annotations_filtered/gRadASOF2m0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 52.83], [53.0, 52.86], [56.0, 59.17], [66.0, 65.79], [67.0, 67.88], [68.0, 69.36], [75.0, 75.64], [80.0, 80.0], [80.0, 80.49], [81.0, 81.77], [83.0, 84.32], [89.0, 88.87], [95.0, 95.55], [103.0, 104.45], [105.0, 106.66]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.37, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 62.28], ["speech", 5.06], ["musical instrument", 1.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.83, -0.14, 3.17, -0.21, 0.88, 1.36, 0.64, 0.0, 0.49, 0.77, 1.32, -0.13, 0.55, 1.45, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/gRxu0ooBrPE_filtered.json b/annotations_filtered/gRxu0ooBrPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7504b1134ff29eeab613ddfb06f1e37c18754590 --- /dev/null +++ b/annotations_filtered/gRxu0ooBrPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.55], [12.0, 15.8], [18.0, 19.8], [21.0, 22.52], [24.0, 25.79], [27.0, 29.32], [30.0, 31.83], [33.0, 35.65], [38.0, 39.65], [43.0, 45.12], [47.0, 49.0], [52.0, 52.71], [54.0, 55.04], [58.0, 59.59], [63.0, 64.59], [65.0, 68.0], [69.0, 70.71], [72.0, 74.63], [76.0, 78.21], [81.0, 81.33], [83.0, 84.94], [85.0, 87.15], [88.0, 91.3], [93.0, 94.91], [96.0, 99.39], [102.0, 106.0], [107.0, 110.56], [112.0, 114.76], [116.0, 120.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 96.77, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.55, 3.8, 1.8, 1.52, 1.79, 2.32, 1.83, 2.65, 1.65, 2.12, 2.0, 0.71, 1.04, 1.59, 1.59, 3.0, 1.71, 2.63, 2.21, 0.33, 1.94, 2.15, 3.3, 1.91, 3.39, 4.0, 3.56, 2.76, 4.38]} \ No newline at end of file diff --git a/annotations_filtered/gRyEkrwnyaI_filtered.json b/annotations_filtered/gRyEkrwnyaI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47fab7fd6bff0f37428ed6fff66de60b6488e3f3 --- /dev/null +++ b/annotations_filtered/gRyEkrwnyaI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [9.0, 9.31], [12.0, 12.68], [14.0, 14.07], [15.0, 15.43], [17.0, 17.15], [22.0, 24.14], [26.0, 25.95], [33.0, 33.91], [36.0, 37.0], [42.0, 42.52], [44.0, 44.0], [58.0, 63.05], [64.0, 64.94], [72.0, 72.32], [73.0, 73.6], [78.0, 79.81], [81.0, 87.69], [90.0, 90.9], [95.0, 99.05], [103.0, 105.22], [109.0, 112.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.34, 0.0, 0.0, 0.0, 0.0, 0.0, 32.46, 0.0, 0.0, 0.0, 0.0, 51.39, 0.0, 33.28, 32.06, 32.11], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 73.68], ["throbbing", 5.19], ["scary music", 2.57]], null, null, null, null, null, [["speech", 58.88], ["music", 12.48], ["whale vocalization", 2.8]], null, null, null, null, null, null, [["music", 36.26], ["theremin", 32.07], ["didgeridoo", 3.6]], [["music", 50.72], ["speech", 4.61], ["boing", 2.71]], [["music", 58.47], ["cacophony", 3.44], ["synthesizer", 2.02]]], "duration": [0.88, 0.31, 0.68, 0.07, 0.43, 0.15, 2.14, -0.05, 0.91, 1.0, 0.52, 0.0, 5.05, 0.94, 0.32, 0.6, 1.81, 6.69, 0.9, 4.05, 2.22, 3.67]} \ No newline at end of file diff --git a/annotations_filtered/gRzjSsXw9PU_filtered.json b/annotations_filtered/gRzjSsXw9PU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..493c233464158422e563ae17bee4ed7395849859 --- /dev/null +++ b/annotations_filtered/gRzjSsXw9PU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.93], [10.0, 15.25], [21.0, 25.14], [26.0, 27.11], [28.0, 29.17], [32.0, 37.77], [38.0, 38.72], [40.0, 40.71], [42.0, 42.2], [43.0, 51.49], [56.0, 57.18], [57.0, 57.59], [58.0, 60.67], [62.0, 63.9], [67.0, 72.05], [75.0, 76.49], [79.0, 79.34], [80.0, 79.68], [80.0, 83.86], [84.0, 89.11], [93.0, 93.73], [97.0, 96.84], [101.0, 108.14], [113.0, 130.62]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 56.33, 42.81, 0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 80.29, 0.0, 97.11, 0.0, 0.0, 0.0, 58.98, 36.31, 0.0, 0.0, 31.01, 31.75], "audiomae_on_audioset": [null, null, [["music", 23.21], ["noise", 18.34], ["hum", 6.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 56.16], ["speech", 22.35], ["fart", 9.0]], null, null, [["boing", 14.29], ["animal", 14.05], ["speech", 11.95]], [["boing", 16.2], ["whack, thwack", 14.41], ["speech", 11.69]]], "duration": [0.93, 5.25, 4.14, 1.11, 1.17, 5.77, 0.72, 0.71, 0.2, 8.49, 1.18, 0.59, 2.67, 1.9, 5.05, 1.49, 0.34, -0.32, 3.86, 5.11, 0.73, -0.16, 7.14, 17.62]} \ No newline at end of file diff --git a/annotations_filtered/gS56O-aHEMs_filtered.json b/annotations_filtered/gS56O-aHEMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36c669f20dbb91f8e25a96d8997157870ed20843 --- /dev/null +++ b/annotations_filtered/gS56O-aHEMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 23.95], [30.0, 35.13], [37.0, 51.06], [54.0, 60.83], [62.0, 64.62], [65.0, 87.79], [89.0, 89.45], [91.0, 91.59]], "keep_status": [true, true, true, true, true, true, false, false], "silence_prob": [46.68, 30.32, 42.55, 32.04, 35.3, 32.03, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 47.4], ["sonar", 9.94], ["sine wave", 7.33]], [["music", 39.67], ["hum", 8.22], ["synthesizer", 7.12]], [["hum", 32.36], ["music", 17.27], ["sonar", 15.2]], [["hum", 34.09], ["mains hum", 21.3], ["explosion", 7.52]], [["speech", 38.29], ["music", 8.08], ["whale vocalization", 6.12]], [["speech", 49.1], ["animal", 10.87], ["vehicle", 4.68]], null, null], "duration": [18.95, 5.13, 14.06, 6.83, 2.62, 22.79, 0.45, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/gS6ibQuZIS8_filtered.json b/annotations_filtered/gS6ibQuZIS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2673a9e770f66e17780fa918b1e2dd37ab68744 --- /dev/null +++ b/annotations_filtered/gS6ibQuZIS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 47.9], [49.0, 56.2], [59.0, 82.39]], "keep_status": [false, false, true], "silence_prob": [44.01, 95.37, 36.48], "audiomae_on_audioset": [[["music", 50.47], ["whale vocalization", 15.98], ["ambient music", 3.81]], null, [["music", 29.94], ["whale vocalization", 10.88], ["theremin", 10.36]]], "duration": [2.9, 7.2, 23.39]} \ No newline at end of file diff --git a/annotations_filtered/gSG9bZu1NtM_filtered.json b/annotations_filtered/gSG9bZu1NtM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5c265f3bd61dd6785c07ea1ee562dd48bab5f31 --- /dev/null +++ b/annotations_filtered/gSG9bZu1NtM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [4.0, 7.33], [9.0, 13.68], [20.0, 20.14], [23.0, 23.92], [25.0, 27.5], [29.0, 57.89], [59.0, 60.59], [66.0, 67.09], [68.0, 68.4], [70.0, 70.29], [71.0, 71.56], [72.0, 81.23], [83.0, 84.28], [86.0, 87.99], [90.0, 92.18], [96.0, 103.81], [106.0, 106.66], [110.0, 114.78], [118.0, 118.12], [122.0, 124.16], [131.0, 130.94], [133.0, 136.43], [137.0, 137.83], [140.0, 146.67], [150.0, 161.0], [164.0, 178.19]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 52.74, 51.6, 0.0, 0.0, 39.74, 33.99, 0.0, 0.0, 0.0, 0.0, 0.0, 31.36, 0.0, 0.0, 86.45, 31.63, 0.0, 34.67, 0.0, 35.51, 0.0, 33.19, 0.0, 31.96, 33.89, 32.52], "audiomae_on_audioset": [null, null, null, null, null, [["music", 46.8], ["musical instrument", 11.56], ["foghorn", 7.42]], [["whale vocalization", 25.95], ["speech", 23.25], ["noise", 13.49]], null, null, null, null, null, [["music", 48.02], ["speech", 17.33], ["thump, thud", 4.59]], null, null, null, [["music", 39.13], ["mains hum", 7.31], ["hum", 6.78]], null, [["music", 29.04], ["throbbing", 20.97], ["hum", 12.36]], null, [["music", 71.75], ["throbbing", 7.38], ["hum", 3.07]], null, [["music", 38.91], ["hum", 8.45], ["throbbing", 7.97]], null, [["music", 56.02], ["hum", 7.41], ["throbbing", 5.61]], [["hum", 37.85], ["throbbing", 28.02], ["music", 18.74]], [["hum", 46.71], ["music", 19.05], ["mains hum", 12.91]]], "duration": [0.64, 3.33, 4.68, 0.14, 0.92, 2.5, 28.89, 1.59, 1.09, 0.4, 0.29, 0.56, 9.23, 1.28, 1.99, 2.18, 7.81, 0.66, 4.78, 0.12, 2.16, -0.06, 3.43, 0.83, 6.67, 11.0, 14.19]} \ No newline at end of file diff --git a/annotations_filtered/gSZ82TOHWc0_filtered.json b/annotations_filtered/gSZ82TOHWc0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6ef2889234d47070c29bad698536a98385b3668 --- /dev/null +++ b/annotations_filtered/gSZ82TOHWc0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.61], [13.0, 13.83], [21.0, 21.64], [45.0, 45.86], [46.0, 46.47], [48.0, 48.76], [49.0, 49.71], [50.0, 50.38], [51.0, 51.63], [55.0, 56.93], [78.0, 78.63], [80.0, 80.0], [85.0, 86.54], [90.0, 91.59], [99.0, 100.7], [112.0, 112.43], [113.0, 114.62], [115.0, 120.07], [121.0, 125.22], [127.0, 128.58], [130.0, 130.27], [133.0, 136.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.53, 79.41, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.62], ["music", 16.04], ["fart", 6.58]], null, null, null, null], "duration": [1.61, 0.83, 0.64, 0.86, 0.47, 0.76, 0.71, 0.38, 0.63, 1.93, 0.63, 0.0, 1.54, 1.59, 1.7, 0.43, 1.62, 5.07, 4.22, 1.58, 0.27, 3.53]} \ No newline at end of file diff --git a/annotations_filtered/gT7MQhe8gRE_filtered.json b/annotations_filtered/gT7MQhe8gRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec24fae43ef41e48f583056adc6a2ef3a8640dc9 --- /dev/null +++ b/annotations_filtered/gT7MQhe8gRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.97], [12.0, 62.8], [65.0, 68.55], [70.0, 84.94], [92.0, 92.16], [93.0, 94.09], [99.0, 99.32], [100.0, 101.51], [104.0, 104.75], [106.0, 106.52], [107.0, 109.56], [111.0, 111.87], [113.0, 113.75], [117.0, 133.62], [134.0, 136.48], [139.0, 141.29], [142.0, 161.15]], "keep_status": [false, false, true, true, false, false, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [46.68, 0.0, 39.91, 46.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.65, 0.0, 0.0, 31.09, 30.66, 29.88, 34.63], "audiomae_on_audioset": [[["speech", 73.26], ["music", 8.1], ["hum", 3.71]], null, [["music", 34.18], ["speech", 29.32], ["didgeridoo", 6.32]], [["music", 40.27], ["buzz", 6.66], ["male singing", 5.74]], null, null, null, null, null, null, [["music", 60.03], ["synthesizer", 2.82], ["singing", 2.74]], null, null, [["music", 51.69], ["cattle, bovinae", 8.72], ["moo", 7.05]], [["music", 38.19], ["didgeridoo", 35.59], ["synthesizer", 3.94]], [["moo", 42.55], ["cattle, bovinae", 33.51], ["livestock, farm animals, working animals", 13.39]], [["fly, housefly", 23.4], ["mosquito", 13.17], ["hum", 12.57]]], "duration": [8.97, 50.8, 3.55, 14.94, 0.16, 1.09, 0.32, 1.51, 0.75, 0.52, 2.56, 0.87, 0.75, 16.62, 2.48, 2.29, 19.15]} \ No newline at end of file diff --git a/annotations_filtered/gTAMKrPh1AE_filtered.json b/annotations_filtered/gTAMKrPh1AE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7d1837c24ecab67cb86cdcbc9ce4789b17fe03b --- /dev/null +++ b/annotations_filtered/gTAMKrPh1AE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.81], [14.0, 18.3], [20.0, 21.29], [27.0, 28.8], [33.0, 37.66], [38.0, 41.81], [46.0, 46.58], [49.0, 49.86], [54.0, 62.5], [64.0, 65.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.06, 0.0, 0.0, 99.78, 99.4, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.81, 4.3, 1.29, 1.8, 4.66, 3.81, 0.58, 0.86, 8.5, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/gTKpKBzd7jg_filtered.json b/annotations_filtered/gTKpKBzd7jg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67b617af03180357a61d3f786039abec4596607b --- /dev/null +++ b/annotations_filtered/gTKpKBzd7jg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.53], [24.0, 24.34], [26.0, 26.33], [30.0, 30.35], [33.0, 32.78], [38.0, 41.03], [41.0, 60.07], [63.0, 69.7], [71.0, 71.66], [73.0, 73.43], [74.0, 74.6], [76.0, 77.8], [79.0, 79.93], [81.0, 86.51], [89.0, 89.63], [92.0, 92.38], [93.0, 93.7], [97.0, 97.93], [103.0, 104.97], [108.0, 110.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 37.49, 61.87, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 80.63], ["didgeridoo", 6.62], ["theremin", 4.13]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 0.34, 0.33, 0.35, -0.22, 3.03, 19.07, 6.7, 0.66, 0.43, 0.6, 1.8, 0.93, 5.51, 0.63, 0.38, 0.7, 0.93, 1.97, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/gTLqDBbrmPM_filtered.json b/annotations_filtered/gTLqDBbrmPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbc9cdf68e19c485e81e2baefc77641a9be73861 --- /dev/null +++ b/annotations_filtered/gTLqDBbrmPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [5.0, 21.74], [23.0, 27.48], [29.0, 29.79], [34.0, 35.8]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 31.67, 61.87, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 43.95], ["explosion", 7.5], ["livestock, farm animals, working animals", 5.59]], null, null, null], "duration": [0.5, 16.74, 4.48, 0.79, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/gTVoFCP1BLg_filtered.json b/annotations_filtered/gTVoFCP1BLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abf913347425359b71b7cc7f431dbf8ed976a10c --- /dev/null +++ b/annotations_filtered/gTVoFCP1BLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.83], [15.0, 25.22], [30.0, 82.75], [85.0, 85.18]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 32.53, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 42.29], ["musical instrument", 10.46], ["brass instrument", 5.87]], null, null], "duration": [0.83, 10.22, 52.75, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/gTWo9oLJOWk_filtered.json b/annotations_filtered/gTWo9oLJOWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9137de4cdbdcb0c55eb894c136a0ab623dfe65bb --- /dev/null +++ b/annotations_filtered/gTWo9oLJOWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 72.57], [73.0, 73.45], [74.0, 146.72], [150.0, 151.12], [155.0, 155.29], [157.0, 157.6], [158.0, 159.71]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [43.57, 0.45, 72.72, 1.12, 0.29, 0.6, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/gTakZ13l8xY_filtered.json b/annotations_filtered/gTakZ13l8xY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bf2c089522e7bf118d64db09dc97cb3222dc947 --- /dev/null +++ b/annotations_filtered/gTakZ13l8xY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [4.0, 4.23], [14.0, 14.89], [18.0, 18.57], [20.0, 20.38], [25.0, 25.74], [28.0, 28.41], [38.0, 38.79], [46.0, 46.3], [48.0, 48.68], [52.0, 54.65], [56.0, 56.37], [59.0, 60.24], [66.0, 67.56], [72.0, 73.18], [75.0, 75.2], [76.0, 77.35], [83.0, 83.13], [84.0, 86.37], [88.0, 88.7], [93.0, 92.8], [100.0, 99.98], [102.0, 102.79], [107.0, 107.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.08, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 17.05], ["throbbing", 12.74], ["speech", 7.43]], null, null, null, null, null, null, null, [["music", 35.8], ["whale vocalization", 9.83], ["hum", 6.49]], null, null, null, null, null], "duration": [0.47, 0.23, 0.89, 0.57, 0.38, 0.74, 0.41, 0.79, 0.3, 0.68, 2.65, 0.37, 1.24, 1.56, 1.18, 0.2, 1.35, 0.13, 2.37, 0.7, -0.2, -0.02, 0.79, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/gTgm44dkSCY_filtered.json b/annotations_filtered/gTgm44dkSCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d45a1b416f5ad8953a22e981c865314e2c70cd33 --- /dev/null +++ b/annotations_filtered/gTgm44dkSCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [4.0, 13.19], [15.0, 15.67], [19.0, 20.73], [22.0, 22.65], [23.0, 25.14], [34.0, 40.74], [43.0, 45.44], [46.0, 50.92], [52.0, 53.77], [56.0, 58.23], [60.0, 60.57], [62.0, 64.35], [66.0, 75.59], [76.0, 78.97], [80.0, 84.06], [86.0, 89.99], [95.0, 96.84], [97.0, 100.99], [109.0, 114.71], [115.0, 132.87], [134.0, 139.51], [142.0, 150.55], [152.0, 153.5], [155.0, 157.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.97, 0.0, 0.0, 0.0, 99.99, 99.97, 97.33, 91.64, 0.0, 100.0, 0.0, 99.92, 100.0, 99.85, 99.98, 100.0, 0.0, 92.31, 100.0, 99.93, 96.54, 100.0, 0.0, 98.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 9.19, 0.67, 1.73, 0.65, 2.14, 6.74, 2.44, 4.92, 1.77, 2.23, 0.57, 2.35, 9.59, 2.97, 4.06, 3.99, 1.84, 3.99, 5.71, 17.87, 5.51, 8.55, 1.5, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/gTt8yvw4MJE_filtered.json b/annotations_filtered/gTt8yvw4MJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bdab74c8d1af68307b989fca7ce1e88b32d7fab --- /dev/null +++ b/annotations_filtered/gTt8yvw4MJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.32], [13.0, 16.04], [18.0, 20.85], [23.0, 23.8], [29.0, 29.1], [41.0, 41.28], [47.0, 49.44], [50.0, 49.62], [50.0, 51.39], [53.0, 55.83], [65.0, 65.45], [76.0, 77.09], [83.0, 82.97], [86.0, 88.03], [89.0, 91.84], [94.0, 95.44], [105.0, 106.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 100.0, 39.34, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 38.67, 0.0, 0.0, 0.0, 44.09, 44.23, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["stomach rumble", 30.71], ["speech", 28.24], ["crack", 12.79]], null, null, null, null, null, null, [["hum", 28.2], ["music", 26.8], ["throbbing", 16.47]], null, null, null, [["music", 37.17], ["throbbing", 19.28], ["hum", 15.5]], [["music", 29.17], ["hum", 19.18], ["speech", 7.7]], null, null], "duration": [1.32, 3.04, 2.85, 0.8, 0.1, 0.28, 2.44, -0.38, 1.39, 2.83, 0.45, 1.09, -0.03, 2.03, 2.84, 1.44, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/gU886wmXhQo_filtered.json b/annotations_filtered/gU886wmXhQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..577051a1e717400bb81775de2bb9efbbb0249b1d --- /dev/null +++ b/annotations_filtered/gU886wmXhQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.99], [35.0, 36.32], [58.0, 58.7]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.99, 1.32, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/gUKbFeHjYX8_filtered.json b/annotations_filtered/gUKbFeHjYX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e59fe727db9e3c5a3368ac0ce71d2b4472564d3 --- /dev/null +++ b/annotations_filtered/gUKbFeHjYX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.67], [12.0, 62.45], [65.0, 134.4], [135.0, 138.96], [142.0, 153.69]], "keep_status": [false, false, false, false, true], "silence_prob": [38.67, 0.0, 0.0, 59.96, 33.31], "audiomae_on_audioset": [[["music", 38.96], ["hum", 23.32], ["mains hum", 10.62]], null, null, null, [["music", 21.27], ["explosion", 16.32], ["rumble", 13.52]]], "duration": [2.67, 50.45, 69.4, 3.96, 11.69]} \ No newline at end of file diff --git a/annotations_filtered/gUeHamRZkSY_filtered.json b/annotations_filtered/gUeHamRZkSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89000d6cb04e750cded316431994c13c19fd6ee1 --- /dev/null +++ b/annotations_filtered/gUeHamRZkSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.08], [9.0, 12.41], [15.0, 16.36], [17.0, 17.81], [21.0, 20.93], [21.0, 22.08], [24.0, 27.77], [29.0, 29.44], [32.0, 32.05], [36.0, 44.34], [46.0, 48.27], [49.0, 61.7], [64.0, 66.65], [67.0, 67.81], [70.0, 70.58], [72.0, 72.69], [73.0, 74.26], [81.0, 81.67], [83.0, 83.05], [84.0, 85.11], [86.0, 85.75], [91.0, 91.17], [97.0, 98.31], [100.0, 101.44], [102.0, 103.81], [116.0, 138.75], [143.0, 142.77], [150.0, 150.77], [154.0, 154.63], [157.0, 156.95]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [48.91, 47.2, 0.0, 0.0, 0.0, 0.0, 40.4, 0.0, 0.0, 82.07, 86.82, 92.15, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.6, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 41.43], ["animal", 11.9], ["speech", 5.73]], [["music", 36.21], ["hum", 11.42], ["mains hum", 6.49]], null, null, null, null, [["sidetone", 36.9], ["speech", 29.69], ["mains hum", 10.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.44], ["speech", 14.68], ["animal", 6.6]], null, null, null, null], "duration": [6.08, 3.41, 1.36, 0.81, -0.07, 1.08, 3.77, 0.44, 0.05, 8.34, 2.27, 12.7, 2.65, 0.81, 0.58, 0.69, 1.26, 0.67, 0.05, 1.11, -0.25, 0.17, 1.31, 1.44, 1.81, 22.75, -0.23, 0.77, 0.63, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/gUpkU0-pS3U_filtered.json b/annotations_filtered/gUpkU0-pS3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..572c43ecb5883e4dba98e73f907ed13828c3ccad --- /dev/null +++ b/annotations_filtered/gUpkU0-pS3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.06], [3.0, 5.61], [9.0, 9.61], [14.0, 18.06], [20.0, 21.32], [25.0, 30.25], [31.0, 32.81], [33.0, 34.94], [37.0, 38.01], [38.0, 42.67], [44.0, 45.82], [46.0, 49.1], [51.0, 51.29], [52.0, 54.77], [60.0, 62.02], [62.0, 62.6], [73.0, 86.54], [89.0, 91.12], [93.0, 95.27], [95.0, 95.49], [96.0, 97.55], [99.0, 118.44], [119.0, 124.6], [127.0, 128.41]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, true, false], "silence_prob": [40.61, 44.49, 0.0, 41.89, 0.0, 67.0, 0.0, 0.0, 0.0, 43.93, 0.0, 59.68, 0.0, 74.76, 40.48, 0.0, 56.48, 47.82, 39.37, 0.0, 0.0, 42.84, 39.61, 0.0], "audiomae_on_audioset": [[["speech", 67.94], ["mains hum", 3.85], ["sidetone", 3.58]], [["speech", 30.22], ["hum", 22.0], ["mains hum", 20.11]], null, [["speech", 11.54], ["heart sounds, heartbeat", 11.24], ["hum", 7.47]], null, null, null, null, null, [["fly, housefly", 36.21], ["bee, wasp, etc.", 14.88], ["insect", 12.05]], null, null, null, null, [["chirp tone", 24.54], ["sine wave", 23.43], ["speech", 23.08]], null, null, [["sine wave", 40.48], ["chirp tone", 34.02], ["sidetone", 3.53]], [["speech", 60.32], ["hum", 3.63], ["sidetone", 3.02]], null, null, [["music", 32.09], ["speech", 12.74], ["synthesizer", 7.11]], [["music", 48.16], ["synthesizer", 6.97], ["electronic music", 4.54]], null], "duration": [2.06, 2.61, 0.61, 4.06, 1.32, 5.25, 1.81, 1.94, 1.01, 4.67, 1.82, 3.1, 0.29, 2.77, 2.02, 0.6, 13.54, 2.12, 2.27, 0.49, 1.55, 19.44, 5.6, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/gUrSHyV7Opg_filtered.json b/annotations_filtered/gUrSHyV7Opg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b38940f6ff7d633efd66ff63af751a2bc6644eb8 --- /dev/null +++ b/annotations_filtered/gUrSHyV7Opg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.64], [5.0, 12.01], [25.0, 28.29], [33.0, 35.55], [43.0, 44.2], [65.0, 64.98], [69.0, 76.33], [81.0, 109.76]], "keep_status": [false, true, true, true, false, false, false, false], "silence_prob": [57.09, 44.99, 32.54, 32.44, 0.0, 0.0, 31.82, 30.14], "audiomae_on_audioset": [null, [["music", 34.69], ["effects unit", 21.87], ["musical instrument", 6.78]], [["music", 39.83], ["carnatic music", 22.77], ["mantra", 6.29]], [["music", 45.2], ["chant", 13.19], ["carnatic music", 8.53]], null, null, [["music", 65.93], ["theremin", 12.34], ["synthesizer", 2.53]], [["music", 76.91], ["crackle", 3.81], ["buzz", 2.65]]], "duration": [2.64, 7.01, 3.29, 2.55, 1.2, -0.02, 7.33, 28.76]} \ No newline at end of file diff --git a/annotations_filtered/gV6Y3OwR2n0_filtered.json b/annotations_filtered/gV6Y3OwR2n0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27d6e127f09b8cac0d180181a0228e8ae6d12ebb --- /dev/null +++ b/annotations_filtered/gV6Y3OwR2n0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.24], [7.0, 11.8], [12.0, 14.52], [15.0, 17.41], [19.0, 22.86], [23.0, 96.11], [98.0, 98.74], [100.0, 101.43], [105.0, 105.41], [108.0, 108.68], [110.0, 111.06], [112.0, 113.86], [116.0, 116.95], [118.0, 118.94], [122.0, 122.69], [123.0, 124.24], [126.0, 125.95], [129.0, 129.66], [131.0, 132.65], [133.0, 152.66], [154.0, 156.02], [158.0, 158.46], [167.0, 167.14], [169.0, 169.59], [174.0, 174.68], [176.0, 177.03], [178.0, 179.07]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.45, 41.6, 52.27, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.53, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 45.21], ["hum", 6.72], ["fly, housefly", 5.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.61], ["synthesizer", 8.76], ["musical instrument", 4.97]], null, null, null, null, null, null, null], "duration": [1.24, 4.8, 2.52, 2.41, 3.86, 73.11, 0.74, 1.43, 0.41, 0.68, 1.06, 1.86, 0.95, 0.94, 0.69, 1.24, -0.05, 0.66, 1.65, 19.66, 2.02, 0.46, 0.14, 0.59, 0.68, 1.03, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/gVdIiTE1ykg_filtered.json b/annotations_filtered/gVdIiTE1ykg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dbff3b08e36792516677de853ec9e7cfb06e9c8 --- /dev/null +++ b/annotations_filtered/gVdIiTE1ykg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.28], [6.0, 6.89], [9.0, 10.02], [14.0, 14.96], [17.0, 17.95], [19.0, 18.87], [24.0, 25.08], [28.0, 28.22], [30.0, 31.68], [32.0, 34.2], [45.0, 46.65], [49.0, 49.82], [50.0, 53.22], [55.0, 56.46], [59.0, 59.24], [60.0, 66.18], [67.0, 78.22], [88.0, 88.42], [90.0, 91.76], [94.0, 95.22], [96.0, 97.7], [104.0, 125.02], [128.0, 129.51], [131.0, 131.5], [133.0, 137.0], [140.0, 144.63], [147.0, 149.22], [152.0, 153.05], [156.0, 157.64], [159.0, 161.91], [162.0, 163.83], [166.0, 168.44]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.86, 0.0, 0.0, 33.12, 0.0, 0.0, 31.22, 31.43, 0.0, 0.0, 0.0, 0.0, 32.68, 0.0, 0.0, 81.89, 31.97, 36.81, 0.0, 0.0, 63.64, 0.0, 93.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 37.01], ["speech", 21.22], ["bee, wasp, etc.", 5.05]], null, null, [["speech", 32.39], ["music", 27.8], ["hum", 9.44]], null, null, [["music", 52.38], ["hum", 8.99], ["speech", 6.01]], [["music", 72.07], ["synthesizer", 7.66], ["timpani", 2.98]], null, null, null, null, [["music", 82.3], ["hum", 1.58], ["thunk", 1.55]], null, null, null, [["clang", 22.5], ["ding", 18.18], ["gunshot, gunfire", 12.25]], [["speech", 63.36], ["breaking", 21.55], ["outside, rural or natural", 2.26]], null, null, null, null, null], "duration": [1.28, 0.89, 1.02, 0.96, 0.95, -0.13, 1.08, 0.22, 1.68, 2.2, 1.65, 0.82, 3.22, 1.46, 0.24, 6.18, 11.22, 0.42, 1.76, 1.22, 1.7, 21.02, 1.51, 0.5, 4.0, 4.63, 2.22, 1.05, 1.64, 2.91, 1.83, 2.44]} \ No newline at end of file diff --git a/annotations_filtered/gVseixK20cM_filtered.json b/annotations_filtered/gVseixK20cM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9403dfadb8ffb9b13015de754a11eb17dbb3e4e --- /dev/null +++ b/annotations_filtered/gVseixK20cM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.02], [11.0, 14.4], [16.0, 21.05], [22.0, 22.77], [31.0, 31.68], [36.0, 36.75], [39.0, 39.88], [44.0, 48.79], [50.0, 51.12], [52.0, 52.96], [56.0, 59.88], [63.0, 63.21], [64.0, 65.91], [77.0, 76.82], [82.0, 83.08], [98.0, 98.81], [105.0, 105.56], [106.0, 106.54], [108.0, 109.29], [117.0, 117.54], [123.0, 123.79], [129.0, 130.6]], "keep_status": [true, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.23, 43.48, 36.11, 0.0, 0.0, 0.0, 0.0, 41.58, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 28.47], ["creak", 13.96], ["music", 9.31]], [["music", 21.95], ["bee, wasp, etc.", 10.93], ["livestock, farm animals, working animals", 6.97]], [["speech", 46.51], ["animal", 10.36], ["cowbell", 8.29]], null, null, null, null, [["music", 42.3], ["hum", 10.17], ["mains hum", 8.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.02, 3.4, 5.05, 0.77, 0.68, 0.75, 0.88, 4.79, 1.12, 0.96, 3.88, 0.21, 1.91, -0.18, 1.08, 0.81, 0.56, 0.54, 1.29, 0.54, 0.79, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/gW-Os5mjbGM_filtered.json b/annotations_filtered/gW-Os5mjbGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f1eaba31067e047502e06efbb3fbb70387b6fd9 --- /dev/null +++ b/annotations_filtered/gW-Os5mjbGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.75], [13.0, 14.0], [16.0, 16.9], [18.0, 19.25], [44.0, 44.58], [48.0, 48.42], [58.0, 58.48], [66.0, 66.72], [69.0, 69.63]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.75, 1.0, 0.9, 1.25, 0.58, 0.42, 0.48, 0.72, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/gW3KZsBwQzw_filtered.json b/annotations_filtered/gW3KZsBwQzw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e303b66580d70eb4a876cf775abeb248c2bef34 --- /dev/null +++ b/annotations_filtered/gW3KZsBwQzw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.99], [5.0, 5.76], [8.0, 8.82], [10.0, 15.38], [16.0, 21.1], [24.0, 24.6], [26.0, 25.61], [26.0, 26.01], [29.0, 30.28], [32.0, 33.4], [36.0, 36.27], [47.0, 50.99], [54.0, 56.32], [58.0, 61.2], [70.0, 77.9], [79.0, 83.32], [85.0, 87.89], [88.0, 88.4], [91.0, 99.94], [103.0, 103.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 66.15, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.98, 46.54, 37.76, 38.98, 33.72, 46.72, 0.0, 56.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.81], ["speech", 8.4], ["techno", 2.71]], [["speech", 27.28], ["music", 21.23], ["fart", 16.9]], [["music", 29.25], ["cattle, bovinae", 13.59], ["moo", 12.33]], [["speech", 19.38], ["throbbing", 19.36], ["hum", 16.29]], [["speech", 42.76], ["music", 12.36], ["synthesizer", 3.89]], null, null, null], "duration": [-0.01, 0.76, 0.82, 5.38, 5.1, 0.6, -0.39, 0.01, 1.28, 1.4, 0.27, 3.99, 2.32, 3.2, 7.9, 4.32, 2.89, 0.4, 8.94, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/gW7ozVNSL8k_filtered.json b/annotations_filtered/gW7ozVNSL8k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2207c8e21162dd4fda648dd267654a6dd7058b2e --- /dev/null +++ b/annotations_filtered/gW7ozVNSL8k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [7.0, 7.7], [14.0, 14.61], [15.0, 15.99], [24.0, 25.79], [26.0, 26.91], [31.0, 32.1], [35.0, 35.06], [36.0, 38.57], [41.0, 44.61], [46.0, 47.53], [53.0, 56.71], [64.0, 64.71], [68.0, 68.84], [70.0, 70.75], [71.0, 73.67], [75.0, 80.45], [81.0, 81.77], [83.0, 84.62], [86.0, 86.95], [88.0, 89.29], [95.0, 97.97], [104.0, 104.89], [105.0, 106.34], [112.0, 112.26], [113.0, 127.97], [129.0, 129.36], [138.0, 147.19], [149.0, 150.67]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.96, 42.46, 0.0, 80.11, 0.0, 0.0, 0.0, 60.32, 62.47, 0.0, 0.0, 0.0, 0.0, 31.05, 0.0, 0.0, 0.0, 42.55, 0.0, 37.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whale vocalization", 49.71], ["speech", 8.28], ["mosquito", 5.58]], [["moo", 41.38], ["cattle, bovinae", 34.4], ["livestock, farm animals, working animals", 11.43]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 21.8], ["music", 12.84], ["fly, housefly", 9.61]], null, null, null, [["speech", 61.83], ["buzz", 7.13], ["sheep", 5.08]], null, [["music", 65.0], ["scary music", 12.55], ["whale vocalization", 6.1]], null], "duration": [0.35, 0.7, 0.61, 0.99, 1.79, 0.91, 1.1, 0.06, 2.57, 3.61, 1.53, 3.71, 0.71, 0.84, 0.75, 2.67, 5.45, 0.77, 1.62, 0.95, 1.29, 2.97, 0.89, 1.34, 0.26, 14.97, 0.36, 9.19, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/gWB-uAtqUIs_filtered.json b/annotations_filtered/gWB-uAtqUIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..675006dbeb7f0cc471992bfe90bc1eecc89a5a2e --- /dev/null +++ b/annotations_filtered/gWB-uAtqUIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.52], [8.0, 8.09], [10.0, 10.32], [11.0, 12.38], [13.0, 14.71], [15.0, 15.7], [39.0, 40.91], [42.0, 44.88], [46.0, 50.33], [53.0, 54.9], [55.0, 57.87], [59.0, 61.65], [63.0, 64.18], [65.0, 65.48], [66.0, 76.81], [77.0, 86.05], [87.0, 88.55], [89.0, 91.91], [92.0, 96.72], [98.0, 99.33]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.12, 60.89, 0.0, 36.27, 64.29, 0.0, 0.0, 59.77, 43.38, 0.0, 50.71, 41.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["burping, eructation", 26.06], ["hum", 23.36], ["mains hum", 17.63]], null, null, [["speech", 43.7], ["mains hum", 12.68], ["hum", 6.19]], null, null, null, null, [["mains hum", 37.12], ["hum", 29.64], ["speech", 13.01]], null, null, [["music", 23.77], ["hum", 17.53], ["mains hum", 13.85]], null], "duration": [0.52, 0.09, 0.32, 1.38, 1.71, 0.7, 1.91, 2.88, 4.33, 1.9, 2.87, 2.65, 1.18, 0.48, 10.81, 9.05, 1.55, 2.91, 4.72, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/gWGhsJWFOrU_filtered.json b/annotations_filtered/gWGhsJWFOrU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/gWGhsJWFOrU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/gWHvF157sFI_filtered.json b/annotations_filtered/gWHvF157sFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a348c8fc320b925952f30781afb1ce39b867050 --- /dev/null +++ b/annotations_filtered/gWHvF157sFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [7.0, 7.72], [10.0, 10.44], [14.0, 15.9], [17.0, 17.74], [18.0, 18.86], [19.0, 19.8], [20.0, 20.71], [22.0, 23.11], [25.0, 25.32], [33.0, 33.24], [35.0, 35.48], [36.0, 36.09], [38.0, 38.69], [43.0, 44.9], [50.0, 56.69], [59.0, 59.07], [61.0, 61.82], [64.0, 65.13], [68.0, 68.39], [70.0, 75.1], [81.0, 81.23], [85.0, 86.37], [88.0, 87.93], [111.0, 169.48], [170.0, 170.19], [174.0, 176.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.07, 0.0, 0.0, 0.0, 0.0, 43.43, 0.0, 0.0, 0.0, 0.0, 0.0, 41.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.21], ["speech", 11.35], ["synthesizer", 7.14]], null, null, null, null, [["music", 58.25], ["synthesizer", 4.47], ["hum", 4.44]], null, null, null, null, null, [["music", 61.13], ["theremin", 8.67], ["bass guitar", 8.6]]], "duration": [0.51, 0.72, 0.44, 1.9, 0.74, 0.86, 0.8, 0.71, 1.11, 0.32, 0.24, 0.48, 0.09, 0.69, 1.9, 6.69, 0.07, 0.82, 1.13, 0.39, 5.1, 0.23, 1.37, -0.07, 58.48, 0.19, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/gX57uKMrxp4_filtered.json b/annotations_filtered/gX57uKMrxp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1676cc0758f7c7d1ccc0869bd5f9d9d020e1472d --- /dev/null +++ b/annotations_filtered/gX57uKMrxp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.39], [7.0, 7.45], [9.0, 8.92], [12.0, 12.19], [39.0, 41.77], [43.0, 43.31], [45.0, 46.58], [50.0, 50.72], [53.0, 55.44], [58.0, 58.5], [67.0, 67.14], [71.0, 87.91], [89.0, 90.0], [93.0, 94.96], [105.0, 105.9], [108.0, 125.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 86.45, 0.0, 0.0, 0.0, 92.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 0.45, -0.08, 0.19, 2.77, 0.31, 1.58, 0.72, 2.44, 0.5, 0.14, 16.91, 1.0, 1.96, 0.9, 17.51]} \ No newline at end of file diff --git a/annotations_filtered/gXHhy4c4UZw_filtered.json b/annotations_filtered/gXHhy4c4UZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd4855137ae7eb6d3d498b6ad16b60cae852d6d1 --- /dev/null +++ b/annotations_filtered/gXHhy4c4UZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.1], [14.0, 14.61], [19.0, 20.11], [23.0, 23.11], [24.0, 24.66], [26.0, 26.52], [31.0, 30.99], [33.0, 33.54], [36.0, 36.88], [38.0, 38.58], [41.0, 41.98], [44.0, 45.5], [47.0, 48.95], [49.0, 50.87], [54.0, 56.96], [63.0, 63.04], [65.0, 65.53], [75.0, 75.95], [81.0, 84.35], [85.0, 86.21], [87.0, 88.16], [90.0, 90.96], [92.0, 92.96], [96.0, 96.47], [98.0, 98.96], [100.0, 100.95], [103.0, 103.49], [105.0, 106.44], [109.0, 110.89], [112.0, 112.77], [117.0, 116.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.64, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 75.23], ["didgeridoo", 7.03], ["sidetone", 4.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.1, 0.61, 1.11, 0.11, 0.66, 0.52, -0.01, 0.54, 0.88, 0.58, 0.98, 1.5, 1.95, 1.87, 2.96, 0.04, 0.53, 0.95, 3.35, 1.21, 1.16, 0.96, 0.96, 0.47, 0.96, 0.95, 0.49, 1.44, 1.89, 0.77, -0.3]} \ No newline at end of file diff --git a/annotations_filtered/gXQhdB1y674_filtered.json b/annotations_filtered/gXQhdB1y674_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ba41aeeb802d6c6647be80bd0d4c48f7e31d790 --- /dev/null +++ b/annotations_filtered/gXQhdB1y674_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.56], [5.0, 6.07], [8.0, 8.82], [9.0, 9.53], [10.0, 11.52], [22.0, 22.3], [31.0, 33.17], [34.0, 33.99], [35.0, 35.04]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.56, 1.07, 0.82, 0.53, 1.52, 0.3, 2.17, -0.01, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/gXRw45jyIsE_filtered.json b/annotations_filtered/gXRw45jyIsE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..239dee8062bc6bcee2d33aa870f1407e36578274 --- /dev/null +++ b/annotations_filtered/gXRw45jyIsE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [7.0, 8.07], [14.0, 14.28], [15.0, 15.8], [22.0, 22.42], [25.0, 25.2], [35.0, 35.88], [38.0, 38.47], [40.0, 40.36], [42.0, 44.83], [51.0, 51.44], [56.0, 55.93], [56.0, 57.21], [58.0, 59.1], [63.0, 64.08], [65.0, 65.31], [68.0, 68.88], [69.0, 69.97], [71.0, 71.63], [72.0, 76.3], [77.0, 77.14], [79.0, 80.01], [83.0, 83.52], [85.0, 85.5], [88.0, 88.47], [89.0, 90.0], [91.0, 91.5], [94.0, 95.05], [97.0, 98.96], [101.0, 101.9], [104.0, 104.72], [108.0, 109.7], [111.0, 111.77], [115.0, 115.6], [119.0, 120.01], [124.0, 127.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 1.07, 0.28, 0.8, 0.42, 0.2, 0.88, 0.47, 0.36, 2.83, 0.44, -0.07, 1.21, 1.1, 1.08, 0.31, 0.88, 0.97, 0.63, 4.3, 0.14, 1.01, 0.52, 0.5, 0.47, 1.0, 0.5, 1.05, 1.96, 0.9, 0.72, 1.7, 0.77, 0.6, 1.01, 3.89]} \ No newline at end of file diff --git a/annotations_filtered/gXv4mbv8-cE_filtered.json b/annotations_filtered/gXv4mbv8-cE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0066e8969c2122b01d1a3abad75dacbbd682f12 --- /dev/null +++ b/annotations_filtered/gXv4mbv8-cE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.2], [19.0, 23.8], [25.0, 25.93], [29.0, 34.43], [38.0, 39.43], [42.0, 44.78], [46.0, 46.57], [49.0, 49.74], [54.0, 55.07], [60.0, 60.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.12, 54.5, 0.0, 89.19, 0.0, 51.12, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["noise", 62.87], ["sidetone", 7.64], ["hum", 7.53]], null, null, null, null, null, null, null, null, null], "duration": [6.2, 4.8, 0.93, 5.43, 1.43, 2.78, 0.57, 0.74, 1.07, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/gYdm3PIHyaM_filtered.json b/annotations_filtered/gYdm3PIHyaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a665dba2e2bcf2af5b29e23aab1b742d3f72a063 --- /dev/null +++ b/annotations_filtered/gYdm3PIHyaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.12], [18.0, 21.81], [22.0, 23.4], [26.0, 27.13], [27.0, 29.96], [31.0, 31.31], [33.0, 37.94], [38.0, 38.74], [40.0, 43.16], [49.0, 51.09], [52.0, 59.68], [63.0, 63.95], [64.0, 65.11], [67.0, 68.35], [69.0, 71.44], [76.0, 75.83], [76.0, 77.28], [78.0, 78.9], [80.0, 83.27], [84.0, 87.51], [89.0, 97.02], [103.0, 103.13], [105.0, 106.08], [107.0, 107.0], [108.0, 108.78], [112.0, 114.3], [121.0, 121.31], [128.0, 131.94], [135.0, 135.55], [137.0, 137.22], [139.0, 141.4], [143.0, 145.08]], "keep_status": [true, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.18, 37.22, 0.0, 0.0, 44.12, 0.0, 43.61, 0.0, 41.81, 47.86, 48.56, 0.0, 0.0, 0.0, 64.63, 0.0, 0.0, 0.0, 34.72, 91.47, 57.09, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 79.41, 0.0, 0.0, 96.42, 80.11], "audiomae_on_audioset": [[["crowd", 16.53], ["hubbub, speech noise, speech babble", 9.7], ["mosquito", 9.12]], [["animal", 69.81], ["dog", 7.71], ["canidae, dogs, wolves", 4.57]], null, null, [["speech", 56.03], ["hum", 17.21], ["mains hum", 4.31]], null, [["speech", 68.54], ["animal", 4.64], ["fly, housefly", 3.99]], null, [["sidetone", 26.42], ["speech", 25.98], ["whale vocalization", 17.1]], [["speech", 29.57], ["music", 20.29], ["hum", 7.49]], [["music", 23.79], ["didgeridoo", 10.4], ["hiccup", 6.79]], null, null, null, null, null, null, null, [["cattle, bovinae", 44.79], ["moo", 31.18], ["livestock, farm animals, working animals", 18.22]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.12, 3.81, 1.4, 1.13, 2.96, 0.31, 4.94, 0.74, 3.16, 2.09, 7.68, 0.95, 1.11, 1.35, 2.44, -0.17, 1.28, 0.9, 3.27, 3.51, 8.02, 0.13, 1.08, 0.0, 0.78, 2.3, 0.31, 3.94, 0.55, 0.22, 2.4, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/gZ-QU3KT1PE_filtered.json b/annotations_filtered/gZ-QU3KT1PE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afcd6ca75ac335e554272139d1d8ee2f0f6d96a7 --- /dev/null +++ b/annotations_filtered/gZ-QU3KT1PE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [2.0, 2.34], [3.0, 3.79], [4.0, 4.62], [6.0, 8.51], [9.0, 13.59], [15.0, 18.28], [20.0, 53.49], [55.0, 81.77], [83.0, 87.61], [91.0, 116.5], [117.0, 116.77], [117.0, 116.8], [117.0, 116.83], [119.0, 119.21], [123.0, 125.46], [126.0, 126.77], [130.0, 131.4], [134.0, 135.51], [136.0, 149.08], [155.0, 160.49]], "keep_status": [false, false, false, false, true, true, true, false, true, true, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.69, 40.47, 33.37, 0.0, 33.63, 31.63, 32.69, 0.0, 0.0, 0.0, 0.0, 46.61, 0.0, 0.0, 0.0, 33.35, 73.82], "audiomae_on_audioset": [null, null, null, null, [["aircraft", 19.51], ["music", 13.91], ["fixed-wing aircraft, airplane", 12.2]], [["mains hum", 25.7], ["hum", 22.01], ["music", 17.87]], [["speech", 12.67], ["grunt", 12.1], ["music", 9.53]], null, [["music", 38.88], ["throbbing", 21.33], ["hum", 7.97]], [["music", 32.35], ["hum", 15.05], ["mains hum", 10.48]], [["music", 29.44], ["hum", 25.44], ["throbbing", 11.5]], null, null, null, null, [["fly, housefly", 37.0], ["insect", 11.4], ["music", 9.06]], null, null, null, [["music", 45.96], ["fly, housefly", 6.23], ["throbbing", 5.62]], null], "duration": [0.29, 0.34, 0.79, 0.62, 2.51, 4.59, 3.28, 33.49, 26.77, 4.61, 25.5, -0.23, -0.2, -0.17, 0.21, 2.46, 0.77, 1.4, 1.51, 13.08, 5.49]} \ No newline at end of file diff --git a/annotations_filtered/gZ9nPV_stFA_filtered.json b/annotations_filtered/gZ9nPV_stFA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eeed48aa4cfb4bd051537bed261a05bd8f1ad155 --- /dev/null +++ b/annotations_filtered/gZ9nPV_stFA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.97], [8.0, 10.71], [12.0, 13.14], [14.0, 14.77], [15.0, 15.79], [17.0, 17.81], [19.0, 18.87], [22.0, 22.27], [24.0, 24.31], [25.0, 26.94], [31.0, 31.56], [33.0, 33.59], [35.0, 37.05], [42.0, 42.43], [44.0, 45.45], [48.0, 48.14], [50.0, 53.18], [55.0, 54.77], [60.0, 60.61], [67.0, 66.82], [74.0, 74.49], [76.0, 76.23], [86.0, 86.39], [88.0, 90.46], [97.0, 103.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 54.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.16, 0.0, 0.0, 0.0, 52.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.16, 55.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.03], ["speech", 5.06], ["fart", 3.24]], null], "duration": [1.97, 2.71, 1.14, 0.77, 0.79, 0.81, -0.13, 0.27, 0.31, 1.94, 0.56, 0.59, 2.05, 0.43, 1.45, 0.14, 3.18, -0.23, 0.61, -0.18, 0.49, 0.23, 0.39, 2.46, 6.71]} \ No newline at end of file diff --git a/annotations_filtered/gZXv9XswYM8_filtered.json b/annotations_filtered/gZXv9XswYM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b72dc9c4f67eb208b209ed6f7cc9393a6c4f8d1 --- /dev/null +++ b/annotations_filtered/gZXv9XswYM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.85], [3.0, 3.1], [6.0, 7.37], [19.0, 19.21], [28.0, 28.04], [32.0, 33.07], [40.0, 40.86], [42.0, 42.85], [51.0, 51.27], [52.0, 52.52], [56.0, 56.47], [58.0, 58.67], [59.0, 59.44], [61.0, 61.26], [63.0, 66.41], [67.0, 69.9], [77.0, 78.27], [81.0, 84.5], [87.0, 86.93], [87.0, 88.97], [89.0, 90.56], [91.0, 92.16], [95.0, 95.99], [97.0, 98.15], [105.0, 105.75], [122.0, 122.57], [124.0, 123.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 85.54, 0.0, 34.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.32], ["sidetone", 11.58], ["tuning fork", 8.17]], null, null, null, null, null, null, null, null, null], "duration": [-0.15, 0.1, 1.37, 0.21, 0.04, 1.07, 0.86, 0.85, 0.27, 0.52, 0.47, 0.67, 0.44, 0.26, 3.41, 2.9, 1.27, 3.5, -0.07, 1.97, 1.56, 1.16, 0.99, 1.15, 0.75, 0.57, -0.15]} \ No newline at end of file diff --git a/annotations_filtered/gZY_zy2hAHA_filtered.json b/annotations_filtered/gZY_zy2hAHA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0d80c3a5f9e44c9540e5f7b03eaa65b3a4826d0 --- /dev/null +++ b/annotations_filtered/gZY_zy2hAHA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.23], [11.0, 11.58], [12.0, 18.32], [20.0, 21.37], [23.0, 22.99], [24.0, 26.94], [31.0, 31.13], [32.0, 49.52], [51.0, 54.03], [56.0, 56.42], [62.0, 64.17], [80.0, 79.81], [83.0, 84.33], [85.0, 85.99], [91.0, 92.2], [95.0, 96.25], [107.0, 107.27], [109.0, 109.97], [114.0, 114.24], [122.0, 122.84]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.71, 0.0, 0.0, 35.95, 0.0, 32.7, 67.0, 0.0, 37.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 37.08], ["synthesizer", 6.19], ["hum", 5.17]], null, null, [["cattle, bovinae", 32.54], ["livestock, farm animals, working animals", 25.19], ["moo", 16.93]], null, [["music", 30.45], ["speech", 26.66], ["sidetone", 15.5]], null, null, [["music", 36.07], ["speech", 33.24], ["radio", 5.79]], null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.58, 6.32, 1.37, -0.01, 2.94, 0.13, 17.52, 3.03, 0.42, 2.17, -0.19, 1.33, 0.99, 1.2, 1.25, 0.27, 0.97, 0.24, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/g_C56llGC1E_filtered.json b/annotations_filtered/g_C56llGC1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cebd18ea90fcc7d37f39393642e288d4144d2509 --- /dev/null +++ b/annotations_filtered/g_C56llGC1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.88], [7.0, 10.32], [15.0, 34.8], [50.0, 50.25], [58.0, 57.74], [58.0, 64.3], [68.0, 69.7], [74.0, 89.68], [94.0, 97.48], [100.0, 101.48], [108.0, 136.63], [144.0, 145.89], [150.0, 161.05], [169.0, 169.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.76, 32.72, 0.0, 0.0, 33.56, 0.0, 31.36, 31.6, 0.0, 36.26, 0.0, 31.59, 0.0], "audiomae_on_audioset": [null, [["music", 66.54], ["musical instrument", 9.95], ["carnatic music", 8.83]], [["music", 55.11], ["effects unit", 12.83], ["guitar", 7.53]], null, null, [["music", 71.09], ["theremin", 7.33], ["musical instrument", 4.26]], null, [["music", 78.42], ["theremin", 3.39], ["musical instrument", 2.94]], [["music", 71.87], ["electronic music", 1.72], ["musical instrument", 1.5]], null, [["music", 57.26], ["effects unit", 9.35], ["theremin", 6.5]], null, [["theremin", 55.98], ["music", 18.14], ["crowd", 3.39]], null], "duration": [1.88, 3.32, 19.8, 0.25, -0.26, 6.3, 1.7, 15.68, 3.48, 1.48, 28.63, 1.89, 11.05, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/g_O0J66490k_filtered.json b/annotations_filtered/g_O0J66490k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/g_O0J66490k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/g_U9jZQ54LM_filtered.json b/annotations_filtered/g_U9jZQ54LM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17620120942835fa3a8c5d68eaac5c7b6da6fbe0 --- /dev/null +++ b/annotations_filtered/g_U9jZQ54LM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.71], [3.0, 4.67], [10.0, 10.17], [15.0, 15.16], [18.0, 25.76], [28.0, 47.76], [59.0, 59.19], [69.0, 69.09], [73.0, 73.63], [78.0, 77.73], [81.0, 89.06], [92.0, 92.04], [102.0, 106.15], [110.0, 116.11], [121.0, 121.22], [123.0, 125.46], [126.0, 131.55], [132.0, 133.2], [136.0, 136.27], [138.0, 139.28], [141.0, 141.44], [150.0, 149.91]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.46, 32.02, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 56.63, 59.96, 0.0, 58.38, 45.18, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 26.77], ["moo", 21.19], ["speech", 18.08]], [["music", 24.48], ["noise", 10.2], ["cacophony", 10.15]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 45.45], ["insect", 26.6], ["bee, wasp, etc.", 25.84]], null, null, null, null, null], "duration": [0.71, 1.67, 0.17, 0.16, 7.76, 19.76, 0.19, 0.09, 0.63, -0.27, 8.06, 0.04, 4.15, 6.11, 0.22, 2.46, 5.55, 1.2, 0.27, 1.28, 0.44, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/g_fIDwoORl4_filtered.json b/annotations_filtered/g_fIDwoORl4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79a1312a28d8c4331baa1870dcace4833f079a2d --- /dev/null +++ b/annotations_filtered/g_fIDwoORl4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.15], [10.0, 15.38], [16.0, 19.33], [21.0, 24.43], [26.0, 29.24], [30.0, 32.7], [35.0, 36.93], [39.0, 40.74], [46.0, 50.33], [51.0, 57.62], [59.0, 63.59], [65.0, 69.08], [70.0, 76.38], [77.0, 86.14], [87.0, 114.22], [116.0, 142.05], [143.0, 157.94], [159.0, 166.33], [167.0, 174.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [79.76, 61.18, 99.92, 92.97, 99.87, 64.41, 0.0, 0.0, 99.97, 72.16, 66.88, 88.46, 98.36, 95.91, 78.21, 81.71, 44.6, 77.87, 72.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.52], ["hum", 13.07], ["mains hum", 8.02]], null, null], "duration": [2.15, 5.38, 3.33, 3.43, 3.24, 2.7, 1.93, 1.74, 4.33, 6.62, 4.59, 4.08, 6.38, 9.14, 27.22, 26.05, 14.94, 7.33, 7.28]} \ No newline at end of file diff --git a/annotations_filtered/g_mjMjs_eFY_filtered.json b/annotations_filtered/g_mjMjs_eFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e06ab74048bcba7d30ffbba54942ab0570a8dfd4 --- /dev/null +++ b/annotations_filtered/g_mjMjs_eFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.82], [18.0, 20.58], [22.0, 23.62], [25.0, 76.52], [78.0, 78.11], [79.0, 81.16], [89.0, 89.16], [96.0, 96.16], [97.0, 97.41], [99.0, 99.39], [100.0, 100.36], [101.0, 102.81], [103.0, 108.38], [111.0, 110.78]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [33.05, 35.33, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.96, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 10.25], ["chuckle, chortle", 7.68], ["snicker", 6.64]], [["sonar", 19.19], ["hum", 15.53], ["mains hum", 7.3]], null, null, null, null, null, null, null, null, null, null, [["explosion", 34.53], ["speech", 17.13], ["burst, pop", 7.66]], null], "duration": [4.82, 2.58, 1.62, 51.52, 0.11, 2.16, 0.16, 0.16, 0.41, 0.39, 0.36, 1.81, 5.38, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/g_wEMoy_wi0_filtered.json b/annotations_filtered/g_wEMoy_wi0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fdd6be91165a026d60a571cbfacfa6ca3a15453 --- /dev/null +++ b/annotations_filtered/g_wEMoy_wi0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.08], [8.0, 12.83], [16.0, 18.96], [26.0, 36.91], [42.0, 44.63], [47.0, 49.72], [52.0, 55.26], [60.0, 60.18], [62.0, 62.83], [68.0, 69.48], [79.0, 79.15], [81.0, 82.21], [86.0, 86.9], [88.0, 90.49], [92.0, 95.98], [96.0, 98.14], [103.0, 108.04], [109.0, 112.78], [115.0, 117.51], [120.0, 122.12], [124.0, 127.01], [129.0, 153.52], [154.0, 153.94]], "keep_status": [false, false, true, true, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [99.95, 99.98, 44.55, 46.97, 37.8, 69.34, 50.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.88, 46.68, 53.1, 96.77, 85.17, 83.16, 84.43, 92.31, 65.79, 0.0], "audiomae_on_audioset": [null, null, [["speech", 17.04], ["noise", 9.06], ["hum", 8.57]], [["hiccup", 24.36], ["gasp", 18.65], ["groan", 13.95]], [["thunk", 44.6], ["glass", 14.41], ["arrow", 6.4]], null, null, null, null, null, null, null, null, [["sine wave", 32.05], ["chirp tone", 30.77], ["music", 4.31]], [["chink, clink", 27.58], ["speech", 10.8], ["cutlery, silverware", 6.07]], null, null, null, null, null, null, null, null], "duration": [4.08, 4.83, 2.96, 10.91, 2.63, 2.72, 3.26, 0.18, 0.83, 1.48, 0.15, 1.21, 0.9, 2.49, 3.98, 2.14, 5.04, 3.78, 2.51, 2.12, 3.01, 24.52, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/gacB8xCQ09s_filtered.json b/annotations_filtered/gacB8xCQ09s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9a6ce124fc396f341cb51d1e90f336ee097ce94 --- /dev/null +++ b/annotations_filtered/gacB8xCQ09s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.76], [10.0, 16.14], [17.0, 20.31], [20.0, 20.34], [20.0, 20.38], [20.0, 20.66], [23.0, 31.62], [32.0, 32.36], [39.0, 52.1], [60.0, 64.2], [71.0, 77.52]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true], "silence_prob": [47.05, 44.93, 40.88, 0.0, 0.0, 0.0, 58.55, 0.0, 60.05, 63.74, 49.4], "audiomae_on_audioset": [[["didgeridoo", 48.27], ["music", 32.14], ["musical instrument", 4.71]], [["music", 47.21], ["didgeridoo", 16.17], ["foghorn", 6.31]], [["boing", 28.15], ["music", 8.0], ["theremin", 7.6]], null, null, null, null, null, null, null, [["music", 22.53], ["boing", 14.88], ["speech", 11.77]]], "duration": [4.76, 6.14, 3.31, 0.34, 0.38, 0.66, 8.62, 0.36, 13.1, 4.2, 6.52]} \ No newline at end of file diff --git a/annotations_filtered/gaoMc6MgvNA_filtered.json b/annotations_filtered/gaoMc6MgvNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03c04cbc11afc865d0ff4e84c6727f6dff57ca45 --- /dev/null +++ b/annotations_filtered/gaoMc6MgvNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.42], [12.0, 38.31], [39.0, 107.42], [113.0, 133.03]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 50.61, 0.0, 28.03], "audiomae_on_audioset": [null, null, null, [["speech", 26.68], ["vehicle", 4.89], ["groan", 4.56]]], "duration": [0.42, 26.31, 68.42, 20.03]} \ No newline at end of file diff --git a/annotations_filtered/gap2gWQy77A_filtered.json b/annotations_filtered/gap2gWQy77A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40a44b261b83d124c950325471b42848043e29ce --- /dev/null +++ b/annotations_filtered/gap2gWQy77A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.58], [16.0, 19.67], [20.0, 21.34], [22.0, 29.3], [33.0, 37.79], [40.0, 40.31], [41.0, 42.3], [45.0, 46.33], [47.0, 48.39], [50.0, 50.46], [53.0, 53.87], [56.0, 57.08], [58.0, 58.6], [60.0, 62.26], [74.0, 78.34], [79.0, 81.03], [82.0, 83.44], [84.0, 85.08], [104.0, 106.47], [111.0, 111.2], [113.0, 115.06], [118.0, 118.96], [119.0, 122.69], [124.0, 124.33], [128.0, 145.96]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, true, false, true], "silence_prob": [0.0, 32.54, 0.0, 29.88, 35.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 45.05, 60.89, 0.0, 0.0, 35.33, 0.0, 29.1, 0.0, 30.85, 0.0, 28.14], "audiomae_on_audioset": [null, [["music", 22.4], ["throbbing", 21.93], ["hum", 13.4]], null, [["speech", 50.7], ["hum", 7.37], ["music", 5.67]], [["speech", 70.88], ["music", 14.13], ["sidetone", 3.72]], null, null, null, null, null, null, null, null, null, [["speech", 41.6], ["hum", 6.12], ["music", 6.06]], null, null, null, [["music", 32.06], ["hum", 27.89], ["mains hum", 9.21]], null, [["hum", 30.82], ["mains hum", 15.11], ["throbbing", 12.32]], null, [["music", 21.81], ["mains hum", 19.92], ["hum", 18.19]], null, [["music", 43.99], ["throbbing", 11.94], ["didgeridoo", 8.29]]], "duration": [1.58, 3.67, 1.34, 7.3, 4.79, 0.31, 1.3, 1.33, 1.39, 0.46, 0.87, 1.08, 0.6, 2.26, 4.34, 2.03, 1.44, 1.08, 2.47, 0.2, 2.06, 0.96, 3.69, 0.33, 17.96]} \ No newline at end of file diff --git a/annotations_filtered/gbEDjhLuPAs_filtered.json b/annotations_filtered/gbEDjhLuPAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21e85ae5391b942113822f0d0c2b52cf906670ce --- /dev/null +++ b/annotations_filtered/gbEDjhLuPAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.74], [8.0, 8.23], [10.0, 10.4], [12.0, 13.24], [15.0, 15.87], [17.0, 20.87], [22.0, 22.99], [23.0, 31.5], [33.0, 37.59], [38.0, 38.91], [39.0, 69.45], [70.0, 70.66], [71.0, 125.76], [127.0, 127.31]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.04, 0.0, 60.6, 46.05, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 29.0], ["stomach rumble", 20.21], ["squish", 15.71]], null, null, [["sidetone", 54.1], ["mains hum", 15.5], ["hum", 11.7]], null, null, null, null, null], "duration": [1.74, 0.23, 0.4, 1.24, 0.87, 3.87, 0.99, 8.5, 4.59, 0.91, 30.45, 0.66, 54.76, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/gbXZzvvp2uc_filtered.json b/annotations_filtered/gbXZzvvp2uc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a169971bec39ebd9b6fe66134048c1f2d6c17835 --- /dev/null +++ b/annotations_filtered/gbXZzvvp2uc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.49], [9.0, 16.98], [18.0, 19.43], [40.0, 41.74], [43.0, 43.77], [44.0, 45.27], [57.0, 62.04], [63.0, 65.13], [89.0, 90.66], [92.0, 93.07], [94.0, 106.05], [109.0, 109.56], [112.0, 112.55], [114.0, 114.69], [118.0, 118.83], [121.0, 121.32], [123.0, 126.67], [130.0, 131.23]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.74, 45.85, 0.0, 0.0, 0.0, 0.0, 37.21, 32.28, 0.0, 0.0, 35.87, 0.0, 0.0, 0.0, 0.0, 0.0, 52.22, 0.0], "audiomae_on_audioset": [[["creak", 14.37], ["throbbing", 8.46], ["hum", 7.72]], [["throbbing", 53.8], ["hum", 27.3], ["heart sounds, heartbeat", 8.28]], null, null, null, null, [["speech", 28.35], ["hum", 26.23], ["mains hum", 17.76]], [["speech", 62.87], ["radio", 12.35], ["vehicle", 4.01]], null, null, [["insect", 27.79], ["fly, housefly", 23.85], ["bee, wasp, etc.", 22.1]], null, null, null, null, null, null, null], "duration": [2.49, 7.98, 1.43, 1.74, 0.77, 1.27, 5.04, 2.13, 1.66, 1.07, 12.05, 0.56, 0.55, 0.69, 0.83, 0.32, 3.67, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/gbbbs1uWxvo_filtered.json b/annotations_filtered/gbbbs1uWxvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84dbd88f75b11c77722cdc7b1a4afde19219102b --- /dev/null +++ b/annotations_filtered/gbbbs1uWxvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.53], [22.0, 22.89], [24.0, 28.17], [30.0, 31.11], [40.0, 40.83], [45.0, 46.03], [50.0, 49.81], [51.0, 51.68], [53.0, 54.28], [64.0, 63.98], [66.0, 69.18], [71.0, 72.5], [85.0, 85.5], [102.0, 102.91], [112.0, 114.08], [115.0, 116.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 0.0, 0.0, 0.0, 67.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 0.89, 4.17, 1.11, 0.83, 1.03, -0.19, 0.68, 1.28, -0.02, 3.18, 1.5, 0.5, 0.91, 2.08, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/gboXDP4L4b0_filtered.json b/annotations_filtered/gboXDP4L4b0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee4aa886bcd7e34cd1f8da0d3c623fb754ee0c2a --- /dev/null +++ b/annotations_filtered/gboXDP4L4b0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.68], [22.0, 31.97], [32.0, 40.88], [42.0, 42.52], [44.0, 44.76], [48.0, 48.88], [52.0, 52.73], [55.0, 54.7], [67.0, 67.83]], "keep_status": [false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 33.28, 37.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 32.47], ["throbbing", 12.99], ["hum", 8.84]], [["speech", 24.99], ["fly, housefly", 8.89], ["hum", 4.7]], null, null, null, null, null, null], "duration": [0.68, 9.97, 8.88, 0.52, 0.76, 0.88, 0.73, -0.3, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/gbu88CKkEzI_filtered.json b/annotations_filtered/gbu88CKkEzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..311c7fd41810252b2872743a5b3817b9f9013a58 --- /dev/null +++ b/annotations_filtered/gbu88CKkEzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.93], [7.0, 13.91], [16.0, 16.65], [18.0, 19.14], [20.0, 20.98], [22.0, 22.74], [27.0, 28.93], [32.0, 32.51], [38.0, 38.91], [42.0, 45.42], [48.0, 48.32], [49.0, 50.4], [51.0, 62.04], [63.0, 62.92], [63.0, 69.67], [76.0, 79.07], [93.0, 100.82], [101.0, 102.57], [104.0, 104.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 57.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.15, 0.0, 0.0, 33.73, 0.0, 38.28, 40.47, 39.44, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.24], ["boing", 5.15], ["buzz", 4.3]], null, [["thunk", 39.18], ["speech", 22.45], ["whack, thwack", 5.31]], [["speech", 35.56], ["music", 21.49], ["beatboxing", 2.64]], [["speech", 70.94], ["cattle, bovinae", 5.45], ["moo", 3.55]], null, null], "duration": [-0.07, 6.91, 0.65, 1.14, 0.98, 0.74, 1.93, 0.51, 0.91, 3.42, 0.32, 1.4, 11.04, -0.08, 6.67, 3.07, 7.82, 1.57, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/gcPY3RIvtCw_filtered.json b/annotations_filtered/gcPY3RIvtCw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6df5faf994ef206edfefed274a3a4aa37fa3ef4 --- /dev/null +++ b/annotations_filtered/gcPY3RIvtCw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.54], [21.0, 23.41], [33.0, 34.08], [38.0, 38.28], [41.0, 43.14], [53.0, 53.62], [58.0, 57.96], [69.0, 69.25], [73.0, 74.36], [85.0, 86.85], [93.0, 99.05], [101.0, 102.73], [103.0, 103.71], [113.0, 114.17], [115.0, 115.05], [115.0, 119.77], [121.0, 123.23], [130.0, 133.37], [172.0, 175.07], [186.0, 187.19], [193.0, 215.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.57, 0.0, 0.0, 35.7, 0.0, 0.0, 0.0, 0.0, 0.0, 34.22, 0.0, 0.0, 0.0, 0.0, 31.56, 33.41, 31.28, 31.8, 0.0, 31.5], "audiomae_on_audioset": [null, [["music", 66.47], ["musical instrument", 3.12], ["electric piano", 2.13]], null, null, [["music", 63.35], ["musical instrument", 6.88], ["guitar", 6.01]], null, null, null, null, null, [["music", 74.88], ["theremin", 3.2], ["effects unit", 3.12]], null, null, null, null, [["music", 79.74], ["musical instrument", 4.06], ["guitar", 2.36]], [["music", 73.35], ["musical instrument", 3.69], ["guitar", 3.67]], [["music", 75.7], ["carnatic music", 2.27], ["musical instrument", 1.48]], [["music", 65.12], ["musical instrument", 5.31], ["guitar", 4.1]], null, [["music", 77.41], ["musical instrument", 2.44], ["guitar", 0.97]]], "duration": [0.54, 2.41, 1.08, 0.28, 2.14, 0.62, -0.04, 0.25, 1.36, 1.85, 6.05, 1.73, 0.71, 1.17, 0.05, 4.77, 2.23, 3.37, 3.07, 1.19, 22.49]} \ No newline at end of file diff --git a/annotations_filtered/gcZPWkNY6x8_filtered.json b/annotations_filtered/gcZPWkNY6x8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b6a95399a9d076c9d68c15395e7d806e5fe9a63 --- /dev/null +++ b/annotations_filtered/gcZPWkNY6x8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.81], [15.0, 19.04], [19.0, 19.08], [31.0, 31.4], [33.0, 33.32], [34.0, 34.26], [41.0, 40.73], [43.0, 43.5], [45.0, 46.09], [50.0, 50.16], [59.0, 60.44], [61.0, 61.11], [63.0, 64.34], [65.0, 65.48], [67.0, 67.61], [68.0, 77.3], [86.0, 93.7], [95.0, 97.07], [98.0, 100.7], [106.0, 109.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 82.61, 99.99, 81.35, 90.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.81, 4.04, 0.08, 0.4, 0.32, 0.26, -0.27, 0.5, 1.09, 0.16, 1.44, 0.11, 1.34, 0.48, 0.61, 9.3, 7.7, 2.07, 2.7, 3.8]} \ No newline at end of file diff --git a/annotations_filtered/gcu30p7VEKI_filtered.json b/annotations_filtered/gcu30p7VEKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1ab1d1e35fe13262a0778a46c0bfb9f0bbc54f7 --- /dev/null +++ b/annotations_filtered/gcu30p7VEKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.9], [9.0, 9.34], [12.0, 13.14], [14.0, 15.11], [23.0, 24.26], [30.0, 41.1], [42.0, 71.47], [73.0, 73.6], [74.0, 74.51], [76.0, 76.05], [79.0, 79.0], [80.0, 107.94], [109.0, 118.44], [119.0, 118.94]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 40.38, 32.77, 0.0, 0.0, 0.0, 0.0, 31.6, 31.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 51.87], ["speech", 14.52], ["synthesizer", 5.35]], [["speech", 47.52], ["music", 13.33], ["hum", 5.8]], null, null, null, null, [["whack, thwack", 23.83], ["music", 17.91], ["speech", 13.19]], [["music", 66.53], ["speech", 13.34], ["didgeridoo", 1.77]], null], "duration": [-0.1, 0.34, 1.14, 1.11, 1.26, 11.1, 29.47, 0.6, 0.51, 0.05, 0.0, 27.94, 9.44, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/ge9ahoqNSLE_filtered.json b/annotations_filtered/ge9ahoqNSLE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0666161ae0ea57f63734944a91a99a27c2fb19bf --- /dev/null +++ b/annotations_filtered/ge9ahoqNSLE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.54], [39.0, 43.01], [46.0, 48.41], [51.0, 52.17], [54.0, 61.23]], "keep_status": [false, true, true, false, true], "silence_prob": [0.0, 30.83, 33.62, 0.0, 30.4], "audiomae_on_audioset": [null, [["music", 12.11], ["hum", 11.78], ["mains hum", 7.67]], [["music", 31.74], ["musical instrument", 6.66], ["theremin", 3.99]], null, [["brass instrument", 23.93], ["music", 21.48], ["foghorn", 19.26]]], "duration": [0.54, 4.01, 2.41, 1.17, 7.23]} \ No newline at end of file diff --git a/annotations_filtered/geGO_emEsqs_filtered.json b/annotations_filtered/geGO_emEsqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c97edb74a86329e3721f29a55545aa4d84ca30d9 --- /dev/null +++ b/annotations_filtered/geGO_emEsqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [34.0, 34.21], [38.0, 38.15], [53.0, 53.01], [100.0, 101.6], [110.0, 109.88], [113.0, 113.31], [125.0, 125.41], [144.0, 144.0], [154.0, 154.99], [171.0, 171.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.21, 0.15, 0.01, 1.6, -0.12, 0.31, 0.41, 0.0, 0.99, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/geOqbM03Hf0_filtered.json b/annotations_filtered/geOqbM03Hf0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0799806fed4e09474340817df6cc2d05093e0599 --- /dev/null +++ b/annotations_filtered/geOqbM03Hf0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.37], [9.0, 9.51], [10.0, 12.51], [13.0, 14.34], [15.0, 15.69], [16.0, 17.86], [20.0, 20.76], [23.0, 24.04], [24.0, 25.22], [27.0, 30.97], [33.0, 32.86], [35.0, 35.72], [39.0, 39.75], [40.0, 43.68], [45.0, 46.53], [47.0, 48.09], [49.0, 53.99], [55.0, 56.1], [57.0, 62.46], [63.0, 63.64], [64.0, 64.79], [69.0, 69.5], [70.0, 73.58], [74.0, 76.27], [77.0, 82.56], [83.0, 85.53], [87.0, 87.35], [88.0, 89.28], [90.0, 96.6], [97.0, 98.37], [100.0, 101.16], [102.0, 103.59], [104.0, 107.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 94.95, 0.0, 87.37, 0.0, 0.0, 0.0, 100.0, 99.91, 100.0, 100.0, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 98.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.37, 0.51, 2.51, 1.34, 0.69, 1.86, 0.76, 1.04, 1.22, 3.97, -0.14, 0.72, 0.75, 3.68, 1.53, 1.09, 4.99, 1.1, 5.46, 0.64, 0.79, 0.5, 3.58, 2.27, 5.56, 2.53, 0.35, 1.28, 6.6, 1.37, 1.16, 1.59, 3.79]} \ No newline at end of file diff --git a/annotations_filtered/geh_Mu622SY_filtered.json b/annotations_filtered/geh_Mu622SY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab4e9ed7993370b636bc4bc94ecdcb88719cb769 --- /dev/null +++ b/annotations_filtered/geh_Mu622SY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.83], [7.0, 7.77], [11.0, 12.26], [13.0, 14.39], [17.0, 19.48], [21.0, 23.23], [24.0, 28.04], [29.0, 30.33], [31.0, 34.94], [36.0, 37.89], [38.0, 39.18], [40.0, 44.47], [45.0, 48.02], [49.0, 87.71], [90.0, 125.05]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, true, false, false], "silence_prob": [89.72, 0.0, 0.0, 0.0, 45.27, 69.74, 50.76, 0.0, 49.13, 0.0, 0.0, 42.62, 40.66, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 22.73], ["bee, wasp, etc.", 12.43], ["mains hum", 11.46]], null, null, null, [["sidetone", 72.35], ["speech", 5.72], ["radio", 3.72]], null, null, [["hum", 27.93], ["mains hum", 13.55], ["noise", 9.15]], [["hum", 42.84], ["mains hum", 17.3], ["gong", 3.24]], null, null], "duration": [2.83, 0.77, 1.26, 1.39, 2.48, 2.23, 4.04, 1.33, 3.94, 1.89, 1.18, 4.47, 3.02, 38.71, 35.05]} \ No newline at end of file diff --git a/annotations_filtered/geiS49_p84Q_filtered.json b/annotations_filtered/geiS49_p84Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b839a511fd004d0a8bc3fb74183aa222e19bc3ae --- /dev/null +++ b/annotations_filtered/geiS49_p84Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [9.0, 9.66], [11.0, 20.07], [21.0, 21.59], [23.0, 33.34], [39.0, 40.59], [49.0, 54.11], [55.0, 56.29], [59.0, 60.18], [61.0, 64.99], [71.0, 73.36], [74.0, 74.56], [78.0, 78.88], [81.0, 81.77], [83.0, 83.59], [84.0, 84.99], [90.0, 93.77], [101.0, 101.87], [106.0, 106.98], [111.0, 110.81], [115.0, 116.24], [119.0, 119.58], [120.0, 124.16], [128.0, 130.49], [133.0, 133.59], [138.0, 139.6], [142.0, 142.4], [144.0, 144.64], [154.0, 154.26], [168.0, 168.4]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.02, 0.0, 34.98, 0.0, 45.02, 0.0, 0.0, 35.2, 50.97, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["buzz", 64.57], ["music", 9.09], ["hum", 2.83]], null, [["music", 44.0], ["effects unit", 8.51], ["musical instrument", 4.29]], null, [["music", 57.7], ["didgeridoo", 8.61], ["musical instrument", 8.51]], null, null, [["speech", 78.62], ["music", 2.29], ["inside, small room", 1.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 0.66, 9.07, 0.59, 10.34, 1.59, 5.11, 1.29, 1.18, 3.99, 2.36, 0.56, 0.88, 0.77, 0.59, 0.99, 3.77, 0.87, 0.98, -0.19, 1.24, 0.58, 4.16, 2.49, 0.59, 1.6, 0.4, 0.64, 0.26, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/geiub8WP_XE_filtered.json b/annotations_filtered/geiub8WP_XE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54114841171d99b7bce4128e738afc7e054f1b5d --- /dev/null +++ b/annotations_filtered/geiub8WP_XE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.31], [9.0, 10.03], [13.0, 14.34], [17.0, 18.84], [25.0, 25.3], [26.0, 29.64], [32.0, 33.29], [35.0, 39.33], [41.0, 41.57], [43.0, 43.39], [47.0, 48.63], [50.0, 53.03], [53.0, 54.78], [57.0, 57.99], [59.0, 71.96], [75.0, 77.85], [87.0, 88.35], [93.0, 94.9], [96.0, 97.19], [99.0, 100.58], [103.0, 104.33], [107.0, 107.76], [109.0, 109.59], [115.0, 116.65], [118.0, 118.34], [119.0, 120.06], [122.0, 123.09], [128.0, 133.02], [134.0, 137.83], [139.0, 141.02], [143.0, 143.09], [145.0, 145.86], [150.0, 150.96], [171.0, 171.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 73.67, 0.0, 67.89, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 45.95, 44.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 75.23, 55.89, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.26], ["musical instrument", 7.38], ["buzz", 5.93]], [["music", 42.17], ["double bass", 9.58], ["cello", 9.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 1.03, 1.34, 1.84, 0.3, 3.64, 1.29, 4.33, 0.57, 0.39, 1.63, 3.03, 1.78, 0.99, 12.96, 2.85, 1.35, 1.9, 1.19, 1.58, 1.33, 0.76, 0.59, 1.65, 0.34, 1.06, 1.09, 5.02, 3.83, 2.02, 0.09, 0.86, 0.96, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/geoi6Sxyg7g_filtered.json b/annotations_filtered/geoi6Sxyg7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fb1ed733def18077144d1cea41d332d7f0255dc --- /dev/null +++ b/annotations_filtered/geoi6Sxyg7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.16], [8.0, 10.27], [12.0, 18.15], [19.0, 22.52], [28.0, 30.1], [31.0, 38.64], [45.0, 46.03], [49.0, 50.13], [52.0, 53.33], [57.0, 59.29], [61.0, 61.92], [67.0, 69.33], [72.0, 77.18], [80.0, 81.68], [82.0, 82.75], [83.0, 87.59], [88.0, 91.29], [93.0, 95.05], [95.0, 97.31], [99.0, 103.25], [104.0, 106.93], [109.0, 109.56], [112.0, 112.04], [113.0, 116.56], [118.0, 123.26], [125.0, 129.05], [129.0, 131.19], [133.0, 153.84], [154.0, 157.01], [159.0, 161.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.01, 59.33, 81.71, 69.34, 98.36, 96.54, 0.0, 0.0, 0.0, 90.95, 0.0, 93.29, 96.66, 0.0, 0.0, 59.59, 87.0, 95.51, 51.28, 97.0, 76.86, 0.0, 0.0, 96.66, 95.91, 37.09, 32.02, 44.26, 45.95, 52.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 60.2], ["speech", 16.3], ["hum", 8.67]], [["speech", 42.85], ["sidetone", 34.72], ["telephone", 3.75]], [["hum", 44.3], ["mains hum", 43.48], ["speech", 2.15]], [["speech", 62.67], ["music", 7.75], ["hum", 4.96]], null], "duration": [2.16, 2.27, 6.15, 3.52, 2.1, 7.64, 1.03, 1.13, 1.33, 2.29, 0.92, 2.33, 5.18, 1.68, 0.75, 4.59, 3.29, 2.05, 2.31, 4.25, 2.93, 0.56, 0.04, 3.56, 5.26, 4.05, 2.19, 20.84, 3.01, 2.91]} \ No newline at end of file diff --git a/annotations_filtered/gfLw0KJ6bLI_filtered.json b/annotations_filtered/gfLw0KJ6bLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce1bdd092cbc01fcffd2097f787d396f08922c18 --- /dev/null +++ b/annotations_filtered/gfLw0KJ6bLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.25], [11.0, 11.5], [12.0, 12.6], [14.0, 14.52], [15.0, 16.01], [18.0, 18.33], [23.0, 29.32], [31.0, 33.35], [36.0, 37.62], [39.0, 41.82], [44.0, 44.37], [46.0, 46.62], [52.0, 52.25], [59.0, 59.19], [60.0, 68.3], [69.0, 70.58], [71.0, 73.75]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true], "silence_prob": [40.07, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 35.44, 0.0, 37.51, 0.0, 0.0, 0.0, 0.0, 34.49, 0.0, 48.78], "audiomae_on_audioset": [[["music", 40.56], ["speech", 34.9], ["radio", 3.71]], null, null, null, null, null, null, [["animal", 17.73], ["music", 17.67], ["dog", 12.29]], null, [["hum", 13.04], ["radio", 12.2], ["music", 11.05]], null, null, null, null, [["music", 75.59], ["thunk", 2.89], ["speech", 2.06]], null, [["music", 30.53], ["radio", 16.79], ["didgeridoo", 6.88]]], "duration": [7.25, 0.5, 0.6, 0.52, 1.01, 0.33, 6.32, 2.35, 1.62, 2.82, 0.37, 0.62, 0.25, 0.19, 8.3, 1.58, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/gfXns_cU8I8_filtered.json b/annotations_filtered/gfXns_cU8I8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..587c0100dfa0c15affcb1084bee7c3f697943ced --- /dev/null +++ b/annotations_filtered/gfXns_cU8I8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.44], [18.0, 17.64], [18.0, 37.13], [41.0, 53.27], [56.0, 56.13], [58.0, 59.9], [61.0, 65.72]], "keep_status": [true, false, false, true, false, false, false], "silence_prob": [29.01, 0.0, 29.26, 29.63, 0.0, 0.0, 30.16], "audiomae_on_audioset": [[["buzz", 22.66], ["music", 14.25], ["hum", 9.84]], null, [["mains hum", 46.87], ["hum", 24.66], ["noise", 4.11]], [["music", 34.66], ["hum", 13.97], ["buzz", 7.42]], null, null, [["fly, housefly", 36.81], ["insect", 31.54], ["mosquito", 6.61]]], "duration": [9.44, -0.36, 19.13, 12.27, 0.13, 1.9, 4.72]} \ No newline at end of file diff --git a/annotations_filtered/ggC1uf1QTjw_filtered.json b/annotations_filtered/ggC1uf1QTjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ad717d9ec9c2a13e2689385eb5ac6f4471155c5 --- /dev/null +++ b/annotations_filtered/ggC1uf1QTjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.53], [9.0, 16.07], [18.0, 22.65], [28.0, 35.95], [38.0, 38.5], [40.0, 41.3], [42.0, 43.56], [47.0, 60.54], [64.0, 83.64], [86.0, 91.56], [92.0, 100.13], [101.0, 123.21], [125.0, 129.69], [135.0, 139.21], [141.0, 149.22], [151.0, 151.65], [152.0, 153.45], [154.0, 158.9], [159.0, 160.0], [162.0, 170.33], [173.0, 177.9], [179.0, 197.4], [199.0, 202.58]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.54, 33.42, 33.79, 0.0, 0.0, 0.0, 30.84, 33.09, 37.07, 79.59, 81.17, 75.72, 91.47, 79.59, 0.0, 0.0, 98.73, 0.0, 97.22, 90.43, 79.07, 93.6], "audiomae_on_audioset": [null, [["music", 63.61], ["theremin", 8.35], ["didgeridoo", 7.83]], [["breaking", 18.69], ["music", 17.74], ["hum", 16.1]], [["music", 69.66], ["didgeridoo", 3.76], ["theremin", 3.45]], null, null, null, [["music", 40.72], ["didgeridoo", 29.92], ["whack, thwack", 3.47]], [["music", 76.59], ["didgeridoo", 4.03], ["hum", 2.51]], [["theremin", 49.87], ["music", 33.78], ["musical instrument", 2.01]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 7.07, 4.65, 7.95, 0.5, 1.3, 1.56, 13.54, 19.64, 5.56, 8.13, 22.21, 4.69, 4.21, 8.22, 0.65, 1.45, 4.9, 1.0, 8.33, 4.9, 18.4, 3.58]} \ No newline at end of file diff --git a/annotations_filtered/gh2apPe9pSI_filtered.json b/annotations_filtered/gh2apPe9pSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38a48ec23276e07c00002e6a4bfa9780435e8990 --- /dev/null +++ b/annotations_filtered/gh2apPe9pSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.85], [15.0, 17.73], [19.0, 19.5], [22.0, 28.59], [32.0, 38.42]], "keep_status": [false, true, false, true, false], "silence_prob": [0.0, 36.9, 0.0, 42.04, 45.43], "audiomae_on_audioset": [null, [["music", 26.9], ["speech", 20.26], ["hum", 14.23]], null, [["mains hum", 28.86], ["music", 22.01], ["hum", 15.64]], [["speech", 38.1], ["music", 22.33], ["whale vocalization", 13.36]]], "duration": [0.85, 2.73, 0.5, 6.59, 6.42]} \ No newline at end of file diff --git a/annotations_filtered/ghDDdQxgXRw_filtered.json b/annotations_filtered/ghDDdQxgXRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ff0ef335fdfd867d9bccaf7052d72f6e08f8464 --- /dev/null +++ b/annotations_filtered/ghDDdQxgXRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 58.9]], "keep_status": [false], "silence_prob": [37.41], "audiomae_on_audioset": [[["music", 58.46], ["bleat", 14.32], ["sheep", 6.47]]], "duration": [18.9]} \ No newline at end of file diff --git a/annotations_filtered/ghNPXViyQoU_filtered.json b/annotations_filtered/ghNPXViyQoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb9f058b4d1aba93d1a06047292164605c6f8562 --- /dev/null +++ b/annotations_filtered/ghNPXViyQoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [4.0, 5.36], [15.0, 15.74], [18.0, 22.32], [26.0, 26.23], [29.0, 29.4], [31.0, 31.28], [36.0, 36.86], [41.0, 42.94], [50.0, 51.07], [54.0, 59.51], [60.0, 61.2], [64.0, 71.58], [73.0, 81.53], [86.0, 87.67], [88.0, 90.61]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.91, 0.0, 41.54, 38.58, 0.0, 53.22], "audiomae_on_audioset": [null, null, null, [["stomach rumble", 29.22], ["speech", 25.46], ["hum", 5.76]], null, null, null, null, null, null, [["mains hum", 41.07], ["hum", 38.25], ["crushing", 2.44]], null, [["hum", 72.59], ["mains hum", 21.1], ["throbbing", 2.7]], [["mains hum", 37.31], ["hum", 17.08], ["speech", 11.51]], null, null], "duration": [0.59, 1.36, 0.74, 4.32, 0.23, 0.4, 0.28, 0.86, 1.94, 1.07, 5.51, 1.2, 7.58, 8.53, 1.67, 2.61]} \ No newline at end of file diff --git a/annotations_filtered/ghQOllvR2cE_filtered.json b/annotations_filtered/ghQOllvR2cE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eaec5692dbffac95eb9aebbca893e2e3c2cb8506 --- /dev/null +++ b/annotations_filtered/ghQOllvR2cE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.32], [4.0, 5.14], [6.0, 6.47], [7.0, 8.01], [8.0, 9.04], [11.0, 19.35], [22.0, 21.93], [24.0, 24.17], [25.0, 26.64], [27.0, 30.21], [31.0, 32.78], [34.0, 35.29], [37.0, 37.72], [44.0, 56.54], [57.0, 60.94], [62.0, 62.29], [63.0, 64.79], [66.0, 66.43], [69.0, 72.49], [85.0, 84.81], [87.0, 87.59], [90.0, 90.46], [92.0, 94.8], [109.0, 109.22], [115.0, 114.96], [117.0, 117.22], [118.0, 118.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.98, 0.0, 0.0, 0.0, 42.06, 0.0, 0.0, 0.0, 99.48, 40.57, 0.0, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 75.23, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 62.54], ["thunk", 17.4], ["radio", 4.9]], null, null, null, [["speech", 48.07], ["sidetone", 17.35], ["whack, thwack", 5.29]], null, null, null, null, [["sidetone", 43.29], ["chirp tone", 10.21], ["crushing", 8.79]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 1.14, 0.47, 1.01, 1.04, 8.35, -0.07, 0.17, 1.64, 3.21, 1.78, 1.29, 0.72, 12.54, 3.94, 0.29, 1.79, 0.43, 3.49, -0.19, 0.59, 0.46, 2.8, 0.22, -0.04, 0.22, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/ghUFMbHmw8s_filtered.json b/annotations_filtered/ghUFMbHmw8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e342994547eae92c346f12d61650e7a5581a2239 --- /dev/null +++ b/annotations_filtered/ghUFMbHmw8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [2.0, 4.43], [7.0, 18.22], [42.0, 43.12], [51.0, 51.12], [52.0, 61.96], [62.0, 75.76], [76.0, 84.82], [85.0, 85.56], [91.0, 93.51], [95.0, 98.34], [104.0, 104.92], [122.0, 122.81], [125.0, 126.33], [143.0, 143.4], [144.0, 144.19], [169.0, 169.16], [174.0, 175.34], [194.0, 202.96], [204.0, 209.56], [210.0, 210.25], [213.0, 213.6], [217.0, 217.71], [219.0, 219.3], [221.0, 221.43], [228.0, 228.77]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 70.72, 30.79, 0.0, 0.0, 33.99, 32.84, 31.91, 0.0, 49.59, 49.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.59, 32.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 44.45], ["moo", 34.21], ["livestock, farm animals, working animals", 19.15]], null, null, [["music", 80.8], ["electronic music", 2.95], ["didgeridoo", 2.85]], [["whack, thwack", 21.98], ["music", 12.41], ["fly, housefly", 9.94]], [["speech", 18.81], ["groan", 8.57], ["moo", 7.38]], null, [["speech", 35.17], ["music", 34.86], ["boing", 8.62]], [["music", 64.57], ["synthesizer", 6.65], ["musical instrument", 5.76]], null, null, null, null, null, null, null, [["music", 29.15], ["noise", 15.72], ["hum", 12.44]], [["music", 24.39], ["crowd", 6.97], ["whale vocalization", 6.82]], null, null, null, null, null, null], "duration": [0.53, 2.43, 11.22, 1.12, 0.12, 9.96, 13.76, 8.82, 0.56, 2.51, 3.34, 0.92, 0.81, 1.33, 0.4, 0.19, 0.16, 1.34, 8.96, 5.56, 0.25, 0.6, 0.71, 0.3, 0.43, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/ghZ6ntXQp3E_filtered.json b/annotations_filtered/ghZ6ntXQp3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87c6dd4e7dce1ccfe970e84947af0bfe8ae8fd0b --- /dev/null +++ b/annotations_filtered/ghZ6ntXQp3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.97], [22.0, 22.5], [28.0, 29.78], [31.0, 31.43], [45.0, 45.32], [46.0, 47.22], [49.0, 49.82], [52.0, 57.94], [72.0, 74.06], [79.0, 80.1], [81.0, 82.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.45, 84.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 58.34], ["electronic music", 7.77], ["synthesizer", 4.34]], null, null, null], "duration": [0.97, 0.5, 1.78, 0.43, 0.32, 1.22, 0.82, 5.94, 2.06, 1.1, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/ghew-s2zPjE_filtered.json b/annotations_filtered/ghew-s2zPjE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65d93498244dd7d4bcff5eff67056aa06d2e0d46 --- /dev/null +++ b/annotations_filtered/ghew-s2zPjE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.95], [22.0, 22.11], [22.0, 27.58], [28.0, 28.8], [29.0, 31.5], [37.0, 37.35]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.74, 0.0, 31.2, 0.0], "audiomae_on_audioset": [null, null, [["theremin", 33.51], ["music", 26.3], ["shofar", 13.04]], null, [["theremin", 60.04], ["music", 29.31], ["wind instrument, woodwind instrument", 1.73]], null], "duration": [-0.05, 0.11, 5.58, 0.8, 2.5, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/ghfqnmL0d_A_filtered.json b/annotations_filtered/ghfqnmL0d_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a0959f9818bd6cee3781a6f68188bf0918d1cfa --- /dev/null +++ b/annotations_filtered/ghfqnmL0d_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.77], [13.0, 15.03], [17.0, 17.83], [19.0, 19.77], [27.0, 28.65], [30.0, 35.26], [38.0, 62.21], [66.0, 66.85], [71.0, 70.8], [97.0, 97.83], [98.0, 97.87], [109.0, 116.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.82, 0.0, 0.0, 0.0, 34.06, 31.74, 0.0, 0.0, 0.0, 0.0, 35.7], "audiomae_on_audioset": [null, [["speech", 63.37], ["telephone", 7.94], ["radio", 6.21]], null, null, null, [["music", 59.61], ["boing", 12.8], ["didgeridoo", 3.35]], [["music", 88.53], ["musical instrument", 1.49], ["funny music", 1.4]], null, null, null, null, [["speech", 65.04], ["music", 17.89], ["radio", 9.26]]], "duration": [0.77, 2.03, 0.83, 0.77, 1.65, 5.26, 24.21, 0.85, -0.2, 0.83, -0.13, 7.48]} \ No newline at end of file diff --git a/annotations_filtered/ghn35eUPiIc_filtered.json b/annotations_filtered/ghn35eUPiIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dde532d983f306a9efb2941b3a9bad7f12cac85d --- /dev/null +++ b/annotations_filtered/ghn35eUPiIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.11], [12.0, 12.43], [16.0, 17.74], [18.0, 18.66], [20.0, 20.65], [25.0, 24.95], [28.0, 30.38], [58.0, 58.24], [61.0, 63.09], [64.0, 65.85], [70.0, 72.77], [73.0, 72.96], [80.0, 81.16], [82.0, 81.68], [82.0, 81.78], [82.0, 82.34], [97.0, 96.6], [97.0, 100.03], [102.0, 102.9], [104.0, 104.09], [105.0, 109.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.31, 0.0, 92.48, 0.0, 69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.22, 0.0, 0.0, 51.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.11, 0.43, 1.74, 0.66, 0.65, -0.05, 2.38, 0.24, 2.09, 1.85, 2.77, -0.04, 1.16, -0.32, -0.22, 0.34, -0.4, 3.03, 0.9, 0.09, 4.32]} \ No newline at end of file diff --git a/annotations_filtered/ghpYpbgtLIs_filtered.json b/annotations_filtered/ghpYpbgtLIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..928709402d50ee3ecc87c2550eba91f4029618fd --- /dev/null +++ b/annotations_filtered/ghpYpbgtLIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.34], [12.0, 13.0], [16.0, 18.52], [21.0, 24.97], [26.0, 26.82], [28.0, 31.56], [39.0, 39.33], [40.0, 55.02], [59.0, 78.75], [80.0, 80.08], [83.0, 82.75], [85.0, 111.74], [115.0, 129.51]], "keep_status": [false, false, true, true, false, true, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 33.46, 33.15, 0.0, 36.14, 0.0, 31.72, 31.74, 0.0, 0.0, 32.05, 35.49], "audiomae_on_audioset": [null, null, [["speech", 29.02], ["music", 16.35], ["explosion", 3.18]], [["mosquito", 19.6], ["music", 17.33], ["throbbing", 9.4]], null, [["fly, housefly", 31.88], ["mosquito", 25.2], ["music", 11.05]], null, [["music", 50.47], ["throbbing", 9.03], ["speech", 8.77]], [["music", 34.58], ["throbbing", 14.25], ["speech", 9.97]], null, null, [["music", 35.19], ["throbbing", 13.55], ["motorcycle", 9.77]], [["cattle, bovinae", 45.02], ["moo", 29.56], ["livestock, farm animals, working animals", 16.69]]], "duration": [0.34, 1.0, 2.52, 3.97, 0.82, 3.56, 0.33, 15.02, 19.75, 0.08, -0.25, 26.74, 14.51]} \ No newline at end of file diff --git a/annotations_filtered/ghtGcGtVtho_filtered.json b/annotations_filtered/ghtGcGtVtho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e110f71bdbb76cd056841fda764c7086d853ff2 --- /dev/null +++ b/annotations_filtered/ghtGcGtVtho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [5.0, 7.21], [8.0, 8.73], [10.0, 11.64], [14.0, 16.6], [18.0, 20.11], [22.0, 23.16], [25.0, 25.83], [27.0, 27.82], [30.0, 30.75], [37.0, 38.85], [40.0, 43.5], [44.0, 45.3], [47.0, 47.75], [50.0, 51.31], [54.0, 55.17], [57.0, 57.52], [61.0, 61.74], [63.0, 63.53], [64.0, 65.06], [69.0, 70.46], [71.0, 72.03], [74.0, 84.77], [86.0, 88.8], [91.0, 96.48], [97.0, 99.1], [100.0, 101.55], [103.0, 106.32], [107.0, 111.79]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.73, 0.0, 0.0, 42.51, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 71.43, 99.96, 99.82, 0.0, 88.83, 98.19], "audiomae_on_audioset": [null, null, null, null, [["moo", 18.17], ["grunt", 16.28], ["cattle, bovinae", 11.01]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 2.21, 0.73, 1.64, 2.6, 2.11, 1.16, 0.83, 0.82, 0.75, 1.85, 3.5, 1.3, 0.75, 1.31, 1.17, 0.52, 0.74, 0.53, 1.06, 1.46, 1.03, 10.77, 2.8, 5.48, 2.1, 1.55, 3.32, 4.79]} \ No newline at end of file diff --git a/annotations_filtered/ghwBg2RgBJM_filtered.json b/annotations_filtered/ghwBg2RgBJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3682586aa5f313bf73204739a8c71672e63b6b8c --- /dev/null +++ b/annotations_filtered/ghwBg2RgBJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [14.0, 16.87], [20.0, 20.53], [26.0, 25.96], [35.0, 45.25], [46.0, 47.46], [50.0, 52.93], [55.0, 78.51], [80.0, 80.54], [81.0, 81.62], [83.0, 83.17], [84.0, 86.21], [90.0, 91.29], [92.0, 93.16], [95.0, 99.37], [100.0, 102.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 85.54, 0.0, 0.0, 96.42, 0.0, 99.56, 99.44, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 90.95, 99.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 2.87, 0.53, -0.04, 10.25, 1.46, 2.93, 23.51, 0.54, 0.62, 0.17, 2.21, 1.29, 1.16, 4.37, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/gi9EwdK-6L4_filtered.json b/annotations_filtered/gi9EwdK-6L4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1fe647d3c175c2ec899f0d9f037845f47e69f30 --- /dev/null +++ b/annotations_filtered/gi9EwdK-6L4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.83], [15.0, 16.14], [19.0, 21.46], [22.0, 29.24], [36.0, 36.41], [38.0, 38.01], [39.0, 41.32], [42.0, 45.22], [50.0, 50.65], [54.0, 53.74], [57.0, 58.11], [63.0, 64.05], [80.0, 88.6], [94.0, 96.65], [98.0, 97.58], [98.0, 97.88], [98.0, 99.5], [107.0, 107.4], [112.0, 113.56], [114.0, 115.26], [117.0, 119.57], [121.0, 137.66], [140.0, 142.11], [143.0, 145.15]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 94.52, 36.34, 0.0, 0.0, 40.81, 38.6, 0.0, 0.0, 0.0, 0.0, 31.09, 41.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 33.04, 39.8, 30.73], "audiomae_on_audioset": [null, null, null, [["singing bowl", 29.06], ["music", 20.98], ["speech", 15.11]], null, null, [["speech", 32.79], ["music", 22.12], ["sidetone", 14.9]], [["didgeridoo", 49.06], ["music", 29.19], ["livestock, farm animals, working animals", 2.48]], null, null, null, null, [["hum", 24.61], ["mains hum", 23.62], ["music", 16.91]], [["music", 61.82], ["didgeridoo", 13.86], ["speech", 2.97]], null, null, null, null, null, null, null, [["hum", 22.06], ["gong", 22.03], ["music", 15.69]], [["music", 51.07], ["electronic music", 5.94], ["gong", 4.49]], [["speech", 44.32], ["boom", 11.91], ["gunshot, gunfire", 5.02]]], "duration": [1.83, 1.14, 2.46, 7.24, 0.41, 0.01, 2.32, 3.22, 0.65, -0.26, 1.11, 1.05, 8.6, 2.65, -0.42, -0.12, 1.5, 0.4, 1.56, 1.26, 2.57, 16.66, 2.11, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/giGWC-o1mvw_filtered.json b/annotations_filtered/giGWC-o1mvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b98f99cd4bd6c193295dd0236f94f46932c4779 --- /dev/null +++ b/annotations_filtered/giGWC-o1mvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.63], [16.0, 18.03], [19.0, 78.34], [80.0, 81.7], [86.0, 95.94], [96.0, 97.82], [98.0, 111.57], [116.0, 121.24], [124.0, 133.51], [140.0, 140.22], [140.0, 149.66], [154.0, 155.46], [166.0, 167.64]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.09, 0.0, 0.0, 36.86, 0.0, 34.85, 32.1, 31.84, 0.0, 31.88, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 61.91], ["speech", 6.52], ["electronic music", 3.11]], null, null, [["speech", 32.18], ["mains hum", 17.37], ["hum", 13.74]], null, [["music", 35.15], ["speech", 31.51], ["didgeridoo", 17.95]], [["didgeridoo", 33.6], ["music", 32.76], ["mains hum", 9.82]], [["music", 68.88], ["crow", 10.81], ["caw", 6.19]], null, [["music", 58.04], ["speech", 16.04], ["scary music", 11.81]], null, null], "duration": [1.63, 2.03, 59.34, 1.7, 9.94, 1.82, 13.57, 5.24, 9.51, 0.22, 9.66, 1.46, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/giajSDY8kCs_filtered.json b/annotations_filtered/giajSDY8kCs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df14689e1a3248e379dfc1dcbb7f96ba6cc715d3 --- /dev/null +++ b/annotations_filtered/giajSDY8kCs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [4.0, 4.41], [6.0, 6.61], [10.0, 10.25], [11.0, 12.7], [14.0, 15.82], [16.0, 23.35], [25.0, 26.55], [27.0, 29.51], [32.0, 32.02], [35.0, 36.41], [41.0, 41.5], [61.0, 62.72], [63.0, 65.47], [68.0, 71.29], [74.0, 74.82], [76.0, 76.45], [77.0, 77.95], [79.0, 80.92], [82.0, 84.5], [92.0, 96.87], [103.0, 106.24], [107.0, 108.95], [111.0, 111.99], [116.0, 126.22], [130.0, 130.96], [139.0, 140.27], [142.0, 142.65], [151.0, 152.69], [153.0, 154.47], [156.0, 159.12], [164.0, 163.88], [169.0, 170.36], [172.0, 172.23], [173.0, 173.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 54.3, 0.0, 0.0, 0.0, 0.0, 99.98, 94.07, 0.0, 0.0, 0.0, 0.0, 61.67, 68.93, 98.8, 0.0, 0.0, 94.95, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 0.41, 0.61, 0.25, 1.7, 1.82, 7.35, 1.55, 2.51, 0.02, 1.41, 0.5, 1.72, 2.47, 3.29, 0.82, 0.45, 0.95, 1.92, 2.5, 4.87, 3.24, 1.95, 0.99, 10.22, 0.96, 1.27, 0.65, 1.69, 1.47, 3.12, -0.12, 1.36, 0.23, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/gif34AkAFIg_filtered.json b/annotations_filtered/gif34AkAFIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b264d845f429e229393bd25454726f0e40ab3154 --- /dev/null +++ b/annotations_filtered/gif34AkAFIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.34], [10.0, 11.3], [16.0, 16.16], [17.0, 17.04], [17.0, 17.78], [30.0, 30.94], [32.0, 32.51], [38.0, 41.18], [47.0, 49.76], [52.0, 52.34], [55.0, 55.61], [57.0, 58.68], [60.0, 61.75], [63.0, 65.1], [69.0, 69.11], [71.0, 72.1], [73.0, 74.75], [76.0, 76.72], [78.0, 79.79], [82.0, 81.92], [83.0, 84.96]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.02, 39.69, 0.0, 0.0, 0.0, 0.0, 32.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mains hum", 17.93], ["hum", 12.29], ["hiccup", 7.52]], [["hum", 11.06], ["eruption", 10.71], ["buzz", 8.87]], null, null, null, null, [["music", 10.35], ["hum", 10.04], ["speech", 8.15]], null, null, null, null, null, null, null], "duration": [0.34, 1.3, 0.16, 0.04, 0.78, 0.94, 0.51, 3.18, 2.76, 0.34, 0.61, 1.68, 1.75, 2.1, 0.11, 1.1, 1.75, 0.72, 1.79, -0.08, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/gijYgnVD9vo_filtered.json b/annotations_filtered/gijYgnVD9vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0c53ab6fcdd91bc3eb88913ac19e270ac846665 --- /dev/null +++ b/annotations_filtered/gijYgnVD9vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [11.0, 12.48], [21.0, 22.76], [29.0, 28.92], [29.0, 35.95], [39.0, 41.23], [42.0, 51.43], [52.0, 53.18], [54.0, 54.58], [60.0, 60.4], [68.0, 69.08], [70.0, 70.98], [81.0, 86.85], [89.0, 97.68]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 48.19, 71.72, 47.08, 0.0, 0.0, 0.0, 0.0, 0.0, 66.63, 58.47], "audiomae_on_audioset": [null, null, null, null, [["music", 35.63], ["quack", 10.84], ["animal", 5.81]], null, [["animal", 35.29], ["music", 24.11], ["sheep", 9.06]], null, null, null, null, null, null, null], "duration": [1.48, 1.48, 1.76, -0.08, 6.95, 2.23, 9.43, 1.18, 0.58, 0.4, 1.08, 0.98, 5.85, 8.68]} \ No newline at end of file diff --git a/annotations_filtered/givOs4_nb-I_filtered.json b/annotations_filtered/givOs4_nb-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c85e5d9d0e331c76a6d035d74d6176455aa4e4c8 --- /dev/null +++ b/annotations_filtered/givOs4_nb-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 13.71], [21.0, 26.84], [30.0, 32.53], [38.0, 39.9], [43.0, 45.33], [48.0, 50.16], [51.0, 52.66], [54.0, 54.87]], "keep_status": [false, true, true, false, true, true, false, false], "silence_prob": [40.22, 43.61, 48.35, 0.0, 43.71, 44.32, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 59.26], ["hum", 11.12], ["mains hum", 6.07]], [["music", 28.21], ["hum", 21.07], ["throbbing", 12.22]], [["music", 36.91], ["speech", 14.36], ["synthesizer", 7.54]], null, [["hum", 23.67], ["music", 16.65], ["mains hum", 10.58]], [["music", 24.21], ["hum", 19.26], ["mains hum", 11.43]], null, null], "duration": [12.71, 5.84, 2.53, 1.9, 2.33, 2.16, 1.66, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/gj-Rl-cgKxM_filtered.json b/annotations_filtered/gj-Rl-cgKxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c4488656f6997a9614df5bf27fabe52b5b93049 --- /dev/null +++ b/annotations_filtered/gj-Rl-cgKxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.32], [9.0, 31.45], [31.0, 31.51], [32.0, 46.4], [47.0, 47.43], [49.0, 72.86], [76.0, 101.38], [104.0, 107.47], [110.0, 109.93], [115.0, 115.7], [119.0, 121.2]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [45.98, 35.86, 0.0, 33.95, 0.0, 35.97, 35.9, 39.74, 0.0, 0.0, 99.44], "audiomae_on_audioset": [[["mains hum", 57.21], ["hum", 39.07], ["speech", 0.78]], [["hum", 15.58], ["noise", 9.1], ["music", 7.33]], null, [["music", 77.56], ["musical instrument", 3.07], ["didgeridoo", 1.65]], null, [["music", 69.69], ["musical instrument", 5.86], ["guitar", 2.48]], [["music", 66.86], ["musical instrument", 5.76], ["trombone", 5.19]], [["cattle, bovinae", 25.66], ["moo", 19.09], ["speech", 17.48]], null, null, null], "duration": [5.32, 22.45, 0.51, 14.4, 0.43, 23.86, 25.38, 3.47, -0.07, 0.7, 2.2]} \ No newline at end of file diff --git a/annotations_filtered/gjWdFgV-Vz8_filtered.json b/annotations_filtered/gjWdFgV-Vz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95b4c2fd65e218d76086f8ddb5d4d1fed5239f32 --- /dev/null +++ b/annotations_filtered/gjWdFgV-Vz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.27], [22.0, 22.4], [31.0, 30.79], [36.0, 40.9], [46.0, 50.77], [61.0, 64.02], [65.0, 65.79], [66.0, 83.42]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.59, 34.26, 34.18, 0.0, 34.28], "audiomae_on_audioset": [null, null, null, [["music", 69.16], ["guitar", 5.54], ["musical instrument", 4.12]], [["music", 65.52], ["musical instrument", 2.91], ["throbbing", 2.48]], [["music", 49.42], ["speech", 5.38], ["synthesizer", 4.83]], null, [["music", 77.31], ["musical instrument", 4.06], ["guitar", 2.69]]], "duration": [1.27, 0.4, -0.21, 4.9, 4.77, 3.02, 0.79, 17.42]} \ No newline at end of file diff --git a/annotations_filtered/gj_BH6Suku0_filtered.json b/annotations_filtered/gj_BH6Suku0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50f5679b009fa7055fe66886cf2286ad05dbf5ed --- /dev/null +++ b/annotations_filtered/gj_BH6Suku0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.28], [9.0, 10.81], [12.0, 12.97], [16.0, 15.8], [38.0, 39.21], [41.0, 42.31], [46.0, 47.83], [52.0, 52.05], [59.0, 60.22], [67.0, 67.36], [88.0, 88.43], [92.0, 92.15], [99.0, 99.79], [103.0, 103.0], [105.0, 105.29], [108.0, 107.86], [127.0, 128.63], [131.0, 131.72], [140.0, 140.93], [146.0, 148.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.28, 1.81, 0.97, -0.2, 1.21, 1.31, 1.83, 0.05, 1.22, 0.36, 0.43, 0.15, 0.79, 0.0, 0.29, -0.14, 1.63, 0.72, 0.93, 2.34]} \ No newline at end of file diff --git a/annotations_filtered/gjjJePytKig_filtered.json b/annotations_filtered/gjjJePytKig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59ed6393b2e3da19a1b8e3a2636f3680bbd9bdad --- /dev/null +++ b/annotations_filtered/gjjJePytKig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[89.0, 91.96], [93.0, 95.74], [96.0, 99.23], [100.0, 100.35], [101.0, 113.68], [114.0, 114.51], [115.0, 115.57], [116.0, 117.59], [120.0, 123.57], [124.0, 125.79], [129.0, 129.37], [131.0, 132.24], [135.0, 139.92], [141.0, 141.56], [142.0, 169.03], [170.0, 170.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.44, 95.37, 85.72, 0.0, 99.52, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 61.27, 0.0, 40.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.3], ["noise", 24.78], ["theremin", 20.77]], null], "duration": [2.96, 2.74, 3.23, 0.35, 12.68, 0.51, 0.57, 1.59, 3.57, 1.79, 0.37, 1.24, 4.92, 0.56, 27.03, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/gjliVll3Uyw_filtered.json b/annotations_filtered/gjliVll3Uyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89db18ddadaba497a48acf2ad58fb226f7d9bf83 --- /dev/null +++ b/annotations_filtered/gjliVll3Uyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 30.13], [31.0, 31.6], [33.0, 34.11], [36.0, 37.39], [38.0, 39.23], [41.0, 43.71], [46.0, 46.09], [49.0, 49.4], [53.0, 54.58], [55.0, 55.98], [58.0, 59.05], [60.0, 60.52], [63.0, 63.22], [65.0, 64.81], [66.0, 68.2], [69.0, 69.97], [77.0, 79.96], [82.0, 87.69]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.72, 0.0, 39.18, 36.38], "audiomae_on_audioset": [null, null, null, null, null, [["fart", 36.09], ["buzz", 7.47], ["fly, housefly", 7.39]], null, null, null, null, null, null, null, null, [["speech", 45.24], ["radio", 10.89], ["hum", 8.48]], null, [["frog", 11.27], ["hum", 10.83], ["noise", 7.93]], [["fly, housefly", 45.09], ["bee, wasp, etc.", 18.73], ["frog", 15.01]]], "duration": [1.13, 0.6, 1.11, 1.39, 1.23, 2.71, 0.09, 0.4, 1.58, 0.98, 1.05, 0.52, 0.22, -0.19, 2.2, 0.97, 2.96, 5.69]} \ No newline at end of file diff --git a/annotations_filtered/gjmt7I1OJfw_filtered.json b/annotations_filtered/gjmt7I1OJfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d44217f613e3c80f021fa0135c2584d507fc0851 --- /dev/null +++ b/annotations_filtered/gjmt7I1OJfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.03], [11.0, 13.15], [14.0, 14.94], [17.0, 18.08], [19.0, 19.99], [22.0, 22.47], [26.0, 26.65], [29.0, 29.15], [61.0, 61.37], [65.0, 65.55], [101.0, 106.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 49.82], ["cattle, bovinae", 27.43], ["moo", 17.53]], null, null, null, null, null, null, null, null, null], "duration": [0.03, 2.15, 0.94, 1.08, 0.99, 0.47, 0.65, 0.15, 0.37, 0.55, 5.32]} \ No newline at end of file diff --git a/annotations_filtered/gjuizikJ2bk_filtered.json b/annotations_filtered/gjuizikJ2bk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2ca4dd43c60773beb2355abb3f63e9f77f57c43 --- /dev/null +++ b/annotations_filtered/gjuizikJ2bk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.96], [15.0, 21.91], [23.0, 24.04], [27.0, 28.24], [30.0, 31.08], [33.0, 40.83], [47.0, 48.56], [50.0, 52.08], [54.0, 55.58], [58.0, 60.2], [66.0, 69.01], [72.0, 73.47], [76.0, 79.57], [82.0, 83.2], [84.0, 85.53], [87.0, 91.37], [93.0, 93.41], [95.0, 122.89], [125.0, 125.95], [127.0, 134.49], [136.0, 138.89], [141.0, 177.74]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.14, 54.17, 0.0, 0.0, 0.0, 70.44, 0.0, 61.57, 0.0, 65.2, 66.03, 0.0, 78.55, 0.0, 0.0, 44.78, 0.0, 55.39, 0.0, 51.99, 78.04, 0.0], "audiomae_on_audioset": [[["sine wave", 36.9], ["chirp tone", 18.55], ["hum", 6.03]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.04], ["mains hum", 27.98], ["music", 9.87]], null, null, null, null, null, null], "duration": [6.96, 6.91, 1.04, 1.24, 1.08, 7.83, 1.56, 2.08, 1.58, 2.2, 3.01, 1.47, 3.57, 1.2, 1.53, 4.37, 0.41, 27.89, 0.95, 7.49, 2.89, 36.74]} \ No newline at end of file diff --git a/annotations_filtered/gkGFvtW0CSE_filtered.json b/annotations_filtered/gkGFvtW0CSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e40db6065323e54565e17d3c9a509bbb2e51fbc --- /dev/null +++ b/annotations_filtered/gkGFvtW0CSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [4.0, 7.05], [9.0, 24.75], [31.0, 95.35], [96.0, 107.62]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 44.2, 40.38, 0.0, 30.67], "audiomae_on_audioset": [null, [["music", 47.85], ["didgeridoo", 9.77], ["musical instrument", 7.77]], [["music", 51.76], ["speech", 18.35], ["didgeridoo", 16.6]], null, [["music", 75.11], ["didgeridoo", 14.71], ["fart", 3.13]]], "duration": [1.44, 3.05, 15.75, 64.35, 11.62]} \ No newline at end of file diff --git a/annotations_filtered/gkJAPsQ2YHE_filtered.json b/annotations_filtered/gkJAPsQ2YHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be8b207cd10361366ca595887c6c2c3198308715 --- /dev/null +++ b/annotations_filtered/gkJAPsQ2YHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.56], [21.0, 21.64], [26.0, 38.35], [40.0, 40.12], [44.0, 44.29], [47.0, 47.38], [48.0, 49.1]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.45, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 86.94], ["sidetone", 4.55], ["music", 1.75]], null, null, null, null], "duration": [1.56, 0.64, 12.35, 0.12, 0.29, 0.38, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/gkfAyFT8xGc_filtered.json b/annotations_filtered/gkfAyFT8xGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6fa083177e60d7260c41afb26dbc786a7b8062f --- /dev/null +++ b/annotations_filtered/gkfAyFT8xGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 25.05], [29.0, 30.23], [31.0, 32.34], [39.0, 39.43], [40.0, 65.69], [66.0, 67.41], [69.0, 75.88]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [34.74, 0.0, 0.0, 0.0, 40.81, 0.0, 49.0], "audiomae_on_audioset": [[["music", 69.55], ["synthesizer", 7.24], ["musical instrument", 6.31]], null, null, null, [["music", 34.75], ["speech", 28.0], ["synthesizer", 9.98]], null, [["mains hum", 38.84], ["hum", 12.69], ["chirp tone", 10.41]]], "duration": [24.05, 1.23, 1.34, 0.43, 25.69, 1.41, 6.88]} \ No newline at end of file diff --git a/annotations_filtered/gknobwKAStE_filtered.json b/annotations_filtered/gknobwKAStE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..859235439af397d85cc4362a557852fa0ba2514a --- /dev/null +++ b/annotations_filtered/gknobwKAStE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.36], [14.0, 14.84], [22.0, 22.79], [23.0, 32.63], [43.0, 43.17], [43.0, 43.24], [45.0, 48.49], [49.0, 52.88], [64.0, 64.54], [68.0, 68.3], [74.0, 74.46], [79.0, 79.25], [85.0, 86.81], [90.0, 90.78], [100.0, 99.98], [103.0, 103.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.69, 0.0, 0.0, 90.25, 46.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 62.81], ["boing", 4.25], ["synthesizer", 4.11]], null, null, null, [["music", 46.3], ["speech", 21.87], ["didgeridoo", 6.3]], null, null, null, null, null, null, null, null], "duration": [0.36, 0.84, 0.79, 9.63, 0.17, 0.24, 3.49, 3.88, 0.54, 0.3, 0.46, 0.25, 1.81, 0.78, -0.02, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/glMgSCdK1xU_filtered.json b/annotations_filtered/glMgSCdK1xU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94c6cf78a9ee52d879cf4b09caf1306655cd5ac9 --- /dev/null +++ b/annotations_filtered/glMgSCdK1xU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.01], [4.0, 5.1], [8.0, 10.62], [11.0, 12.92], [15.0, 16.24], [19.0, 20.48], [22.0, 22.42], [25.0, 27.11], [30.0, 30.52], [33.0, 35.46], [37.0, 37.47], [38.0, 38.38], [40.0, 43.51], [46.0, 48.56], [50.0, 52.54], [54.0, 55.0], [63.0, 64.61], [66.0, 67.95], [72.0, 72.89], [75.0, 76.45], [78.0, 79.12], [81.0, 83.57], [84.0, 85.99], [91.0, 91.27], [93.0, 93.51], [94.0, 97.58], [99.0, 100.06], [104.0, 106.76], [110.0, 112.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.45, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 99.52, 0.0, 0.0, 99.16, 99.59, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 0.0, 90.08, 0.0, 77.53, 75.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.01, 1.1, 2.62, 1.92, 1.24, 1.48, 0.42, 2.11, 0.52, 2.46, 0.47, 0.38, 3.51, 2.56, 2.54, 1.0, 1.61, 1.95, 0.89, 1.45, 1.12, 2.57, 1.99, 0.27, 0.51, 3.58, 1.06, 2.76, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/glNH68Iaa3E_filtered.json b/annotations_filtered/glNH68Iaa3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfe5b33c99bc59cef721a2bdccf7de32c8db3931 --- /dev/null +++ b/annotations_filtered/glNH68Iaa3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.88], [9.0, 15.42], [17.0, 23.31], [24.0, 24.07], [27.0, 31.01], [35.0, 35.56], [37.0, 49.91], [53.0, 54.04], [56.0, 64.13], [66.0, 66.48], [67.0, 67.93], [70.0, 81.35], [82.0, 83.05], [84.0, 84.01], [85.0, 86.58], [90.0, 89.95], [91.0, 91.71], [94.0, 93.97], [95.0, 98.39], [101.0, 102.12], [103.0, 105.38], [108.0, 111.28], [112.0, 121.83], [130.0, 130.98], [133.0, 133.64], [135.0, 135.8], [138.0, 138.03], [142.0, 143.6], [146.0, 147.6], [153.0, 154.95], [158.0, 163.34], [165.0, 165.55], [167.0, 167.41], [167.0, 167.63]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 32.37, 30.81, 0.0, 29.16, 0.0, 30.07, 0.0, 29.23, 0.0, 0.0, 40.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.91, 0.0, 38.82, 34.36, 50.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["throbbing", 54.07], ["music", 21.66], ["hum", 16.63]], [["music", 44.8], ["speech", 28.88], ["throbbing", 4.45]], null, [["music", 61.48], ["cacophony", 7.7], ["musical instrument", 3.74]], null, [["speech", 28.16], ["throbbing", 19.47], ["music", 19.09]], null, [["speech", 46.16], ["music", 22.05], ["cacophony", 9.74]], null, null, [["music", 58.54], ["synthesizer", 16.26], ["sampler", 5.25]], null, null, null, null, null, null, null, null, [["music", 41.33], ["hum", 26.97], ["throbbing", 8.18]], [["music", 40.33], ["throbbing", 17.5], ["hum", 9.91]], null, null, null, null, null, null, null, null, [["music", 46.26], ["synthesizer", 10.14], ["throbbing", 5.75]], null, null, null], "duration": [1.88, 6.42, 6.31, 0.07, 4.01, 0.56, 12.91, 1.04, 8.13, 0.48, 0.93, 11.35, 1.05, 0.01, 1.58, -0.05, 0.71, -0.03, 3.39, 1.12, 2.38, 3.28, 9.83, 0.98, 0.64, 0.8, 0.03, 1.6, 1.6, 1.95, 5.34, 0.55, 0.41, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/gm-sqEK2InM_filtered.json b/annotations_filtered/gm-sqEK2InM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..698cd64d78a2456e701d9941b08ee0ef8bb8e862 --- /dev/null +++ b/annotations_filtered/gm-sqEK2InM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.43], [14.0, 15.77], [17.0, 17.32], [19.0, 19.21], [19.0, 30.64], [32.0, 33.44], [34.0, 62.97], [65.0, 66.48], [72.0, 73.63], [74.0, 74.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 93.29, 0.0, 96.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 1.77, 0.32, 0.21, 11.64, 1.44, 28.97, 1.48, 1.63, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/gm0I_zdgs8o_filtered.json b/annotations_filtered/gm0I_zdgs8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d918513d26d880186f831d9c855ea7b61b9db030 --- /dev/null +++ b/annotations_filtered/gm0I_zdgs8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.07], [10.0, 9.75], [10.0, 42.11], [44.0, 56.66], [58.0, 61.65], [65.0, 64.71], [67.0, 96.31], [103.0, 106.54], [111.0, 113.97], [116.0, 145.89]], "keep_status": [true, false, false, false, false, false, true, false, false, false], "silence_prob": [47.2, 0.0, 0.0, 87.92, 99.82, 0.0, 31.48, 46.26, 64.97, 52.98], "audiomae_on_audioset": [[["speech", 28.37], ["music", 15.36], ["buzz", 5.68]], null, null, null, null, null, [["music", 47.49], ["whale vocalization", 9.78], ["hum", 8.78]], [["mosquito", 58.02], ["fly, housefly", 14.72], ["throbbing", 4.8]], null, null], "duration": [6.07, -0.25, 32.11, 12.66, 3.65, -0.29, 29.31, 3.54, 2.97, 29.89]} \ No newline at end of file diff --git a/annotations_filtered/gm2PdV3UPfc_filtered.json b/annotations_filtered/gm2PdV3UPfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9693721bf6393cf039e26ef582fde99118b9d864 --- /dev/null +++ b/annotations_filtered/gm2PdV3UPfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.42], [11.0, 12.83], [16.0, 16.55], [18.0, 19.33], [21.0, 23.33], [25.0, 28.14], [33.0, 47.28], [49.0, 48.98], [51.0, 52.02], [55.0, 56.39], [58.0, 58.78], [61.0, 62.36], [66.0, 66.6], [71.0, 72.54], [79.0, 79.56]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [33.94, 0.0, 0.0, 0.0, 88.1, 91.81, 35.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["cowbell", 12.44], ["boing", 11.72], ["breaking", 11.09]], null, null, null, null, null, [["speech", 46.98], ["sidetone", 6.25], ["explosion", 5.27]], null, null, null, null, null, null, null, null], "duration": [2.42, 1.83, 0.55, 1.33, 2.33, 3.14, 14.28, -0.02, 1.02, 1.39, 0.78, 1.36, 0.6, 1.54, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/gmElew2NIS8_filtered.json b/annotations_filtered/gmElew2NIS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f34e075987c2f1494f34da60718ad9371da07ea3 --- /dev/null +++ b/annotations_filtered/gmElew2NIS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.9], [7.0, 7.82], [14.0, 14.98], [16.0, 16.75], [18.0, 18.96], [20.0, 20.63], [27.0, 27.19], [30.0, 29.88], [47.0, 51.66], [52.0, 53.54], [56.0, 56.79], [58.0, 58.01], [58.0, 58.72], [60.0, 59.71], [60.0, 59.81], [60.0, 59.85], [60.0, 60.66], [63.0, 72.93], [73.0, 74.07], [75.0, 75.39], [77.0, 77.79], [79.0, 84.55], [90.0, 103.89], [105.0, 107.52], [110.0, 121.47], [125.0, 141.22]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.24, 0.0, 0.0, 0.0, 42.65, 36.8, 43.33, 34.31, 31.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["baby cry, infant cry", 17.26], ["moo", 14.65], ["cattle, bovinae", 14.35]], null, null, null, null, null, null, null, null, null, null, null, null, [["dog", 13.53], ["fart", 11.0], ["animal", 7.82]], [["speech", 29.72], ["fart", 5.87], ["explosion", 5.33]], [["fly, housefly", 15.48], ["insect", 12.95], ["speech", 11.24]], [["speech", 40.13], ["wail, moan", 8.15], ["groan", 3.52]], [["livestock, farm animals, working animals", 32.47], ["cattle, bovinae", 31.07], ["moo", 17.17]]], "duration": [1.9, 0.82, 0.98, 0.75, 0.96, 0.63, 0.19, -0.12, 4.66, 1.54, 0.79, 0.01, 0.72, -0.29, -0.19, -0.15, 0.66, 9.93, 1.07, 0.39, 0.79, 5.55, 13.89, 2.52, 11.47, 16.22]} \ No newline at end of file diff --git a/annotations_filtered/gmJtNjLjsNQ_filtered.json b/annotations_filtered/gmJtNjLjsNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f26d9e514315f2f0516997787757a034e276aca8 --- /dev/null +++ b/annotations_filtered/gmJtNjLjsNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 71.91], [73.0, 76.28], [77.0, 80.23], [81.0, 83.05], [83.0, 84.55], [86.0, 86.71], [88.0, 91.12], [92.0, 99.99], [100.0, 107.03], [107.0, 124.78], [127.0, 127.18], [128.0, 134.28], [135.0, 141.22], [142.0, 157.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.81, 95.23, 92.15, 95.23, 0.0, 0.0, 97.43, 97.0, 80.46, 72.6, 0.0, 73.51, 78.21, 70.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.91, 3.28, 3.23, 2.05, 1.55, 0.71, 3.12, 7.99, 7.03, 17.78, 0.18, 6.28, 6.22, 15.76]} \ No newline at end of file diff --git a/annotations_filtered/gmSeaKdO9IQ_filtered.json b/annotations_filtered/gmSeaKdO9IQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ed58bd7e2a62e5c04e2b29dcb0e51c01f41260d --- /dev/null +++ b/annotations_filtered/gmSeaKdO9IQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 24.98], [27.0, 28.07], [29.0, 30.4], [35.0, 34.77], [36.0, 36.44], [41.0, 41.32], [43.0, 46.68], [48.0, 49.98], [51.0, 52.81], [54.0, 62.8], [64.0, 75.14], [77.0, 82.68], [84.0, 108.94], [110.0, 111.03], [114.0, 116.24], [117.0, 117.64]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false], "silence_prob": [47.5, 0.0, 0.0, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 33.62, 73.36, 54.63, 38.2, 0.0, 44.32, 0.0], "audiomae_on_audioset": [[["speech", 73.61], ["sidetone", 5.37], ["speech synthesizer", 3.8]], null, null, null, null, null, null, null, null, [["music", 44.91], ["gong", 5.54], ["fly, housefly", 5.13]], null, null, [["music", 14.99], ["effects unit", 14.09], ["singing bowl", 13.14]], null, [["music", 35.16], ["noise", 7.58], ["hum", 6.17]], null], "duration": [4.98, 1.07, 1.4, -0.23, 0.44, 0.32, 3.68, 1.98, 1.81, 8.8, 11.14, 5.68, 24.94, 1.03, 2.24, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/gmYSTObayoY_filtered.json b/annotations_filtered/gmYSTObayoY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18193f1320a98d807e6cc4635b0aac28ddf215f2 --- /dev/null +++ b/annotations_filtered/gmYSTObayoY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.51], [6.0, 9.88], [13.0, 14.52], [17.0, 18.52], [19.0, 19.33], [20.0, 24.83], [37.0, 45.37], [48.0, 50.43], [52.0, 51.87], [52.0, 53.33], [54.0, 54.46], [56.0, 59.17], [61.0, 87.67], [88.0, 116.78], [123.0, 125.04], [129.0, 130.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [71.0, 66.39, 0.0, 0.0, 0.0, 42.96, 53.16, 40.55, 0.0, 0.0, 0.0, 60.32, 41.62, 35.15, 39.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 50.69], ["boing", 12.52], ["speech", 11.27]], null, [["music", 62.88], ["synthesizer", 4.82], ["musical instrument", 4.09]], null, null, null, null, [["music", 56.5], ["hum", 7.56], ["theremin", 7.0]], [["music", 73.61], ["didgeridoo", 8.11], ["hum", 2.85]], [["music", 36.38], ["speech", 13.35], ["hum", 8.1]], null], "duration": [2.51, 3.88, 1.52, 1.52, 0.33, 4.83, 8.37, 2.43, -0.13, 1.33, 0.46, 3.17, 26.67, 28.78, 2.04, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/gmbInMp4ioU_filtered.json b/annotations_filtered/gmbInMp4ioU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12a9f13e48f85754ac18fc8e898d748019474af6 --- /dev/null +++ b/annotations_filtered/gmbInMp4ioU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.18], [52.0, 52.05], [54.0, 60.76], [68.0, 68.94], [71.0, 71.02], [73.0, 78.54], [82.0, 85.95], [88.0, 96.15], [100.0, 99.6], [103.0, 103.18], [105.0, 106.14], [115.0, 115.52], [118.0, 118.44], [119.0, 119.99]], "keep_status": [false, false, true, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [98.66, 0.0, 31.94, 0.0, 0.0, 32.35, 65.09, 33.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 41.99], ["thunk", 12.55], ["boing", 11.75]], null, null, [["thunk", 41.31], ["speech", 10.12], ["breaking", 6.66]], null, [["speech", 44.58], ["cowbell", 7.65], ["animal", 7.48]], null, null, null, null, null, null], "duration": [2.18, 0.05, 6.76, 0.94, 0.02, 5.54, 3.95, 8.15, -0.4, 0.18, 1.14, 0.52, 0.44, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/gmedATt5viM_filtered.json b/annotations_filtered/gmedATt5viM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5630560afe8e3ba08797c1a70ff861e31fb1859e --- /dev/null +++ b/annotations_filtered/gmedATt5viM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 88.7], [89.0, 105.0], [106.0, 106.62], [108.0, 112.8], [113.0, 115.2], [118.0, 126.99], [128.0, 128.8]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 37.22, 0.0, 80.29, 79.07, 78.55, 0.0], "audiomae_on_audioset": [null, [["grunt", 22.91], ["music", 21.63], ["speech", 10.31]], null, null, null, null, null], "duration": [48.7, 16.0, 0.62, 4.8, 2.2, 8.99, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/gmnU4tK8GOo_filtered.json b/annotations_filtered/gmnU4tK8GOo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b863e4493786c06d708a5d926d0f8335ec9384c --- /dev/null +++ b/annotations_filtered/gmnU4tK8GOo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 38.28], [39.0, 66.21], [74.0, 75.84], [76.0, 119.82], [120.0, 121.17], [124.0, 128.12], [139.0, 141.32], [142.0, 144.58], [146.0, 146.62], [147.0, 147.82]], "keep_status": [true, true, false, false, false, true, false, false, false, false], "silence_prob": [39.74, 32.14, 0.0, 0.0, 0.0, 31.46, 62.07, 59.77, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 32.5], ["throbbing", 13.37], ["hum", 8.0]], [["breaking", 30.82], ["glass", 19.01], ["music", 13.27]], null, null, null, [["whack, thwack", 21.19], ["thunk", 15.31], ["speech", 9.09]], null, null, null, null], "duration": [2.28, 27.21, 1.84, 43.82, 1.17, 4.12, 2.32, 2.58, 0.62, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/gmo_PhSftuc_filtered.json b/annotations_filtered/gmo_PhSftuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed87b37aa5734819aa9381022469f6cdfa84db1d --- /dev/null +++ b/annotations_filtered/gmo_PhSftuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.01], [27.0, 28.17], [29.0, 31.23], [33.0, 33.74], [34.0, 35.28], [41.0, 51.9], [53.0, 56.32], [58.0, 58.77], [63.0, 80.94], [82.0, 84.28], [85.0, 90.49], [91.0, 94.69], [99.0, 100.01], [102.0, 103.74], [106.0, 122.62]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [96.77, 0.0, 57.97, 0.0, 0.0, 37.58, 96.54, 0.0, 65.2, 63.1, 67.13, 80.46, 0.0, 0.0, 80.64], "audiomae_on_audioset": [null, null, null, null, null, [["fart", 20.12], ["speech", 7.38], ["creak", 6.77]], null, null, null, null, null, null, null, null, null], "duration": [2.01, 1.17, 2.23, 0.74, 1.28, 10.9, 3.32, 0.77, 17.94, 2.28, 5.49, 3.69, 1.01, 1.74, 16.62]} \ No newline at end of file diff --git a/annotations_filtered/gnI8phF08PE_filtered.json b/annotations_filtered/gnI8phF08PE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71a67d07f6f6099ba436c903ec7d11dbe1c90551 --- /dev/null +++ b/annotations_filtered/gnI8phF08PE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.77], [5.0, 4.8], [7.0, 7.55], [11.0, 12.61], [13.0, 14.57], [17.0, 19.25], [20.0, 23.13], [26.0, 27.31], [33.0, 32.85], [36.0, 37.77], [39.0, 39.02], [40.0, 40.78]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.35, 0.0, 0.0, 0.0, 0.0, 30.67, 61.87, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 28.09], ["speech", 15.48], ["livestock, farm animals, working animals", 7.28]], null, null, null, null, [["speech", 42.89], ["music", 24.46], ["boing", 14.36]], null, null, null, null, null, null], "duration": [3.77, -0.2, 0.55, 1.61, 1.57, 2.25, 3.13, 1.31, -0.15, 1.77, 0.02, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/gnWkYf8Peo8_filtered.json b/annotations_filtered/gnWkYf8Peo8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cea6ef870f3bd58e0058055fd2be921c66e4673a --- /dev/null +++ b/annotations_filtered/gnWkYf8Peo8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.64], [17.0, 17.17], [17.0, 17.98], [21.0, 32.12], [33.0, 38.42], [39.0, 40.24], [42.0, 42.47], [43.0, 45.28], [46.0, 47.9], [49.0, 49.32], [50.0, 51.56], [53.0, 68.64], [72.0, 113.12], [113.0, 117.0], [120.0, 158.03]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 35.56, 81.89, 0.0, 0.0, 82.43, 0.0, 0.0, 0.0, 40.38, 0.0, 30.39, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 42.21], ["hum", 9.96], ["breaking", 9.36]], null, null, null, null, null, null, null, [["music", 18.13], ["fart", 8.88], ["ambient music", 8.73]], null, [["whale vocalization", 15.09], ["music", 14.18], ["buzz", 9.16]], null], "duration": [1.64, 0.17, 0.98, 11.12, 5.42, 1.24, 0.47, 2.28, 1.9, 0.32, 1.56, 15.64, 41.12, 4.0, 38.03]} \ No newline at end of file diff --git a/annotations_filtered/gnY0vVF0j60_filtered.json b/annotations_filtered/gnY0vVF0j60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4b236d1a06309043abf1196a3350b6cde14e6fa --- /dev/null +++ b/annotations_filtered/gnY0vVF0j60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.49], [8.0, 9.1], [10.0, 22.28], [23.0, 24.78], [26.0, 27.94], [28.0, 29.1], [35.0, 35.95], [37.0, 38.26], [40.0, 41.59], [42.0, 43.04], [44.0, 45.0], [46.0, 47.17], [52.0, 53.99], [55.0, 55.81], [60.0, 61.38], [64.0, 65.16], [76.0, 77.99], [85.0, 85.89], [87.0, 87.96], [89.0, 89.61], [90.0, 97.36], [99.0, 123.77], [128.0, 130.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.06, 31.93, 98.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.26], ["synthesizer", 6.12], ["throbbing", 3.19]], [["speech", 54.58], ["vehicle", 12.99], ["buzz", 10.38]], null], "duration": [0.49, 1.1, 12.28, 1.78, 1.94, 1.1, 0.95, 1.26, 1.59, 1.04, 1.0, 1.17, 1.99, 0.81, 1.38, 1.16, 1.99, 0.89, 0.96, 0.61, 7.36, 24.77, 2.25]} \ No newline at end of file diff --git a/annotations_filtered/gnaDj74UMqs_filtered.json b/annotations_filtered/gnaDj74UMqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d466741e74d2225ba257c517438521d39c5c3c7e --- /dev/null +++ b/annotations_filtered/gnaDj74UMqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.17], [7.0, 10.12], [11.0, 13.07], [24.0, 24.16], [25.0, 32.46], [35.0, 37.32], [38.0, 39.01], [43.0, 43.06], [45.0, 45.81], [49.0, 49.62], [50.0, 50.77], [53.0, 56.42], [58.0, 61.08], [61.0, 61.62], [64.0, 65.21], [68.0, 76.05], [78.0, 80.23], [82.0, 87.29], [87.0, 88.59], [94.0, 95.72], [97.0, 97.82], [100.0, 101.44], [102.0, 107.1], [112.0, 112.35], [112.0, 113.14], [124.0, 125.27], [129.0, 128.66], [130.0, 130.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.26, 98.44, 0.0, 56.25, 55.89, 0.0, 0.0, 0.0, 0.0, 0.0, 48.14, 39.52, 0.0, 0.0, 60.79, 99.76, 94.95, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 31.18], ["speech", 23.2], ["didgeridoo", 8.24]], [["music", 34.94], ["musical instrument", 16.11], ["guitar", 5.49]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, 3.12, 2.07, 0.16, 7.46, 2.32, 1.01, 0.06, 0.81, 0.62, 0.77, 3.42, 3.08, 0.62, 1.21, 8.05, 2.23, 5.29, 1.59, 1.72, 0.82, 1.44, 5.1, 0.35, 1.14, 1.27, -0.34, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/gnallHWgupY_filtered.json b/annotations_filtered/gnallHWgupY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4abc0a73a098e3b2c6d08e8ffe99e5bea44e1c4 --- /dev/null +++ b/annotations_filtered/gnallHWgupY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [4.0, 4.72], [6.0, 6.64], [8.0, 15.97], [17.0, 18.77], [22.0, 21.86], [26.0, 26.84], [28.0, 30.0], [30.0, 30.99], [33.0, 33.54], [43.0, 43.93], [47.0, 48.59], [52.0, 53.15], [57.0, 57.86], [63.0, 65.08], [69.0, 75.63], [80.0, 81.38], [83.0, 84.13], [86.0, 85.99], [88.0, 89.38], [93.0, 93.48], [95.0, 97.83], [99.0, 99.06], [103.0, 116.94], [119.0, 120.45], [121.0, 130.62], [131.0, 175.71], [179.0, 179.96], [181.0, 181.72], [184.0, 184.28], [186.0, 186.49], [188.0, 193.5], [195.0, 195.83], [198.0, 199.13], [202.0, 202.53], [204.0, 208.14], [208.0, 212.95], [213.0, 214.68], [216.0, 217.17]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.14, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.12, 33.06, 0.0, 0.0, 0.0, 0.0, 0.0, 31.03, 0.0, 30.81, 0.0, 30.63, 0.0, 0.0, 0.0, 0.0, 0.0, 53.1, 0.0, 0.0, 0.0, 37.15, 34.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 24.61], ["synthesizer", 14.57], ["whale vocalization", 5.99]], null, null, null, null, null, null, null, null, null, null, [["speech", 32.9], ["music", 14.16], ["vehicle", 7.28]], [["cattle, bovinae", 30.3], ["moo", 27.05], ["livestock, farm animals, working animals", 14.49]], null, null, null, null, null, [["music", 28.74], ["vehicle", 10.32], ["speech", 4.47]], null, [["music", 40.12], ["whale vocalization", 3.76], ["buzz", 3.15]], null, [["music", 51.47], ["speech", 6.16], ["whack, thwack", 4.68]], null, null, null, null, null, null, null, null, null, [["hum", 32.16], ["glass", 21.03], ["mains hum", 11.64]], [["music", 38.37], ["speech", 32.85], ["electronic music", 1.44]], null, null], "duration": [1.17, 0.72, 0.64, 7.97, 1.77, -0.14, 0.84, 2.0, 0.99, 0.54, 0.93, 1.59, 1.15, 0.86, 2.08, 6.63, 1.38, 1.13, -0.01, 1.38, 0.48, 2.83, 0.06, 13.94, 1.45, 9.62, 44.71, 0.96, 0.72, 0.28, 0.49, 5.5, 0.83, 1.13, 0.53, 4.14, 4.95, 1.68, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/gnbjy2tWfd4_filtered.json b/annotations_filtered/gnbjy2tWfd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94d42bf6cbcc9aa45b54957d18d18a93497a9e79 --- /dev/null +++ b/annotations_filtered/gnbjy2tWfd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.77], [50.0, 51.34], [86.0, 87.76]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.77, 1.34, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/gnfp7yyQgH8_filtered.json b/annotations_filtered/gnfp7yyQgH8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dad5d13aaf9af920594ec3e3fe786bb42339da37 --- /dev/null +++ b/annotations_filtered/gnfp7yyQgH8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 30.91], [31.0, 34.72], [36.0, 38.18], [49.0, 60.08], [61.0, 64.22], [66.0, 66.65], [82.0, 82.41], [85.0, 90.31], [93.0, 101.12], [104.0, 120.36], [131.0, 131.35]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [47.39, 45.3, 49.09, 48.74, 34.3, 0.0, 0.0, 42.39, 33.77, 31.0, 0.0], "audiomae_on_audioset": [[["music", 86.54], ["speech", 1.75], ["electronic music", 1.07]], [["music", 71.41], ["hum", 7.14], ["musical instrument", 3.91]], [["music", 37.52], ["gong", 21.0], ["singing bowl", 9.54]], [["throbbing", 48.04], ["hum", 32.25], ["music", 6.26]], [["music", 27.37], ["synthesizer", 24.01], ["sonar", 12.25]], null, null, [["hum", 46.68], ["sidetone", 19.51], ["speech", 11.61]], [["music", 52.55], ["speech", 24.09], ["hum", 4.07]], [["hum", 52.52], ["mains hum", 23.73], ["throbbing", 6.89]], null], "duration": [12.91, 3.72, 2.18, 11.08, 3.22, 0.65, 0.41, 5.31, 8.12, 16.36, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/gnlvKhPzx5A_filtered.json b/annotations_filtered/gnlvKhPzx5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/gnlvKhPzx5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/gnz7BQ7lxJQ_filtered.json b/annotations_filtered/gnz7BQ7lxJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f88d9d0f071ef3f636af2f5a1c7d869e282a9c4 --- /dev/null +++ b/annotations_filtered/gnz7BQ7lxJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 111.67], [113.0, 114.18], [116.0, 121.1], [122.0, 121.74], [122.0, 124.23], [125.0, 125.44]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 79.59, 0.0, 84.25, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [35.67, 1.18, 5.1, -0.26, 2.23, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/go4K4rCFjMQ_filtered.json b/annotations_filtered/go4K4rCFjMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97ca9fba01d9cc826a0764b19077352e1d5582a2 --- /dev/null +++ b/annotations_filtered/go4K4rCFjMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 31.68], [35.0, 35.94], [37.0, 40.0], [50.0, 50.55], [53.0, 55.11], [60.0, 60.37], [64.0, 64.61], [69.0, 72.59], [76.0, 75.93], [80.0, 80.33], [82.0, 82.24], [84.0, 84.18], [95.0, 96.01], [97.0, 96.97], [98.0, 98.02], [101.0, 103.84], [112.0, 112.31], [113.0, 113.63], [115.0, 115.48], [117.0, 117.07], [119.0, 119.23], [119.0, 120.18], [120.0, 124.85], [126.0, 133.02], [134.0, 134.97], [137.0, 151.17], [174.0, 174.33], [190.0, 190.48], [197.0, 199.18], [203.0, 202.8], [207.0, 210.19], [214.0, 214.29], [223.0, 225.17], [226.0, 226.47]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 41.66, 0.0, 36.37, 0.0, 0.0, 33.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.11, 33.48, 0.0, 31.67, 0.0, 0.0, 31.79, 0.0, 32.83, 0.0, 35.15, 0.0], "audiomae_on_audioset": [null, null, [["music", 46.23], ["didgeridoo", 18.28], ["musical instrument", 5.53]], null, [["music", 62.25], ["musical instrument", 10.52], ["theremin", 9.78]], null, null, [["music", 26.65], ["didgeridoo", 23.55], ["effects unit", 6.22]], null, null, null, null, null, null, null, [["music", 48.0], ["musical instrument", 6.55], ["synthesizer", 6.11]], null, null, null, null, null, null, [["music", 32.19], ["hum", 13.52], ["synthesizer", 9.17]], [["theremin", 33.86], ["music", 31.86], ["quack", 5.29]], null, [["music", 72.38], ["musical instrument", 3.71], ["quack", 3.16]], null, null, [["music", 50.91], ["didgeridoo", 28.59], ["theremin", 5.06]], null, [["music", 35.42], ["gong", 20.91], ["musical instrument", 6.18]], null, [["theremin", 60.77], ["music", 20.91], ["ambient music", 5.21]], null], "duration": [-0.32, 0.94, 3.0, 0.55, 2.11, 0.37, 0.61, 3.59, -0.07, 0.33, 0.24, 0.18, 1.01, -0.03, 0.02, 2.84, 0.31, 0.63, 0.48, 0.07, 0.23, 1.18, 4.85, 7.02, 0.97, 14.17, 0.33, 0.48, 2.18, -0.2, 3.19, 0.29, 2.17, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/goAo5dC8P1s_filtered.json b/annotations_filtered/goAo5dC8P1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55ac142fbac9ae381b2e1b765d4765bbfbeeb572 --- /dev/null +++ b/annotations_filtered/goAo5dC8P1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.82], [20.0, 20.26], [41.0, 41.37], [49.0, 49.72], [52.0, 53.32], [70.0, 70.48], [74.0, 74.65], [78.0, 78.78], [86.0, 89.95], [100.0, 100.13], [114.0, 140.1], [143.0, 167.95], [168.0, 171.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.6, 0.0, 52.74, 54.97, 87.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 50.52], ["musical instrument", 13.3], ["clarinet", 8.32]], null, null, null, null], "duration": [1.82, 0.26, 0.37, 0.72, 1.32, 0.48, 0.65, 0.78, 3.95, 0.13, 26.1, 24.95, 3.63]} \ No newline at end of file diff --git a/annotations_filtered/goEiURelfsM_filtered.json b/annotations_filtered/goEiURelfsM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e953a4e0c11d6eeb9401c1a2abe91ce6d3568c1 --- /dev/null +++ b/annotations_filtered/goEiURelfsM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.86], [8.0, 8.29], [11.0, 11.8], [13.0, 13.63], [15.0, 16.46], [18.0, 19.25], [21.0, 22.11], [28.0, 33.57], [35.0, 35.95], [38.0, 40.51], [41.0, 41.89], [42.0, 41.99], [42.0, 42.4], [47.0, 48.09], [53.0, 53.86], [58.0, 58.82], [63.0, 65.57], [67.0, 67.56], [70.0, 71.64], [77.0, 77.65], [78.0, 78.83], [82.0, 82.36], [85.0, 85.33], [86.0, 86.32], [87.0, 90.19], [97.0, 99.18], [99.0, 102.73], [105.0, 106.76], [109.0, 111.82], [115.0, 115.21], [117.0, 123.58], [125.0, 128.21], [130.0, 130.87], [134.0, 134.81], [137.0, 137.44], [142.0, 142.74], [149.0, 150.03], [153.0, 153.77]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 32.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.38, 32.91, 31.32, 0.0, 30.83, 0.0, 31.04, 32.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 46.55], ["bleat", 6.54], ["speech", 6.34]], null, [["livestock, farm animals, working animals", 36.74], ["cattle, bovinae", 12.95], ["moo", 11.72]], null, null, null, null, null, null, [["moo", 24.12], ["cattle, bovinae", 21.08], ["music", 13.76]], null, null, null, null, null, null, null, [["speech", 39.17], ["music", 15.01], ["mosquito", 5.72]], [["music", 28.34], ["didgeridoo", 10.59], ["speech", 4.39]], [["speech", 44.65], ["music", 29.61], ["boing", 6.83]], null, [["music", 64.35], ["singing", 7.36], ["saxophone", 3.7]], null, [["music", 54.5], ["singing", 7.62], ["bleat", 6.85]], [["moo", 36.45], ["livestock, farm animals, working animals", 34.73], ["cattle, bovinae", 20.46]], null, null, null, null, null, null], "duration": [1.86, 0.29, 0.8, 0.63, 1.46, 1.25, 1.11, 5.57, 0.95, 2.51, 0.89, -0.01, 0.4, 1.09, 0.86, 0.82, 2.57, 0.56, 1.64, 0.65, 0.83, 0.36, 0.33, 0.32, 3.19, 2.18, 3.73, 1.76, 2.82, 0.21, 6.58, 3.21, 0.87, 0.81, 0.44, 0.74, 1.03, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/goKRpR4XNg8_filtered.json b/annotations_filtered/goKRpR4XNg8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4f7f56d9d8fbfc2f8c7b2e3f079a7fff76445b9 --- /dev/null +++ b/annotations_filtered/goKRpR4XNg8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.71], [6.0, 8.45], [10.0, 12.26], [22.0, 24.06], [29.0, 29.98], [42.0, 42.43], [47.0, 48.14], [49.0, 50.87], [58.0, 59.43], [78.0, 79.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.64, 99.91, 45.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 60.05], ["synthetic singing", 17.0], ["male singing", 4.52]], null, null, null, null, null, null], "duration": [0.71, 2.45, 2.26, 2.06, 0.98, 0.43, 1.14, 1.87, 1.43, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/goOhv_1FYsE_filtered.json b/annotations_filtered/goOhv_1FYsE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9a18027769f9e343233affa3f725acfc09abe59 --- /dev/null +++ b/annotations_filtered/goOhv_1FYsE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 90.24]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [57.24]} \ No newline at end of file diff --git a/annotations_filtered/goikm-zX9r8_filtered.json b/annotations_filtered/goikm-zX9r8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/goikm-zX9r8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/goyoOGbDjNM_filtered.json b/annotations_filtered/goyoOGbDjNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9a2c7ac50ca2d55409b1bce27981ea5e24415c5 --- /dev/null +++ b/annotations_filtered/goyoOGbDjNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.1], [4.0, 6.12], [6.0, 21.44], [23.0, 23.92], [25.0, 25.25], [27.0, 37.35], [40.0, 59.1], [63.0, 77.94], [78.0, 88.26], [89.0, 98.74]], "keep_status": [false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 63.64, 39.17, 0.0, 0.0, 34.01, 34.15, 31.71, 38.43, 36.42], "audiomae_on_audioset": [null, null, [["speech", 49.23], ["music", 23.95], ["musical instrument", 4.51]], null, null, [["music", 56.88], ["synthesizer", 9.08], ["musical instrument", 6.4]], [["music", 50.7], ["whack, thwack", 8.19], ["throbbing", 6.49]], [["speech", 41.46], ["music", 19.71], ["boing", 11.21]], [["music", 56.47], ["synthesizer", 13.22], ["musical instrument", 4.23]], [["music", 55.93], ["throbbing", 7.28], ["musical instrument", 5.34]]], "duration": [1.1, 2.12, 15.44, 0.92, 0.25, 10.35, 19.1, 14.94, 10.26, 9.74]} \ No newline at end of file diff --git a/annotations_filtered/gozRrRCtj6E_filtered.json b/annotations_filtered/gozRrRCtj6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36cbac183b196454fa0b95d3370d1861dd9c81b0 --- /dev/null +++ b/annotations_filtered/gozRrRCtj6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 47.38], [49.0, 57.28], [59.0, 74.41], [74.0, 74.49], [85.0, 103.6], [104.0, 114.64]], "keep_status": [false, false, true, false, false, false], "silence_prob": [35.96, 30.53, 30.56, 0.0, 29.72, 64.29], "audiomae_on_audioset": [[["speech", 37.97], ["music", 30.8], ["sidetone", 9.77]], [["music", 54.82], ["speech", 19.94], ["sidetone", 4.56]], [["music", 30.27], ["speech", 26.2], ["didgeridoo", 8.96]], null, [["music", 64.39], ["didgeridoo", 16.46], ["musical instrument", 4.47]], null], "duration": [13.38, 8.28, 15.41, 0.49, 18.6, 10.64]} \ No newline at end of file diff --git a/annotations_filtered/gp6FX1H99NA_filtered.json b/annotations_filtered/gp6FX1H99NA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/gp6FX1H99NA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/gp7K6ZwuDow_filtered.json b/annotations_filtered/gp7K6ZwuDow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfb6cf83cc5c38270acb42af53f0b3618754b693 --- /dev/null +++ b/annotations_filtered/gp7K6ZwuDow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.24], [11.0, 12.95], [13.0, 14.88], [16.0, 22.77], [24.0, 24.76], [26.0, 28.88], [31.0, 31.8], [33.0, 33.45], [37.0, 39.93], [43.0, 43.04], [44.0, 44.24], [57.0, 57.54], [59.0, 59.1], [77.0, 78.11], [79.0, 79.76]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.1, 0.0, 46.75, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 29.7], ["music", 14.43], ["rumble", 9.84]], null, [["speech", 69.94], ["thunk", 5.83], ["hum", 5.64]], null, null, null, null, null, null, null, null, null], "duration": [0.24, 1.95, 1.88, 6.77, 0.76, 2.88, 0.8, 0.45, 2.93, 0.04, 0.24, 0.54, 0.1, 1.11, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/gp8OWUqg4r4_filtered.json b/annotations_filtered/gp8OWUqg4r4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93046af204c39fe878b44ca73bacab34ad2f0d5c --- /dev/null +++ b/annotations_filtered/gp8OWUqg4r4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [14.0, 14.45], [17.0, 17.32], [22.0, 21.64], [30.0, 31.67], [35.0, 39.82], [42.0, 42.08], [47.0, 51.92], [54.0, 58.94], [63.0, 69.55], [85.0, 85.97], [88.0, 88.03], [92.0, 94.49], [98.0, 99.08], [106.0, 106.84], [109.0, 110.12], [116.0, 115.89], [118.0, 118.56], [119.0, 120.36], [121.0, 121.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 98.73, 91.13, 94.52, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.45, 0.32, -0.36, 1.67, 4.82, 0.08, 4.92, 4.94, 6.55, 0.97, 0.03, 2.49, 1.08, 0.84, 1.12, -0.11, 0.56, 1.36, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/gpCFk7jK810_filtered.json b/annotations_filtered/gpCFk7jK810_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49baa76871f8733621f9df0488eab3879e1a905a --- /dev/null +++ b/annotations_filtered/gpCFk7jK810_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.78], [5.0, 6.03], [7.0, 9.59], [13.0, 15.63], [22.0, 23.52], [26.0, 27.51], [36.0, 56.61], [59.0, 62.67], [66.0, 67.53], [70.0, 122.45], [122.0, 122.49], [123.0, 122.52], [123.0, 122.55], [123.0, 123.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 94.37, 0.0, 0.0, 99.73, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.78, 1.03, 2.59, 2.63, 1.52, 1.51, 20.61, 3.67, 1.53, 52.45, 0.49, -0.48, -0.45, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/gpW3ywIoyr0_filtered.json b/annotations_filtered/gpW3ywIoyr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78a302d48fc4228eebd8f296dda808e183bf2322 --- /dev/null +++ b/annotations_filtered/gpW3ywIoyr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.62], [18.0, 20.87], [26.0, 28.27], [29.0, 29.56], [35.0, 37.42], [39.0, 38.94], [40.0, 43.61], [45.0, 47.61], [50.0, 52.02], [54.0, 55.38], [59.0, 60.76], [62.0, 63.09], [70.0, 70.23], [72.0, 74.75], [76.0, 77.08], [78.0, 80.03], [86.0, 86.29], [93.0, 94.53], [99.0, 100.77], [101.0, 101.88], [103.0, 103.06], [113.0, 114.51], [122.0, 123.47], [124.0, 124.23], [126.0, 126.52], [148.0, 148.09], [150.0, 151.56], [152.0, 154.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 85.35, 99.99, 0.0, 97.22, 0.0, 52.27, 61.97, 100.0, 0.0, 0.0, 0.0, 0.0, 84.25, 0.0, 48.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.9], ["foghorn", 8.94], ["gong", 6.52]], null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 29.05], ["beep, bleep", 15.65], ["moo", 12.41]]], "duration": [0.62, 2.87, 2.27, 0.56, 2.42, -0.06, 3.61, 2.61, 2.02, 1.38, 1.76, 1.09, 0.23, 2.75, 1.08, 2.03, 0.29, 1.53, 1.77, 0.88, 0.06, 1.51, 1.47, 0.23, 0.52, 0.09, 1.56, 2.41]} \ No newline at end of file diff --git a/annotations_filtered/gpgsfivrruk_filtered.json b/annotations_filtered/gpgsfivrruk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e53cf3a100eaaf809e628c93912a7f8a5c9d41e2 --- /dev/null +++ b/annotations_filtered/gpgsfivrruk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.9], [15.0, 15.06], [15.0, 18.4], [20.0, 22.67], [25.0, 26.23], [27.0, 29.88], [32.0, 37.56], [39.0, 42.58], [45.0, 57.65], [60.0, 106.91], [109.0, 109.48]], "keep_status": [true, false, true, true, false, true, true, true, true, false, false], "silence_prob": [28.45, 0.0, 33.75, 29.98, 0.0, 34.22, 30.99, 30.42, 30.48, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 22.56], ["hum", 21.06], ["white noise", 17.0]], null, [["mains hum", 24.03], ["hum", 17.68], ["speech", 8.96]], [["eruption", 14.39], ["white noise", 14.13], ["static", 7.73]], null, [["speech", 35.33], ["white noise", 10.46], ["mains hum", 8.69]], [["mains hum", 27.25], ["hum", 18.16], ["eruption", 8.88]], [["eruption", 15.06], ["hum", 13.12], ["explosion", 10.01]], [["hum", 23.4], ["mains hum", 11.56], ["music", 7.28]], null, null], "duration": [2.9, 0.06, 3.4, 2.67, 1.23, 2.88, 5.56, 3.58, 12.65, 46.91, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/gpjYU0C2yrY_filtered.json b/annotations_filtered/gpjYU0C2yrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..164f7da682b854881d3db8e5c64197b561e3a536 --- /dev/null +++ b/annotations_filtered/gpjYU0C2yrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 62.14], [64.0, 93.11], [94.0, 93.93], [94.0, 103.59], [105.0, 139.63], [142.0, 162.24]], "keep_status": [false, false, false, false, false, false], "silence_prob": [29.33, 29.14, 0.0, 33.56, 0.0, 70.02], "audiomae_on_audioset": [[["hum", 40.38], ["throbbing", 25.5], ["music", 14.62]], [["music", 44.15], ["hum", 20.26], ["throbbing", 7.66]], null, [["music", 71.12], ["electronic music", 6.65], ["hum", 4.53]], null, null], "duration": [26.14, 29.11, -0.07, 9.59, 34.63, 20.24]} \ No newline at end of file diff --git a/annotations_filtered/gpkncObsNqY_filtered.json b/annotations_filtered/gpkncObsNqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9498ac7a66c4cca43e4cef56f799554ea58d7b22 --- /dev/null +++ b/annotations_filtered/gpkncObsNqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.89], [35.0, 36.02], [42.0, 42.43], [42.0, 42.53], [45.0, 47.02], [50.0, 57.23], [61.0, 62.29], [69.0, 69.7], [79.0, 79.52], [80.0, 87.86], [90.0, 97.33], [110.0, 111.7], [121.0, 121.12], [131.0, 134.6], [143.0, 146.55], [149.0, 150.16], [158.0, 158.13], [162.0, 163.39], [173.0, 176.07], [179.0, 179.88], [181.0, 184.33], [192.0, 198.39], [202.0, 202.22], [203.0, 205.24], [206.0, 213.21]], "keep_status": [true, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [33.14, 0.0, 0.0, 0.0, 29.0, 31.24, 0.0, 0.0, 0.0, 32.64, 31.83, 0.0, 0.0, 32.42, 29.36, 0.0, 0.0, 0.0, 34.74, 0.0, 31.74, 33.94, 0.0, 42.3, 30.25], "audiomae_on_audioset": [[["music", 41.16], ["speech", 15.05], ["music of latin america", 9.93]], null, null, null, [["music", 13.89], ["fart", 12.26], ["sound effect", 6.93]], [["mosquito", 44.68], ["fly, housefly", 22.74], ["insect", 10.65]], null, null, null, [["fly, housefly", 31.34], ["music", 17.43], ["insect", 16.07]], [["speech", 41.32], ["music", 31.51], ["fart", 10.93]], null, null, [["speech", 33.36], ["whack, thwack", 30.01], ["boing", 18.97]], [["theremin", 33.77], ["music", 30.79], ["hum", 7.28]], null, null, null, [["music", 45.26], ["speech", 8.69], ["theremin", 5.25]], null, [["speech", 33.78], ["music", 26.41], ["boing", 14.09]], [["music", 65.62], ["musical instrument", 5.47], ["effects unit", 4.09]], null, [["boing", 57.75], ["speech", 22.08], ["music", 5.72]], [["fart", 57.29], ["speech", 21.42], ["music", 5.95]]], "duration": [2.89, 1.02, 0.43, 0.53, 2.02, 7.23, 1.29, 0.7, 0.52, 7.86, 7.33, 1.7, 0.12, 3.6, 3.55, 1.16, 0.13, 1.39, 3.07, 0.88, 3.33, 6.39, 0.22, 2.24, 7.21]} \ No newline at end of file diff --git a/annotations_filtered/gprLI38JwQ0_filtered.json b/annotations_filtered/gprLI38JwQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb93e19a692a49442c07334f86f9c392a0f265e0 --- /dev/null +++ b/annotations_filtered/gprLI38JwQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.5], [32.0, 36.39], [37.0, 38.47], [40.0, 51.76], [55.0, 55.63], [56.0, 56.4], [58.0, 62.88], [63.0, 65.28], [73.0, 73.9], [77.0, 79.62], [80.0, 80.97]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.18, 0.0, 96.54, 0.0, 0.0, 62.68, 60.79, 0.0, 86.09, 0.0], "audiomae_on_audioset": [null, [["music", 34.68], ["theremin", 14.8], ["synthesizer", 11.4]], null, null, null, null, null, null, null, null, null], "duration": [0.5, 4.39, 1.47, 11.76, 0.63, 0.4, 4.88, 2.28, 0.9, 2.62, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/gpytphKy7a0_filtered.json b/annotations_filtered/gpytphKy7a0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41c62433b61b3356777e6bdbe1602566f7d16b2d --- /dev/null +++ b/annotations_filtered/gpytphKy7a0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 24.46], [27.0, 32.05], [53.0, 55.11], [82.0, 83.22], [85.0, 85.21], [86.0, 87.45], [95.0, 96.21], [98.0, 98.52], [101.0, 101.8], [112.0, 113.81], [121.0, 122.42]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [35.46, 39.15, 81.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 69.05], ["synthesizer", 7.41], ["theremin", 6.4]], [["speech", 33.89], ["hum", 14.23], ["mains hum", 9.36]], null, null, null, null, null, null, null, null, null], "duration": [14.46, 5.05, 2.11, 1.22, 0.21, 1.45, 1.21, 0.52, 0.8, 1.81, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/gq1gSTF2oyA_filtered.json b/annotations_filtered/gq1gSTF2oyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c6e4c01b3b6317a70a044135625266ac90a1204 --- /dev/null +++ b/annotations_filtered/gq1gSTF2oyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 28.17], [29.0, 31.55], [33.0, 39.02], [44.0, 46.75], [51.0, 53.28], [56.0, 57.5], [64.0, 66.66], [68.0, 68.62], [71.0, 72.54], [73.0, 79.78], [84.0, 85.45], [87.0, 97.29], [101.0, 102.3], [104.0, 104.55], [106.0, 107.4], [112.0, 113.64], [120.0, 119.97], [121.0, 122.54], [124.0, 124.39], [125.0, 127.52], [130.0, 131.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.17, 54.7, 67.51, 60.05, 94.52, 0.0, 55.67, 0.0, 0.0, 62.37, 0.0, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.17, 2.55, 6.02, 2.75, 2.28, 1.5, 2.66, 0.62, 1.54, 6.78, 1.45, 10.29, 1.3, 0.55, 1.4, 1.64, -0.03, 1.54, 0.39, 2.52, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/gq5WIcSz2ko_filtered.json b/annotations_filtered/gq5WIcSz2ko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/gq5WIcSz2ko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/gq6JKq3Q_uw_filtered.json b/annotations_filtered/gq6JKq3Q_uw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..638549fc6050d6d74869d1f6fba37df4ea856157 --- /dev/null +++ b/annotations_filtered/gq6JKq3Q_uw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 25.25], [45.0, 46.6], [62.0, 62.29], [67.0, 68.2], [85.0, 84.92], [88.0, 88.92]], "keep_status": [false, false, false, false, false, false], "silence_prob": [40.21, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.85], ["synthesizer", 33.32], ["keyboard (musical)", 5.13]], null, null, null, null, null], "duration": [11.25, 1.6, 0.29, 1.2, -0.08, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/gqRIBKn09_M_filtered.json b/annotations_filtered/gqRIBKn09_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a0cde6ffa7e4bff93c2011202034f6e8731cf9c --- /dev/null +++ b/annotations_filtered/gqRIBKn09_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.87], [16.0, 18.22], [20.0, 21.25], [33.0, 33.44], [46.0, 47.29], [51.0, 50.99], [53.0, 53.82], [75.0, 76.59], [79.0, 79.54], [83.0, 84.69], [88.0, 88.52], [109.0, 113.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.14], "audiomae_on_audioset": [null, [["music", 53.38], ["boing", 15.11], ["sidetone", 5.26]], null, null, null, null, null, null, null, null, null, [["music", 73.26], ["reggae", 3.6], ["yodeling", 3.3]]], "duration": [-0.13, 2.22, 1.25, 0.44, 1.29, -0.01, 0.82, 1.59, 0.54, 1.69, 0.52, 4.02]} \ No newline at end of file diff --git a/annotations_filtered/gqe-oAUoEto_filtered.json b/annotations_filtered/gqe-oAUoEto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62acf0e2aa79ee0b12218197d1c2cb132670d51f --- /dev/null +++ b/annotations_filtered/gqe-oAUoEto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.22], [15.0, 15.48], [17.0, 26.6], [27.0, 28.68], [29.0, 52.56], [55.0, 55.29], [63.0, 73.95], [77.0, 85.83], [98.0, 99.12], [101.0, 105.71], [113.0, 114.17], [114.0, 115.42], [119.0, 119.58], [122.0, 122.34], [138.0, 145.54], [148.0, 149.34], [154.0, 155.63], [157.0, 159.58], [160.0, 160.19], [161.0, 164.64]], "keep_status": [false, false, true, false, true, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 28.78, 0.0, 29.16, 0.0, 28.78, 31.44, 0.0, 37.49, 0.0, 0.0, 0.0, 0.0, 31.41, 0.0, 0.0, 49.64, 0.0, 73.21], "audiomae_on_audioset": [null, null, [["speech", 46.43], ["whale vocalization", 13.11], ["rumble", 5.84]], null, [["speech", 50.02], ["frog", 9.59], ["whale vocalization", 4.52]], null, [["speech", 65.85], ["music", 13.16], ["whale vocalization", 10.93]], [["music", 23.74], ["speech", 18.17], ["livestock, farm animals, working animals", 11.92]], null, [["speech", 28.32], ["animal", 8.48], ["sidetone", 7.15]], null, null, null, null, [["cattle, bovinae", 26.82], ["livestock, farm animals, working animals", 23.64], ["speech", 19.99]], null, null, [["cattle, bovinae", 26.52], ["speech", 17.38], ["moo", 13.28]], null, null], "duration": [1.22, 0.48, 9.6, 1.68, 23.56, 0.29, 10.95, 8.83, 1.12, 4.71, 1.17, 1.42, 0.58, 0.34, 7.54, 1.34, 1.63, 2.58, 0.19, 3.64]} \ No newline at end of file diff --git a/annotations_filtered/grEV7MeCTsg_filtered.json b/annotations_filtered/grEV7MeCTsg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2960f468039b0dc620f1a04be4cd42d685b2113e --- /dev/null +++ b/annotations_filtered/grEV7MeCTsg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.61], [8.0, 7.96], [24.0, 24.48], [25.0, 25.32], [39.0, 40.04], [65.0, 65.52], [73.0, 74.07], [74.0, 75.98], [80.0, 85.63], [88.0, 90.71], [96.0, 96.67], [102.0, 104.28], [107.0, 107.28], [128.0, 128.78], [129.0, 129.32], [131.0, 131.23], [132.0, 133.84], [137.0, 137.27], [142.0, 142.16], [143.0, 143.21], [144.0, 146.11], [147.0, 147.55], [148.0, 151.23], [153.0, 153.08], [155.0, 156.54], [157.0, 157.74], [164.0, 163.93], [167.0, 167.64], [168.0, 169.69], [171.0, 172.76], [177.0, 179.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 69.88, 0.0, 54.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.92, 0.0, 70.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.61, -0.04, 0.48, 0.32, 1.04, 0.52, 1.07, 1.98, 5.63, 2.71, 0.67, 2.28, 0.28, 0.78, 0.32, 0.23, 1.84, 0.27, 0.16, 0.21, 2.11, 0.55, 3.23, 0.08, 1.54, 0.74, -0.07, 0.64, 1.69, 1.76, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/grdxSWSHJaY_filtered.json b/annotations_filtered/grdxSWSHJaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8442dfd72ff44acab5f8305a963ca72a6ccf4fc8 --- /dev/null +++ b/annotations_filtered/grdxSWSHJaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.9], [23.0, 51.51], [52.0, 54.9], [58.0, 60.44], [61.0, 62.6], [69.0, 68.81], [69.0, 68.98], [69.0, 69.36], [70.0, 70.09], [72.0, 72.59], [73.0, 72.96], [77.0, 77.21], [80.0, 80.0], [87.0, 89.77], [90.0, 91.56], [94.0, 96.23], [96.0, 103.03], [104.0, 104.5], [105.0, 106.19], [107.0, 109.56], [110.0, 110.2], [111.0, 114.59], [115.0, 116.83], [120.0, 120.83], [121.0, 124.5], [130.0, 130.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 97.54, 99.99, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.38, 0.0, 32.96, 32.28, 0.0, 0.0, 79.41, 0.0, 99.97, 0.0, 0.0, 43.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["canidae, dogs, wolves", 17.38], ["animal", 16.82], ["music", 10.77]], null, [["vehicle", 27.54], ["speech", 18.55], ["car", 11.35]], [["music", 25.18], ["effects unit", 6.2], ["echo", 6.05]], null, null, null, null, null, null, null, [["speech", 50.89], ["inside, small room", 7.16], ["whimper", 5.8]], null], "duration": [0.9, 28.51, 2.9, 2.44, 1.6, -0.19, -0.02, 0.36, 0.09, 0.59, -0.04, 0.21, 0.0, 2.77, 1.56, 2.23, 7.03, 0.5, 1.19, 2.56, 0.2, 3.59, 1.83, 0.83, 3.5, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/grlDMsiQ2Yc_filtered.json b/annotations_filtered/grlDMsiQ2Yc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a343657f768f17b119cae83da7aa7bef1b504ae7 --- /dev/null +++ b/annotations_filtered/grlDMsiQ2Yc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.87], [11.0, 49.08], [51.0, 61.05], [63.0, 65.47]], "keep_status": [true, false, false, false], "silence_prob": [31.26, 0.0, 69.61, 99.65], "audiomae_on_audioset": [[["music", 44.03], ["musical instrument", 9.49], ["wind instrument, woodwind instrument", 6.69]], null, null, null], "duration": [2.87, 38.08, 10.05, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/grn62a_8fZ4_filtered.json b/annotations_filtered/grn62a_8fZ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6277981f0b3da31659ca2cbc4792312e4b8efce2 --- /dev/null +++ b/annotations_filtered/grn62a_8fZ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.9], [20.0, 20.46], [23.0, 23.7], [25.0, 25.03], [26.0, 26.69], [28.0, 28.63], [29.0, 29.76], [31.0, 30.77], [46.0, 45.82], [49.0, 48.93], [50.0, 51.29], [53.0, 55.21], [57.0, 62.4], [63.0, 63.81], [65.0, 65.67], [67.0, 67.54], [87.0, 87.27], [96.0, 96.53], [98.0, 98.51], [99.0, 99.84], [108.0, 108.68], [110.0, 111.33], [112.0, 112.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.52, 38.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 55.57], ["hum", 7.01], ["throbbing", 3.77]], [["music", 65.58], ["boing", 4.08], ["hum", 3.92]], null, null, null, null, null, null, null, null, null, null], "duration": [2.9, 0.46, 0.7, 0.03, 0.69, 0.63, 0.76, -0.23, -0.18, -0.07, 1.29, 2.21, 5.4, 0.81, 0.67, 0.54, 0.27, 0.53, 0.51, 0.84, 0.68, 1.33, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/grpGRWYL6mQ_filtered.json b/annotations_filtered/grpGRWYL6mQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34d0e0d3e44c8af229ee840d5408c721d6f104b4 --- /dev/null +++ b/annotations_filtered/grpGRWYL6mQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 41.71], [42.0, 43.7], [45.0, 60.17], [62.0, 63.1], [63.0, 64.84], [66.0, 66.36], [71.0, 71.52], [72.0, 72.87], [76.0, 78.02], [79.0, 80.06], [81.0, 81.24], [82.0, 86.16], [88.0, 88.75], [92.0, 92.67], [94.0, 94.71], [99.0, 98.88], [105.0, 105.41], [106.0, 108.5], [112.0, 120.7], [124.0, 125.12], [126.0, 126.59], [132.0, 131.77], [137.0, 137.84], [139.0, 139.04], [143.0, 150.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.56, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 61.37, 42.39, 0.0, 0.0, 0.0, 0.0, 0.0, 36.11], "audiomae_on_audioset": [null, null, [["music", 68.93], ["speech", 19.75], ["sound effect", 1.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.69], ["didgeridoo", 19.81], ["musical instrument", 1.88]], null, null, null, null, null, [["theremin", 50.26], ["speech", 19.64], ["music", 13.94]]], "duration": [38.71, 1.7, 15.17, 1.1, 1.84, 0.36, 0.52, 0.87, 2.02, 1.06, 0.24, 4.16, 0.75, 0.67, 0.71, -0.12, 0.41, 2.5, 8.7, 1.12, 0.59, -0.23, 0.84, 0.04, 7.82]} \ No newline at end of file diff --git a/annotations_filtered/grwlYBNyMk4_filtered.json b/annotations_filtered/grwlYBNyMk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0114a5f1a3a7d1d0cce2f1a92f93f995a23a7ebc --- /dev/null +++ b/annotations_filtered/grwlYBNyMk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.1], [19.0, 19.95], [23.0, 27.65], [31.0, 31.01], [38.0, 40.42], [44.0, 44.69], [51.0, 51.12], [53.0, 55.9], [59.0, 59.48], [60.0, 60.34], [61.0, 62.88], [65.0, 66.85], [72.0, 76.33], [80.0, 81.65], [83.0, 85.9], [90.0, 89.94], [90.0, 94.29], [95.0, 96.06], [97.0, 97.56], [125.0, 151.65], [155.0, 157.99], [160.0, 162.03], [168.0, 168.25], [173.0, 178.7], [185.0, 189.48], [192.0, 192.4]], "keep_status": [false, false, true, false, true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, true, false], "silence_prob": [0.0, 0.0, 31.06, 0.0, 30.34, 0.0, 0.0, 29.55, 0.0, 0.0, 0.0, 0.0, 32.18, 0.0, 29.59, 0.0, 30.74, 0.0, 0.0, 30.2, 28.58, 53.59, 0.0, 33.17, 32.98, 0.0], "audiomae_on_audioset": [null, null, [["whip", 16.37], ["hum", 15.8], ["speech", 15.47]], null, [["whale vocalization", 16.87], ["fly, housefly", 16.13], ["hum", 6.19]], null, null, [["sound effect", 21.01], ["whale vocalization", 17.2], ["boing", 10.29]], null, null, null, null, [["music", 64.84], ["speech", 9.67], ["mosquito", 6.74]], null, [["whack, thwack", 25.54], ["speech", 15.46], ["sound effect", 8.93]], null, [["music", 49.12], ["speech", 26.23], ["thunk", 4.86]], null, null, [["speech", 46.06], ["music", 18.57], ["whack, thwack", 8.39]], [["speech", 57.17], ["boing", 4.31], ["music", 3.57]], null, null, [["music", 29.28], ["speech", 21.62], ["synthesizer", 10.98]], [["speech", 31.23], ["sidetone", 13.6], ["music", 13.19]], null], "duration": [1.1, 0.95, 4.65, 0.01, 2.42, 0.69, 0.12, 2.9, 0.48, 0.34, 1.88, 1.85, 4.33, 1.65, 2.9, -0.06, 4.29, 1.06, 0.56, 26.65, 2.99, 2.03, 0.25, 5.7, 4.48, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/gs0WQmW1icQ_filtered.json b/annotations_filtered/gs0WQmW1icQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be39a29d924014b43ae565151788aca962c5b0ca --- /dev/null +++ b/annotations_filtered/gs0WQmW1icQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.56], [8.0, 10.17], [11.0, 37.74], [38.0, 84.0]], "keep_status": [false, true, true, false], "silence_prob": [47.2, 47.82, 42.26, 0.0], "audiomae_on_audioset": [[["gong", 43.8], ["music", 23.07], ["sonar", 13.32]], [["chirp tone", 27.34], ["sine wave", 24.64], ["ambient music", 9.54]], [["music", 45.41], ["sonar", 6.41], ["glass", 5.29]], null], "duration": [5.56, 2.17, 26.74, 46.0]} \ No newline at end of file diff --git a/annotations_filtered/gs3GHB24IaM_filtered.json b/annotations_filtered/gs3GHB24IaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c899f790e8c50640e87008761451a2706c7e5fe --- /dev/null +++ b/annotations_filtered/gs3GHB24IaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.2], [12.0, 20.76], [28.0, 29.51], [53.0, 53.1], [54.0, 54.57], [61.0, 66.19], [68.0, 74.02], [81.0, 88.94], [95.0, 95.76], [99.0, 99.52], [104.0, 104.73], [113.0, 114.32], [121.0, 121.56]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [29.56, 30.54, 0.0, 0.0, 0.0, 32.13, 29.62, 29.85, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 60.32], ["speech", 9.21], ["throbbing", 3.92]], [["music", 44.92], ["hum", 19.02], ["mains hum", 12.78]], null, null, null, [["music", 80.03], ["groan", 3.78], ["hum", 2.47]], [["music", 73.84], ["throbbing", 5.49], ["cacophony", 3.49]], [["music", 47.0], ["sonar", 9.73], ["hum", 7.37]], null, null, null, null, null], "duration": [4.2, 8.76, 1.51, 0.1, 0.57, 5.19, 6.02, 7.94, 0.76, 0.52, 0.73, 1.32, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/gsG8sEK2md8_filtered.json b/annotations_filtered/gsG8sEK2md8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca82d90a4656905713159054e15db0810a21856f --- /dev/null +++ b/annotations_filtered/gsG8sEK2md8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.11], [32.0, 34.84], [35.0, 35.43], [36.0, 40.39], [41.0, 41.57], [42.0, 42.72], [45.0, 55.61], [56.0, 63.48], [64.0, 63.95], [64.0, 64.07], [64.0, 64.94], [67.0, 69.43], [70.0, 71.29], [73.0, 77.87], [85.0, 95.28], [97.0, 128.71], [130.0, 130.33], [131.0, 131.94], [132.0, 152.96], [153.0, 154.06], [155.0, 169.2], [170.0, 186.58], [187.0, 189.4]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 33.16, 0.0, 30.99, 0.0, 0.0, 31.03, 34.25, 0.0, 0.0, 0.0, 59.68, 0.0, 50.51, 29.27, 0.0, 0.0, 0.0, 29.74, 0.0, 29.32, 29.01, 33.09], "audiomae_on_audioset": [null, [["music", 46.79], ["didgeridoo", 9.71], ["whale vocalization", 3.95]], null, [["didgeridoo", 36.58], ["music", 18.96], ["theremin", 18.57]], null, null, [["music", 20.54], ["didgeridoo", 11.88], ["hum", 10.32]], [["music", 62.95], ["didgeridoo", 10.0], ["speech", 6.79]], null, null, null, null, null, null, [["hum", 33.71], ["throbbing", 15.01], ["music", 11.69]], null, null, null, [["speech", 64.17], ["music", 20.48], ["breaking", 2.39]], null, [["hum", 23.2], ["music", 21.35], ["throbbing", 16.27]], [["music", 69.38], ["didgeridoo", 5.24], ["animal", 3.28]], [["speech", 18.26], ["electric shaver, electric razor", 11.3], ["mains hum", 7.21]]], "duration": [0.11, 2.84, 0.43, 4.39, 0.57, 0.72, 10.61, 7.48, -0.05, 0.07, 0.94, 2.43, 1.29, 4.87, 10.28, 31.71, 0.33, 0.94, 20.96, 1.06, 14.2, 16.58, 2.4]} \ No newline at end of file diff --git a/annotations_filtered/gsGm2Ohl7x8_filtered.json b/annotations_filtered/gsGm2Ohl7x8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9a82285b6ed2ad7d7f7bf11d5214c6d01468ca4 --- /dev/null +++ b/annotations_filtered/gsGm2Ohl7x8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 23.3], [25.0, 32.1], [37.0, 45.39], [50.0, 51.11], [60.0, 59.95], [70.0, 71.09], [72.0, 96.55]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [94.22, 79.41, 48.78, 0.0, 0.0, 0.0, 30.09], "audiomae_on_audioset": [null, null, [["hum", 36.9], ["speech", 17.06], ["throbbing", 11.37]], null, null, null, [["speech", 80.25], ["whack, thwack", 2.52], ["music", 1.86]]], "duration": [4.3, 7.1, 8.39, 1.11, -0.05, 1.09, 24.55]} \ No newline at end of file diff --git a/annotations_filtered/gsWHt9OIofc_filtered.json b/annotations_filtered/gsWHt9OIofc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d50c08279a7292dfa7398c444272a38ddf01585 --- /dev/null +++ b/annotations_filtered/gsWHt9OIofc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.94], [12.0, 12.11], [15.0, 15.67], [22.0, 23.03], [26.0, 27.41], [28.0, 29.15], [31.0, 31.63], [35.0, 35.5], [38.0, 38.62], [56.0, 58.09], [63.0, 63.12], [68.0, 69.84], [73.0, 74.56], [79.0, 79.78], [83.0, 84.84], [86.0, 86.43], [93.0, 93.12], [97.0, 97.24], [99.0, 99.86], [102.0, 102.07], [104.0, 104.13], [105.0, 106.89], [111.0, 113.53], [115.0, 115.11], [118.0, 118.93], [121.0, 122.39], [124.0, 125.15], [130.0, 130.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.11, 0.67, 1.03, 1.41, 1.15, 0.63, 0.5, 0.62, 2.09, 0.12, 1.84, 1.56, 0.78, 1.84, 0.43, 0.12, 0.24, 0.86, 0.07, 0.13, 1.89, 2.53, 0.11, 0.93, 1.39, 1.15, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/gsYcnpq1HBc_filtered.json b/annotations_filtered/gsYcnpq1HBc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dab166f273974023e40dbe1006a7a6b4be20f1ec --- /dev/null +++ b/annotations_filtered/gsYcnpq1HBc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.73], [12.0, 12.28], [14.0, 14.47], [16.0, 16.39], [17.0, 19.08], [30.0, 30.48], [33.0, 33.13], [53.0, 54.33], [59.0, 60.32], [93.0, 94.31], [101.0, 100.92], [113.0, 123.82], [130.0, 131.23], [137.0, 139.13], [152.0, 152.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 52.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.28, 0.0, 29.73, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 89.89], ["didgeridoo", 1.46], ["singing", 1.13]], null, [["fly, housefly", 26.75], ["mosquito", 11.23], ["music", 9.41]], null], "duration": [0.73, 0.28, 0.47, 0.39, 2.08, 0.48, 0.13, 1.33, 1.32, 1.31, -0.08, 10.82, 1.23, 2.13, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/gt6_2qd75F8_filtered.json b/annotations_filtered/gt6_2qd75F8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58493056258ac0024b1b554eb8d5bdfd455d784c --- /dev/null +++ b/annotations_filtered/gt6_2qd75F8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.21], [6.0, 14.01], [17.0, 17.85], [24.0, 56.34], [63.0, 105.07], [107.0, 121.58], [122.0, 124.17], [127.0, 129.66], [130.0, 133.34], [136.0, 162.95]], "keep_status": [false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 29.89, 0.0, 0.0, 0.0, 51.5, 40.57, 30.93, 34.98, 30.23], "audiomae_on_audioset": [null, [["music", 43.15], ["didgeridoo", 41.07], ["noise", 1.54]], null, null, null, null, [["speech", 35.31], ["hum", 12.76], ["whale vocalization", 9.07]], [["music", 23.94], ["speech", 16.86], ["eruption", 5.02]], [["speech", 35.26], ["frog", 18.04], ["noise", 6.16]], [["music", 65.67], ["hum", 4.89], ["throbbing", 3.31]]], "duration": [0.21, 8.01, 0.85, 32.34, 42.07, 14.58, 2.17, 2.66, 3.34, 26.95]} \ No newline at end of file diff --git a/annotations_filtered/gtHhlD6p8BY_filtered.json b/annotations_filtered/gtHhlD6p8BY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb500dc1c3f37d839e14b9dc909a64e03d3a958c --- /dev/null +++ b/annotations_filtered/gtHhlD6p8BY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[78.0, 79.64], [81.0, 81.67], [83.0, 83.39], [87.0, 89.01], [93.0, 94.1], [95.0, 95.69], [101.0, 119.35], [120.0, 131.19], [135.0, 134.89], [136.0, 155.83], [157.0, 163.92], [165.0, 172.56], [177.0, 196.94], [200.0, 200.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.31, 0.0, 0.0, 30.51, 31.55, 0.0, 31.85, 31.97, 30.87, 33.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 36.48], ["music", 31.22], ["throbbing", 15.45]], [["fart", 39.6], ["speech", 31.22], ["music", 6.13]], null, [["speech", 55.43], ["music", 14.71], ["outside, rural or natural", 4.02]], [["speech", 61.48], ["music", 7.51], ["fart", 3.55]], [["cattle, bovinae", 36.54], ["livestock, farm animals, working animals", 30.71], ["moo", 27.53]], [["cattle, bovinae", 37.69], ["moo", 35.08], ["livestock, farm animals, working animals", 11.96]], null], "duration": [1.64, 0.67, 0.39, 2.01, 1.1, 0.69, 18.35, 11.19, -0.11, 19.83, 6.92, 7.56, 19.94, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/gtKp8oxOzAU_filtered.json b/annotations_filtered/gtKp8oxOzAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..083027ea277068f32fc3c8812dba857f8df6d978 --- /dev/null +++ b/annotations_filtered/gtKp8oxOzAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [6.0, 12.01], [13.0, 14.25], [15.0, 16.33], [17.0, 18.45], [19.0, 19.84], [21.0, 21.86], [24.0, 28.0], [29.0, 34.3], [34.0, 34.99], [36.0, 42.72], [43.0, 48.44], [49.0, 49.92], [53.0, 54.95], [56.0, 57.18], [59.0, 59.61], [61.0, 61.28], [64.0, 67.22], [69.0, 69.7], [70.0, 75.47], [77.0, 80.81], [81.0, 80.86], [81.0, 82.05], [83.0, 90.61], [91.0, 92.18], [94.0, 96.69], [97.0, 111.79], [113.0, 114.76], [119.0, 118.99], [120.0, 120.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.93, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 94.81, 0.0, 96.54, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 0.0, 72.6, 62.68, 0.0, 0.0, 63.74, 0.0, 69.88, 51.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 72.4], ["music", 7.32], ["sidetone", 2.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 6.01, 1.25, 1.33, 1.45, 0.84, 0.86, 4.0, 5.3, 0.99, 6.72, 5.44, 0.92, 1.95, 1.18, 0.61, 0.28, 3.22, 0.7, 5.47, 3.81, -0.14, 1.05, 7.61, 1.18, 2.69, 14.79, 1.76, -0.01, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/gtngV41jpcw_filtered.json b/annotations_filtered/gtngV41jpcw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec772b7f1dcbe86c41d4e6f3dc84bd395d83cd45 --- /dev/null +++ b/annotations_filtered/gtngV41jpcw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.58], [15.0, 16.55], [20.0, 28.44], [29.0, 30.21], [33.0, 34.62], [36.0, 39.38], [44.0, 45.45], [47.0, 47.55], [50.0, 50.65], [56.0, 55.83], [60.0, 61.2], [63.0, 64.74], [66.0, 67.85], [69.0, 68.76], [71.0, 72.22]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [49.92, 0.0, 58.47, 0.0, 0.0, 32.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 84.17], ["synthesizer", 1.78], ["noise", 1.26]], null, null, null, null, [["fart", 38.93], ["sound effect", 13.56], ["explosion", 11.28]], null, null, null, null, null, null, null, null, null], "duration": [9.58, 1.55, 8.44, 1.21, 1.62, 3.38, 1.45, 0.55, 0.65, -0.17, 1.2, 1.74, 1.85, -0.24, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/guK3fiVFU98_filtered.json b/annotations_filtered/guK3fiVFU98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..607c7effdec9df84060cea64cbb010d4a2cd4db0 --- /dev/null +++ b/annotations_filtered/guK3fiVFU98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [6.0, 6.35], [7.0, 7.72], [9.0, 9.95], [10.0, 10.96], [14.0, 14.4], [15.0, 16.06], [18.0, 20.93], [23.0, 23.45], [24.0, 26.69], [28.0, 28.73], [29.0, 29.89], [34.0, 34.52], [37.0, 39.19], [41.0, 42.53], [43.0, 43.8], [46.0, 48.25], [50.0, 50.19], [52.0, 53.16], [54.0, 54.62], [56.0, 56.67], [57.0, 63.09], [65.0, 66.95], [69.0, 68.89], [70.0, 80.67], [82.0, 82.14], [84.0, 85.04], [87.0, 88.59], [92.0, 92.16], [92.0, 92.53], [95.0, 95.55], [99.0, 99.08], [100.0, 100.16], [101.0, 101.43], [104.0, 104.03], [105.0, 109.02], [109.0, 110.29], [111.0, 113.44], [115.0, 118.08], [119.0, 119.62], [121.0, 124.61], [127.0, 128.02], [131.0, 131.77], [132.0, 132.54], [134.0, 134.67], [135.0, 135.28], [136.0, 136.26], [137.0, 138.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 98.73, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 99.21, 81.89, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 0.35, 0.72, 0.95, 0.96, 0.4, 1.06, 2.93, 0.45, 2.69, 0.73, 0.89, 0.52, 2.19, 1.53, 0.8, 2.25, 0.19, 1.16, 0.62, 0.67, 6.09, 1.95, -0.11, 10.67, 0.14, 1.04, 1.59, 0.16, 0.53, 0.55, 0.08, 0.16, 0.43, 0.03, 4.02, 1.29, 2.44, 3.08, 0.62, 3.61, 1.02, 0.77, 0.54, 0.67, 0.28, 0.26, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/guMVb47aD-k_filtered.json b/annotations_filtered/guMVb47aD-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d56bd67f6c518fb39a07959cf13882846d518175 --- /dev/null +++ b/annotations_filtered/guMVb47aD-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.76], [11.0, 13.53], [14.0, 15.25], [20.0, 20.78], [24.0, 24.56], [33.0, 34.21], [38.0, 39.95], [41.0, 43.56], [46.0, 46.31], [48.0, 51.0], [55.0, 54.87], [57.0, 58.85], [61.0, 66.5], [68.0, 69.48]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [45.24, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 39.11, 0.0, 44.26, 0.0, 0.0, 79.24, 0.0], "audiomae_on_audioset": [[["noise", 28.06], ["hum", 14.83], ["mains hum", 11.06]], null, null, null, null, null, null, [["frog", 26.26], ["domestic animals, pets", 5.12], ["croak", 4.77]], null, [["speech", 34.31], ["sidetone", 26.79], ["hum", 9.14]], null, null, null, null], "duration": [3.76, 2.53, 1.25, 0.78, 0.56, 1.21, 1.95, 2.56, 0.31, 3.0, -0.13, 1.85, 5.5, 1.48]} \ No newline at end of file diff --git a/annotations_filtered/guQnnPJgtUo_filtered.json b/annotations_filtered/guQnnPJgtUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f6a776d1114125ef77414d67a5e57b27e5b10cd --- /dev/null +++ b/annotations_filtered/guQnnPJgtUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.8], [11.0, 12.19], [14.0, 15.23], [16.0, 22.23], [23.0, 28.59], [33.0, 41.35]], "keep_status": [false, false, false, false, false, true], "silence_prob": [56.78, 0.0, 0.0, 56.7, 76.86, 33.9], "audiomae_on_audioset": [null, null, null, null, null, [["noise", 15.03], ["electric shaver, electric razor", 12.28], ["speech", 8.27]]], "duration": [2.8, 1.19, 1.23, 6.23, 5.59, 8.35]} \ No newline at end of file diff --git a/annotations_filtered/guWGxRXZbis_filtered.json b/annotations_filtered/guWGxRXZbis_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7df4cfb9d00d77374665f40f498cedb3f145c2c0 --- /dev/null +++ b/annotations_filtered/guWGxRXZbis_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [3.0, 4.31], [5.0, 6.4], [7.0, 7.8], [9.0, 12.01], [14.0, 15.75], [17.0, 19.01], [20.0, 25.41], [26.0, 32.16], [33.0, 32.83], [34.0, 34.5], [36.0, 36.58], [42.0, 43.04], [44.0, 44.91], [47.0, 48.12], [49.0, 49.76], [53.0, 53.18], [55.0, 55.76], [57.0, 58.55], [59.0, 60.12], [62.0, 64.84], [69.0, 69.99], [71.0, 71.22], [72.0, 73.53], [75.0, 75.17], [75.0, 76.13], [78.0, 79.37], [80.0, 80.52], [82.0, 84.99], [86.0, 87.29], [89.0, 89.87], [93.0, 94.81], [99.0, 100.25], [103.0, 102.9], [103.0, 105.07], [105.0, 106.93], [108.0, 108.46], [109.0, 110.66], [112.0, 113.04], [115.0, 115.18], [116.0, 120.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 77.7, 0.0, 81.17, 77.03, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 1.31, 1.4, 0.8, 3.01, 1.75, 2.01, 5.41, 6.16, -0.17, 0.5, 0.58, 1.04, 0.91, 1.12, 0.76, 0.18, 0.76, 1.55, 1.12, 2.84, 0.99, 0.22, 1.53, 0.17, 1.13, 1.37, 0.52, 2.99, 1.29, 0.87, 1.81, 1.25, -0.1, 2.07, 1.93, 0.46, 1.66, 1.04, 0.18, 4.43]} \ No newline at end of file diff --git a/annotations_filtered/gu_ckpTcrBI_filtered.json b/annotations_filtered/gu_ckpTcrBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b7af3d5efabec422ae98d832b5dba2d7bad7cc5 --- /dev/null +++ b/annotations_filtered/gu_ckpTcrBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.82], [6.0, 11.82], [14.0, 14.01], [16.0, 16.56], [17.0, 18.74], [21.0, 21.36], [24.0, 26.15], [28.0, 29.44], [32.0, 33.66], [35.0, 36.9], [38.0, 42.9], [44.0, 45.08], [48.0, 49.01], [50.0, 51.58], [52.0, 53.11], [53.0, 54.45], [55.0, 55.29], [56.0, 56.88], [57.0, 63.36], [64.0, 65.74], [66.0, 67.41], [69.0, 68.89], [71.0, 72.66], [74.0, 74.97], [78.0, 78.49], [79.0, 107.84], [110.0, 110.1], [112.0, 112.8], [115.0, 118.35], [120.0, 120.19], [127.0, 127.38], [128.0, 130.84], [132.0, 131.94], [133.0, 133.15], [135.0, 136.75], [145.0, 146.75], [149.0, 150.75], [152.0, 154.36], [155.0, 154.68], [157.0, 157.11], [158.0, 174.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.31, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.29, 0.0, 0.0, 93.45, 0.0, 0.0, 47.08, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 0.0, 53.72], "audiomae_on_audioset": [null, [["speech", 35.58], ["livestock, farm animals, working animals", 17.53], ["animal", 17.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.76], ["speech", 7.38], ["hum", 6.42]], null, null, null, null, null, null, [["music", 79.08], ["soundtrack music", 3.57], ["theremin", 2.77]], null, null, null, null, null, [["music", 32.39], ["didgeridoo", 23.59], ["bass guitar", 2.96]], null, null, null, null, null, null, null, null, null], "duration": [0.82, 5.82, 0.01, 0.56, 1.74, 0.36, 2.15, 1.44, 1.66, 1.9, 4.9, 1.08, 1.01, 1.58, 1.11, 1.45, 0.29, 0.88, 6.36, 1.74, 1.41, -0.11, 1.66, 0.97, 0.49, 28.84, 0.1, 0.8, 3.35, 0.19, 0.38, 2.84, -0.06, 0.15, 1.75, 1.75, 1.75, 2.36, -0.32, 0.11, 16.28]} \ No newline at end of file diff --git a/annotations_filtered/gv1nYk_OJjs_filtered.json b/annotations_filtered/gv1nYk_OJjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad0ee6fb33ed9943107f2e3f75da8aadac9fc0e5 --- /dev/null +++ b/annotations_filtered/gv1nYk_OJjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.65], [2.0, 2.66], [6.0, 12.23], [13.0, 15.52], [16.0, 16.01], [17.0, 27.04], [30.0, 38.1], [40.0, 40.42], [46.0, 47.75], [49.0, 52.35], [55.0, 55.46], [56.0, 60.08], [61.0, 70.66], [72.0, 77.94], [79.0, 79.69], [81.0, 81.75], [85.0, 86.48], [91.0, 91.25], [97.0, 102.51], [103.0, 112.43], [116.0, 116.85], [119.0, 119.4], [121.0, 120.87]], "keep_status": [false, false, true, false, false, true, true, false, false, true, false, false, true, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 36.9, 43.08, 0.0, 33.6, 34.89, 0.0, 0.0, 47.2, 0.0, 55.04, 39.19, 35.59, 0.0, 0.0, 0.0, 0.0, 34.65, 37.67, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 24.51], ["sonar", 10.49], ["music", 6.88]], [["whale vocalization", 61.55], ["theremin", 7.33], ["music", 6.34]], null, [["electric shaver, electric razor", 31.79], ["music", 28.13], ["didgeridoo", 3.02]], [["speech", 36.39], ["music", 13.89], ["hum", 10.17]], null, null, [["speech", 22.35], ["howl", 6.38], ["animal", 6.11]], null, null, [["animal", 51.19], ["sheep", 10.32], ["goat", 4.0]], [["speech", 24.99], ["music", 6.24], ["mosquito", 5.65]], null, null, null, null, [["hum", 46.71], ["mains hum", 20.59], ["throbbing", 13.41]], [["speech", 26.44], ["music", 17.43], ["synthesizer", 6.45]], null, null, null], "duration": [-0.35, 0.66, 6.23, 2.52, 0.01, 10.04, 8.1, 0.42, 1.75, 3.35, 0.46, 4.08, 9.66, 5.94, 0.69, 0.75, 1.48, 0.25, 5.51, 9.43, 0.85, 0.4, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/gvBe38KoiVc_filtered.json b/annotations_filtered/gvBe38KoiVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a734d087dc31da98f13e51bd221f5d1aa66a8e9c --- /dev/null +++ b/annotations_filtered/gvBe38KoiVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [6.0, 13.49], [17.0, 24.95], [35.0, 36.32], [37.0, 41.47], [45.0, 67.42]], "keep_status": [false, true, true, false, true, false], "silence_prob": [0.0, 29.36, 29.39, 0.0, 29.76, 29.77], "audiomae_on_audioset": [null, [["music", 37.32], ["singing", 4.39], ["smash, crash", 4.0]], [["music", 23.54], ["boom", 17.64], ["hum", 5.38]], null, [["cattle, bovinae", 31.29], ["moo", 18.43], ["livestock, farm animals, working animals", 15.18]], [["livestock, farm animals, working animals", 39.69], ["cattle, bovinae", 25.35], ["moo", 12.7]]], "duration": [1.37, 7.49, 7.95, 1.32, 4.47, 22.42]} \ No newline at end of file diff --git a/annotations_filtered/gvGNWLszAQA_filtered.json b/annotations_filtered/gvGNWLszAQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f31b9a6d2ee3673dd46f38d1e49ea73622afbe3d --- /dev/null +++ b/annotations_filtered/gvGNWLszAQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.38], [17.0, 18.18], [19.0, 19.57], [21.0, 21.3], [24.0, 24.53], [25.0, 39.95], [43.0, 44.1], [47.0, 52.19], [52.0, 53.4], [58.0, 59.49], [62.0, 66.5], [68.0, 68.89], [71.0, 73.4], [76.0, 76.18], [78.0, 77.92], [79.0, 84.55], [85.0, 86.04], [90.0, 96.43], [97.0, 98.51], [101.0, 101.56]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.77, 0.0, 34.24, 0.0, 0.0, 43.2, 0.0, 36.37, 0.0, 0.0, 34.97, 0.0, 35.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 44.04], ["keyboard (musical)", 15.51], ["piano", 15.37]], null, [["music", 49.66], ["synthesizer", 13.82], ["musical instrument", 4.53]], null, null, [["hum", 43.16], ["throbbing", 16.77], ["mains hum", 15.29]], null, [["white noise", 5.5], ["sound effect", 5.34], ["cacophony", 5.3]], null, null, [["music", 53.23], ["synthesizer", 6.89], ["musical instrument", 3.57]], null, [["music", 47.43], ["synthesizer", 9.33], ["throbbing", 6.02]], null, null], "duration": [0.38, 1.18, 0.57, 0.3, 0.53, 14.95, 1.1, 5.19, 1.4, 1.49, 4.5, 0.89, 2.4, 0.18, -0.08, 5.55, 1.04, 6.43, 1.51, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/gvJLNa16cdo_filtered.json b/annotations_filtered/gvJLNa16cdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..147474c4cf1ad4f70b868bdc3ea662a773d27bef --- /dev/null +++ b/annotations_filtered/gvJLNa16cdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.74], [15.0, 15.04], [16.0, 18.57], [20.0, 20.49], [31.0, 33.84], [35.0, 36.17], [39.0, 47.55], [48.0, 52.83], [61.0, 62.53], [63.0, 64.27], [67.0, 67.47], [68.0, 69.55], [73.0, 74.49], [76.0, 77.16], [87.0, 87.84], [88.0, 89.11], [94.0, 94.86], [95.0, 95.96], [101.0, 102.3], [104.0, 105.85], [107.0, 108.53], [109.0, 109.53], [110.0, 111.47], [112.0, 113.12], [116.0, 117.12], [120.0, 120.06], [122.0, 123.36], [124.0, 125.2], [126.0, 128.48], [129.0, 129.71], [130.0, 132.43]], "keep_status": [true, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [38.8, 0.0, 43.43, 0.0, 49.22, 0.0, 41.83, 30.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 48.35], "audiomae_on_audioset": [[["speech", 40.9], ["hum", 12.0], ["throbbing", 6.21]], null, [["music", 50.02], ["hum", 7.77], ["musical instrument", 5.78]], null, [["music", 63.69], ["synthesizer", 3.88], ["ambient music", 3.61]], null, [["hum", 33.95], ["music", 19.57], ["throbbing", 11.42]], [["gong", 17.43], ["breaking", 14.81], ["music", 14.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.2], ["foghorn", 8.47], ["didgeridoo", 4.11]]], "duration": [2.74, 0.04, 2.57, 0.49, 2.84, 1.17, 8.55, 4.83, 1.53, 1.27, 0.47, 1.55, 1.49, 1.16, 0.84, 1.11, 0.86, 0.96, 1.3, 1.85, 1.53, 0.53, 1.47, 1.12, 1.12, 0.06, 1.36, 1.2, 2.48, 0.71, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/gvKBHCBBdf0_filtered.json b/annotations_filtered/gvKBHCBBdf0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06f5de0b9047ac04df4b01d6e738349125c23399 --- /dev/null +++ b/annotations_filtered/gvKBHCBBdf0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [10.0, 10.23], [12.0, 12.24], [28.0, 29.51], [33.0, 36.36], [45.0, 47.19], [48.0, 48.47], [52.0, 57.4], [59.0, 60.0], [67.0, 84.55], [86.0, 91.17], [93.0, 92.97], [98.0, 98.54], [104.0, 104.45], [110.0, 110.29], [118.0, 119.06], [119.0, 120.16], [125.0, 125.44], [128.0, 129.44], [131.0, 131.18], [135.0, 135.73], [137.0, 136.86], [138.0, 139.45], [143.0, 143.34], [144.0, 144.64], [145.0, 146.16], [147.0, 148.04], [149.0, 149.54], [150.0, 151.38], [152.0, 153.87], [155.0, 155.65], [156.0, 157.3], [158.0, 174.78], [179.0, 188.6], [191.0, 192.62], [198.0, 200.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 85.72, 99.98, 0.0, 95.23, 0.0, 96.54, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 95.91, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.23, 0.24, 1.51, 3.36, 2.19, 0.47, 5.4, 1.0, 17.55, 5.17, -0.03, 0.54, 0.45, 0.29, 1.06, 1.16, 0.44, 1.44, 0.18, 0.73, -0.14, 1.45, 0.34, 0.64, 1.16, 1.04, 0.54, 1.38, 1.87, 0.65, 1.3, 16.78, 9.6, 1.62, 2.62]} \ No newline at end of file diff --git a/annotations_filtered/gvTCSxLPy0Q_filtered.json b/annotations_filtered/gvTCSxLPy0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c250e61cf39d206a60cc143aa7b1db87d000454f --- /dev/null +++ b/annotations_filtered/gvTCSxLPy0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.15], [5.0, 6.35], [7.0, 7.47], [8.0, 9.17], [15.0, 15.04], [16.0, 17.47], [20.0, 21.2], [22.0, 22.45], [27.0, 28.05], [32.0, 35.38], [37.0, 38.13], [41.0, 52.32], [53.0, 68.79]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [43.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.04, 0.0, 34.08, 30.28], "audiomae_on_audioset": [[["cattle, bovinae", 10.56], ["moo", 8.92], ["livestock, farm animals, working animals", 8.25]], null, null, null, null, null, null, null, null, [["music", 47.65], ["hum", 15.07], ["throbbing", 7.06]], null, [["music", 65.05], ["echo", 6.76], ["synthesizer", 6.4]], [["music", 59.49], ["speech", 9.82], ["thump, thud", 3.4]]], "duration": [2.15, 1.35, 0.47, 1.17, 0.04, 1.47, 1.2, 0.45, 1.05, 3.38, 1.13, 11.32, 15.79]} \ No newline at end of file diff --git a/annotations_filtered/gvbI2bHohQ4_filtered.json b/annotations_filtered/gvbI2bHohQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8d5616a85fc839a5a5dab155783b79756d6e12b --- /dev/null +++ b/annotations_filtered/gvbI2bHohQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 23.19], [25.0, 26.1], [27.0, 27.13], [28.0, 28.58], [30.0, 31.5], [35.0, 42.3], [44.0, 54.7], [56.0, 77.38]], "keep_status": [false, false, false, false, false, false, true, true], "silence_prob": [35.01, 0.0, 0.0, 0.0, 0.0, 34.55, 32.28, 30.67], "audiomae_on_audioset": [[["hum", 38.75], ["music", 26.49], ["mains hum", 11.34]], null, null, null, null, [["music", 66.72], ["throbbing", 4.56], ["musical instrument", 4.54]], [["music", 42.75], ["hum", 18.1], ["theremin", 7.82]], [["music", 41.95], ["gong", 8.75], ["didgeridoo", 6.87]]], "duration": [18.19, 1.1, 0.13, 0.58, 1.5, 7.3, 10.7, 21.38]} \ No newline at end of file diff --git a/annotations_filtered/gvuZShYhzX8_filtered.json b/annotations_filtered/gvuZShYhzX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f057894ed237090734a956e20fd8a01354e2793a --- /dev/null +++ b/annotations_filtered/gvuZShYhzX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 57.94], [63.0, 66.88], [69.0, 70.41], [72.0, 83.17], [84.0, 83.83], [84.0, 89.9], [97.0, 97.71], [101.0, 102.07], [105.0, 106.57], [111.0, 114.86], [116.0, 115.87], [117.0, 117.34], [119.0, 119.94], [124.0, 124.61], [131.0, 133.89], [141.0, 140.76], [148.0, 149.08], [150.0, 150.3], [154.0, 154.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 29.86, 0.0, 28.21, 0.0, 30.81, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 45.52, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 74.07], ["didgeridoo", 5.64], ["whale vocalization", 4.34]], null, [["music", 63.29], ["synthesizer", 4.32], ["throbbing", 3.82]], null, [["music", 54.92], ["electronic music", 11.11], ["throbbing", 5.2]], null, null, null, null, null, null, null, null, [["music", 20.82], ["hum", 15.55], ["noise", 6.93]], null, null, null, null], "duration": [32.94, 3.88, 1.41, 11.17, -0.17, 5.9, 0.71, 1.07, 1.57, 3.86, -0.13, 0.34, 0.94, 0.61, 2.89, -0.24, 1.08, 0.3, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/gw4Sj4hJy4s_filtered.json b/annotations_filtered/gw4Sj4hJy4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19bf437dff117dfc85efb4b419f3f6ac30a7dbfb --- /dev/null +++ b/annotations_filtered/gw4Sj4hJy4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.84], [4.0, 8.95], [9.0, 9.09]], "keep_status": [false, false, false], "silence_prob": [0.0, 86.45, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [-0.16, 4.95, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/gwEeqSGSL3g_filtered.json b/annotations_filtered/gwEeqSGSL3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd1a76c64950a5a51395813525d612baf1e66a67 --- /dev/null +++ b/annotations_filtered/gwEeqSGSL3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 60.52], [62.0, 70.66], [79.0, 79.96], [81.0, 82.41], [82.0, 93.77], [94.0, 99.2], [103.0, 107.18], [108.0, 114.79]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [29.96, 29.81, 0.0, 0.0, 30.08, 30.26, 43.13, 61.97], "audiomae_on_audioset": [[["music", 76.74], ["electronic music", 2.31], ["heart murmur", 2.21]], [["music", 80.41], ["electronic music", 5.56], ["throbbing", 3.89]], null, null, [["music", 62.47], ["didgeridoo", 8.32], ["speech", 4.64]], [["music", 31.67], ["musical instrument", 6.61], ["whip", 5.53]], [["music", 60.76], ["effects unit", 10.79], ["musical instrument", 4.32]], null], "duration": [11.52, 8.66, 0.96, 1.41, 11.77, 5.2, 4.18, 6.79]} \ No newline at end of file diff --git a/annotations_filtered/gwEoo0r_8EY_filtered.json b/annotations_filtered/gwEoo0r_8EY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1f9716f1c77e07b9d81842975c1f4692e883f2f --- /dev/null +++ b/annotations_filtered/gwEoo0r_8EY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.76], [16.0, 18.13], [20.0, 21.51], [23.0, 23.4], [25.0, 25.71], [26.0, 28.07], [29.0, 29.79], [31.0, 32.91], [33.0, 33.64], [34.0, 55.04], [62.0, 81.26], [86.0, 91.99], [96.0, 98.74], [102.0, 102.44], [105.0, 117.69], [119.0, 120.46], [122.0, 122.18], [123.0, 127.13], [128.0, 129.1], [141.0, 142.1], [151.0, 151.28], [159.0, 160.52]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [55.81, 65.44, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 0.0, 35.37, 30.7, 31.5, 35.39, 0.0, 32.56, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 39.15], ["singing bowl", 23.81], ["music", 7.73]], null, null, null, [["music", 40.09], ["rumble", 11.13], ["hum", 11.12]], [["speech", 58.98], ["music", 5.9], ["groan", 5.15]], [["whack, thwack", 36.28], ["music", 24.36], ["speech", 6.57]], [["rumble", 36.46], ["music", 19.25], ["speech", 17.22]], null, [["speech", 23.29], ["music", 18.87], ["hum", 7.91]], null, null, null, null, null, null, null], "duration": [6.76, 2.13, 1.51, 0.4, 0.71, 2.07, 0.79, 1.91, 0.64, 21.04, 19.26, 5.99, 2.74, 0.44, 12.69, 1.46, 0.18, 4.13, 1.1, 1.1, 0.28, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/gwTTsc0zMco_filtered.json b/annotations_filtered/gwTTsc0zMco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e588a25f55f10e9965617efc1ad71ffb6c7967b --- /dev/null +++ b/annotations_filtered/gwTTsc0zMco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.77], [10.0, 10.93], [12.0, 13.85], [18.0, 19.26], [22.0, 22.25], [23.0, 25.88], [27.0, 28.81], [32.0, 33.57], [34.0, 38.87], [39.0, 44.98], [46.0, 48.83], [49.0, 57.82], [60.0, 62.33], [63.0, 79.62], [81.0, 82.31], [83.0, 83.73], [84.0, 94.17], [97.0, 107.89], [110.0, 112.29], [117.0, 121.47]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, true, false], "silence_prob": [49.78, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 45.95, 41.89, 36.21, 30.98, 31.57, 31.28, 0.0, 0.0, 31.65, 30.82, 36.15, 54.36], "audiomae_on_audioset": [[["sine wave", 18.61], ["chirp tone", 14.53], ["dial tone", 7.22]], null, null, null, null, null, null, null, [["music", 37.05], ["hum", 18.9], ["throbbing", 11.48]], [["music", 46.08], ["speech", 29.72], ["hum", 7.09]], [["music", 62.42], ["sine wave", 8.16], ["chirp tone", 6.72]], [["speech", 29.6], ["music", 19.39], ["whack, thwack", 7.94]], [["fly, housefly", 48.59], ["insect", 33.06], ["mosquito", 12.01]], [["mains hum", 38.53], ["hum", 27.53], ["throbbing", 10.97]], null, null, [["speech", 53.06], ["music", 16.71], ["hum", 6.28]], [["music", 29.46], ["speech", 23.86], ["buzz", 13.58]], [["throbbing", 34.52], ["music", 24.99], ["hum", 9.11]], null], "duration": [3.77, 0.93, 1.85, 1.26, 0.25, 2.88, 1.81, 1.57, 4.87, 5.98, 2.83, 8.82, 2.33, 16.62, 1.31, 0.73, 10.17, 10.89, 2.29, 4.47]} \ No newline at end of file diff --git a/annotations_filtered/gwY85_MC_AY_filtered.json b/annotations_filtered/gwY85_MC_AY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d3b555663016a7d6ba14e7eeb66e3a1588f3493 --- /dev/null +++ b/annotations_filtered/gwY85_MC_AY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.07], [11.0, 11.69], [13.0, 18.82], [20.0, 20.41], [24.0, 26.65], [27.0, 31.02], [32.0, 33.1], [34.0, 39.29], [40.0, 42.23], [45.0, 46.11], [49.0, 48.84], [54.0, 55.11], [56.0, 58.26], [59.0, 62.53], [76.0, 93.95], [95.0, 96.79], [103.0, 115.92], [117.0, 117.98], [121.0, 122.62], [123.0, 127.06], [128.0, 129.02], [135.0, 136.05], [137.0, 156.46], [164.0, 164.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 100.0, 0.0, 100.0, 92.15, 0.0, 100.0, 99.4, 0.0, 0.0, 0.0, 100.0, 99.98, 100.0, 0.0, 99.91, 0.0, 0.0, 97.43, 0.0, 0.0, 81.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.07, 0.69, 5.82, 0.41, 2.65, 4.02, 1.1, 5.29, 2.23, 1.11, -0.16, 1.11, 2.26, 3.53, 17.95, 1.79, 12.92, 0.98, 1.62, 4.06, 1.02, 1.05, 19.46, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/gw_zwDaiuJs_filtered.json b/annotations_filtered/gw_zwDaiuJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfc194125802e5012078bc848516d8525f7c2020 --- /dev/null +++ b/annotations_filtered/gw_zwDaiuJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.65], [6.0, 7.55], [10.0, 11.06], [13.0, 14.98], [15.0, 16.23], [18.0, 17.66], [18.0, 20.21], [21.0, 22.25], [24.0, 25.19], [27.0, 27.9], [28.0, 28.46], [31.0, 32.22], [34.0, 33.99], [35.0, 35.38], [36.0, 36.95], [37.0, 38.58], [41.0, 42.01], [44.0, 47.93], [49.0, 51.07], [53.0, 54.24], [55.0, 60.54], [62.0, 65.26], [66.0, 67.59], [68.0, 73.26], [75.0, 86.63], [90.0, 96.03], [99.0, 103.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 99.05, 0.0, 85.72, 71.87, 0.0, 77.03, 56.63, 38.32, 62.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 62.38], ["music", 29.27], ["musical instrument", 1.97]], null], "duration": [0.65, 1.55, 1.06, 1.98, 1.23, -0.34, 2.21, 1.25, 1.19, 0.9, 0.46, 1.22, -0.01, 0.38, 0.95, 1.58, 1.01, 3.93, 2.07, 1.24, 5.54, 3.26, 1.59, 5.26, 11.63, 6.03, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/gwjAFSu_VKM_filtered.json b/annotations_filtered/gwjAFSu_VKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d478b816591b85df0cd052a834002b5d4fa49a3 --- /dev/null +++ b/annotations_filtered/gwjAFSu_VKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.23], [8.0, 11.87], [13.0, 35.41], [49.0, 51.73], [58.0, 65.94], [67.0, 69.08], [70.0, 73.55], [74.0, 74.71], [76.0, 77.26], [84.0, 86.75], [87.0, 86.95], [87.0, 99.0], [109.0, 109.31], [112.0, 111.89], [113.0, 113.7], [114.0, 114.34], [114.0, 114.45], [115.0, 115.48], [116.0, 116.24], [119.0, 120.38], [122.0, 122.71], [128.0, 128.88], [130.0, 129.86], [135.0, 135.58], [140.0, 140.21], [141.0, 141.78], [144.0, 145.32], [148.0, 149.08], [150.0, 152.12], [154.0, 156.9], [159.0, 158.99], [163.0, 163.92], [164.0, 164.62], [165.0, 165.89], [167.0, 168.2], [170.0, 174.06]], "keep_status": [false, true, false, true, true, true, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.13, 45.75, 46.54, 38.49, 39.01, 39.11, 0.0, 0.0, 41.98, 0.0, 37.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, [["music", 48.02], ["synthesizer", 6.84], ["musical instrument", 5.0]], [["music", 74.05], ["synthesizer", 9.41], ["musical instrument", 3.69]], [["music", 23.37], ["musical instrument", 11.75], ["synthesizer", 9.18]], [["music", 50.53], ["hum", 4.35], ["throbbing", 4.32]], [["music", 48.28], ["synthesizer", 6.05], ["musical instrument", 5.23]], [["music", 46.35], ["musical instrument", 5.79], ["sampler", 2.73]], null, null, [["music", 26.66], ["speech", 19.22], ["synthesizer", 6.26]], null, [["music", 59.54], ["sound effect", 2.67], ["musical instrument", 2.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 3.87, 22.41, 2.73, 7.94, 2.08, 3.55, 0.71, 1.26, 2.75, -0.05, 12.0, 0.31, -0.11, 0.7, 0.34, 0.45, 0.48, 0.24, 1.38, 0.71, 0.88, -0.14, 0.58, 0.21, 0.78, 1.32, 1.08, 2.12, 2.9, -0.01, 0.92, 0.62, 0.89, 1.2, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/gx-03rUq-1Q_filtered.json b/annotations_filtered/gx-03rUq-1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8670847ca0589d7e40f5ea1f80879365e553b1e7 --- /dev/null +++ b/annotations_filtered/gx-03rUq-1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.46], [10.0, 11.79], [29.0, 30.15], [32.0, 32.07], [39.0, 39.28], [43.0, 45.1], [48.0, 48.79], [60.0, 60.34], [63.0, 63.04], [65.0, 65.25], [68.0, 68.44], [69.0, 69.38], [72.0, 72.15], [74.0, 74.58], [77.0, 77.21], [78.0, 79.15], [81.0, 82.93], [84.0, 88.72], [98.0, 98.44], [105.0, 109.43], [111.0, 111.67], [112.0, 120.12], [125.0, 126.18], [127.0, 128.75], [130.0, 130.59], [146.0, 146.26], [149.0, 149.96], [151.0, 152.05], [154.0, 154.6], [160.0, 160.62], [163.0, 164.81], [170.0, 170.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.61, 0.0, 44.81, 0.0, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 82.55], ["noise", 2.6], ["effects unit", 0.9]], null, [["thunk", 16.11], ["cattle, bovinae", 10.03], ["moo", 9.61]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.46, 1.79, 1.15, 0.07, 0.28, 2.1, 0.79, 0.34, 0.04, 0.25, 0.44, 0.38, 0.15, 0.58, 0.21, 1.15, 1.93, 4.72, 0.44, 4.43, 0.67, 8.12, 1.18, 1.75, 0.59, 0.26, 0.96, 1.05, 0.6, 0.62, 1.81, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/gx9O6q0pDAU_filtered.json b/annotations_filtered/gx9O6q0pDAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac7716ecc871fefa69420c08ff8a1cf7bbf34f72 --- /dev/null +++ b/annotations_filtered/gx9O6q0pDAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.68], [15.0, 16.06], [20.0, 21.95], [43.0, 47.55], [49.0, 50.04], [51.0, 51.83], [53.0, 54.38], [55.0, 66.43], [67.0, 67.37], [68.0, 71.39], [75.0, 75.2], [76.0, 77.26], [78.0, 101.02], [102.0, 103.13], [104.0, 112.51], [114.0, 114.13], [116.0, 116.43], [121.0, 121.83], [125.0, 125.58], [127.0, 126.79]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.62, 0.0, 0.0, 0.0, 31.31, 0.0, 32.32, 0.0, 0.0, 31.26, 0.0, 30.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 45.17], ["synthesizer", 6.31], ["musical instrument", 5.7]], null, null, null, [["music", 63.07], ["synthesizer", 21.64], ["musical instrument", 4.0]], null, [["music", 39.04], ["speech", 18.68], ["theremin", 14.76]], null, null, [["music", 42.24], ["theremin", 19.2], ["bell", 6.1]], null, [["music", 27.82], ["speech", 12.57], ["didgeridoo", 8.77]], null, null, null, null, null], "duration": [0.68, 1.06, 1.95, 4.55, 1.04, 0.83, 1.38, 11.43, 0.37, 3.39, 0.2, 1.26, 23.02, 1.13, 8.51, 0.13, 0.43, 0.83, 0.58, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/gxAaVqdz_Vk_filtered.json b/annotations_filtered/gxAaVqdz_Vk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7bff65218e296cfdbab9af696185790742be4b3 --- /dev/null +++ b/annotations_filtered/gxAaVqdz_Vk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 47.46], [49.0, 60.3], [62.0, 91.13], [92.0, 92.92], [95.0, 97.7], [98.0, 112.56], [117.0, 121.59], [125.0, 125.24], [128.0, 128.04], [129.0, 130.1]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [39.61, 33.46, 32.75, 0.0, 69.74, 35.25, 31.73, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.42], ["gong", 9.55], ["hum", 7.24]], [["music", 49.26], ["theremin", 35.49], ["musical instrument", 4.59]], [["theremin", 63.59], ["music", 25.74], ["synthesizer", 2.64]], null, null, [["music", 66.83], ["musical instrument", 6.1], ["synthesizer", 3.48]], [["music", 60.58], ["theremin", 8.18], ["synthesizer", 7.56]], null, null, null], "duration": [8.46, 11.3, 29.13, 0.92, 2.7, 14.56, 4.59, 0.24, 0.04, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/gxacglqQMqE_filtered.json b/annotations_filtered/gxacglqQMqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa245fb381388f25fb5a3a3cf5a5693a444c712a --- /dev/null +++ b/annotations_filtered/gxacglqQMqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 22.15], [25.0, 33.99], [34.0, 34.03], [34.0, 34.06], [34.0, 34.13], [34.0, 34.21], [34.0, 34.26], [34.0, 34.32], [34.0, 35.4], [36.0, 38.57], [40.0, 47.21], [52.0, 54.14], [71.0, 87.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [35.88, 54.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.86, 41.58, 51.88, 30.86], "audiomae_on_audioset": [[["mains hum", 35.91], ["hum", 32.23], ["music", 11.13]], null, null, null, null, null, null, null, null, null, [["music", 41.29], ["hum", 18.07], ["throbbing", 13.99]], null, [["buzz", 25.27], ["hum", 14.96], ["music", 11.44]]], "duration": [13.15, 8.99, 0.03, 0.06, 0.13, 0.21, 0.26, 0.32, 1.4, 2.57, 7.21, 2.14, 16.4]} \ No newline at end of file diff --git a/annotations_filtered/gxeIvClLpKI_filtered.json b/annotations_filtered/gxeIvClLpKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abbd851f10d1aa79974c7d4556c324f220a4f664 --- /dev/null +++ b/annotations_filtered/gxeIvClLpKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.83], [12.0, 18.96], [19.0, 22.23], [25.0, 69.3], [70.0, 99.3], [100.0, 101.58], [106.0, 120.33], [123.0, 128.26]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.9, 46.26, 0.0, 76.7, 0.0, 98.66, 99.4], "audiomae_on_audioset": [null, [["speech", 64.62], ["music", 15.61], ["electronic music", 1.96]], [["speech", 43.82], ["music", 26.0], ["electronic music", 2.99]], null, null, null, null, null], "duration": [1.83, 6.96, 3.23, 44.3, 29.3, 1.58, 14.33, 5.26]} \ No newline at end of file diff --git a/annotations_filtered/gxhMfM0QlwM_filtered.json b/annotations_filtered/gxhMfM0QlwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1de28eb0534a28666d169c64e51be0d75eb0dce6 --- /dev/null +++ b/annotations_filtered/gxhMfM0QlwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.75], [40.0, 40.51], [45.0, 44.93], [45.0, 45.03], [45.0, 45.27], [49.0, 49.38], [52.0, 56.42], [57.0, 56.69], [72.0, 72.45], [78.0, 80.23], [81.0, 86.56], [87.0, 86.7], [88.0, 102.07], [108.0, 109.11], [114.0, 114.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.15, 0.0, 0.0, 48.19, 40.09, 0.0, 41.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 48.51], ["didgeridoo", 31.84], ["speech", 5.91]], null, null, [["didgeridoo", 63.14], ["music", 20.0], ["synthesizer", 2.15]], [["music", 33.69], ["didgeridoo", 16.63], ["fly, housefly", 4.32]], null, [["music", 62.77], ["didgeridoo", 15.18], ["throbbing", 3.67]], null, null], "duration": [1.75, 0.51, -0.07, 0.03, 0.27, 0.38, 4.42, -0.31, 0.45, 2.23, 5.56, -0.3, 14.07, 1.11, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/gxqt6x5ThcU_filtered.json b/annotations_filtered/gxqt6x5ThcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/gxqt6x5ThcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/gxsDfmzU-Lo_filtered.json b/annotations_filtered/gxsDfmzU-Lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c349b715ed2022f7716be4490abf7b22b34ef16b --- /dev/null +++ b/annotations_filtered/gxsDfmzU-Lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 57.87], [60.0, 66.48], [68.0, 78.76], [87.0, 102.14], [104.0, 116.46], [119.0, 120.26], [121.0, 121.39], [125.0, 126.28]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 32.93, 28.54, 29.08, 30.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 31.74], ["theremin", 21.49], ["musical instrument", 5.03]], [["music", 51.42], ["speech", 17.9], ["explosion", 9.78]], [["music", 40.9], ["hum", 23.42], ["throbbing", 17.31]], [["music", 42.49], ["hum", 19.72], ["throbbing", 16.28]], null, null, null], "duration": [50.87, 6.48, 10.76, 15.14, 12.46, 1.26, 0.39, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/gxuEGIzZrGc_filtered.json b/annotations_filtered/gxuEGIzZrGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3162807b79214f508459d154ced4c8c725f1cce --- /dev/null +++ b/annotations_filtered/gxuEGIzZrGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.6], [21.0, 26.1], [34.0, 40.73], [43.0, 46.36], [48.0, 54.82], [56.0, 60.59], [62.0, 66.61], [71.0, 76.17], [78.0, 163.34]], "keep_status": [false, true, false, false, false, true, true, false, false], "silence_prob": [63.85, 45.78, 73.51, 69.07, 39.89, 32.49, 44.18, 32.83, 0.0], "audiomae_on_audioset": [null, [["music", 43.29], ["speech", 12.28], ["fly, housefly", 8.17]], null, null, [["music", 45.56], ["effects unit", 16.87], ["musical instrument", 13.39]], [["crack", 32.36], ["breaking", 16.23], ["crushing", 12.39]], [["grunt", 44.66], ["music", 4.1], ["fart", 3.15]], [["music", 34.25], ["speech", 33.01], ["breaking", 16.24]], null], "duration": [5.6, 5.1, 6.73, 3.36, 6.82, 4.59, 4.61, 5.17, 85.34]} \ No newline at end of file diff --git a/annotations_filtered/gzPiBOc_Nfs_filtered.json b/annotations_filtered/gzPiBOc_Nfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f74218857608756809d71843e31c839eb67a7df --- /dev/null +++ b/annotations_filtered/gzPiBOc_Nfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.18], [15.0, 25.07], [28.0, 35.13], [37.0, 48.14], [50.0, 82.53], [85.0, 88.92], [89.0, 91.59], [92.0, 93.73], [98.0, 104.26], [107.0, 156.88], [159.0, 162.95], [167.0, 166.89], [167.0, 168.94], [171.0, 170.95]], "keep_status": [true, true, false, true, false, true, true, false, true, false, false, false, false, false], "silence_prob": [30.47, 39.17, 99.62, 31.73, 0.0, 30.33, 32.81, 0.0, 29.41, 0.0, 53.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.45], ["mains hum", 16.8], ["hum", 11.62]], [["music", 28.24], ["hum", 23.13], ["mains hum", 14.45]], null, [["music", 24.02], ["speech", 9.73], ["foghorn", 8.25]], null, [["music", 45.5], ["speech", 14.47], ["didgeridoo", 5.09]], [["foghorn", 48.34], ["speech", 15.63], ["music", 3.49]], null, [["music", 25.56], ["noise", 21.98], ["hum", 10.12]], null, null, null, null, null], "duration": [2.18, 10.07, 7.13, 11.14, 32.53, 3.92, 2.59, 1.73, 6.26, 49.88, 3.95, -0.11, 1.94, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/gzRy-pvwdL0_filtered.json b/annotations_filtered/gzRy-pvwdL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..969a2868132a263b6e27c141013e92663a8aabf7 --- /dev/null +++ b/annotations_filtered/gzRy-pvwdL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.77], [13.0, 13.42], [17.0, 17.39], [18.0, 19.04], [21.0, 21.9], [24.0, 26.72], [28.0, 28.78], [31.0, 31.14], [34.0, 34.06], [38.0, 39.36], [44.0, 47.38], [50.0, 50.28], [53.0, 53.1], [56.0, 61.33], [62.0, 65.25], [67.0, 68.93], [70.0, 71.12], [74.0, 77.5], [79.0, 80.03], [81.0, 83.71], [84.0, 86.46], [87.0, 88.21], [90.0, 90.71], [93.0, 95.37], [96.0, 98.12], [99.0, 99.5], [101.0, 102.41], [104.0, 104.11], [106.0, 108.89], [109.0, 109.98], [111.0, 112.14], [115.0, 118.64], [122.0, 122.54], [125.0, 125.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.29, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 99.1, 0.0, 100.0, 95.23, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.77, 0.42, 0.39, 1.04, 0.9, 2.72, 0.78, 0.14, 0.06, 1.36, 3.38, 0.28, 0.1, 5.33, 3.25, 1.93, 1.12, 3.5, 1.03, 2.71, 2.46, 1.21, 0.71, 2.37, 2.12, 0.5, 1.41, 0.11, 2.89, 0.98, 1.14, 3.64, 0.54, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/gz_dPVrciwM_filtered.json b/annotations_filtered/gz_dPVrciwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c14910dc2652483f40aaa6b6c290c341e6e98c83 --- /dev/null +++ b/annotations_filtered/gz_dPVrciwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.34], [11.0, 12.41], [14.0, 31.55], [32.0, 33.57], [36.0, 49.91], [57.0, 56.88], [59.0, 59.26], [60.0, 60.45], [61.0, 69.26], [76.0, 76.38], [77.0, 81.4], [82.0, 97.9], [99.0, 114.86], [115.0, 118.57], [119.0, 128.02], [133.0, 133.02], [135.0, 137.49], [138.0, 141.13], [144.0, 154.43], [155.0, 155.51], [156.0, 156.61]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.4, 0.0, 38.11, 0.0, 0.0, 0.0, 32.42, 0.0, 82.97, 31.29, 31.19, 30.43, 30.88, 0.0, 99.8, 55.89, 60.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 34.9], ["music", 21.94], ["mains hum", 18.75]], null, null, null, [["sidetone", 24.45], ["music", 19.43], ["speech", 18.66]], null, null, [["music", 58.64], ["speech", 10.22], ["hum", 6.82]], [["music", 55.21], ["speech", 10.91], ["throbbing", 8.59]], [["sidetone", 58.65], ["music", 9.88], ["speech", 8.15]], [["music", 74.19], ["electronic music", 3.97], ["speech", 2.01]], null, null, null, null, null, null], "duration": [1.34, 1.41, 17.55, 1.57, 13.91, -0.12, 0.26, 0.45, 8.26, 0.38, 4.4, 15.9, 15.86, 3.57, 9.02, 0.02, 2.49, 3.13, 10.43, 0.51, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/gzbYTUXZkSI_filtered.json b/annotations_filtered/gzbYTUXZkSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83e9281c6e2d9f44dc5fb0d21e6575033db6c44a --- /dev/null +++ b/annotations_filtered/gzbYTUXZkSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [2.0, 1.85], [7.0, 11.37], [13.0, 14.93], [16.0, 30.97], [33.0, 33.37], [44.0, 45.47], [47.0, 59.61], [63.0, 81.51], [83.0, 121.22], [122.0, 135.65], [137.0, 146.87], [150.0, 150.5], [154.0, 155.56], [159.0, 206.71]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 51.44, 0.0, 30.65, 0.0, 0.0, 31.04, 31.77, 0.0, 32.54, 30.69, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 36.52], ["speech", 26.49], ["sound effect", 3.43]], null, null, [["music", 34.71], ["didgeridoo", 16.46], ["hum", 13.85]], [["fly, housefly", 45.69], ["mosquito", 23.24], ["insect", 22.45]], null, [["music", 77.97], ["throbbing", 5.06], ["electronic music", 4.38]], [["music", 83.24], ["speech", 3.38], ["didgeridoo", 1.55]], null, null, null], "duration": [0.24, -0.15, 4.37, 1.93, 14.97, 0.37, 1.47, 12.61, 18.51, 38.22, 13.65, 9.87, 0.5, 1.56, 47.71]} \ No newline at end of file