diff --git a/annotations_filtered/b-2p52a82UM_filtered.json b/annotations_filtered/b-2p52a82UM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a745dfc30361c8519977384e3f41fc9e7c292355 --- /dev/null +++ b/annotations_filtered/b-2p52a82UM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 17.81], [18.0, 18.28], [19.0, 19.9], [30.0, 30.75], [31.0, 31.4], [31.0, 37.13], [49.0, 50.77], [52.0, 53.96], [56.0, 62.34], [63.0, 79.57], [83.0, 83.4], [87.0, 87.79], [125.0, 127.9], [129.0, 130.1], [138.0, 138.96], [141.0, 141.17], [145.0, 146.79], [150.0, 151.83], [154.0, 156.59], [158.0, 163.19]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [31.0, 0.0, 0.0, 0.0, 0.0, 29.45, 0.0, 0.0, 62.37, 48.91, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 55.53, 45.05], "audiomae_on_audioset": [[["music", 77.25], ["speech", 4.17], ["thunk", 1.69]], null, null, null, null, [["music", 23.79], ["sidetone", 12.86], ["speech", 10.59]], null, null, null, [["hum", 42.64], ["mains hum", 27.66], ["music", 9.86]], null, null, null, null, null, null, null, null, null, [["speech", 36.16], ["music", 13.68], ["animal", 5.74]]], "duration": [16.81, 0.28, 0.9, 0.75, 0.4, 6.13, 1.77, 1.96, 6.34, 16.57, 0.4, 0.79, 2.9, 1.1, 0.96, 0.17, 1.79, 1.83, 2.59, 5.19]} \ No newline at end of file diff --git a/annotations_filtered/b-QlCUByMcE_filtered.json b/annotations_filtered/b-QlCUByMcE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a05069666897135fb10e472e97fc2c7cd5f12b5 --- /dev/null +++ b/annotations_filtered/b-QlCUByMcE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.6], [15.0, 14.94], [17.0, 18.32], [21.0, 22.72], [29.0, 30.59], [32.0, 32.36], [33.0, 34.16], [42.0, 43.87], [47.0, 48.25], [49.0, 51.8], [56.0, 56.78], [60.0, 62.97], [68.0, 70.38], [70.0, 70.92], [76.0, 76.64], [81.0, 81.65], [87.0, 87.84], [94.0, 96.2], [98.0, 99.69], [100.0, 101.82], [102.0, 103.81], [108.0, 110.46], [111.0, 110.69], [114.0, 119.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 78.55, 62.27, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 99.76, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.6, -0.06, 1.32, 1.72, 1.59, 0.36, 1.16, 1.87, 1.25, 2.8, 0.78, 2.97, 2.38, 0.92, 0.64, 0.65, 0.84, 2.2, 1.69, 1.82, 1.81, 2.46, -0.31, 5.18]} \ No newline at end of file diff --git a/annotations_filtered/b-_C0lWgga0_filtered.json b/annotations_filtered/b-_C0lWgga0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a9b6260a312085e0a3f5789d10c79cb27e90193 --- /dev/null +++ b/annotations_filtered/b-_C0lWgga0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 47.11], [51.0, 52.44], [56.0, 58.04]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 30.43], "audiomae_on_audioset": [null, null, [["music", 61.13], ["musical instrument", 3.04], ["bass guitar", 2.72]]], "duration": [42.11, 1.44, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/b-f5iMDXvcA_filtered.json b/annotations_filtered/b-f5iMDXvcA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..483ab222d4832727e8d1c51fa1ed42ad1dc0bd4a --- /dev/null +++ b/annotations_filtered/b-f5iMDXvcA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 74.28]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [66.28]} \ No newline at end of file diff --git a/annotations_filtered/b-w1bY8qhnc_filtered.json b/annotations_filtered/b-w1bY8qhnc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17ee709dded09c65f8d4d1e7153d8b9c4e1ca08f --- /dev/null +++ b/annotations_filtered/b-w1bY8qhnc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 28.49], [29.0, 28.54], [32.0, 33.79], [35.0, 37.3], [40.0, 42.57], [44.0, 45.32], [47.0, 50.06], [54.0, 56.08], [58.0, 57.67], [58.0, 60.93], [62.0, 64.15], [66.0, 69.67], [71.0, 71.09], [71.0, 71.79], [79.0, 80.27], [81.0, 82.44], [84.0, 84.69], [85.0, 87.24], [87.0, 87.27], [88.0, 89.77], [90.0, 90.56], [99.0, 98.63], [100.0, 100.48], [106.0, 112.01], [114.0, 114.15], [125.0, 129.78], [138.0, 141.4], [141.0, 149.82], [151.0, 157.05], [158.0, 159.9], [161.0, 162.35], [162.0, 167.86], [168.0, 170.24], [171.0, 173.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, true, true, false], "silence_prob": [55.04, 0.0, 0.0, 91.47, 82.07, 0.0, 88.64, 84.8, 0.0, 52.74, 44.69, 53.22, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 0.0, 0.0, 0.0, 0.0, 0.0, 32.46, 0.0, 33.19, 46.9, 39.5, 36.11, 0.0, 0.0, 42.44, 41.5, 58.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 41.12], ["speech", 12.58], ["hum", 7.46]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.63], ["music", 31.33], ["synthetic singing", 1.27]], null, [["speech", 42.12], ["music", 21.83], ["sidetone", 5.78]], [["music", 17.62], ["speech", 8.85], ["animal", 4.75]], [["music", 30.68], ["singing bowl", 10.17], ["synthesizer", 8.13]], [["speech", 58.06], ["music", 22.48], ["synthesizer", 3.44]], null, null, [["music", 36.11], ["speech", 22.14], ["mains hum", 4.69]], [["speech", 40.2], ["music", 23.74], ["musical instrument", 5.86]], null], "duration": [13.49, -0.46, 1.79, 2.3, 2.57, 1.32, 3.06, 2.08, -0.33, 2.93, 2.15, 3.67, 0.09, 0.79, 1.27, 1.44, 0.69, 2.24, 0.27, 1.77, 0.56, -0.37, 0.48, 6.01, 0.15, 4.78, 3.4, 8.82, 6.05, 1.9, 1.35, 5.86, 2.24, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/b02H0dW2xf8_filtered.json b/annotations_filtered/b02H0dW2xf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d144957efabc04e2dd067ab769503d408122003 --- /dev/null +++ b/annotations_filtered/b02H0dW2xf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.57], [25.0, 25.57]], "keep_status": [true, false], "silence_prob": [31.25, 0.0], "audiomae_on_audioset": [[["speech", 31.63], ["fart", 20.99], ["music", 5.61]], null], "duration": [3.57, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/b0KSEziycmw_filtered.json b/annotations_filtered/b0KSEziycmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e213df6382e65dbfdfc31d9ae902dfbf6a2bf986 --- /dev/null +++ b/annotations_filtered/b0KSEziycmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.1], [10.0, 10.59], [18.0, 18.87], [22.0, 23.43], [27.0, 27.18], [28.0, 28.34], [35.0, 36.56], [38.0, 38.38], [40.0, 40.56], [42.0, 42.94], [49.0, 49.81], [51.0, 52.08], [53.0, 53.87], [55.0, 55.73], [57.0, 58.18], [59.0, 59.8], [67.0, 67.71], [69.0, 70.7], [71.0, 71.98], [74.0, 75.24], [76.0, 77.31], [78.0, 78.31], [80.0, 80.27], [82.0, 82.76], [84.0, 84.45], [86.0, 86.17], [87.0, 87.32], [92.0, 93.26], [95.0, 101.76], [102.0, 104.45], [112.0, 113.27], [116.0, 117.98], [122.0, 123.84], [126.0, 128.36], [129.0, 131.55], [134.0, 135.55], [139.0, 140.71], [142.0, 144.46], [145.0, 152.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.32, 42.96, 0.0, 0.0, 0.0, 38.02, 41.2, 0.0, 0.0, 55.53, 29.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 22.54], ["speech", 18.4], ["fart", 14.78]], [["speech", 36.55], ["music", 28.91], ["echo", 3.09]], null, null, null, [["sine wave", 43.99], ["speech", 12.33], ["chirp tone", 9.39]], [["insect", 20.62], ["fly, housefly", 19.44], ["speech", 10.63]], null, null, null, [["music", 61.0], ["speech", 22.54], ["explosion", 2.26]]], "duration": [1.1, 0.59, 0.87, 1.43, 0.18, 0.34, 1.56, 0.38, 0.56, 0.94, 0.81, 1.08, 0.87, 0.73, 1.18, 0.8, 0.71, 1.7, 0.98, 1.24, 1.31, 0.31, 0.27, 0.76, 0.45, 0.17, 0.32, 1.26, 6.76, 2.45, 1.27, 1.98, 1.84, 2.36, 2.55, 1.55, 1.71, 2.46, 7.59]} \ No newline at end of file diff --git a/annotations_filtered/b0SfZ4LMV98_filtered.json b/annotations_filtered/b0SfZ4LMV98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03406b8786363143000c621a3efcfe5aa175bbe1 --- /dev/null +++ b/annotations_filtered/b0SfZ4LMV98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.74], [13.0, 13.61], [15.0, 20.76], [23.0, 23.33], [25.0, 25.79], [27.0, 26.86], [48.0, 48.56], [59.0, 60.22], [61.0, 61.74], [63.0, 64.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.74, 0.61, 5.76, 0.33, 0.79, -0.14, 0.56, 1.22, 0.74, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/b0p7_jQ8HiE_filtered.json b/annotations_filtered/b0p7_jQ8HiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9680985cdf9cd1d8a62e04efb4ff888367c122e --- /dev/null +++ b/annotations_filtered/b0p7_jQ8HiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.89], [17.0, 19.16], [24.0, 24.39], [27.0, 29.66], [38.0, 38.97], [43.0, 44.25], [49.0, 49.35], [52.0, 61.84], [63.0, 64.34], [67.0, 68.03], [70.0, 71.66], [74.0, 75.73], [79.0, 84.45], [85.0, 90.36]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [43.18, 41.1, 0.0, 35.82, 0.0, 0.0, 0.0, 32.84, 0.0, 0.0, 0.0, 0.0, 37.01, 33.97], "audiomae_on_audioset": [[["music", 46.53], ["musical instrument", 7.08], ["echo", 4.34]], [["gong", 16.8], ["music", 16.11], ["singing bowl", 11.65]], null, [["music", 46.7], ["didgeridoo", 7.44], ["mantra", 6.44]], null, null, null, [["music", 60.66], ["theremin", 8.51], ["synthesizer", 7.73]], null, null, null, null, [["music", 59.51], ["effects unit", 6.27], ["didgeridoo", 4.15]], [["music", 63.54], ["didgeridoo", 12.0], ["musical instrument", 3.78]]], "duration": [5.89, 2.16, 0.39, 2.66, 0.97, 1.25, 0.35, 9.84, 1.34, 1.03, 1.66, 1.73, 5.45, 5.36]} \ No newline at end of file diff --git a/annotations_filtered/b0xYU8jHaH4_filtered.json b/annotations_filtered/b0xYU8jHaH4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..309ad12f640c60b1517d86243dbf7ce2d05d38f2 --- /dev/null +++ b/annotations_filtered/b0xYU8jHaH4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.41], [5.0, 5.71], [7.0, 7.74], [8.0, 9.05], [11.0, 13.37], [16.0, 17.68], [23.0, 23.14], [24.0, 25.03], [28.0, 28.29], [30.0, 31.02], [37.0, 38.15], [41.0, 43.92], [47.0, 47.55], [50.0, 50.25], [57.0, 56.86], [57.0, 57.2], [57.0, 57.3], [57.0, 57.48], [58.0, 58.7], [70.0, 71.05], [74.0, 74.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.87], ["music", 7.53], ["synthesizer", 4.96]], null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.71, 0.74, 1.05, 2.37, 1.68, 0.14, 1.03, 0.29, 1.02, 1.15, 2.92, 0.55, 0.25, -0.14, 0.2, 0.3, 0.48, 0.7, 1.05, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/b10LyOeq5Hs_filtered.json b/annotations_filtered/b10LyOeq5Hs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa24ba4f937ff52dd7afdd3cba7c218128a214c4 --- /dev/null +++ b/annotations_filtered/b10LyOeq5Hs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.14], [5.0, 6.25], [9.0, 12.34], [14.0, 15.48], [21.0, 23.25], [26.0, 31.04], [33.0, 40.24], [42.0, 49.72], [51.0, 51.71], [53.0, 54.45], [55.0, 57.94], [60.0, 61.18], [62.0, 64.25], [65.0, 66.7], [68.0, 70.07], [77.0, 78.58], [81.0, 84.91], [86.0, 92.87], [94.0, 95.81], [98.0, 98.68], [103.0, 104.21], [105.0, 107.81], [109.0, 110.84], [113.0, 114.83], [118.0, 135.35], [136.0, 145.32], [146.0, 152.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 0.0, 99.93, 0.0, 98.36, 100.0, 100.0, 100.0, 0.0, 0.0, 62.89, 0.0, 67.13, 0.0, 99.52, 0.0, 99.99, 98.8, 0.0, 0.0, 0.0, 87.19, 0.0, 0.0, 96.54, 98.73, 97.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.14, 1.25, 3.34, 1.48, 2.25, 5.04, 7.24, 7.72, 0.71, 1.45, 2.94, 1.18, 2.25, 1.7, 2.07, 1.58, 3.91, 6.87, 1.81, 0.68, 1.21, 2.81, 1.84, 1.83, 17.35, 9.32, 6.83]} \ No newline at end of file diff --git a/annotations_filtered/b1MxW8nf_lU_filtered.json b/annotations_filtered/b1MxW8nf_lU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4f27426bd63416ead985666fc81b220c22bd495 --- /dev/null +++ b/annotations_filtered/b1MxW8nf_lU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 41.5], [42.0, 50.4], [55.0, 73.16], [76.0, 76.92], [78.0, 78.97], [84.0, 84.48]], "keep_status": [true, true, true, false, false, false], "silence_prob": [32.28, 32.08, 33.73, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 60.41], ["crowd", 4.75], ["throbbing", 4.61]], [["music", 47.17], ["throbbing", 10.45], ["speech", 4.94]], [["speech", 35.09], ["livestock, farm animals, working animals", 13.32], ["cattle, bovinae", 10.74]], null, null, null], "duration": [17.5, 8.4, 18.16, 0.92, 0.97, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/b1Qxbu777zo_filtered.json b/annotations_filtered/b1Qxbu777zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36ee7a5ac2c839fdf69604e579a288f9ea23475c --- /dev/null +++ b/annotations_filtered/b1Qxbu777zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.29], [8.0, 8.45], [11.0, 12.72], [19.0, 19.48], [20.0, 20.56], [23.0, 23.48], [31.0, 32.34], [36.0, 37.05], [38.0, 39.24], [40.0, 41.57], [43.0, 42.9], [48.0, 50.6], [51.0, 51.07], [52.0, 53.08], [54.0, 54.3], [57.0, 59.83], [61.0, 62.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.52, 0.0, 0.0, 0.0, 39.49, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 19.48], ["sidetone", 19.03], ["rumble", 12.31]], null, null, null, [["music", 33.64], ["speech", 21.25], ["hum", 6.69]], null], "duration": [0.29, 0.45, 1.72, 0.48, 0.56, 0.48, 1.34, 1.05, 1.24, 1.57, -0.1, 2.6, 0.07, 1.08, 0.3, 2.83, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/b1eMAFWXZ4Q_filtered.json b/annotations_filtered/b1eMAFWXZ4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f37bd4cbad69ab54238b029244dd730d297262e --- /dev/null +++ b/annotations_filtered/b1eMAFWXZ4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 23.62], [32.0, 34.08], [38.0, 37.76], [42.0, 44.25], [56.0, 56.62], [58.0, 65.15], [66.0, 66.02], [69.0, 69.58], [74.0, 73.9], [80.0, 80.57], [96.0, 96.99], [104.0, 104.13], [106.0, 109.32], [113.0, 114.57], [116.0, 117.91]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [28.77, 45.08, 0.0, 34.45, 0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0, 0.0], "audiomae_on_audioset": [[["music", 33.4], ["throbbing", 20.38], ["didgeridoo", 20.31]], [["music", 20.99], ["hum", 13.28], ["throbbing", 9.11]], null, [["creak", 35.86], ["mains hum", 12.46], ["hum", 12.26]], null, null, null, null, null, null, null, null, null, null, null], "duration": [8.62, 2.08, -0.24, 2.25, 0.62, 7.15, 0.02, 0.58, -0.1, 0.57, 0.99, 0.13, 3.32, 1.57, 1.91]} \ No newline at end of file diff --git a/annotations_filtered/b1jqSRnqLMw_filtered.json b/annotations_filtered/b1jqSRnqLMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17ec43b25fe8f6ea8156b04e215b46157139323f --- /dev/null +++ b/annotations_filtered/b1jqSRnqLMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 45.6], [47.0, 101.44], [104.0, 104.18], [106.0, 105.71], [112.0, 112.72], [119.0, 121.42], [122.0, 123.43], [130.0, 131.6], [137.0, 149.84]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [98.51, 0.0, 0.0, 0.0, 0.0, 45.21, 0.0, 0.0, 43.3], "audiomae_on_audioset": [null, null, null, null, null, [["music", 57.61], ["carnatic music", 17.95], ["musical instrument", 11.06]], null, null, [["music", 39.38], ["hum", 13.41], ["synthesizer", 9.73]]], "duration": [24.6, 54.44, 0.18, -0.29, 0.72, 2.42, 1.43, 1.6, 12.84]} \ No newline at end of file diff --git a/annotations_filtered/b1vFQilhgrY_filtered.json b/annotations_filtered/b1vFQilhgrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5017eb269c5b88e5162f779b06ac31c4208466a --- /dev/null +++ b/annotations_filtered/b1vFQilhgrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.9], [1.0, 0.94], [1.0, 6.22], [8.0, 8.46], [13.0, 13.93], [16.0, 16.46], [28.0, 28.48], [29.0, 30.15], [34.0, 34.52], [35.0, 39.83], [42.0, 42.62]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.72, 0.0], "audiomae_on_audioset": [null, null, [["speech", 40.1], ["sidetone", 13.42], ["dishes, pots, and pans", 12.51]], null, null, null, null, null, null, [["speech", 70.8], ["radio", 3.09], ["mains hum", 3.02]], null], "duration": [-0.1, -0.06, 5.22, 0.46, 0.93, 0.46, 0.48, 1.15, 0.52, 4.83, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/b2MEP246DxY_filtered.json b/annotations_filtered/b2MEP246DxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1c971b680aaa32be9bdfad52b34d60585b0c8cd --- /dev/null +++ b/annotations_filtered/b2MEP246DxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 24.16], [27.0, 70.68], [79.0, 79.07], [80.0, 94.64], [98.0, 113.95]], "keep_status": [false, false, false, false, false], "silence_prob": [28.63, 0.0, 0.0, 30.4, 29.34], "audiomae_on_audioset": [[["speech", 44.9], ["music", 26.54], ["outside, rural or natural", 4.2]], null, null, [["speech", 48.08], ["brass instrument", 13.46], ["trombone", 11.75]], [["music", 45.46], ["speech", 20.87], ["electronic music", 7.7]]], "duration": [10.16, 43.68, 0.07, 14.64, 15.95]} \ No newline at end of file diff --git a/annotations_filtered/b2P-oU216V4_filtered.json b/annotations_filtered/b2P-oU216V4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f3410f2d9f627d4d1d3601b69b8cdb3f6f52e42 --- /dev/null +++ b/annotations_filtered/b2P-oU216V4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.79], [16.0, 26.43], [27.0, 29.71], [35.0, 42.36], [45.0, 45.33], [47.0, 55.53], [65.0, 67.96], [73.0, 78.12], [81.0, 88.72], [110.0, 111.72]], "keep_status": [false, true, false, false, false, false, true, false, false, false], "silence_prob": [32.09, 34.04, 54.83, 33.39, 0.0, 32.77, 34.57, 31.79, 32.01, 0.0], "audiomae_on_audioset": [[["speech", 43.85], ["music", 25.81], ["sidetone", 2.33]], [["music", 52.1], ["speech", 11.51], ["whack, thwack", 5.09]], null, [["music", 44.01], ["speech", 22.52], ["throbbing", 5.12]], null, [["cattle, bovinae", 37.54], ["livestock, farm animals, working animals", 35.4], ["moo", 23.38]], [["music", 43.32], ["speech", 18.38], ["moo", 6.35]], [["music", 82.11], ["theremin", 4.17], ["synthesizer", 3.43]], [["music", 72.52], ["throbbing", 4.7], ["musical instrument", 3.23]], null], "duration": [3.79, 10.43, 2.71, 7.36, 0.33, 8.53, 2.96, 5.12, 7.72, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/b2WuWXRVdfk_filtered.json b/annotations_filtered/b2WuWXRVdfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..781c89c68fd995568f41ad988044966013b7be07 --- /dev/null +++ b/annotations_filtered/b2WuWXRVdfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.26], [16.0, 48.46], [51.0, 52.56], [57.0, 98.56]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.26, 32.46, 1.56, 41.56]} \ No newline at end of file diff --git a/annotations_filtered/b2f2Kqt_KcE_filtered.json b/annotations_filtered/b2f2Kqt_KcE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd3802586adc8867aa00b8bafbd14b504da18c42 --- /dev/null +++ b/annotations_filtered/b2f2Kqt_KcE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.09], [13.0, 13.54], [15.0, 15.23], [15.0, 16.48], [17.0, 18.03], [22.0, 24.97], [33.0, 34.8], [37.0, 37.02], [38.0, 40.73], [44.0, 46.58], [50.0, 51.27], [52.0, 54.16], [56.0, 57.6], [58.0, 60.74], [61.0, 62.41], [67.0, 66.95], [71.0, 71.73], [73.0, 82.0], [84.0, 83.81], [92.0, 92.8], [104.0, 105.27], [107.0, 108.8], [111.0, 112.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.1, 100.0, 0.0, 98.73, 0.0, 97.83, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 0.54, 0.23, 1.48, 1.03, 2.97, 1.8, 0.02, 2.73, 2.58, 1.27, 2.16, 1.6, 2.74, 1.41, -0.05, 0.73, 9.0, -0.19, 0.8, 1.27, 1.8, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/b2gz0vSh0J4_filtered.json b/annotations_filtered/b2gz0vSh0J4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..427bdeb8049060e28631afd29543bd101b2b3ba2 --- /dev/null +++ b/annotations_filtered/b2gz0vSh0J4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.88], [11.0, 25.54], [26.0, 25.93], [26.0, 28.0], [30.0, 31.83], [32.0, 33.29], [34.0, 35.55], [37.0, 39.36], [40.0, 42.38], [43.0, 49.87], [52.0, 58.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 99.99, 0.0, 99.99, 0.0, 0.0, 0.0, 99.98, 99.94, 99.99, 66.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [6.88, 14.54, -0.07, 2.0, 1.83, 1.29, 1.55, 2.36, 2.38, 6.87, 6.67]} \ No newline at end of file diff --git a/annotations_filtered/b2hhdMiOTOE_filtered.json b/annotations_filtered/b2hhdMiOTOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46d8205f3a9e000ef6ec075c2bd9d7121043dc91 --- /dev/null +++ b/annotations_filtered/b2hhdMiOTOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 58.6], [59.0, 96.97], [100.0, 126.98], [128.0, 138.67]], "keep_status": [false, false, true, true], "silence_prob": [0.0, 0.0, 31.65, 34.72], "audiomae_on_audioset": [null, null, [["music", 18.87], ["hum", 6.79], ["noise", 6.63]], [["music", 38.42], ["effects unit", 14.55], ["guitar", 7.35]]], "duration": [-0.4, 37.97, 26.98, 10.67]} \ No newline at end of file diff --git a/annotations_filtered/b2zQmmYEDY4_filtered.json b/annotations_filtered/b2zQmmYEDY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f83ed4758a99329235849818c97ac04e34fe6cc --- /dev/null +++ b/annotations_filtered/b2zQmmYEDY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.43], [10.0, 12.63], [15.0, 16.02], [17.0, 17.9], [21.0, 21.07], [39.0, 39.34], [48.0, 54.73], [57.0, 64.94], [67.0, 67.22], [71.0, 101.29], [104.0, 116.33], [119.0, 120.78]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 35.61, 0.0, 0.0, 0.0, 0.0, 30.95, 31.38, 0.0, 0.0, 30.32, 0.0], "audiomae_on_audioset": [null, [["music", 45.32], ["theremin", 9.4], ["didgeridoo", 3.36]], null, null, null, null, [["music", 36.56], ["speech", 32.39], ["theremin", 5.76]], [["music", 59.35], ["didgeridoo", 7.97], ["musical instrument", 2.27]], null, null, [["music", 47.92], ["hum", 13.69], ["speech", 9.75]], null], "duration": [1.43, 2.63, 1.02, 0.9, 0.07, 0.34, 6.73, 7.94, 0.22, 30.29, 12.33, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/b3Aq5Vc0Ics_filtered.json b/annotations_filtered/b3Aq5Vc0Ics_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb9394550c2f4de58aaf409e97f5be4916373da9 --- /dev/null +++ b/annotations_filtered/b3Aq5Vc0Ics_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.22], [9.0, 11.45], [12.0, 15.8], [26.0, 33.74], [35.0, 37.99], [41.0, 43.38], [48.0, 49.76], [50.0, 51.81], [55.0, 58.18], [59.0, 60.86], [62.0, 63.53], [73.0, 73.85], [76.0, 80.74], [82.0, 83.22], [85.0, 87.18], [89.0, 91.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.29, 77.2, 99.94, 99.97, 92.15, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 99.8, 0.0, 100.0, 67.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.22, 2.45, 3.8, 7.74, 2.99, 2.38, 1.76, 1.81, 3.18, 1.86, 1.53, 0.85, 4.74, 1.22, 2.18, 2.93]} \ No newline at end of file diff --git a/annotations_filtered/b3EWsHg08x4_filtered.json b/annotations_filtered/b3EWsHg08x4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..508318142721168450a4078041bd535f944e98ba --- /dev/null +++ b/annotations_filtered/b3EWsHg08x4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.17], [6.0, 8.68], [9.0, 9.86], [18.0, 18.1], [20.0, 21.19], [29.0, 29.37], [37.0, 37.59], [40.0, 41.05], [42.0, 42.18], [47.0, 47.63], [56.0, 56.34], [58.0, 58.46], [60.0, 60.4], [61.0, 61.8], [62.0, 63.41], [66.0, 68.05], [68.0, 68.49], [70.0, 70.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 68.57], ["music", 8.62], ["fireworks", 1.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, 2.68, 0.86, 0.1, 1.19, 0.37, 0.59, 1.05, 0.18, 0.63, 0.34, 0.46, 0.4, 0.8, 1.41, 2.05, 0.49, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/b3OlGLDk4pY_filtered.json b/annotations_filtered/b3OlGLDk4pY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e2233310c6f808c25888d1fedcfdbeaf8f2d921 --- /dev/null +++ b/annotations_filtered/b3OlGLDk4pY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 57.25], [60.0, 76.69], [79.0, 85.46], [87.0, 104.58], [107.0, 115.26], [119.0, 128.36], [131.0, 131.23], [133.0, 150.36], [154.0, 158.19], [159.0, 167.24], [172.0, 173.15], [175.0, 175.86], [177.0, 234.86]], "keep_status": [false, true, true, true, true, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 29.7, 29.0, 28.73, 29.4, 29.54, 0.0, 28.7, 29.4, 28.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 22.08], ["hum", 10.79], ["mains hum", 10.28]], [["music", 26.03], ["static", 6.54], ["hum", 5.97]], [["music", 23.84], ["speech", 8.63], ["vehicle", 8.05]], [["music", 17.62], ["fly, housefly", 13.73], ["mosquito", 12.18]], [["music", 59.03], ["sound effect", 5.28], ["buzz", 3.97]], null, [["livestock, farm animals, working animals", 25.77], ["cattle, bovinae", 21.67], ["moo", 12.71]], [["music", 26.81], ["hum", 13.23], ["explosion", 12.48]], [["hum", 29.1], ["music", 25.12], ["mains hum", 16.37]], null, null, null], "duration": [52.25, 16.69, 6.46, 17.58, 8.26, 9.36, 0.23, 17.36, 4.19, 8.24, 1.15, 0.86, 57.86]} \ No newline at end of file diff --git a/annotations_filtered/b3lLWO2d7b0_filtered.json b/annotations_filtered/b3lLWO2d7b0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a82821be1a5ceebccb47165208117144e455aab0 --- /dev/null +++ b/annotations_filtered/b3lLWO2d7b0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[129.0, 133.14], [136.0, 168.4], [169.0, 170.67], [171.0, 171.42], [173.0, 195.22], [195.0, 195.25], [196.0, 200.18], [209.0, 212.14], [213.0, 212.94]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [38.82, 0.0, 0.0, 0.0, 32.47, 0.0, 33.23, 44.6, 0.0], "audiomae_on_audioset": [[["fly, housefly", 40.41], ["insect", 34.7], ["mosquito", 6.91]], null, null, null, [["music", 58.9], ["speech", 11.35], ["electronic music", 9.52]], null, [["throbbing", 26.42], ["music", 24.87], ["hum", 21.78]], [["music", 48.08], ["throbbing", 16.9], ["hum", 8.34]], null], "duration": [4.14, 32.4, 1.67, 0.42, 22.22, 0.25, 4.18, 3.14, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/b3lOpSXhT0c_filtered.json b/annotations_filtered/b3lOpSXhT0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00186de47ca921c422c09616e5d5d01562eb9522 --- /dev/null +++ b/annotations_filtered/b3lOpSXhT0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 103.67], [104.0, 104.14], [105.0, 108.63], [109.0, 111.2], [112.0, 113.29], [114.0, 137.71], [138.0, 138.38]], "keep_status": [false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 41.2, 40.92, 0.0, 31.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 30.38], ["hum", 10.08], ["throbbing", 5.84]], [["hum", 36.11], ["throbbing", 19.8], ["mains hum", 13.37]], null, [["whack, thwack", 19.5], ["music", 11.83], ["smash, crash", 9.09]], null], "duration": [33.67, 0.14, 3.63, 2.2, 1.29, 23.71, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/b4kKWa_hjCk_filtered.json b/annotations_filtered/b4kKWa_hjCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dafebdfebada2127ca1e13db87bf29d723e5da7 --- /dev/null +++ b/annotations_filtered/b4kKWa_hjCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [9.0, 9.24], [10.0, 10.35], [11.0, 13.93], [16.0, 17.71], [18.0, 18.86], [19.0, 22.99], [26.0, 26.67], [38.0, 37.89], [54.0, 56.34], [58.0, 60.4], [63.0, 64.13], [87.0, 87.54], [95.0, 95.76], [111.0, 111.92], [117.0, 118.18], [120.0, 120.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 33.63, 0.0, 0.0, 58.47, 40.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["moo", 42.83], ["cattle, bovinae", 27.71], ["livestock, farm animals, working animals", 18.63]], null, null, null, [["music", 53.95], ["foghorn", 5.7], ["theremin", 4.12]], null, null, null, null, null, null], "duration": [1.13, 0.24, 0.35, 2.93, 1.71, 0.86, 3.99, 0.67, -0.11, 2.34, 2.4, 1.13, 0.54, 0.76, 0.92, 1.18, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/b4kRHpvisxE_filtered.json b/annotations_filtered/b4kRHpvisxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9928d1b7c0c3d2b183e9276cebfc679a9ebd3a4a --- /dev/null +++ b/annotations_filtered/b4kRHpvisxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.89], [10.0, 11.72], [13.0, 14.28], [18.0, 18.0], [18.0, 20.31], [25.0, 26.64], [31.0, 34.47], [35.0, 37.39], [39.0, 41.57], [43.0, 45.81], [50.0, 52.47], [54.0, 57.32], [60.0, 62.94], [64.0, 66.82], [69.0, 72.5], [75.0, 76.27], [79.0, 81.11], [84.0, 86.12], [88.0, 90.54], [92.0, 95.01], [96.0, 97.78], [101.0, 101.51], [103.0, 104.21], [107.0, 107.08], [112.0, 113.0], [117.0, 122.0], [129.0, 130.28], [131.0, 135.89], [137.0, 140.34], [143.0, 145.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 99.92, 56.86, 100.0, 100.0, 100.0, 73.97, 99.98, 99.1, 98.86, 0.0, 100.0, 98.99, 99.05, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 60.32, 0.0, 71.29, 82.25, 76.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.11, 1.72, 1.28, 0.0, 2.31, 1.64, 3.47, 2.39, 2.57, 2.81, 2.47, 3.32, 2.94, 2.82, 3.5, 1.27, 2.11, 2.12, 2.54, 3.01, 1.78, 0.51, 1.21, 0.08, 1.0, 5.0, 1.28, 4.89, 3.34, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/b4vpGhO2LwA_filtered.json b/annotations_filtered/b4vpGhO2LwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a09b4f793ce7b4480e14dcbe6e4cc18074e0ed17 --- /dev/null +++ b/annotations_filtered/b4vpGhO2LwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.38], [18.0, 18.18], [19.0, 19.62], [41.0, 41.35], [47.0, 47.82], [50.0, 51.02], [52.0, 54.04], [55.0, 56.54], [61.0, 61.11], [67.0, 67.1], [73.0, 72.82], [73.0, 76.0], [77.0, 77.48], [84.0, 84.08], [85.0, 86.07], [96.0, 96.9]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.58, 0.0, 0.0, 0.0, 0.0, 34.56, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 12.97], ["honk", 11.75], ["goose", 10.95]], null, null, null, null, [["speech", 35.66], ["hum", 9.83], ["sidetone", 6.71]], null, null, null, null], "duration": [0.38, 0.18, 0.62, 0.35, 0.82, 1.02, 2.04, 1.54, 0.11, 0.1, -0.18, 3.0, 0.48, 0.08, 1.07, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/b56RExAdg7s_filtered.json b/annotations_filtered/b56RExAdg7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18cda8e3b49b3c9d7627af4887e94e8f1d9042f5 --- /dev/null +++ b/annotations_filtered/b56RExAdg7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.12], [14.0, 35.45], [36.0, 37.54], [39.0, 42.25], [42.0, 44.59], [46.0, 50.68]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 55.67, 0.0, 61.67, 57.32, 44.52], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 34.88], ["mains hum", 22.01], ["music", 8.14]]], "duration": [1.12, 21.45, 1.54, 3.25, 2.59, 4.68]} \ No newline at end of file diff --git a/annotations_filtered/b5I94bT23cQ_filtered.json b/annotations_filtered/b5I94bT23cQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c55adea442a1f856167d722235658e1abf9125e6 --- /dev/null +++ b/annotations_filtered/b5I94bT23cQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.79], [19.0, 19.79], [23.0, 25.08], [26.0, 26.43], [32.0, 33.74], [34.0, 35.7], [36.0, 37.4], [39.0, 39.9], [41.0, 41.28], [43.0, 43.09], [43.0, 48.32], [51.0, 50.67], [51.0, 52.74], [58.0, 58.16], [62.0, 64.81], [65.0, 72.05], [74.0, 74.36], [80.0, 80.97], [83.0, 84.13], [85.0, 85.87], [87.0, 87.3], [101.0, 101.36], [112.0, 112.62], [116.0, 118.37], [121.0, 121.54], [122.0, 123.52], [124.0, 126.03], [137.0, 139.16], [148.0, 155.73], [159.0, 160.64], [169.0, 171.73], [173.0, 174.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.55, 0.0, 0.0, 0.0, 68.8, 37.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.31, 0.0, 0.0, 36.18, 49.13, 84.25, 0.0, 86.45, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 64.42], ["fly, housefly", 5.84], ["throbbing", 3.26]], null, null, null, null, [["speech", 26.42], ["insect", 15.41], ["bee, wasp, etc.", 12.9]], null, null, null, null, null, null, null, null, null, null, [["speech", 19.41], ["boing", 11.47], ["hum", 8.13]], [["hum", 17.73], ["throbbing", 6.3], ["noise", 4.26]], null, null, null, null], "duration": [-0.21, 0.79, 2.08, 0.43, 1.74, 1.7, 1.4, 0.9, 0.28, 0.09, 5.32, -0.33, 1.74, 0.16, 2.81, 7.05, 0.36, 0.97, 1.13, 0.87, 0.3, 0.36, 0.62, 2.37, 0.54, 1.52, 2.03, 2.16, 7.73, 1.64, 2.73, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/b5Q6A_1YyHg_filtered.json b/annotations_filtered/b5Q6A_1YyHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52dd70b365704288feac7098c9c0d1aeb6f54cc0 --- /dev/null +++ b/annotations_filtered/b5Q6A_1YyHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 27.01], [28.0, 32.68], [36.0, 40.76], [48.0, 68.15], [71.0, 80.57], [91.0, 102.69], [103.0, 103.79], [106.0, 106.89], [117.0, 124.38]], "keep_status": [false, false, false, false, false, true, false, false, true], "silence_prob": [31.13, 29.7, 30.1, 29.47, 29.78, 29.92, 0.0, 0.0, 32.68], "audiomae_on_audioset": [[["speech", 41.65], ["music", 33.4], ["theremin", 3.25]], [["music", 82.12], ["mosquito", 2.19], ["theremin", 2.05]], [["speech", 50.87], ["music", 33.41], ["boing", 2.7]], [["music", 57.71], ["speech", 10.03], ["fart", 3.61]], [["music", 54.8], ["speech", 27.43], ["electronic music", 1.92]], [["whack, thwack", 37.8], ["speech", 12.4], ["fart", 11.62]], null, null, [["speech", 45.09], ["whack, thwack", 16.11], ["thunk", 8.59]]], "duration": [5.01, 4.68, 4.76, 20.15, 9.57, 11.69, 0.79, 0.89, 7.38]} \ No newline at end of file diff --git a/annotations_filtered/b60DLSEemEY_filtered.json b/annotations_filtered/b60DLSEemEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..398143e0973652773a7d74824d2c282744768aa0 --- /dev/null +++ b/annotations_filtered/b60DLSEemEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.53], [6.0, 12.38], [13.0, 13.22], [14.0, 18.71], [19.0, 23.41], [24.0, 24.34], [25.0, 27.08], [27.0, 50.84], [52.0, 54.01], [54.0, 55.43], [60.0, 60.13], [62.0, 64.07], [66.0, 65.97], [66.0, 68.23], [69.0, 70.02], [79.0, 79.42], [83.0, 83.34], [85.0, 84.94], [92.0, 92.91], [98.0, 98.17], [103.0, 104.75], [106.0, 119.11], [125.0, 129.98], [130.0, 131.38]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [41.72, 63.1, 0.0, 53.84, 37.34, 0.0, 30.69, 30.7, 32.14, 0.0, 0.0, 43.69, 0.0, 40.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.52, 96.89, 0.0], "audiomae_on_audioset": [[["hum", 17.11], ["mains hum", 16.89], ["music", 12.81]], null, null, null, [["sidetone", 62.83], ["hum", 12.77], ["speech", 9.22]], null, [["hum", 17.6], ["throbbing", 16.32], ["mains hum", 13.33]], [["music", 46.06], ["hum", 17.2], ["throbbing", 11.46]], [["speech", 34.67], ["music", 11.77], ["hum", 6.01]], null, null, [["speech", 75.45], ["sidetone", 6.15], ["music", 2.94]], null, [["music", 26.08], ["speech", 18.32], ["mains hum", 7.25]], null, null, null, null, null, null, null, [["crow", 40.8], ["caw", 20.29], ["hum", 7.68]], null, null], "duration": [3.53, 6.38, 0.22, 4.71, 4.41, 0.34, 2.08, 23.84, 2.01, 1.43, 0.13, 2.07, -0.03, 2.23, 1.02, 0.42, 0.34, -0.06, 0.91, 0.17, 1.75, 13.11, 4.98, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/b65C_muXajk_filtered.json b/annotations_filtered/b65C_muXajk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22f6adb319647e32deb720a4f8296bf94a3ad4cc --- /dev/null +++ b/annotations_filtered/b65C_muXajk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.25], [28.0, 28.26], [29.0, 29.57], [38.0, 38.64], [41.0, 41.2], [42.0, 48.39], [51.0, 50.94], [52.0, 52.32], [53.0, 53.65], [55.0, 56.98], [85.0, 85.33], [86.0, 87.84], [92.0, 94.54], [97.0, 98.49], [100.0, 100.52], [102.0, 102.46], [110.0, 110.54], [114.0, 114.76], [118.0, 122.01], [123.0, 125.9], [126.0, 126.74], [128.0, 130.76], [132.0, 135.4], [136.0, 137.98], [143.0, 144.58], [146.0, 147.26], [149.0, 151.24], [152.0, 153.94], [155.0, 157.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 99.92, 0.0, 0.0, 0.0, 35.46, 0.0, 31.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.33], ["sound effect", 6.28], ["cacophony", 6.08]], null, [["hum", 24.13], ["mains hum", 24.11], ["boat, water vehicle", 5.58]]], "duration": [0.25, 0.26, 0.57, 0.64, 0.2, 6.39, -0.06, 0.32, 0.65, 1.98, 0.33, 1.84, 2.54, 1.49, 0.52, 0.46, 0.54, 0.76, 4.01, 2.9, 0.74, 2.76, 3.4, 1.98, 1.58, 1.26, 2.24, 1.94, 2.67]} \ No newline at end of file diff --git a/annotations_filtered/b6X5bVMoCJc_filtered.json b/annotations_filtered/b6X5bVMoCJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7efb9634ac82d0ffca6493dff3c89a36a437b671 --- /dev/null +++ b/annotations_filtered/b6X5bVMoCJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [6.0, 7.08], [13.0, 13.61], [18.0, 19.09], [23.0, 24.51], [27.0, 28.0], [30.0, 31.7], [33.0, 39.92], [42.0, 42.48], [43.0, 45.79], [47.0, 51.0], [53.0, 59.88], [61.0, 63.26], [68.0, 73.99], [77.0, 79.47], [81.0, 81.7], [84.0, 84.5], [87.0, 92.8], [98.0, 99.0], [105.0, 112.99], [115.0, 117.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 46.36, 45.36, 31.77, 41.44, 34.67, 32.08, 0.0, 0.0, 32.94, 0.0, 33.62, 56.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 36.82], ["speech", 25.38], ["throbbing", 13.1]], [["speech", 75.11], ["music", 9.51], ["sidetone", 1.09]], [["music", 50.88], ["boing", 16.25], ["speech", 7.89]], [["music", 40.1], ["throbbing", 12.3], ["hum", 4.48]], [["music", 27.09], ["speech", 22.91], ["throbbing", 17.71]], [["music", 40.44], ["speech", 39.39], ["sidetone", 2.98]], null, null, [["music", 41.38], ["breaking", 23.23], ["whack, thwack", 6.37]], null, [["music", 41.32], ["speech", 27.92], ["throbbing", 9.01]], null], "duration": [0.47, 1.08, 0.61, 1.09, 1.51, 1.0, 1.7, 6.92, 0.48, 2.79, 4.0, 6.88, 2.26, 5.99, 2.47, 0.7, 0.5, 5.8, 1.0, 7.99, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/b6vOp7_rI6Q_filtered.json b/annotations_filtered/b6vOp7_rI6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d352b2ad069e2da3660c9009dac04f2c8efdcc6 --- /dev/null +++ b/annotations_filtered/b6vOp7_rI6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 23.87], [24.0, 27.84], [28.0, 31.43], [32.0, 34.05], [38.0, 40.98], [42.0, 44.93], [45.0, 50.7], [52.0, 60.93], [63.0, 64.57], [66.0, 66.73], [73.0, 76.17], [77.0, 77.38], [78.0, 81.13], [104.0, 104.53], [112.0, 112.75], [118.0, 119.03], [127.0, 128.28], [131.0, 132.51], [135.0, 135.85], [138.0, 138.0], [142.0, 142.91], [144.0, 145.0], [147.0, 147.31], [152.0, 153.59], [156.0, 156.32], [162.0, 162.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.83, 93.13, 80.64, 99.48, 100.0, 100.0, 83.7, 99.99, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.87, 3.84, 3.43, 2.05, 2.98, 2.93, 5.7, 8.93, 1.57, 0.73, 3.17, 0.38, 3.13, 0.53, 0.75, 1.03, 1.28, 1.51, 0.85, 0.0, 0.91, 1.0, 0.31, 1.59, 0.32, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/b6xbga06ApQ_filtered.json b/annotations_filtered/b6xbga06ApQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..880af5198c5307874972be40076a43d7011217ed --- /dev/null +++ b/annotations_filtered/b6xbga06ApQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.68], [9.0, 13.59], [18.0, 19.26], [20.0, 22.92], [25.0, 26.18], [34.0, 34.33], [36.0, 36.85], [40.0, 40.46], [42.0, 42.16], [45.0, 45.2], [48.0, 48.14], [49.0, 51.46], [56.0, 56.13], [59.0, 59.61], [67.0, 70.82], [80.0, 81.36], [94.0, 94.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 99.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.68, 4.59, 1.26, 2.92, 1.18, 0.33, 0.85, 0.46, 0.16, 0.2, 0.14, 2.46, 0.13, 0.61, 3.82, 1.36, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/b74611maYgQ_filtered.json b/annotations_filtered/b74611maYgQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24a45da85759cfdf102186810d3328a3d6dca39a --- /dev/null +++ b/annotations_filtered/b74611maYgQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.58], [25.0, 28.58], [31.0, 39.23], [42.0, 50.16], [52.0, 55.05], [55.0, 55.14], [60.0, 60.78], [63.0, 69.77], [70.0, 70.88], [74.0, 74.56], [77.0, 87.86], [93.0, 96.03], [97.0, 103.33]], "keep_status": [false, true, true, true, true, false, false, false, false, false, false, false, true], "silence_prob": [31.54, 39.74, 40.28, 29.36, 32.42, 0.0, 0.0, 33.27, 0.0, 0.0, 32.87, 31.06, 30.4], "audiomae_on_audioset": [[["speech", 55.79], ["music", 14.47], ["explosion", 4.99]], [["speech", 23.46], ["hum", 20.26], ["mains hum", 10.18]], [["speech", 43.18], ["music", 12.54], ["mains hum", 6.29]], [["electric shaver, electric razor", 15.19], ["buzz", 13.88], ["speech", 13.19]], [["music", 37.65], ["hum", 13.47], ["throbbing", 8.88]], null, null, [["music", 59.23], ["speech", 21.2], ["electronic music", 2.7]], null, null, [["music", 43.08], ["speech", 23.8], ["hum", 14.51]], [["whale vocalization", 55.31], ["speech", 7.79], ["wild animals", 7.25]], [["whale vocalization", 28.49], ["music", 12.85], ["buzz", 10.51]]], "duration": [2.58, 3.58, 8.23, 8.16, 3.05, 0.14, 0.78, 6.77, 0.88, 0.56, 10.86, 3.03, 6.33]} \ No newline at end of file diff --git a/annotations_filtered/b7AjNXAF-7Y_filtered.json b/annotations_filtered/b7AjNXAF-7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/b7AjNXAF-7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/b7C69HqnV8s_filtered.json b/annotations_filtered/b7C69HqnV8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47ce03f5e8d2d42962a465d1a6285cbd1b3dfcd1 --- /dev/null +++ b/annotations_filtered/b7C69HqnV8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.49], [18.0, 21.1], [22.0, 24.27], [25.0, 25.46], [28.0, 29.08], [32.0, 34.84], [35.0, 37.23], [39.0, 39.95], [40.0, 43.43], [46.0, 47.14], [49.0, 51.51], [53.0, 64.79], [68.0, 69.04], [71.0, 72.45], [73.0, 76.98], [81.0, 81.97], [84.0, 85.11], [87.0, 87.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.76, 80.11, 79.76, 0.0, 0.0, 59.59, 72.16, 0.0, 90.08, 0.0, 98.19, 36.72, 0.0, 0.0, 37.14, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 82.78], ["funk", 2.09], ["synthesizer", 1.44]], null, null, [["music", 82.77], ["didgeridoo", 1.67], ["sampler", 1.49]], null, null, null], "duration": [4.49, 3.1, 2.27, 0.46, 1.08, 2.84, 2.23, 0.95, 3.43, 1.14, 2.51, 11.79, 1.04, 1.45, 3.98, 0.97, 1.11, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/b7Dxy34dFyY_filtered.json b/annotations_filtered/b7Dxy34dFyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11a56b1e88f31378ac958f3edf723cca29c0414e --- /dev/null +++ b/annotations_filtered/b7Dxy34dFyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [5.0, 6.59], [10.0, 10.69], [12.0, 12.78], [13.0, 14.55], [25.0, 26.0], [30.0, 31.43], [32.0, 35.97], [38.0, 39.9], [45.0, 45.96], [47.0, 48.24], [53.0, 54.53], [57.0, 58.01], [60.0, 60.05], [64.0, 64.5], [66.0, 67.04], [72.0, 72.32], [73.0, 73.45], [78.0, 78.22], [80.0, 81.84], [85.0, 85.46], [90.0, 96.42], [98.0, 98.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 1.59, 0.69, 0.78, 1.55, 1.0, 1.43, 3.97, 1.9, 0.96, 1.24, 1.53, 1.01, 0.05, 0.5, 1.04, 0.32, 0.45, 0.22, 1.84, 0.46, 6.42, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/b7lV6-iKiwQ_filtered.json b/annotations_filtered/b7lV6-iKiwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b32253ed0d944185f6ca3a187fc9aca2d04669c2 --- /dev/null +++ b/annotations_filtered/b7lV6-iKiwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 81.94], [83.0, 87.13], [88.0, 90.44], [91.0, 93.92], [97.0, 98.66], [100.0, 101.78], [104.0, 108.9], [111.0, 111.92], [112.0, 113.8], [116.0, 116.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.66, 99.99, 100.0, 77.36, 0.0, 0.0, 99.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [11.94, 4.13, 2.44, 2.92, 1.66, 1.78, 4.9, 0.92, 1.8, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/b7wurDomuVs_filtered.json b/annotations_filtered/b7wurDomuVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f49d6f18c5b2477f07ca7e3146d4a4883eaf0948 --- /dev/null +++ b/annotations_filtered/b7wurDomuVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.99], [8.0, 10.1], [13.0, 26.99], [27.0, 48.52], [49.0, 50.58], [52.0, 52.95], [53.0, 54.7], [57.0, 60.29], [62.0, 71.19], [74.0, 75.69], [78.0, 98.64], [106.0, 106.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.51, 96.04, 87.19, 0.0, 0.0, 0.0, 99.44, 99.56, 0.0, 58.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 2.1, 13.99, 21.52, 1.58, 0.95, 1.7, 3.29, 9.19, 1.69, 20.64, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/b8Dv782UIb4_filtered.json b/annotations_filtered/b8Dv782UIb4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89f3d256de567514377801c0fca86b047acfab18 --- /dev/null +++ b/annotations_filtered/b8Dv782UIb4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [6.0, 9.78], [10.0, 10.69], [13.0, 15.25], [16.0, 17.1], [19.0, 19.77], [22.0, 22.62], [24.0, 25.93], [27.0, 27.13], [30.0, 30.42], [31.0, 37.34], [39.0, 41.86], [43.0, 44.24], [45.0, 46.63], [47.0, 58.26], [68.0, 69.79], [72.0, 72.84], [74.0, 76.71], [78.0, 78.85], [81.0, 82.68], [85.0, 85.99], [95.0, 95.05], [96.0, 96.7], [98.0, 99.93], [101.0, 103.08], [105.0, 106.19], [108.0, 108.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.48, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 52.33, 0.0, 0.0, 29.41, 0.0, 0.0, 40.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 29.09], ["grunt", 15.37], ["roaring cats (lions, tigers)", 13.47]], null, null, [["cattle, bovinae", 20.15], ["livestock, farm animals, working animals", 15.91], ["speech", 14.13]], null, null, null, null, null, null, null, null, null], "duration": [1.14, 3.78, 0.69, 2.25, 1.1, 0.77, 0.62, 1.93, 0.13, 0.42, 6.34, 2.86, 1.24, 1.63, 11.26, 1.79, 0.84, 2.71, 0.85, 1.68, 0.99, 0.05, 0.7, 1.93, 2.08, 1.19, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/b8U1na74Bcc_filtered.json b/annotations_filtered/b8U1na74Bcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31683f288d1837e994e7497764b281d40ed92faa --- /dev/null +++ b/annotations_filtered/b8U1na74Bcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 55.9], [59.0, 73.67], [74.0, 75.47], [76.0, 76.64], [77.0, 77.67], [82.0, 82.39], [86.0, 86.49], [87.0, 87.83], [91.0, 95.17], [96.0, 98.93], [99.0, 99.99], [104.0, 107.06], [109.0, 110.08], [112.0, 113.22], [114.0, 116.21], [117.0, 117.32], [118.0, 118.29], [119.0, 119.69], [121.0, 127.38], [132.0, 134.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 36.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.31, 84.8, 0.0, 95.91, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 32.85, 34.02], "audiomae_on_audioset": [null, [["telephone bell ringing", 68.72], ["music", 17.45], ["telephone", 7.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.45], ["synthesizer", 16.91], ["sine wave", 10.65]], [["music", 34.1], ["speech", 18.57], ["foghorn", 9.94]]], "duration": [45.9, 14.67, 1.47, 0.64, 0.67, 0.39, 0.49, 0.83, 4.17, 2.93, 0.99, 3.06, 1.08, 1.22, 2.21, 0.32, 0.29, 0.69, 6.38, 2.2]} \ No newline at end of file diff --git a/annotations_filtered/b8oFKKPfgi0_filtered.json b/annotations_filtered/b8oFKKPfgi0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..687bf1d13404868f5448eb2181d888603d427da1 --- /dev/null +++ b/annotations_filtered/b8oFKKPfgi0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [2.0, 4.36], [6.0, 6.0], [6.0, 8.33], [9.0, 10.71], [12.0, 12.66], [13.0, 14.37], [15.0, 16.26], [17.0, 18.79], [20.0, 21.88], [22.0, 25.83], [30.0, 30.74], [31.0, 80.59], [81.0, 82.07], [84.0, 91.71], [92.0, 93.46], [95.0, 96.72], [98.0, 103.45], [103.0, 103.49], [104.0, 103.54], [104.0, 104.92], [108.0, 109.51], [111.0, 112.46], [113.0, 114.88], [116.0, 118.35], [118.0, 118.42], [120.0, 126.55], [129.0, 129.96], [131.0, 136.12]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 43.82, 0.0, 38.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.84, 0.0, 0.0, 0.0, 33.71, 0.0, 0.0, 31.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.94, 0.0, 32.33, 0.0, 61.97], "audiomae_on_audioset": [null, [["music", 51.88], ["speech", 13.2], ["techno", 2.47]], null, [["music", 39.01], ["frog", 14.98], ["croak", 8.25]], null, null, null, null, null, null, [["speech", 71.04], ["radio", 5.41], ["busy signal", 3.1]], null, null, null, [["music", 61.14], ["speech", 10.94], ["didgeridoo", 2.87]], null, null, [["music", 78.91], ["electronic music", 1.5], ["house music", 1.49]], null, null, null, null, null, null, [["music", 45.76], ["throbbing", 6.7], ["sampler", 4.22]], null, [["music", 60.05], ["speech", 10.28], ["drum machine", 6.81]], null, null], "duration": [1.1, 2.36, 0.0, 2.33, 1.71, 0.66, 1.37, 1.26, 1.79, 1.88, 3.83, 0.74, 49.59, 1.07, 7.71, 1.46, 1.72, 5.45, 0.49, -0.46, 0.92, 1.51, 1.46, 1.88, 2.35, 0.42, 6.55, 0.96, 5.12]} \ No newline at end of file diff --git a/annotations_filtered/b8t5kX7k0vQ_filtered.json b/annotations_filtered/b8t5kX7k0vQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b4605401fba692878e7b18bad852a7e5141f070 --- /dev/null +++ b/annotations_filtered/b8t5kX7k0vQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.16], [5.0, 5.8]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.16, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/b95SzqTrjRo_filtered.json b/annotations_filtered/b95SzqTrjRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ae6d9ac9f995572cfd251a7459cc3a6ec803e8d --- /dev/null +++ b/annotations_filtered/b95SzqTrjRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.29], [5.0, 5.63], [8.0, 8.13], [9.0, 9.32], [12.0, 12.46], [13.0, 13.39], [16.0, 16.97], [22.0, 26.1], [29.0, 30.91], [31.0, 35.34], [42.0, 42.96], [44.0, 46.4], [49.0, 53.0]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.36, 0.0, 52.1, 0.0, 49.97, 53.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 38.84], ["whale vocalization", 9.15], ["livestock, farm animals, working animals", 8.26]], null, null, null, [["glass", 16.08], ["mains hum", 15.22], ["hum", 13.34]], null], "duration": [3.29, 0.63, 0.13, 0.32, 0.46, 0.39, 0.97, 4.1, 1.91, 4.34, 0.96, 2.4, 4.0]} \ No newline at end of file diff --git a/annotations_filtered/b9EAfTyu5_I_filtered.json b/annotations_filtered/b9EAfTyu5_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2055f3c64bdebf65ec020d1029e165ab44dac697 --- /dev/null +++ b/annotations_filtered/b9EAfTyu5_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 11.28], [12.0, 13.42], [15.0, 15.69], [16.0, 17.25], [19.0, 22.67], [23.0, 24.09], [25.0, 30.7], [32.0, 33.44], [34.0, 35.65], [36.0, 36.63], [38.0, 38.25], [40.0, 39.97], [41.0, 41.74], [43.0, 44.98], [46.0, 47.11], [48.0, 49.3], [50.0, 51.26], [52.0, 53.77], [55.0, 56.12], [60.0, 60.37], [62.0, 63.27], [64.0, 64.93], [66.0, 66.58], [68.0, 68.07], [69.0, 70.93], [71.0, 71.59], [73.0, 74.04], [75.0, 75.15], [76.0, 77.23], [79.0, 82.54], [83.0, 88.4], [90.0, 90.64], [92.0, 92.58], [94.0, 94.88], [95.0, 96.6], [97.0, 98.27], [99.0, 102.59], [103.0, 110.4], [113.0, 126.67], [128.0, 129.37]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.6, 0.0, 0.0, 0.0, 59.42, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.49, 49.09, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 36.67, 35.06, 0.0], "audiomae_on_audioset": [[["animal", 17.6], ["whale vocalization", 8.11], ["noise", 7.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.96], ["foghorn", 12.58], ["speech", 6.39]], [["music", 21.91], ["hum", 17.99], ["mains hum", 17.45]], null, null, null, null, null, null, [["music", 70.45], ["theremin", 14.46], ["speech", 1.31]], [["music", 75.02], ["ambient music", 3.39], ["keyboard (musical)", 2.82]], null], "duration": [11.28, 1.42, 0.69, 1.25, 3.67, 1.09, 5.7, 1.44, 1.65, 0.63, 0.25, -0.03, 0.74, 1.98, 1.11, 1.3, 1.26, 1.77, 1.12, 0.37, 1.27, 0.93, 0.58, 0.07, 1.93, 0.59, 1.04, 0.15, 1.23, 3.54, 5.4, 0.64, 0.58, 0.88, 1.6, 1.27, 3.59, 7.4, 13.67, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/b9KCMBBn0EI_filtered.json b/annotations_filtered/b9KCMBBn0EI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73603dc2d6dc57162f0703894083a568dc020c26 --- /dev/null +++ b/annotations_filtered/b9KCMBBn0EI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[82.0, 83.17], [86.0, 128.44]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.17, 42.44]} \ No newline at end of file diff --git a/annotations_filtered/b9WFVLRPOJI_filtered.json b/annotations_filtered/b9WFVLRPOJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b67cd11e2ac5bda18b0f7aeb0a3afe2247f8ed0b --- /dev/null +++ b/annotations_filtered/b9WFVLRPOJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 26.13], [32.0, 36.15], [37.0, 37.18], [39.0, 40.71]], "keep_status": [true, true, false, false], "silence_prob": [28.81, 30.46, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 41.57], ["vehicle", 16.67], ["car", 8.26]], [["speech", 50.58], ["music", 12.84], ["breaking", 3.5]], null, null], "duration": [4.13, 4.15, 0.18, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/b9abCIgGxT4_filtered.json b/annotations_filtered/b9abCIgGxT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..237c78ec63ca9bd3ad4afbea1a60a371818f5f77 --- /dev/null +++ b/annotations_filtered/b9abCIgGxT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.2], [12.0, 18.23], [22.0, 49.55], [51.0, 74.09]], "keep_status": [true, false, false, false], "silence_prob": [49.4, 32.67, 35.65, 44.37], "audiomae_on_audioset": [[["speech", 34.78], ["water", 14.71], ["radio", 4.75]], [["speech", 69.92], ["burping, eructation", 9.09], ["noise", 2.78]], [["speech", 74.23], ["burping, eructation", 5.85], ["hum", 5.45]], [["mains hum", 37.57], ["hum", 35.96], ["gong", 5.74]]], "duration": [3.2, 6.23, 27.55, 23.09]} \ No newline at end of file diff --git a/annotations_filtered/b9pr0K7SuYk_filtered.json b/annotations_filtered/b9pr0K7SuYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6e9fd562c558a77348be8df048df64ed0c68334 --- /dev/null +++ b/annotations_filtered/b9pr0K7SuYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.12], [6.0, 6.96], [8.0, 10.49], [11.0, 12.26], [13.0, 30.0], [33.0, 39.93], [42.0, 43.8], [46.0, 47.07], [56.0, 56.02], [57.0, 57.81], [58.0, 58.92], [67.0, 67.04], [68.0, 69.25], [70.0, 70.34], [71.0, 71.93], [85.0, 84.92], [86.0, 87.0], [88.0, 88.4], [90.0, 90.32], [94.0, 101.01], [101.0, 102.39], [104.0, 104.33], [106.0, 107.47], [108.0, 108.89], [110.0, 112.08], [115.0, 138.27]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [32.25, 0.0, 64.07, 0.0, 31.85, 32.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.83, 0.0, 0.0, 0.0, 0.0, 34.7, 34.03], "audiomae_on_audioset": [[["music", 38.02], ["throbbing", 21.61], ["hum", 8.07]], null, null, null, [["music", 73.63], ["electronic music", 5.35], ["hum", 2.91]], [["music", 54.31], ["speech", 7.15], ["electronic music", 6.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 65.36], ["hum", 8.48], ["throbbing", 3.73]], null, null, null, null, [["music", 31.02], ["didgeridoo", 10.38], ["boing", 7.6]], [["music", 25.71], ["whack, thwack", 23.99], ["groan", 11.07]]], "duration": [3.12, 0.96, 2.49, 1.26, 17.0, 6.93, 1.8, 1.07, 0.02, 0.81, 0.92, 0.04, 1.25, 0.34, 0.93, -0.08, 1.0, 0.4, 0.32, 7.01, 1.39, 0.33, 1.47, 0.89, 2.08, 23.27]} \ No newline at end of file diff --git a/annotations_filtered/b9qMqGTi1uc_filtered.json b/annotations_filtered/b9qMqGTi1uc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e2a769c84217335893e16000e6abbeeb286599b --- /dev/null +++ b/annotations_filtered/b9qMqGTi1uc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.41], [6.0, 6.4], [7.0, 7.33], [11.0, 11.38], [16.0, 17.2], [23.0, 22.99], [25.0, 25.71], [26.0, 27.23], [28.0, 28.49], [30.0, 30.43], [31.0, 41.62], [44.0, 52.14], [52.0, 58.24], [61.0, 97.01], [98.0, 113.8], [115.0, 116.65], [117.0, 117.51], [119.0, 121.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.27, 39.83, 29.74, 0.0, 60.6, 0.0, 0.0, 68.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["vehicle", 10.59], ["explosion", 6.99], ["smash, crash", 5.84]], [["speech", 45.92], ["music", 16.93], ["hum", 8.37]], [["music", 55.53], ["speech", 13.55], ["reverberation", 3.14]], null, null, null, null, null], "duration": [0.41, 0.4, 0.33, 0.38, 1.2, -0.01, 0.71, 1.23, 0.49, 0.43, 10.62, 8.14, 6.24, 36.01, 15.8, 1.65, 0.51, 2.61]} \ No newline at end of file diff --git a/annotations_filtered/bAI6N5Uo7SQ_filtered.json b/annotations_filtered/bAI6N5Uo7SQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6fd87c4723ff1055a4ab5bb13cea210388b3a67 --- /dev/null +++ b/annotations_filtered/bAI6N5Uo7SQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.09], [15.0, 15.74], [45.0, 46.2], [54.0, 56.24], [57.0, 59.14], [66.0, 70.8], [78.0, 78.88], [81.0, 84.0], [87.0, 87.08], [94.0, 94.2], [105.0, 106.35], [107.0, 107.86], [115.0, 115.97], [117.0, 117.59], [119.0, 125.29], [128.0, 129.74]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [51.99, 0.0, 0.0, 36.27, 34.65, 36.39, 0.0, 34.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 66.51], ["musical instrument", 4.2], ["singing", 2.67]], [["music", 58.86], ["piano", 9.56], ["keyboard (musical)", 6.57]], [["music", 74.56], ["musical instrument", 2.14], ["acoustic guitar", 1.93]], null, [["music", 59.84], ["synthesizer", 4.59], ["musical instrument", 3.46]], null, null, null, null, null, null, null, null], "duration": [6.09, 0.74, 1.2, 2.24, 2.14, 4.8, 0.88, 3.0, 0.08, 0.2, 1.35, 0.86, 0.97, 0.59, 6.29, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/bANgFADltvw_filtered.json b/annotations_filtered/bANgFADltvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f9d7086cf4936082c859f31608cd33508999e89 --- /dev/null +++ b/annotations_filtered/bANgFADltvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.27], [12.0, 14.89], [16.0, 17.05], [18.0, 19.5], [21.0, 21.83], [26.0, 29.29], [31.0, 49.18], [51.0, 51.51], [54.0, 54.63], [59.0, 59.48], [61.0, 61.47], [63.0, 63.98], [65.0, 65.74], [66.0, 67.58], [69.0, 70.23], [75.0, 76.0], [77.0, 77.21], [81.0, 81.78], [85.0, 85.87], [87.0, 87.39], [90.0, 91.02], [92.0, 93.09], [94.0, 94.69], [97.0, 97.53], [98.0, 114.99], [116.0, 119.43], [121.0, 122.77], [126.0, 126.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.56, 0.0, 0.0, 0.0, 93.6, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.89, 58.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 74.92], ["grunt", 2.72], ["screaming", 2.6]], null, null, null], "duration": [1.27, 2.89, 1.05, 1.5, 0.83, 3.29, 18.18, 0.51, 0.63, 0.48, 0.47, 0.98, 0.74, 1.58, 1.23, 1.0, 0.21, 0.78, 0.87, 0.39, 1.02, 1.09, 0.69, 0.53, 16.99, 3.43, 1.77, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/bAyb9cEDh2E_filtered.json b/annotations_filtered/bAyb9cEDh2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba9a36a34884f63ea97fbcfc7c06beb06efcd815 --- /dev/null +++ b/annotations_filtered/bAyb9cEDh2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 20.01], [31.0, 31.94], [34.0, 34.8], [36.0, 36.91], [37.0, 37.59], [38.0, 38.53], [42.0, 46.35], [47.0, 48.17], [53.0, 53.11], [55.0, 55.07], [56.0, 61.77], [63.0, 64.61], [68.0, 68.94], [71.0, 75.14], [76.0, 78.12], [80.0, 79.76], [85.0, 86.51], [90.0, 91.57], [93.0, 94.19], [95.0, 102.19], [103.0, 103.62], [106.0, 106.86], [109.0, 112.73], [113.0, 118.64], [119.0, 122.93], [123.0, 125.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 98.1, 98.8, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 99.88, 97.73, 56.03, 88.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [14.01, 0.94, 0.8, 0.91, 0.59, 0.53, 4.35, 1.17, 0.11, 0.07, 5.77, 1.61, 0.94, 4.14, 2.12, -0.24, 1.51, 1.57, 1.19, 7.19, 0.62, 0.86, 3.73, 5.64, 3.93, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/bBHFfXCAPLc_filtered.json b/annotations_filtered/bBHFfXCAPLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d00dd9ba90441d7a1ff5514ea8166970767ad551 --- /dev/null +++ b/annotations_filtered/bBHFfXCAPLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [6.0, 16.55], [22.0, 38.1], [40.0, 43.36], [44.0, 43.82], [44.0, 44.15], [44.0, 54.77], [58.0, 61.74], [65.0, 65.2], [75.0, 75.68], [77.0, 77.5], [81.0, 82.02], [84.0, 84.18], [85.0, 85.8], [92.0, 94.9], [96.0, 100.67], [103.0, 103.42], [124.0, 124.75], [126.0, 127.79], [131.0, 131.7]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.97, 33.96, 45.78, 0.0, 0.0, 45.59, 35.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 33.63, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 53.21], ["throbbing", 21.63], ["mains hum", 16.77]], [["music", 80.53], ["cacophony", 6.08], ["vehicle", 1.24]], [["hum", 35.62], ["throbbing", 30.44], ["mains hum", 5.65]], null, null, [["sidetone", 29.65], ["speech", 24.86], ["music", 14.04]], [["hum", 18.51], ["speech", 14.58], ["music", 11.48]], null, null, null, null, null, null, null, [["music", 57.79], ["hum", 9.31], ["mains hum", 4.39]], null, null, null, null], "duration": [0.87, 10.55, 16.1, 3.36, -0.18, 0.15, 10.77, 3.74, 0.2, 0.68, 0.5, 1.02, 0.18, 0.8, 2.9, 4.67, 0.42, 0.75, 1.79, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/bBLKvPSgQ2A_filtered.json b/annotations_filtered/bBLKvPSgQ2A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daf6856629b76432c3e1824fc3d808dc11aadf66 --- /dev/null +++ b/annotations_filtered/bBLKvPSgQ2A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.45], [12.0, 11.94], [16.0, 16.34], [20.0, 20.71], [24.0, 25.69], [28.0, 29.83], [30.0, 33.02], [34.0, 35.92], [37.0, 38.67], [40.0, 40.95], [44.0, 44.96], [47.0, 47.53], [49.0, 50.18], [52.0, 54.63], [55.0, 56.57], [57.0, 57.11], [60.0, 61.15], [63.0, 63.98], [69.0, 70.8], [72.0, 73.16], [75.0, 75.66], [78.0, 80.5], [87.0, 93.33], [95.0, 114.4], [117.0, 122.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.72, 84.98, 89.01, 93.45], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, -0.06, 0.34, 0.71, 1.69, 1.83, 3.02, 1.92, 1.67, 0.95, 0.96, 0.53, 1.18, 2.63, 1.57, 0.11, 1.15, 0.98, 1.8, 1.16, 0.66, 2.5, 6.33, 19.4, 5.1]} \ No newline at end of file diff --git a/annotations_filtered/bBbLZ6m_9MA_filtered.json b/annotations_filtered/bBbLZ6m_9MA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22109d19b7a1d64ba273a19ab5dd399433b2989c --- /dev/null +++ b/annotations_filtered/bBbLZ6m_9MA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.17], [13.0, 13.15], [15.0, 47.39], [51.0, 65.08], [69.0, 86.26]], "keep_status": [true, false, false, false, false], "silence_prob": [49.13, 0.0, 0.0, 41.54, 38.4], "audiomae_on_audioset": [[["speech", 27.0], ["music", 25.72], ["didgeridoo", 4.55]], null, null, [["music", 50.29], ["speech", 17.88], ["didgeridoo", 10.19]], [["music", 37.95], ["speech", 28.86], ["didgeridoo", 9.32]]], "duration": [3.17, 0.15, 32.39, 14.08, 17.26]} \ No newline at end of file diff --git a/annotations_filtered/bBeHRwjwKk8_filtered.json b/annotations_filtered/bBeHRwjwKk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/bBeHRwjwKk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/bBil15ORYI0_filtered.json b/annotations_filtered/bBil15ORYI0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50e7a93f2bd67dd1d78093fa008de26a91391c12 --- /dev/null +++ b/annotations_filtered/bBil15ORYI0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.43], [14.0, 14.4], [16.0, 17.68], [18.0, 22.71], [29.0, 30.11], [39.0, 39.14], [45.0, 45.79], [53.0, 53.43], [66.0, 69.87], [70.0, 70.92], [73.0, 72.79], [78.0, 81.26], [88.0, 88.77], [94.0, 94.95], [99.0, 100.99], [102.0, 104.9], [110.0, 110.37], [117.0, 118.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.41, 0.0, 0.0, 0.0, 0.0, 58.13, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 53.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 67.09], ["sidetone", 7.49], ["hum", 3.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 0.4, 1.68, 4.71, 1.11, 0.14, 0.79, 0.43, 3.87, 0.92, -0.21, 3.26, 0.77, 0.95, 1.99, 2.9, 0.37, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/bBjLUZgx4WA_filtered.json b/annotations_filtered/bBjLUZgx4WA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ebf28905ff90b0739fda7677d16d1cd86dafbb0 --- /dev/null +++ b/annotations_filtered/bBjLUZgx4WA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [6.0, 8.31], [10.0, 10.98], [13.0, 13.04], [18.0, 19.31], [20.0, 20.43], [21.0, 21.93], [24.0, 29.86], [32.0, 33.74], [35.0, 36.48], [37.0, 38.38], [41.0, 41.03], [43.0, 42.85], [45.0, 45.01], [47.0, 47.28], [50.0, 50.06], [55.0, 55.71], [57.0, 58.18], [60.0, 63.49], [70.0, 70.7], [74.0, 74.48], [75.0, 75.0], [76.0, 77.13], [78.0, 79.42], [81.0, 86.43], [90.0, 90.85], [94.0, 94.95], [98.0, 100.41], [102.0, 108.5], [111.0, 117.53], [119.0, 124.11], [125.0, 130.55], [132.0, 134.77], [139.0, 140.76], [142.0, 143.04], [144.0, 149.13], [150.0, 152.12], [154.0, 157.1], [158.0, 161.38], [164.0, 166.41], [167.0, 168.56]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 41.24, 0.0, 0.0, 0.0, 0.0, 0.0, 45.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.02, 0.0, 0.0, 0.0, 0.0, 0.0, 45.3, 0.0, 0.0, 46.9, 46.79, 45.75, 47.74, 43.98, 44.49, 0.0, 0.0, 44.43, 47.82, 45.65, 45.02, 45.21, 0.0], "audiomae_on_audioset": [null, [["speech", 48.42], ["singing bowl", 13.36], ["music", 6.48]], null, null, null, null, null, [["singing bowl", 35.16], ["music", 32.75], ["ambient music", 7.45]], null, null, null, null, null, null, null, null, null, null, [["music", 75.32], ["ambient music", 4.09], ["scary music", 1.95]], null, null, null, null, null, [["music", 47.26], ["hum", 14.24], ["electronic music", 5.01]], null, null, [["music", 38.21], ["gong", 22.28], ["electronic music", 7.89]], [["music", 54.66], ["singing bowl", 7.55], ["hiccup", 4.31]], [["music", 46.28], ["ambient music", 12.67], ["singing bowl", 8.01]], [["music", 68.59], ["scary music", 4.02], ["foghorn", 2.74]], [["music", 56.49], ["ambient music", 20.03], ["scary music", 10.82]], [["music", 70.13], ["ambient music", 13.39], ["electronic music", 3.57]], null, null, [["music", 61.37], ["ambient music", 18.28], ["synthesizer", 3.26]], [["music", 33.88], ["ambient music", 23.76], ["electronic music", 12.75]], [["music", 50.49], ["singing bowl", 14.5], ["ambient music", 5.85]], [["music", 23.33], ["speech", 18.57], ["singing bowl", 17.09]], [["music", 60.36], ["ambient music", 10.57], ["singing bowl", 6.89]], null], "duration": [0.43, 2.31, 0.98, 0.04, 1.31, 0.43, 0.93, 5.86, 1.74, 1.48, 1.38, 0.03, -0.15, 0.01, 0.28, 0.06, 0.71, 1.18, 3.49, 0.7, 0.48, 0.0, 1.13, 1.42, 5.43, 0.85, 0.95, 2.41, 6.5, 6.53, 5.11, 5.55, 2.77, 1.76, 1.04, 5.13, 2.12, 3.1, 3.38, 2.41, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/bBzNPO001NU_filtered.json b/annotations_filtered/bBzNPO001NU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a81ada63b6d2c036942ead3cafd167615f0924a --- /dev/null +++ b/annotations_filtered/bBzNPO001NU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.11], [10.0, 10.03], [11.0, 11.53], [14.0, 14.42], [19.0, 19.31], [20.0, 20.58], [22.0, 22.54], [23.0, 24.88], [29.0, 29.4], [34.0, 34.06], [43.0, 43.92], [45.0, 45.23], [49.0, 53.37], [55.0, 55.92], [57.0, 57.15], [59.0, 59.58], [64.0, 64.57], [68.0, 70.53], [71.0, 72.84], [88.0, 90.15], [93.0, 93.43], [95.0, 95.37], [97.0, 97.58], [99.0, 99.82], [101.0, 101.26], [103.0, 103.54], [113.0, 115.74], [117.0, 118.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 94.95, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.11, 0.03, 0.53, 0.42, 0.31, 0.58, 0.54, 1.88, 0.4, 0.06, 0.92, 0.23, 4.37, 0.92, 0.15, 0.58, 0.57, 2.53, 1.84, 2.15, 0.43, 0.37, 0.58, 0.82, 0.26, 0.54, 2.74, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/bC0vGFJbMjo_filtered.json b/annotations_filtered/bC0vGFJbMjo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a456da7edb215ea88628f9d841b19b4e23efb68e --- /dev/null +++ b/annotations_filtered/bC0vGFJbMjo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.14], [37.0, 38.23], [44.0, 44.76], [65.0, 68.01], [75.0, 87.99], [93.0, 99.81], [103.0, 103.33], [104.0, 111.1], [117.0, 129.74], [132.0, 144.0], [145.0, 145.47], [149.0, 149.52], [150.0, 150.21], [151.0, 184.62], [185.0, 185.26]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 84.43, 30.1, 30.26, 0.0, 30.17, 30.14, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 56.57], ["hum", 7.87], ["throbbing", 4.03]], [["music", 68.49], ["smash, crash", 8.39], ["boom", 2.67]], null, [["music", 69.74], ["electronic music", 2.51], ["throbbing", 1.44]], [["music", 72.41], ["electronic music", 4.15], ["throbbing", 3.52]], null, null, null, null, null, null], "duration": [0.14, 1.23, 0.76, 3.01, 12.99, 6.81, 0.33, 7.1, 12.74, 12.0, 0.47, 0.52, 0.21, 33.62, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/bCIXKzeaAAs_filtered.json b/annotations_filtered/bCIXKzeaAAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c303175c291131273c0bbd9a42ce38cb50d6751c --- /dev/null +++ b/annotations_filtered/bCIXKzeaAAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.13], [11.0, 13.24], [14.0, 16.14], [16.0, 17.83], [18.0, 18.33], [25.0, 26.35], [30.0, 32.24], [33.0, 35.34], [36.0, 36.83], [39.0, 39.53], [41.0, 40.68], [42.0, 46.13], [49.0, 49.13], [49.0, 49.99], [50.0, 52.35], [55.0, 56.49], [57.0, 57.05], [74.0, 73.99], [76.0, 80.23], [81.0, 83.0], [84.0, 86.68], [89.0, 91.05], [92.0, 93.07], [96.0, 96.55], [98.0, 98.63], [103.0, 105.53], [109.0, 110.64], [112.0, 116.09], [117.0, 120.21], [122.0, 126.4]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [50.61, 69.74, 64.41, 0.0, 0.0, 0.0, 48.35, 58.47, 0.0, 0.0, 0.0, 67.13, 0.0, 0.0, 35.91, 0.0, 0.0, 0.0, 58.3, 53.84, 53.59, 56.86, 0.0, 0.0, 0.0, 71.57, 0.0, 71.72, 63.85, 65.09], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 43.16], ["throbbing", 11.1], ["mains hum", 11.04]], null, null, null, null, null, null, null, [["speech", 33.64], ["hum", 20.73], ["music", 13.08]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.13, 2.24, 2.14, 1.83, 0.33, 1.35, 2.24, 2.34, 0.83, 0.53, -0.32, 4.13, 0.13, 0.99, 2.35, 1.49, 0.05, -0.01, 4.23, 2.0, 2.68, 2.05, 1.07, 0.55, 0.63, 2.53, 1.64, 4.09, 3.21, 4.4]} \ No newline at end of file diff --git a/annotations_filtered/bCKgFFmf_iI_filtered.json b/annotations_filtered/bCKgFFmf_iI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63aa6c2c5def4565bc85e1b9b5c6f0437d59dae6 --- /dev/null +++ b/annotations_filtered/bCKgFFmf_iI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[77.0, 78.46], [82.0, 82.63], [83.0, 102.03], [107.0, 120.97]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 30.43, 30.6], "audiomae_on_audioset": [null, null, [["music", 70.92], ["electronic music", 4.56], ["techno", 2.02]], [["music", 48.99], ["sidetone", 15.1], ["speech", 10.71]]], "duration": [1.46, 0.63, 19.03, 13.97]} \ No newline at end of file diff --git a/annotations_filtered/bCLTAaa3qMM_filtered.json b/annotations_filtered/bCLTAaa3qMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0756a68c0bfa0ad800bb41b011d857803715d449 --- /dev/null +++ b/annotations_filtered/bCLTAaa3qMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.83], [13.0, 21.03], [21.0, 23.77], [27.0, 27.3], [28.0, 28.24], [31.0, 31.9], [34.0, 34.48], [43.0, 45.23], [47.0, 47.01], [48.0, 47.97], [49.0, 94.51], [95.0, 115.5], [118.0, 122.55], [125.0, 127.62], [129.0, 142.59], [146.0, 152.07], [160.0, 174.11], [177.0, 179.0], [180.0, 180.94]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, true, true, false, false], "silence_prob": [0.0, 38.56, 50.16, 0.0, 0.0, 0.0, 0.0, 61.47, 0.0, 0.0, 0.0, 30.48, 30.33, 30.36, 32.26, 29.3, 29.59, 37.38, 0.0], "audiomae_on_audioset": [null, [["music", 50.9], ["hum", 10.71], ["mains hum", 5.17]], null, null, null, null, null, null, null, null, null, [["music", 51.92], ["theremin", 11.6], ["synthesizer", 3.89]], [["music", 28.24], ["speech", 28.17], ["throbbing", 5.72]], [["music", 39.65], ["speech", 29.96], ["didgeridoo", 3.05]], [["music", 34.65], ["speech", 26.44], ["hum", 8.94]], [["music", 54.49], ["breaking", 6.69], ["whack, thwack", 5.84]], [["music", 33.04], ["fly, housefly", 15.0], ["hum", 7.55]], [["theremin", 60.15], ["music", 8.42], ["civil defense siren", 4.11]], null], "duration": [1.83, 8.03, 2.77, 0.3, 0.24, 0.9, 0.48, 2.23, 0.01, -0.03, 45.51, 20.5, 4.55, 2.62, 13.59, 6.07, 14.11, 2.0, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/bCOc7VCSox4_filtered.json b/annotations_filtered/bCOc7VCSox4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3fb56b1aa8ca5330794a2e94631e28f49b21fa5 --- /dev/null +++ b/annotations_filtered/bCOc7VCSox4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.29], [5.0, 5.27], [7.0, 7.21], [8.0, 13.41], [21.0, 26.55], [34.0, 39.73], [41.0, 41.79], [45.0, 45.44], [47.0, 47.38], [49.0, 50.3], [52.0, 55.97], [57.0, 59.81], [67.0, 85.83], [87.0, 98.22], [108.0, 111.32], [123.0, 128.76], [134.0, 136.53], [137.0, 143.94], [145.0, 145.22], [146.0, 146.53], [149.0, 149.89], [153.0, 153.84]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false], "silence_prob": [45.11, 0.0, 0.0, 41.48, 35.57, 43.08, 0.0, 0.0, 0.0, 0.0, 33.17, 31.82, 32.32, 89.9, 85.54, 39.91, 43.66, 45.62, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 27.24], ["music", 14.07], ["whale vocalization", 9.76]], null, null, [["music", 53.84], ["theremin", 8.07], ["thunk", 7.25]], [["music", 67.36], ["theremin", 10.95], ["carnatic music", 4.05]], [["music", 69.63], ["carnatic music", 6.34], ["theremin", 4.57]], null, null, null, null, [["music", 50.9], ["boing", 21.64], ["theremin", 7.72]], [["music", 60.65], ["theremin", 14.13], ["foghorn", 8.21]], [["music", 83.11], ["didgeridoo", 3.94], ["musical instrument", 2.13]], null, null, [["whimper", 22.97], ["groan", 14.83], ["male singing", 12.84]], [["a capella", 23.22], ["male singing", 15.1], ["music", 8.88]], [["humming", 32.11], ["howl", 9.48], ["frog", 7.58]], null, null, null, null], "duration": [2.29, 0.27, 0.21, 5.41, 5.55, 5.73, 0.79, 0.44, 0.38, 1.3, 3.97, 2.81, 18.83, 11.22, 3.32, 5.76, 2.53, 6.94, 0.22, 0.53, 0.89, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/bCYs8v0Xji4_filtered.json b/annotations_filtered/bCYs8v0Xji4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..376cf794380600852c702b0b0e78c1febac98246 --- /dev/null +++ b/annotations_filtered/bCYs8v0Xji4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [6.0, 6.86], [9.0, 11.1], [15.0, 19.23], [20.0, 21.17], [26.0, 26.42], [27.0, 31.83], [34.0, 33.91], [35.0, 35.83], [40.0, 40.95], [44.0, 46.03], [52.0, 52.44], [56.0, 56.84], [59.0, 58.99], [60.0, 60.76], [62.0, 62.95], [64.0, 64.47], [65.0, 65.38], [69.0, 72.54], [75.0, 75.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 94.95, 70.44, 0.0, 0.0, 51.77, 0.0, 0.0, 0.0, 39.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["sine wave", 49.94], ["speech", 25.88], ["chirp tone", 6.31]], null, null, null, null, null, null, null, [["whack, thwack", 16.44], ["speech", 12.67], ["tuning fork", 9.3]], null], "duration": [0.75, 0.86, 2.1, 4.23, 1.17, 0.42, 4.83, -0.09, 0.83, 0.95, 2.03, 0.44, 0.84, -0.01, 0.76, 0.95, 0.47, 0.38, 3.54, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/bCZRAcsuRgY_filtered.json b/annotations_filtered/bCZRAcsuRgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7102a6478a2e60fbb7b3c6ecd7c205852c6bc795 --- /dev/null +++ b/annotations_filtered/bCZRAcsuRgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.01], [22.0, 23.84], [35.0, 34.75], [35.0, 38.45], [42.0, 51.14], [54.0, 58.92], [66.0, 70.04], [80.0, 82.27], [91.0, 95.39], [106.0, 106.34], [109.0, 109.53], [113.0, 113.97], [122.0, 125.61], [129.0, 129.95], [132.0, 131.65], [132.0, 131.68], [132.0, 138.5], [145.0, 149.25], [155.0, 154.87], [157.0, 159.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.85, 34.83, 33.8, 37.3, 38.45, 33.78, 0.0, 0.0, 0.0, 37.83, 0.0, 0.0, 0.0, 33.88, 36.14, 0.0, 36.01], "audiomae_on_audioset": [null, null, null, [["music", 65.3], ["reggae", 7.19], ["yodeling", 1.99]], [["music", 84.2], ["reggae", 2.38], ["singing", 0.99]], [["music", 74.52], ["reggae", 8.97], ["singing", 1.74]], [["music", 74.59], ["synthesizer", 3.97], ["electronic music", 3.55]], [["music", 55.23], ["throbbing", 18.07], ["synthesizer", 5.45]], [["music", 73.28], ["song", 1.53], ["singing", 1.42]], null, null, null, [["music", 72.41], ["throbbing", 4.0], ["electronic music", 2.38]], null, null, null, [["music", 77.71], ["reggae", 6.99], ["singing", 1.31]], [["music", 54.17], ["musical instrument", 3.16], ["cello", 2.79]], null, [["music", 69.07], ["didgeridoo", 3.55], ["musical instrument", 2.81]]], "duration": [0.01, 1.84, -0.25, 3.45, 9.14, 4.92, 4.04, 2.27, 4.39, 0.34, 0.53, 0.97, 3.61, 0.95, -0.35, -0.32, 6.5, 4.25, -0.13, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/bCaHwP04KK0_filtered.json b/annotations_filtered/bCaHwP04KK0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eae680d47ec18e0b67a9e3735e112a4a87b0c09d --- /dev/null +++ b/annotations_filtered/bCaHwP04KK0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.27], [14.0, 18.39], [19.0, 19.87], [21.0, 22.27], [23.0, 35.68]], "keep_status": [true, false, false, false, false], "silence_prob": [44.63, 42.46, 0.0, 0.0, 44.49], "audiomae_on_audioset": [[["music", 45.87], ["raindrop", 9.39], ["rain on surface", 5.07]], [["hum", 38.15], ["mains hum", 19.54], ["music", 15.0]], null, null, [["music", 39.62], ["whale vocalization", 31.95], ["speech", 8.17]]], "duration": [8.27, 4.39, 0.87, 1.27, 12.68]} \ No newline at end of file diff --git a/annotations_filtered/bCk9vtlnr34_filtered.json b/annotations_filtered/bCk9vtlnr34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dc4d3cb09cf2bd469e984e3a22e9d095d1fa68d --- /dev/null +++ b/annotations_filtered/bCk9vtlnr34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.04], [9.0, 9.83], [11.0, 11.69], [19.0, 26.91], [28.0, 29.17], [29.0, 31.06], [32.0, 42.77], [44.0, 88.52]], "keep_status": [false, false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.68, 0.0, 33.13, 32.12, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 49.92], ["musical instrument", 7.8], ["brass instrument", 7.53]], null, [["music", 32.83], ["moo", 16.52], ["cattle, bovinae", 13.79]], [["music", 49.93], ["brass instrument", 10.06], ["musical instrument", 8.9]], null], "duration": [1.04, 0.83, 0.69, 7.91, 1.17, 2.06, 10.77, 44.52]} \ No newline at end of file diff --git a/annotations_filtered/bD8bl3omDIU_filtered.json b/annotations_filtered/bD8bl3omDIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cff21cf33898854bac77a00139f318039e89183 --- /dev/null +++ b/annotations_filtered/bD8bl3omDIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 49.47], [53.0, 54.82], [58.0, 60.62], [65.0, 66.85], [70.0, 73.11], [77.0, 79.15], [85.0, 85.56], [91.0, 91.84], [97.0, 97.87], [103.0, 104.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 74.6, 0.0, 42.0, 30.58, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 71.63], ["theremin", 7.81], ["humming", 1.83]], [["music", 82.4], ["carnatic music", 3.55], ["musical instrument", 2.17]], null, null, null, null], "duration": [47.47, 1.82, 2.62, 1.85, 3.11, 2.15, 0.56, 0.84, 0.87, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/bD8jQGwyuBU_filtered.json b/annotations_filtered/bD8jQGwyuBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d9a4f235017ab46dcf2bfcc67d4d509f632ad7f --- /dev/null +++ b/annotations_filtered/bD8jQGwyuBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [8.0, 8.88], [9.0, 12.66], [15.0, 15.42], [17.0, 18.13], [20.0, 20.41], [24.0, 28.31], [33.0, 39.92], [42.0, 43.02], [44.0, 47.21], [50.0, 52.15], [81.0, 83.93], [87.0, 88.6], [90.0, 93.29], [96.0, 96.94], [98.0, 99.12], [101.0, 102.29], [103.0, 108.45], [112.0, 115.1], [116.0, 135.48], [139.0, 143.07], [145.0, 147.33], [152.0, 154.41], [156.0, 156.57], [158.0, 158.65], [161.0, 161.22], [167.0, 167.59], [169.0, 168.76]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, true, false, true, false, false, false, false, true, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 32.49, 31.2, 0.0, 48.27, 93.29, 49.87, 0.0, 36.78, 0.0, 0.0, 0.0, 36.7, 45.72, 34.48, 35.52, 43.05, 52.1, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["laughter", 18.1], ["snicker", 14.39], ["speech", 13.05]], [["boing", 46.9], ["speech", 11.06], ["echo", 8.17]], null, [["throbbing", 43.7], ["music", 21.81], ["hum", 5.39]], null, [["hum", 32.7], ["throbbing", 17.84], ["knock", 10.18]], null, [["music", 27.55], ["throbbing", 11.12], ["hum", 6.07]], null, null, null, [["speech", 45.43], ["sidetone", 35.83], ["radio", 2.94]], [["speech", 14.02], ["animal", 4.63], ["dog", 4.01]], [["music", 41.27], ["effects unit", 6.38], ["musical instrument", 5.51]], [["speech", 13.63], ["cattle, bovinae", 12.36], ["moo", 10.25]], [["cattle, bovinae", 41.69], ["moo", 39.65], ["livestock, farm animals, working animals", 12.25]], null, null, null, null, null, null], "duration": [0.13, 0.88, 3.66, 0.42, 1.13, 0.41, 4.31, 6.92, 1.02, 3.21, 2.15, 2.93, 1.6, 3.29, 0.94, 1.12, 1.29, 5.45, 3.1, 19.48, 4.07, 2.33, 2.41, 0.57, 0.65, 0.22, 0.59, -0.24]} \ No newline at end of file diff --git a/annotations_filtered/bDW3OVitFE8_filtered.json b/annotations_filtered/bDW3OVitFE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9e54f99d9c49aca7229816299c1799ac1316113 --- /dev/null +++ b/annotations_filtered/bDW3OVitFE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [5.0, 5.53], [6.0, 7.33], [18.0, 18.42], [19.0, 19.75], [22.0, 21.69], [23.0, 24.06], [26.0, 26.65], [29.0, 29.64], [31.0, 32.22], [33.0, 34.08], [35.0, 35.09], [42.0, 42.42], [46.0, 46.45], [47.0, 48.05], [49.0, 49.67], [52.0, 53.08], [55.0, 55.41], [56.0, 58.58], [62.0, 62.67], [67.0, 67.98], [68.0, 74.41], [75.0, 76.03], [78.0, 78.31], [80.0, 82.86], [83.0, 83.96], [85.0, 88.13], [89.0, 92.92], [94.0, 94.54], [97.0, 105.65], [106.0, 111.96], [115.0, 124.5], [125.0, 129.47], [130.0, 132.49], [133.0, 133.64], [134.0, 135.4], [136.0, 139.46], [142.0, 142.47], [146.0, 147.46], [149.0, 149.13], [150.0, 151.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.68, 0.0, 0.0, 63.53, 0.0, 0.0, 54.3, 0.0, 100.0, 99.8, 0.0, 99.21, 68.41, 73.97, 83.88, 99.26, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.53, 1.33, 0.42, 0.75, -0.31, 1.06, 0.65, 0.64, 1.22, 1.08, 0.09, 0.42, 0.45, 1.05, 0.67, 1.08, 0.41, 2.58, 0.67, 0.98, 6.41, 1.03, 0.31, 2.86, 0.96, 3.13, 3.92, 0.54, 8.65, 5.96, 9.5, 4.47, 2.49, 0.64, 1.4, 3.46, 0.47, 1.46, 0.13, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/bD_rWCvgDy8_filtered.json b/annotations_filtered/bD_rWCvgDy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22f688c075382b79922f98c143b7cd0c8ff8419e --- /dev/null +++ b/annotations_filtered/bD_rWCvgDy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.27], [59.0, 58.67]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.27, -0.33]} \ No newline at end of file diff --git a/annotations_filtered/bDcFILIfHU4_filtered.json b/annotations_filtered/bDcFILIfHU4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dcc594e5db269a6686915a8fdb90df78663195c --- /dev/null +++ b/annotations_filtered/bDcFILIfHU4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 19.38], [24.0, 24.48], [25.0, 26.4], [36.0, 36.73], [37.0, 38.65], [43.0, 45.17], [45.0, 46.33], [49.0, 48.91], [49.0, 49.65], [55.0, 55.98], [61.0, 61.21], [62.0, 64.34], [65.0, 67.85], [78.0, 79.39], [80.0, 80.74], [82.0, 82.48], [86.0, 88.84], [90.0, 90.41], [91.0, 91.17], [96.0, 96.65], [97.0, 99.03], [100.0, 100.9], [104.0, 106.49], [107.0, 110.19], [111.0, 118.93], [119.0, 122.55], [123.0, 124.92], [128.0, 129.66], [131.0, 133.34], [134.0, 136.09], [137.0, 139.19], [140.0, 141.4], [149.0, 149.57], [156.0, 159.75], [160.0, 160.47], [161.0, 163.07], [164.0, 168.03]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [45.14, 0.0, 0.0, 0.0, 0.0, 52.62, 0.0, 0.0, 0.0, 0.0, 0.0, 36.01, 89.54, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0, 44.15, 0.0, 85.17, 68.41, 80.46, 57.89, 0.0, 0.0, 54.76, 72.46, 59.86, 0.0, 0.0, 37.5, 0.0, 64.41, 60.89], "audiomae_on_audioset": [[["speech", 32.14], ["music", 12.75], ["livestock, farm animals, working animals", 11.07]], null, null, null, null, null, null, null, null, null, null, [["speech", 45.62], ["sine wave", 16.63], ["busy signal", 12.34]], null, null, null, null, null, null, null, null, [["music", 28.45], ["speech", 16.27], ["sonar", 11.58]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.03], ["fly, housefly", 12.58], ["insect", 9.96]], null, null, null], "duration": [5.38, 0.48, 1.4, 0.73, 1.65, 2.17, 1.33, -0.09, 0.65, 0.98, 0.21, 2.34, 2.85, 1.39, 0.74, 0.48, 2.84, 0.41, 0.17, 0.65, 2.03, 0.9, 2.49, 3.19, 7.93, 3.55, 1.92, 1.66, 2.34, 2.09, 2.19, 1.4, 0.57, 3.75, 0.47, 2.07, 4.03]} \ No newline at end of file diff --git a/annotations_filtered/bDm5fnJ1Hg0_filtered.json b/annotations_filtered/bDm5fnJ1Hg0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dfd7a1c194a8efd4887a9d3ce347562ad2edd3d --- /dev/null +++ b/annotations_filtered/bDm5fnJ1Hg0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 43.78], [46.0, 49.52], [51.0, 51.38], [54.0, 57.03], [61.0, 61.33], [63.0, 63.9], [64.0, 64.98], [68.0, 73.47], [74.0, 75.34], [78.0, 81.67], [83.0, 84.62], [91.0, 90.75], [92.0, 103.42], [104.0, 111.7], [112.0, 113.41], [114.0, 121.37], [123.0, 128.07], [130.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 82.79, 0.0, 98.99, 0.0, 0.0, 0.0, 91.98, 0.0, 87.0, 0.0, 0.0, 67.13, 52.05, 0.0, 56.03, 45.88, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.17], ["wood", 5.71], ["splinter", 5.62]], null], "duration": [1.78, 3.52, 0.38, 3.03, 0.33, 0.9, 0.98, 5.47, 1.34, 3.67, 1.62, -0.25, 11.42, 7.7, 1.41, 7.37, 5.07, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/bEA-o4IJAic_filtered.json b/annotations_filtered/bEA-o4IJAic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45c236a0cf368eae19e5c21cfa2b316f059b0c68 --- /dev/null +++ b/annotations_filtered/bEA-o4IJAic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [7.0, 9.46], [10.0, 11.1], [12.0, 15.26], [18.0, 18.74], [21.0, 24.66], [28.0, 28.85], [42.0, 41.96], [49.0, 54.87], [56.0, 56.71], [58.0, 64.13], [65.0, 67.61], [69.0, 74.6], [78.0, 78.65], [81.0, 81.55], [90.0, 92.35], [94.0, 96.89], [99.0, 102.3], [105.0, 105.54], [107.0, 108.65], [111.0, 114.1], [116.0, 116.36], [118.0, 120.88]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.64, 0.0, 45.08, 0.0, 86.82, 0.0, 0.0, 99.87, 0.0, 97.54, 99.56, 89.36, 0.0, 0.0, 60.79, 94.81, 99.21, 0.0, 0.0, 64.52, 0.0, 51.12], "audiomae_on_audioset": [null, null, null, [["speech", 35.24], ["bee, wasp, etc.", 12.67], ["hum", 9.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 2.46, 1.1, 3.26, 0.74, 3.66, 0.85, -0.04, 5.87, 0.71, 6.13, 2.61, 5.6, 0.65, 0.55, 2.35, 2.89, 3.3, 0.54, 1.65, 3.1, 0.36, 2.88]} \ No newline at end of file diff --git a/annotations_filtered/bEBQWhgGM1g_filtered.json b/annotations_filtered/bEBQWhgGM1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3066291316a614474469bf3a2a8bc2931c642b64 --- /dev/null +++ b/annotations_filtered/bEBQWhgGM1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[88.0, 97.88], [98.0, 97.97], [98.0, 117.27]], "keep_status": [false, false, true], "silence_prob": [95.78, 0.0, 49.64], "audiomae_on_audioset": [null, null, [["hum", 21.26], ["whale vocalization", 16.98], ["rumble", 14.6]]], "duration": [9.88, -0.03, 19.27]} \ No newline at end of file diff --git a/annotations_filtered/bEpL6Mt_jrk_filtered.json b/annotations_filtered/bEpL6Mt_jrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0cbbbc2ee9e71e60d3bc8c737237d1053c49881 --- /dev/null +++ b/annotations_filtered/bEpL6Mt_jrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.6], [5.0, 4.92], [14.0, 14.74], [20.0, 32.0], [35.0, 38.03], [39.0, 40.71], [44.0, 44.83], [47.0, 47.44], [48.0, 49.74], [56.0, 58.35], [60.0, 61.97], [65.0, 65.26], [69.0, 69.55], [76.0, 77.67], [80.0, 81.87], [94.0, 95.27], [96.0, 98.02], [100.0, 108.89], [110.0, 116.87], [118.0, 118.89], [120.0, 127.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.95, 99.95, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 97.54, 99.84, 0.0, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.6, -0.08, 0.74, 12.0, 3.03, 1.71, 0.83, 0.44, 1.74, 2.35, 1.97, 0.26, 0.55, 1.67, 1.87, 1.27, 2.02, 8.89, 6.87, 0.89, 7.72]} \ No newline at end of file diff --git a/annotations_filtered/bFfnDQ3bDfA_filtered.json b/annotations_filtered/bFfnDQ3bDfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea6c5a6da264a42949f257af065cfa9afc393935 --- /dev/null +++ b/annotations_filtered/bFfnDQ3bDfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [7.0, 7.32], [9.0, 9.76], [10.0, 11.6], [13.0, 12.6], [13.0, 13.93], [18.0, 18.49], [25.0, 26.42], [31.0, 31.21], [37.0, 38.47], [42.0, 42.2], [45.0, 45.49], [48.0, 47.7], [49.0, 49.52], [52.0, 53.35], [56.0, 56.57], [59.0, 60.0], [60.0, 61.43], [63.0, 63.26], [64.0, 64.88], [72.0, 71.78], [76.0, 76.2], [85.0, 85.02], [87.0, 87.86], [91.0, 91.64], [97.0, 97.92], [98.0, 99.3], [105.0, 104.77], [105.0, 105.58], [109.0, 109.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.32, 0.76, 1.6, -0.4, 0.93, 0.49, 1.42, 0.21, 1.47, 0.2, 0.49, -0.3, 0.52, 1.35, 0.57, 1.0, 1.43, 0.26, 0.88, -0.22, 0.2, 0.02, 0.86, 0.64, 0.92, 1.3, -0.23, 0.58, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/bFsgLhx9dxg_filtered.json b/annotations_filtered/bFsgLhx9dxg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60018f928a9b96c647c698680136f1f7456f4d6e --- /dev/null +++ b/annotations_filtered/bFsgLhx9dxg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.99], [29.0, 30.97], [32.0, 32.68], [38.0, 45.33], [47.0, 67.81], [71.0, 71.04], [72.0, 73.82], [76.0, 77.31], [83.0, 84.52], [88.0, 91.79], [93.0, 95.15], [100.0, 102.91], [106.0, 108.09], [110.0, 111.37], [113.0, 119.74], [120.0, 121.31], [123.0, 126.74], [128.0, 129.24], [133.0, 135.51], [137.0, 150.42], [150.0, 156.59], [158.0, 176.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.29, 31.15, 0.0, 0.0, 0.0, 0.0, 98.01, 95.23, 98.44, 91.13, 0.0, 95.91, 0.0, 91.98, 0.0, 56.55, 94.66, 63.1, 71.14], "audiomae_on_audioset": [null, null, null, [["music", 76.51], ["theremin", 8.73], ["ambient music", 1.97]], [["music", 41.7], ["theremin", 37.99], ["musical instrument", 3.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 1.97, 0.68, 7.33, 20.81, 0.04, 1.82, 1.31, 1.52, 3.79, 2.15, 2.91, 2.09, 1.37, 6.74, 1.31, 3.74, 1.24, 2.51, 13.42, 6.59, 18.37]} \ No newline at end of file diff --git a/annotations_filtered/bGQ9QznPQ_M_filtered.json b/annotations_filtered/bGQ9QznPQ_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d0d2a5d8a979e00c986ebd140c6b333dedae31c --- /dev/null +++ b/annotations_filtered/bGQ9QznPQ_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.08], [7.0, 17.81], [20.0, 22.3], [27.0, 26.97], [30.0, 44.02], [47.0, 53.22], [54.0, 54.45], [57.0, 57.05], [61.0, 70.55], [71.0, 82.44], [84.0, 89.43], [93.0, 92.91], [93.0, 95.54], [97.0, 97.61], [99.0, 98.98], [101.0, 101.53], [104.0, 105.31], [106.0, 108.21], [109.0, 109.53], [114.0, 114.52], [116.0, 116.53], [123.0, 126.87], [133.0, 132.66], [134.0, 135.53]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.74, 36.49, 0.0, 30.76, 30.06, 0.0, 0.0, 37.32, 30.81, 30.74, 0.0, 29.81, 0.0, 0.0, 0.0, 0.0, 65.55, 0.0, 0.0, 0.0, 82.07, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 67.38], ["sidetone", 9.6], ["throbbing", 6.2]], [["music", 75.01], ["electronic music", 5.91], ["drum machine", 2.89]], null, [["sidetone", 69.65], ["music", 20.46], ["drum machine", 2.66]], [["music", 40.48], ["speech", 24.72], ["electronic music", 5.45]], null, null, [["music", 30.35], ["speech", 9.76], ["moo", 8.84]], [["music", 34.71], ["throbbing", 22.83], ["hum", 15.45]], [["music", 68.85], ["throbbing", 7.98], ["speech", 4.8]], null, [["music", 42.62], ["speech", 10.49], ["electronic music", 4.15]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 10.81, 2.3, -0.03, 14.02, 6.22, 0.45, 0.05, 9.55, 11.44, 5.43, -0.09, 2.54, 0.61, -0.02, 0.53, 1.31, 2.21, 0.53, 0.52, 0.53, 3.87, -0.34, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/bGWyL-vJAn4_filtered.json b/annotations_filtered/bGWyL-vJAn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb1dd560eaa41ae59268f9afe279e849600ca652 --- /dev/null +++ b/annotations_filtered/bGWyL-vJAn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.09], [24.0, 24.58], [27.0, 38.74], [39.0, 52.57], [55.0, 55.92], [59.0, 58.99], [78.0, 78.61], [84.0, 84.94]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [35.73, 0.0, 32.29, 39.18, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.7], ["throbbing", 14.0], ["cattle, bovinae", 4.73]], null, [["music", 71.63], ["synthesizer", 6.75], ["whale vocalization", 2.24]], [["animal", 28.27], ["whale vocalization", 15.2], ["noise", 7.21]], null, null, null, null], "duration": [5.09, 0.58, 11.74, 13.57, 0.92, -0.01, 0.61, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/bGXeYGkiQDo_filtered.json b/annotations_filtered/bGXeYGkiQDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c239cb13234d0e820eba8d48858b07d78fb85d9 --- /dev/null +++ b/annotations_filtered/bGXeYGkiQDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.25], [21.0, 23.13], [24.0, 25.27], [26.0, 30.67], [31.0, 31.87], [32.0, 33.86], [36.0, 38.74], [40.0, 40.54], [42.0, 41.99], [43.0, 43.9], [46.0, 46.6], [47.0, 48.07], [50.0, 50.35], [51.0, 51.63], [61.0, 61.42], [67.0, 68.2], [73.0, 73.35], [75.0, 75.2], [76.0, 77.79], [79.0, 79.79], [86.0, 85.97], [89.0, 89.33], [94.0, 94.61], [95.0, 95.91], [99.0, 99.27], [102.0, 102.39], [106.0, 106.14], [108.0, 108.09], [110.0, 110.37], [113.0, 115.38], [117.0, 117.51], [122.0, 121.98], [124.0, 125.85], [127.0, 127.38], [129.0, 129.46], [131.0, 131.21], [133.0, 133.3], [137.0, 137.25], [142.0, 142.06], [154.0, 154.75], [160.0, 161.4], [162.0, 161.91], [164.0, 163.97], [174.0, 173.97]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.9, 0.0, 88.28, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 49.07], ["hum", 10.39], ["sine wave", 7.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 42.11], ["sidetone", 13.16], ["throbbing", 10.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 2.13, 1.27, 4.67, 0.87, 1.86, 2.74, 0.54, -0.01, 0.9, 0.6, 1.07, 0.35, 0.63, 0.42, 1.2, 0.35, 0.2, 1.79, 0.79, -0.03, 0.33, 0.61, 0.91, 0.27, 0.39, 0.14, 0.09, 0.37, 2.38, 0.51, -0.02, 1.85, 0.38, 0.46, 0.21, 0.3, 0.25, 0.06, 0.75, 1.4, -0.09, -0.03, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/bH5GtRBsss0_filtered.json b/annotations_filtered/bH5GtRBsss0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f94d00f497a5a6024b8bd45eb2a351ca56fd2cc --- /dev/null +++ b/annotations_filtered/bH5GtRBsss0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.1], [4.0, 5.44], [6.0, 9.0], [21.0, 24.73], [25.0, 32.05], [32.0, 40.47], [42.0, 47.38], [49.0, 49.33], [51.0, 51.6], [55.0, 59.66], [60.0, 61.45], [64.0, 65.01], [66.0, 66.58], [69.0, 69.3], [73.0, 73.11], [75.0, 74.97], [77.0, 77.63], [80.0, 83.35], [84.0, 85.77], [90.0, 93.83], [97.0, 97.82], [98.0, 100.08], [102.0, 104.18], [105.0, 105.29], [107.0, 108.48], [112.0, 111.97], [115.0, 119.01], [124.0, 125.66], [126.0, 127.16], [129.0, 128.87]], "keep_status": [true, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.46, 0.0, 50.46, 37.37, 37.38, 43.13, 45.52, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 0.0, 77.87, 0.0, 60.89, 74.76, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 17.81], ["gong", 14.5], ["speech", 13.06]], null, null, [["speech", 29.76], ["music", 23.23], ["theremin", 14.56]], [["speech", 33.45], ["hum", 22.81], ["mains hum", 14.82]], [["mains hum", 27.63], ["hum", 19.25], ["electric shaver, electric razor", 17.63]], [["livestock, farm animals, working animals", 24.11], ["animal", 9.92], ["cattle, bovinae", 9.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.1, 1.44, 3.0, 3.73, 7.05, 8.47, 5.38, 0.33, 0.6, 4.66, 1.45, 1.01, 0.58, 0.3, 0.11, -0.03, 0.63, 3.35, 1.77, 3.83, 0.82, 2.08, 2.18, 0.29, 1.48, -0.03, 4.01, 1.66, 1.16, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/bHTWme5Ks9g_filtered.json b/annotations_filtered/bHTWme5Ks9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bd2f715f905c73248c35cff275e756adcc9b16a --- /dev/null +++ b/annotations_filtered/bHTWme5Ks9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 29.29], [34.0, 36.8], [38.0, 40.24], [43.0, 48.93], [50.0, 59.16], [60.0, 64.52], [66.0, 67.44], [68.0, 71.81], [72.0, 85.06]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [64.41, 100.0, 100.0, 100.0, 98.44, 99.26, 0.0, 36.63, 38.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 54.2], ["trombone", 13.22], ["brass instrument", 11.01]], [["music", 40.1], ["didgeridoo", 15.88], ["trombone", 9.54]]], "duration": [11.29, 2.8, 2.24, 5.93, 9.16, 4.52, 1.44, 3.81, 13.06]} \ No newline at end of file diff --git a/annotations_filtered/bHW5h5O-e5I_filtered.json b/annotations_filtered/bHW5h5O-e5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fbabd1f0b6e36808a8911a2493ef234bca41e90 --- /dev/null +++ b/annotations_filtered/bHW5h5O-e5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.88], [8.0, 8.26], [9.0, 9.09], [12.0, 15.18], [19.0, 19.16], [21.0, 22.05], [28.0, 28.65], [30.0, 30.37], [31.0, 31.38], [36.0, 37.94], [39.0, 39.73], [41.0, 42.47], [44.0, 46.62], [49.0, 49.84], [54.0, 57.6], [60.0, 60.51], [64.0, 66.21], [69.0, 69.75], [71.0, 71.71], [72.0, 72.99], [76.0, 76.28], [78.0, 78.61], [82.0, 82.46], [88.0, 88.33], [89.0, 89.9], [94.0, 94.44], [103.0, 102.96], [104.0, 103.99], [105.0, 105.34], [107.0, 107.15], [108.0, 110.67], [114.0, 114.22], [116.0, 116.06], [121.0, 121.8], [122.0, 122.66], [125.0, 124.97], [127.0, 127.2], [128.0, 129.74], [134.0, 134.96], [140.0, 140.53], [142.0, 145.69], [147.0, 148.69], [150.0, 151.85], [156.0, 156.57], [157.0, 157.35], [159.0, 159.19], [162.0, 161.97], [164.0, 164.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 99.98, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.26, 0.09, 3.18, 0.16, 1.05, 0.65, 0.37, 0.38, 1.94, 0.73, 1.47, 2.62, 0.84, 3.6, 0.51, 2.21, 0.75, 0.71, 0.99, 0.28, 0.61, 0.46, 0.33, 0.9, 0.44, -0.04, -0.01, 0.34, 0.15, 2.67, 0.22, 0.06, 0.8, 0.66, -0.03, 0.2, 1.74, 0.96, 0.53, 3.69, 1.69, 1.85, 0.57, 0.35, 0.19, -0.03, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/bHjHDiu2UR8_filtered.json b/annotations_filtered/bHjHDiu2UR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b9cca4603fe6fcfb393d8d8f48f2aa6c4eafea9 --- /dev/null +++ b/annotations_filtered/bHjHDiu2UR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 22.87], [25.0, 27.04], [32.0, 33.44], [34.0, 68.3], [69.0, 70.04]], "keep_status": [false, false, false, false, false], "silence_prob": [60.05, 43.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 67.19], ["musical instrument", 3.59], ["synthesizer", 3.32]], null, null, null], "duration": [4.87, 2.04, 1.44, 34.3, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/bHwiXFc9MOw_filtered.json b/annotations_filtered/bHwiXFc9MOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbb0dec5a6d6ae0dd8a296ef24a0c47c5e459f9c --- /dev/null +++ b/annotations_filtered/bHwiXFc9MOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.07], [8.0, 9.19], [9.0, 9.39], [9.0, 53.65], [56.0, 86.04]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.07, 1.19, 0.39, 44.65, 30.04]} \ No newline at end of file diff --git a/annotations_filtered/bI9CAfqY3hk_filtered.json b/annotations_filtered/bI9CAfqY3hk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68290b27d99325f2ce6e6bc2c40419d044f364a7 --- /dev/null +++ b/annotations_filtered/bI9CAfqY3hk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 62.85], [65.0, 68.54], [72.0, 105.71], [111.0, 113.0]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 42.15, 0.0, 37.04], "audiomae_on_audioset": [null, [["cacophony", 19.11], ["music", 9.07], ["noise", 7.57]], null, [["hum", 23.34], ["music", 12.58], ["mains hum", 11.97]]], "duration": [39.85, 3.54, 33.71, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/bICHpdNbsmU_filtered.json b/annotations_filtered/bICHpdNbsmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ac589aab51791a83cd611c662e2080b25ddb49e --- /dev/null +++ b/annotations_filtered/bICHpdNbsmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.28], [9.0, 11.08], [15.0, 18.66], [20.0, 38.37], [40.0, 40.61], [43.0, 49.0], [52.0, 64.81], [66.0, 66.83]], "keep_status": [false, false, false, false, false, true, true, false], "silence_prob": [0.0, 92.97, 99.73, 92.8, 0.0, 32.79, 31.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 23.21], ["music", 19.57], ["coin (dropping)", 9.18]], [["music", 28.32], ["clang", 10.04], ["throbbing", 7.84]], null], "duration": [1.28, 2.08, 3.66, 18.37, 0.61, 6.0, 12.81, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/bIHeoOh2F7o_filtered.json b/annotations_filtered/bIHeoOh2F7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33964f8a26f77956cd6fda3f392cb38f1380b5e6 --- /dev/null +++ b/annotations_filtered/bIHeoOh2F7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.77], [17.0, 16.8], [17.0, 18.64], [20.0, 24.98], [28.0, 29.37], [30.0, 30.54], [34.0, 34.35], [35.0, 36.49], [38.0, 38.82], [39.0, 40.74], [50.0, 49.96], [62.0, 63.19], [64.0, 64.17], [69.0, 72.33], [74.0, 75.51], [76.0, 77.19], [91.0, 91.67], [93.0, 94.51], [96.0, 96.85], [99.0, 99.42], [103.0, 104.28], [108.0, 108.78], [114.0, 114.66], [118.0, 122.12]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [43.79, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.89], "audiomae_on_audioset": [[["speech", 37.3], ["cattle, bovinae", 14.86], ["livestock, farm animals, working animals", 11.89]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.51], ["speech", 15.79], ["boing", 9.01]]], "duration": [8.77, -0.2, 1.64, 4.98, 1.37, 0.54, 0.35, 1.49, 0.82, 1.74, -0.04, 1.19, 0.17, 3.33, 1.51, 1.19, 0.67, 1.51, 0.85, 0.42, 1.28, 0.78, 0.66, 4.12]} \ No newline at end of file diff --git a/annotations_filtered/bIbxR_KN2TM_filtered.json b/annotations_filtered/bIbxR_KN2TM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9c20d1cf10a4c43891943a5c9af7f26b56b6d58 --- /dev/null +++ b/annotations_filtered/bIbxR_KN2TM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.6], [21.0, 22.28], [23.0, 33.81], [39.0, 39.01], [43.0, 49.82], [58.0, 57.81], [69.0, 69.55], [71.0, 73.63], [80.0, 81.14], [84.0, 92.01], [92.0, 98.2], [101.0, 100.75], [104.0, 105.58], [108.0, 109.41], [112.0, 114.17], [122.0, 122.84]], "keep_status": [false, false, true, false, true, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 35.89, 0.0, 32.77, 0.0, 0.0, 51.39, 0.0, 46.02, 33.66, 0.0, 0.0, 0.0, 45.88, 0.0], "audiomae_on_audioset": [null, null, [["buzz", 15.07], ["electric shaver, electric razor", 13.5], ["fly, housefly", 10.71]], null, [["speech", 55.62], ["boing", 3.81], ["fart", 2.24]], null, null, null, null, [["speech", 17.29], ["cattle, bovinae", 13.7], ["livestock, farm animals, working animals", 10.47]], [["speech", 80.88], ["clip-clop", 2.39], ["animal", 2.39]], null, null, null, [["speech", 49.6], ["music", 4.93], ["crowd", 2.91]], null], "duration": [0.6, 1.28, 10.81, 0.01, 6.82, -0.19, 0.55, 2.63, 1.14, 8.01, 6.2, -0.25, 1.58, 1.41, 2.17, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/bIfMAhK7Boo_filtered.json b/annotations_filtered/bIfMAhK7Boo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de63469bdafd97215c86c35652e0e4bc76435086 --- /dev/null +++ b/annotations_filtered/bIfMAhK7Boo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.7], [15.0, 19.43], [22.0, 24.53], [25.0, 26.18], [28.0, 29.24], [35.0, 36.21], [40.0, 41.52], [43.0, 44.47], [47.0, 48.61], [51.0, 56.49], [58.0, 58.55], [60.0, 61.52], [63.0, 64.2], [67.0, 73.89], [76.0, 78.6], [81.0, 86.78], [92.0, 95.94], [97.0, 111.03], [114.0, 115.55], [117.0, 117.76], [120.0, 120.99], [122.0, 127.18], [128.0, 139.06], [140.0, 170.31], [173.0, 173.23], [180.0, 180.32], [183.0, 186.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 63.42, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 62.78, 48.61, 31.78, 31.11, 33.04, 0.0, 0.0, 0.0, 38.31, 71.57, 0.0, 0.0, 0.0, 74.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.49], ["music", 8.85], ["hum", 6.44]], [["fly, housefly", 40.37], ["mosquito", 25.05], ["insect", 24.55]], [["fly, housefly", 36.61], ["mosquito", 29.16], ["insect", 20.48]], [["music", 39.61], ["speech", 35.28], ["breaking", 4.56]], null, null, null, [["breaking", 50.63], ["music", 21.42], ["speech", 10.16]], null, null, null, null, null], "duration": [0.7, 4.43, 2.53, 1.18, 1.24, 1.21, 1.52, 1.47, 1.61, 5.49, 0.55, 1.52, 1.2, 6.89, 2.6, 5.78, 3.94, 14.03, 1.55, 0.76, 0.99, 5.18, 11.06, 30.31, 0.23, 0.32, 3.63]} \ No newline at end of file diff --git a/annotations_filtered/bIpQoVucszI_filtered.json b/annotations_filtered/bIpQoVucszI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2d69c5bc808bc7ddd60b89688d7b1fdd830abf5 --- /dev/null +++ b/annotations_filtered/bIpQoVucszI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [3.0, 3.18], [5.0, 5.29], [11.0, 11.91], [14.0, 14.94], [16.0, 16.55], [17.0, 22.32], [24.0, 28.26], [35.0, 36.04], [37.0, 37.76], [40.0, 40.59], [42.0, 41.82], [43.0, 44.39], [47.0, 46.94], [47.0, 47.34], [47.0, 47.46], [48.0, 48.41], [51.0, 57.28], [60.0, 61.38], [62.0, 70.46], [71.0, 79.25], [86.0, 86.7], [88.0, 88.45], [91.0, 95.0], [103.0, 104.5], [106.0, 106.78], [107.0, 112.5], [117.0, 116.7], [118.0, 118.3], [119.0, 120.56], [123.0, 123.38], [124.0, 129.57], [131.0, 131.73], [136.0, 143.95], [146.0, 146.42], [148.0, 152.05], [154.0, 154.89], [155.0, 157.35]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, true, false, false, false, false, false, false, false, true, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.14, 32.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 38.43, 34.92, 0.0, 0.0, 39.25, 0.0, 0.0, 30.37, 0.0, 0.0, 0.0, 0.0, 33.08, 0.0, 35.09, 0.0, 31.56, 0.0, 33.16], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 20.95], ["moo", 18.16], ["music", 17.06]], [["fly, housefly", 26.07], ["mosquito", 21.59], ["insect", 16.15]], null, null, null, null, null, null, null, null, null, [["music", 28.66], ["speech", 15.1], ["throbbing", 13.97]], null, [["music", 16.27], ["moo", 10.23], ["speech", 10.03]], [["music", 16.18], ["speech", 15.22], ["livestock, farm animals, working animals", 14.52]], null, null, [["speech", 17.94], ["music", 10.23], ["fly, housefly", 8.58]], null, null, [["speech", 35.84], ["music", 28.9], ["sheep", 6.61]], null, null, null, null, [["cattle, bovinae", 22.46], ["moo", 17.92], ["livestock, farm animals, working animals", 16.0]], null, [["music", 58.62], ["speech", 5.03], ["throbbing", 5.0]], null, [["music", 29.55], ["speech", 27.85], ["crowd", 2.51]], null, [["music", 28.5], ["didgeridoo", 15.26], ["speech", 11.37]]], "duration": [1.0, 0.18, 0.29, 0.91, 0.94, 0.55, 5.32, 4.26, 1.04, 0.76, 0.59, -0.18, 1.39, -0.06, 0.34, 0.46, 0.41, 6.28, 1.38, 8.46, 8.25, 0.7, 0.45, 4.0, 1.5, 0.78, 5.5, -0.3, 0.3, 1.56, 0.38, 5.57, 0.73, 7.95, 0.42, 4.05, 0.89, 2.35]} \ No newline at end of file diff --git a/annotations_filtered/bJNpX5bfXcw_filtered.json b/annotations_filtered/bJNpX5bfXcw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/bJNpX5bfXcw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/bJSDrRcwwKQ_filtered.json b/annotations_filtered/bJSDrRcwwKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98985787402640b1f76950182bc0643dcb16abbd --- /dev/null +++ b/annotations_filtered/bJSDrRcwwKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 27.6], [29.0, 29.91], [33.0, 34.21], [35.0, 37.72], [45.0, 47.34], [51.0, 53.2], [55.0, 57.2], [59.0, 62.55], [64.0, 64.84], [77.0, 82.66], [83.0, 88.47], [93.0, 94.44], [102.0, 107.72], [110.0, 110.44], [111.0, 111.86], [113.0, 123.53], [124.0, 126.03], [127.0, 129.86], [136.0, 136.97], [137.0, 138.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false], "silence_prob": [55.6, 0.0, 0.0, 53.84, 87.92, 48.02, 78.04, 81.17, 0.0, 88.28, 51.28, 0.0, 35.12, 0.0, 0.0, 36.55, 39.46, 45.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 30.41], ["music", 28.14], ["singing bowl", 19.12]], null, null, null, null, null, null, [["breaking", 40.87], ["music", 12.86], ["glass", 11.46]], null, null, [["music", 21.42], ["livestock, farm animals, working animals", 13.73], ["insect", 13.35]], [["frog", 57.51], ["croak", 11.63], ["whale vocalization", 10.43]], [["music", 36.71], ["speech", 14.57], ["singing bowl", 8.65]], null, null], "duration": [2.6, 0.91, 1.21, 2.72, 2.34, 2.2, 2.2, 3.55, 0.84, 5.66, 5.47, 1.44, 5.72, 0.44, 0.86, 10.53, 2.03, 2.86, 0.97, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/bJgem6Xc3TM_filtered.json b/annotations_filtered/bJgem6Xc3TM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dac53297631c8c4a177686f9e29d940844776e4 --- /dev/null +++ b/annotations_filtered/bJgem6Xc3TM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.69], [17.0, 17.27], [17.0, 17.47], [18.0, 17.71], [20.0, 20.98], [23.0, 23.31], [30.0, 30.99], [36.0, 37.18], [40.0, 40.91], [45.0, 51.22], [54.0, 54.57], [62.0, 63.02]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 23.53], ["speech", 20.93], ["hum", 19.86]], null, null], "duration": [0.69, 0.27, 0.47, -0.29, 0.98, 0.31, 0.99, 1.18, 0.91, 6.22, 0.57, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/bJuDofIoW34_filtered.json b/annotations_filtered/bJuDofIoW34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..102593f46bc77c23f654a4f7f24281c1262592bf --- /dev/null +++ b/annotations_filtered/bJuDofIoW34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [13.0, 13.91], [19.0, 27.55], [28.0, 29.57], [31.0, 31.85], [33.0, 33.74], [35.0, 35.56], [38.0, 39.63], [41.0, 41.94], [44.0, 44.83], [47.0, 52.0], [52.0, 55.11], [58.0, 60.96], [62.0, 62.68], [65.0, 65.75], [68.0, 68.77], [72.0, 73.25], [76.0, 76.74], [82.0, 83.3], [84.0, 91.93], [95.0, 104.94], [105.0, 108.08], [108.0, 109.29], [114.0, 114.74], [116.0, 116.48], [123.0, 123.47], [128.0, 128.66], [138.0, 148.68], [149.0, 149.93], [151.0, 155.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 38.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 94.22, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.77, 38.23, 40.61, 0.0, 0.0, 0.0, 0.0, 0.0, 28.98, 0.0, 42.02], "audiomae_on_audioset": [null, null, [["speech", 85.85], ["fireworks", 2.26], ["noise", 1.33]], null, null, null, null, null, null, null, null, null, [["fart", 23.35], ["speech", 18.07], ["explosion", 7.56]], null, null, null, null, null, null, null, [["music", 32.16], ["throbbing", 26.8], ["hum", 20.75]], [["music", 74.14], ["thunk", 2.56], ["electronic music", 2.39]], null, null, null, null, null, [["speech", 42.08], ["explosion", 35.7], ["eruption", 7.66]], null, [["animal", 16.1], ["speech", 12.88], ["bow-wow", 8.05]]], "duration": [0.78, 0.91, 8.55, 1.57, 0.85, 0.74, 0.56, 1.63, 0.94, 0.83, 5.0, 3.11, 2.96, 0.68, 0.75, 0.77, 1.25, 0.74, 1.3, 7.93, 9.94, 3.08, 1.29, 0.74, 0.48, 0.47, 0.66, 10.68, 0.93, 4.66]} \ No newline at end of file diff --git a/annotations_filtered/bKLQBuSPVwQ_filtered.json b/annotations_filtered/bKLQBuSPVwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf6d1bb419605075118e28ef8babf176db08f0b7 --- /dev/null +++ b/annotations_filtered/bKLQBuSPVwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.63], [18.0, 19.31], [22.0, 22.22], [25.0, 28.38], [36.0, 37.37], [39.0, 62.67], [64.0, 66.73], [67.0, 75.29], [76.0, 79.39], [82.0, 84.16], [92.0, 93.8], [94.0, 99.15], [101.0, 101.8], [103.0, 113.49], [116.0, 116.9], [120.0, 119.94], [124.0, 130.86], [132.0, 134.35], [138.0, 139.9], [141.0, 146.67], [148.0, 153.62], [155.0, 157.2]], "keep_status": [false, false, false, true, false, true, true, true, true, false, false, true, false, false, false, false, false, true, false, false, true, true], "silence_prob": [40.02, 0.0, 0.0, 45.46, 0.0, 47.54, 43.61, 37.14, 45.08, 43.23, 0.0, 43.13, 0.0, 41.01, 0.0, 0.0, 32.0, 39.25, 0.0, 51.5, 47.74, 44.4], "audiomae_on_audioset": [[["sidetone", 52.87], ["telephone", 17.02], ["speech", 13.84]], null, null, [["hum", 31.55], ["sidetone", 18.29], ["mains hum", 11.28]], null, [["music", 40.17], ["noise", 12.54], ["synthesizer", 4.97]], [["music", 37.35], ["synthesizer", 18.25], ["theremin", 9.32]], [["music", 36.85], ["hum", 16.83], ["mains hum", 13.8]], [["music", 33.84], ["synthesizer", 9.05], ["musical instrument", 7.13]], [["music", 57.67], ["didgeridoo", 9.04], ["musical instrument", 4.7]], null, [["music", 41.8], ["synthesizer", 7.88], ["effects unit", 5.76]], null, [["singing bowl", 36.02], ["music", 30.33], ["marimba, xylophone", 4.17]], null, null, [["music", 32.08], ["speech", 25.72], ["sidetone", 21.68]], [["music", 38.17], ["speech", 12.09], ["didgeridoo", 8.68]], null, null, [["music", 36.79], ["speech", 10.81], ["musical instrument", 6.77]], [["music", 44.88], ["musical instrument", 6.9], ["hum", 3.72]]], "duration": [2.63, 1.31, 0.22, 3.38, 1.37, 23.67, 2.73, 8.29, 3.39, 2.16, 1.8, 5.15, 0.8, 10.49, 0.9, -0.06, 6.86, 2.35, 1.9, 5.67, 5.62, 2.2]} \ No newline at end of file diff --git a/annotations_filtered/bKOW66PVjvA_filtered.json b/annotations_filtered/bKOW66PVjvA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..850bfb5b986189b98821582d25b1bb62a0095fb8 --- /dev/null +++ b/annotations_filtered/bKOW66PVjvA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.69]], "keep_status": [false], "silence_prob": [69.34], "audiomae_on_audioset": [null], "duration": [3.69]} \ No newline at end of file diff --git a/annotations_filtered/bKbZTFrWing_filtered.json b/annotations_filtered/bKbZTFrWing_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..280c9c3f2effccc5cfa70de13a7534ca07576f1b --- /dev/null +++ b/annotations_filtered/bKbZTFrWing_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.04], [7.0, 8.63], [9.0, 10.99], [11.0, 12.88], [14.0, 18.89], [21.0, 23.23], [24.0, 26.23], [29.0, 29.47], [31.0, 32.24], [34.0, 34.91], [36.0, 41.94], [44.0, 45.27], [47.0, 48.63], [49.0, 50.43], [51.0, 51.88], [53.0, 52.91], [53.0, 54.58], [55.0, 56.1], [57.0, 57.74], [59.0, 60.71], [66.0, 67.1], [70.0, 71.17], [72.0, 72.49], [74.0, 74.6], [80.0, 81.01], [90.0, 101.33], [102.0, 103.45], [104.0, 105.29], [106.0, 109.76], [115.0, 125.24], [126.0, 126.42], [127.0, 128.14], [129.0, 130.15], [131.0, 133.44], [136.0, 143.72], [146.0, 151.36], [153.0, 162.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [99.98, 0.0, 0.0, 0.0, 92.8, 95.78, 99.76, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.26, 0.0, 0.0, 95.09, 92.8, 0.0, 0.0, 0.0, 90.25, 39.01, 40.06, 35.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.29], ["theremin", 4.5], ["vehicle", 2.25]], null, null, null, null, null, null, null, null, [["heart sounds, heartbeat", 19.62], ["speech", 18.1], ["sneeze", 13.04]], [["music", 52.97], ["speech", 6.72], ["grunt", 4.34]], [["speech", 22.78], ["music", 21.39], ["fly, housefly", 4.96]]], "duration": [3.04, 1.63, 1.99, 1.88, 4.89, 2.23, 2.23, 0.47, 1.24, 0.91, 5.94, 1.27, 1.63, 1.43, 0.88, -0.09, 1.58, 1.1, 0.74, 1.71, 1.1, 1.17, 0.49, 0.6, 1.01, 11.33, 1.45, 1.29, 3.76, 10.24, 0.42, 1.14, 1.15, 2.44, 7.72, 5.36, 9.51]} \ No newline at end of file diff --git a/annotations_filtered/bKkJKMjnYf4_filtered.json b/annotations_filtered/bKkJKMjnYf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c827923d6fb5de42a2be795300c09b0d37620ab2 --- /dev/null +++ b/annotations_filtered/bKkJKMjnYf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.26], [10.0, 11.45], [13.0, 13.53], [15.0, 15.6], [17.0, 18.23], [20.0, 22.18], [23.0, 39.33], [40.0, 52.89], [61.0, 61.43], [66.0, 65.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 99.36, 89.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 1.45, 0.53, 0.6, 1.23, 2.18, 16.33, 12.89, 0.43, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/bKy6BtAbTU8_filtered.json b/annotations_filtered/bKy6BtAbTU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71730566d188e7bdf36f958b19e0899c5c2a3864 --- /dev/null +++ b/annotations_filtered/bKy6BtAbTU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.26], [3.0, 3.92], [6.0, 14.23], [46.0, 46.47], [55.0, 56.17], [59.0, 60.56], [65.0, 66.33], [71.0, 71.98], [73.0, 73.8], [75.0, 77.85], [79.0, 79.78], [82.0, 85.77], [91.0, 93.12], [94.0, 95.76], [100.0, 102.25], [112.0, 112.41], [113.0, 115.7], [117.0, 119.28], [126.0, 126.54], [130.0, 131.11], [152.0, 153.12], [162.0, 161.76], [167.0, 167.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 0.92, 8.23, 0.47, 1.17, 1.56, 1.33, 0.98, 0.8, 2.85, 0.78, 3.77, 2.12, 1.76, 2.25, 0.41, 2.7, 2.28, 0.54, 1.11, 1.12, -0.24, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/bLD14JwSiYs_filtered.json b/annotations_filtered/bLD14JwSiYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bae1b55e7828874810b165ecaa45c94cfb8a8da --- /dev/null +++ b/annotations_filtered/bLD14JwSiYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.91], [43.0, 47.39], [48.0, 50.09], [51.0, 53.59], [63.0, 63.66], [65.0, 66.45], [67.0, 68.54], [70.0, 70.71], [72.0, 81.13], [84.0, 84.38], [90.0, 92.7], [94.0, 95.15], [96.0, 112.16]], "keep_status": [false, true, true, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 29.62, 33.32, 29.45, 0.0, 0.0, 0.0, 0.0, 38.64, 0.0, 70.58, 0.0, 32.08], "audiomae_on_audioset": [null, [["music", 51.25], ["civil defense siren", 10.01], ["animal", 8.02]], [["music", 45.21], ["sidetone", 8.41], ["electronic music", 6.64]], [["cattle, bovinae", 42.81], ["moo", 24.0], ["livestock, farm animals, working animals", 17.52]], null, null, null, null, [["music", 27.61], ["didgeridoo", 26.4], ["buzz", 9.87]], null, null, null, [["music", 31.29], ["electric shaver, electric razor", 13.75], ["musical instrument", 5.67]]], "duration": [0.91, 4.39, 2.09, 2.59, 0.66, 1.45, 1.54, 0.71, 9.13, 0.38, 2.7, 1.15, 16.16]} \ No newline at end of file diff --git a/annotations_filtered/bLPMGLsf1c0_filtered.json b/annotations_filtered/bLPMGLsf1c0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..440ef17e22fbca9370a88731b724287d951ccfba --- /dev/null +++ b/annotations_filtered/bLPMGLsf1c0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 54.16], [55.0, 55.36], [57.0, 56.98], [59.0, 62.13], [63.0, 64.37], [66.0, 68.66], [69.0, 70.68], [72.0, 76.86], [78.0, 118.12], [120.0, 125.78], [129.0, 129.93], [131.0, 131.36], [132.0, 133.34]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [43.61, 0.0, 0.0, 59.51, 0.0, 41.32, 0.0, 34.51, 0.0, 32.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 38.87], ["mains hum", 35.88], ["music", 12.3]], null, null, null, null, [["noise", 16.55], ["hum", 15.79], ["mains hum", 14.64]], null, [["mains hum", 41.33], ["hum", 30.1], ["music", 14.53]], null, [["music", 38.48], ["buzz", 10.38], ["mains hum", 8.82]], null, null, null], "duration": [5.16, 0.36, -0.02, 3.13, 1.37, 2.66, 1.68, 4.86, 40.12, 5.78, 0.93, 0.36, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/bLX_zt_MhW0_filtered.json b/annotations_filtered/bLX_zt_MhW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17034cb9cf0f1a79fa066fc381464b57815b69c2 --- /dev/null +++ b/annotations_filtered/bLX_zt_MhW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 42.52], [45.0, 70.44], [71.0, 130.82], [134.0, 139.82], [143.0, 142.55], [143.0, 143.63], [144.0, 148.39], [151.0, 152.95], [157.0, 180.99], [185.0, 185.33]], "keep_status": [true, true, false, false, false, false, false, false, false, false], "silence_prob": [44.99, 36.7, 0.0, 40.9, 0.0, 0.0, 53.72, 0.0, 39.72, 0.0], "audiomae_on_audioset": [[["music", 31.53], ["whale vocalization", 21.33], ["livestock, farm animals, working animals", 6.22]], [["music", 27.46], ["whale vocalization", 17.08], ["buzz", 10.69]], null, [["radio", 39.89], ["speech", 27.73], ["noise", 17.33]], null, null, null, null, [["speech", 64.83], ["music", 13.78], ["radio", 10.02]], null], "duration": [21.52, 25.44, 59.82, 5.82, -0.45, 0.63, 4.39, 1.95, 23.99, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/bLbLsjRVm9Y_filtered.json b/annotations_filtered/bLbLsjRVm9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70fee6ddb6a755af508b9be7a3664ddd8f2bce18 --- /dev/null +++ b/annotations_filtered/bLbLsjRVm9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.46], [9.0, 13.2], [14.0, 18.37], [19.0, 30.16], [32.0, 35.65], [36.0, 40.85], [42.0, 42.57], [43.0, 44.09], [44.0, 44.64], [45.0, 45.74], [47.0, 48.25], [49.0, 51.16], [52.0, 53.43], [54.0, 55.05], [57.0, 65.45], [68.0, 71.49], [72.0, 74.8], [77.0, 78.19], [79.0, 80.47], [81.0, 84.1], [85.0, 86.31], [87.0, 87.45], [88.0, 89.26], [90.0, 91.07], [92.0, 93.93], [95.0, 97.75], [98.0, 99.33], [99.0, 101.43], [103.0, 102.63], [103.0, 103.81], [104.0, 107.99], [109.0, 115.37], [116.0, 116.41], [119.0, 120.58], [122.0, 122.15], [122.0, 122.61], [124.0, 132.27], [135.0, 135.23], [137.0, 138.45], [139.0, 140.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 99.99, 0.0, 0.0, 100.0, 99.95, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.46, 4.2, 4.37, 11.16, 3.65, 4.85, 0.57, 1.09, 0.64, 0.74, 1.25, 2.16, 1.43, 1.05, 8.45, 3.49, 2.8, 1.19, 1.47, 3.1, 1.31, 0.45, 1.26, 1.07, 1.93, 2.75, 1.33, 2.43, -0.37, 0.81, 3.99, 6.37, 0.41, 1.58, 0.15, 0.61, 8.27, 0.23, 1.45, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/bLi52djkRTs_filtered.json b/annotations_filtered/bLi52djkRTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..403ddd92abb83c0750f07ffc40e30c5229d77d5a --- /dev/null +++ b/annotations_filtered/bLi52djkRTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.27], [19.0, 34.99], [36.0, 36.66], [40.0, 43.14], [44.0, 51.26], [53.0, 58.65], [59.0, 75.57], [76.0, 80.4], [82.0, 88.16], [91.0, 92.53], [96.0, 98.2], [99.0, 110.79], [112.0, 113.81], [115.0, 115.05], [116.0, 117.46]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 34.26, 0.0, 46.29, 98.19, 99.52, 51.23, 92.15, 96.29, 0.0, 99.88, 90.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 35.81], ["music", 13.61], ["harmonica", 7.96]], null, [["speech", 38.58], ["sidetone", 10.16], ["fly, housefly", 6.83]], null, null, null, null, null, null, null, null, null, null, null], "duration": [3.27, 15.99, 0.66, 3.14, 7.26, 5.65, 16.57, 4.4, 6.16, 1.53, 2.2, 11.79, 1.81, 0.05, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/bLjFBMuBc68_filtered.json b/annotations_filtered/bLjFBMuBc68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22d11579d9a1af2953926f7297fea1ec04718781 --- /dev/null +++ b/annotations_filtered/bLjFBMuBc68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [7.0, 9.12], [11.0, 12.95], [13.0, 19.89], [21.0, 22.03], [24.0, 25.81], [28.0, 28.26], [29.0, 30.21], [31.0, 33.0], [34.0, 35.68], [37.0, 37.99], [41.0, 46.63], [48.0, 48.71], [49.0, 50.41], [52.0, 54.99], [59.0, 59.8], [61.0, 63.0], [64.0, 66.06], [67.0, 68.55], [70.0, 71.05], [73.0, 73.58], [76.0, 76.47], [77.0, 78.27]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.36, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 61.18, 0.0, 0.0, 84.25, 0.0, 60.6, 53.47, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 43.97], ["speech", 11.05], ["didgeridoo", 4.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 2.12, 1.95, 6.89, 1.03, 1.81, 0.26, 1.21, 2.0, 1.68, 0.99, 5.63, 0.71, 1.41, 2.99, 0.8, 2.0, 2.06, 1.55, 1.05, 0.58, 0.47, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/bLmYWtqC8pc_filtered.json b/annotations_filtered/bLmYWtqC8pc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e4d2fd2b893983e926745dd7d7b7360ae68a1d4 --- /dev/null +++ b/annotations_filtered/bLmYWtqC8pc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.76], [12.0, 12.45], [15.0, 15.38], [17.0, 17.31], [22.0, 22.08], [23.0, 23.5], [27.0, 28.26], [37.0, 38.25], [40.0, 50.18], [52.0, 53.13], [55.0, 55.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 0.45, 0.38, 0.31, 0.08, 0.5, 1.26, 1.25, 10.18, 1.13, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/bLqJo78X3OI_filtered.json b/annotations_filtered/bLqJo78X3OI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ec81f03f64fb6722d8f6819bdc0e0e232fadcc2 --- /dev/null +++ b/annotations_filtered/bLqJo78X3OI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 85.65], [88.0, 90.81], [92.0, 140.97], [143.0, 151.82]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 32.97, 0.0, 30.95], "audiomae_on_audioset": [null, [["music", 42.97], ["trombone", 14.5], ["brass instrument", 11.24]], null, [["music", 34.88], ["whip", 31.41], ["foghorn", 10.0]]], "duration": [77.65, 2.81, 48.97, 8.82]} \ No newline at end of file diff --git a/annotations_filtered/bLqwpb4eDeA_filtered.json b/annotations_filtered/bLqwpb4eDeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dba0551bc2f6760e64cfbcc36b66197c2c345f70 --- /dev/null +++ b/annotations_filtered/bLqwpb4eDeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.84], [14.0, 15.08], [16.0, 20.8], [22.0, 22.96], [25.0, 27.09], [30.0, 30.33], [31.0, 31.77], [33.0, 33.03], [34.0, 54.35], [56.0, 59.32]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [63.64, 0.0, 53.22, 0.0, 39.12, 0.0, 0.0, 0.0, 51.55, 47.46], "audiomae_on_audioset": [null, null, null, null, [["music", 54.86], ["effects unit", 9.29], ["guitar", 6.44]], null, null, null, null, [["music", 45.18], ["theremin", 7.42], ["singing bowl", 6.64]]], "duration": [2.84, 1.08, 4.8, 0.96, 2.09, 0.33, 0.77, 0.03, 20.35, 3.32]} \ No newline at end of file diff --git a/annotations_filtered/bLsM1z8lX_A_filtered.json b/annotations_filtered/bLsM1z8lX_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ed38aeaeed12357b184b4b0a2a3b0a276b7d16f --- /dev/null +++ b/annotations_filtered/bLsM1z8lX_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.92], [7.0, 8.26], [17.0, 19.13], [23.0, 23.08], [26.0, 27.63], [34.0, 34.91], [39.0, 39.55], [42.0, 42.43]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.92, 1.26, 2.13, 0.08, 1.63, 0.91, 0.55, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/bLsnl_fdBoI_filtered.json b/annotations_filtered/bLsnl_fdBoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc48db416d59bf4af90af8df70979bd11970f77a --- /dev/null +++ b/annotations_filtered/bLsnl_fdBoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.22], [4.0, 10.22], [12.0, 13.42], [16.0, 17.05], [20.0, 21.25], [22.0, 22.17], [22.0, 22.5], [23.0, 23.35], [25.0, 31.51], [32.0, 32.54], [34.0, 37.5], [41.0, 50.03], [53.0, 85.02], [87.0, 99.3], [100.0, 106.46], [114.0, 124.17], [125.0, 145.61]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 44.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.01, 0.0, 29.25, 29.39, 0.0, 29.62, 28.81, 29.4, 30.6], "audiomae_on_audioset": [null, [["music", 51.44], ["speech", 7.84], ["synthesizer", 4.75]], null, null, null, null, null, null, [["music", 33.94], ["speech", 21.56], ["throbbing", 20.94]], null, [["music", 62.1], ["speech", 6.68], ["groan", 3.96]], [["groan", 38.49], ["speech", 23.88], ["music", 7.61]], null, [["speech", 58.53], ["music", 15.19], ["whack, thwack", 2.1]], [["speech", 59.23], ["music", 6.64], ["sidetone", 5.03]], [["music", 43.68], ["boing", 6.39], ["explosion", 5.87]], [["boing", 50.35], ["music", 36.5], ["ding", 0.94]]], "duration": [0.22, 6.22, 1.42, 1.05, 1.25, 0.17, 0.5, 0.35, 6.51, 0.54, 3.5, 9.03, 32.02, 12.3, 6.46, 10.17, 20.61]} \ No newline at end of file diff --git a/annotations_filtered/bMDdjhWe9NQ_filtered.json b/annotations_filtered/bMDdjhWe9NQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80ddf7444dc955d026bc4b3c687d87ab803d0401 --- /dev/null +++ b/annotations_filtered/bMDdjhWe9NQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.42], [7.0, 10.54], [11.0, 10.71], [11.0, 10.83], [11.0, 12.02], [12.0, 25.91], [26.0, 28.65], [36.0, 37.13], [38.0, 38.67], [46.0, 45.87], [48.0, 48.47], [51.0, 69.55], [72.0, 84.72], [88.0, 106.08], [108.0, 109.86], [111.0, 112.56], [113.0, 114.25], [116.0, 118.37], [120.0, 123.28], [124.0, 125.07]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [61.97, 36.44, 0.0, 0.0, 0.0, 46.22, 42.3, 0.0, 0.0, 0.0, 0.0, 36.37, 41.1, 38.37, 0.0, 0.0, 0.0, 46.09, 72.46, 0.0], "audiomae_on_audioset": [null, [["speech", 22.2], ["sine wave", 15.33], ["fart", 5.93]], null, null, null, [["sidetone", 26.89], ["speech", 23.3], ["hum", 20.63]], [["speech", 30.74], ["hum", 21.49], ["fart", 9.95]], null, null, null, null, [["stomach rumble", 45.41], ["speech", 16.22], ["burping, eructation", 16.0]], [["speech", 40.17], ["frog", 5.26], ["mosquito", 4.42]], [["speech", 62.11], ["noise", 11.14], ["sidetone", 3.4]], null, null, null, [["speech", 21.19], ["effects unit", 11.76], ["music", 11.31]], null, null], "duration": [4.42, 3.54, -0.29, -0.17, 1.02, 13.91, 2.65, 1.13, 0.67, -0.13, 0.47, 18.55, 12.72, 18.08, 1.86, 1.56, 1.25, 2.37, 3.28, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/bMVWECam8EA_filtered.json b/annotations_filtered/bMVWECam8EA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d8554b3d4442a8135efdb1a0a0b31d76d5afb4e --- /dev/null +++ b/annotations_filtered/bMVWECam8EA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.76], [9.0, 9.42], [10.0, 11.37], [12.0, 12.78], [13.0, 14.15], [15.0, 15.13], [23.0, 24.17], [27.0, 27.04], [29.0, 40.39], [43.0, 46.68], [47.0, 48.71], [51.0, 52.91], [57.0, 57.82], [64.0, 65.69], [67.0, 67.66], [79.0, 80.11], [94.0, 98.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.55, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.67], ["whack, thwack", 16.57], ["fart", 7.34]]], "duration": [2.76, 0.42, 1.37, 0.78, 1.15, 0.13, 1.17, 0.04, 11.39, 3.68, 1.71, 1.91, 0.82, 1.69, 0.66, 1.11, 4.05]} \ No newline at end of file diff --git a/annotations_filtered/bMjYOV8VnYk_filtered.json b/annotations_filtered/bMjYOV8VnYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41534e460d29ecd41939aa34a9c35ad7d2def605 --- /dev/null +++ b/annotations_filtered/bMjYOV8VnYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.23], [28.0, 104.67], [111.0, 124.61], [125.0, 125.96], [128.0, 128.6]], "keep_status": [true, false, true, false, false], "silence_prob": [30.09, 0.0, 30.21, 0.0, 0.0], "audiomae_on_audioset": [[["didgeridoo", 27.31], ["music", 20.13], ["speech", 16.34]], null, [["music", 27.87], ["hum", 14.72], ["throbbing", 13.37]], null, null], "duration": [2.23, 76.67, 13.61, 0.96, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/bMtdrKIdDgE_filtered.json b/annotations_filtered/bMtdrKIdDgE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32178dd6c0c2103c8d4df43639ce2c8281443d1e --- /dev/null +++ b/annotations_filtered/bMtdrKIdDgE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.88], [31.0, 30.86], [33.0, 33.84], [35.0, 35.7], [37.0, 37.4], [38.0, 39.95], [42.0, 42.67], [49.0, 51.46], [54.0, 55.97], [60.0, 61.05], [64.0, 65.04], [69.0, 70.88], [76.0, 81.51], [84.0, 86.1], [89.0, 89.65], [94.0, 94.93], [98.0, 98.2], [104.0, 104.92], [109.0, 111.82], [117.0, 120.73], [122.0, 124.78], [126.0, 128.33], [130.0, 130.33], [133.0, 134.52], [135.0, 135.21], [136.0, 137.08], [142.0, 143.21]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.56, 0.0, 0.0, 0.0, 0.0, 63.96, 59.68, 0.0, 0.0, 0.0, 0.0, 76.53, 37.25, 40.31, 46.68, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 27.82], ["hum", 14.57], ["buzz", 7.08]], null, null, null, null, null, null, null, null, null, null, null, [["crushing", 12.95], ["walk, footsteps", 9.36], ["heart sounds, heartbeat", 7.79]], [["hum", 18.75], ["sine wave", 13.3], ["speech", 12.05]], [["speech", 28.18], ["hum", 11.87], ["sidetone", 5.51]], null, null, null, null, null], "duration": [2.88, -0.14, 0.84, 0.7, 0.4, 1.95, 0.67, 2.46, 1.97, 1.05, 1.04, 1.88, 5.51, 2.1, 0.65, 0.93, 0.2, 0.92, 2.82, 3.73, 2.78, 2.33, 0.33, 1.52, 0.21, 1.08, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/bN1E4vf9FlM_filtered.json b/annotations_filtered/bN1E4vf9FlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9469f5c2d3fd7bd0ee28911cbbf2c2f6dae360d9 --- /dev/null +++ b/annotations_filtered/bN1E4vf9FlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 155.51]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [146.51]} \ No newline at end of file diff --git a/annotations_filtered/bN3U1IwMvhI_filtered.json b/annotations_filtered/bN3U1IwMvhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e8090985784e5ae8ee0b9b3deca79e17fe36ea2 --- /dev/null +++ b/annotations_filtered/bN3U1IwMvhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.73], [8.0, 8.56], [15.0, 15.5], [16.0, 15.99], [16.0, 17.66], [18.0, 18.71], [24.0, 24.04], [24.0, 27.6], [30.0, 30.72], [35.0, 35.7], [39.0, 39.45], [45.0, 45.74], [66.0, 71.63], [76.0, 81.57], [84.0, 86.95], [90.0, 90.95], [100.0, 99.96], [110.0, 112.78], [113.0, 113.16], [113.0, 113.53]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.21, 0.0, 0.0, 0.0, 0.0, 35.0, 32.61, 32.01, 0.0, 0.0, 30.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 38.87], ["music", 18.48], ["sidetone", 6.09]], null, null, null, null, [["music", 58.1], ["dial tone", 12.68], ["sine wave", 8.09]], [["music", 80.69], ["sampler", 1.76], ["hum", 1.14]], [["music", 63.23], ["singing", 2.43], ["salsa music", 1.68]], null, null, [["music", 61.2], ["carnatic music", 10.13], ["yodeling", 3.54]], null, null], "duration": [0.73, 0.56, 0.5, -0.01, 1.66, 0.71, 0.04, 3.6, 0.72, 0.7, 0.45, 0.74, 5.63, 5.57, 2.95, 0.95, -0.04, 2.78, 0.16, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/bNFWITNVAKU_filtered.json b/annotations_filtered/bNFWITNVAKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bca93a8b0822ab4cda56c754f0c30102094fda44 --- /dev/null +++ b/annotations_filtered/bNFWITNVAKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.03], [11.0, 28.32], [28.0, 31.19], [32.0, 106.88], [109.0, 110.17], [113.0, 128.02]], "keep_status": [false, false, true, false, false, true], "silence_prob": [0.0, 31.15, 31.88, 0.0, 0.0, 31.25], "audiomae_on_audioset": [null, [["music", 36.98], ["hum", 36.43], ["mains hum", 6.64]], [["whale vocalization", 33.72], ["insect", 9.11], ["fly, housefly", 5.31]], null, null, [["speech", 25.39], ["music", 18.0], ["hum", 15.07]]], "duration": [1.03, 17.32, 3.19, 74.88, 1.17, 15.02]} \ No newline at end of file diff --git a/annotations_filtered/bNbi_KLd_Uk_filtered.json b/annotations_filtered/bNbi_KLd_Uk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e08dd9f4b0469474f7cadc005165452db632d3b1 --- /dev/null +++ b/annotations_filtered/bNbi_KLd_Uk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.75], [8.0, 11.31], [15.0, 16.88], [19.0, 32.68], [36.0, 37.05], [39.0, 40.26], [44.0, 44.24], [51.0, 52.44], [67.0, 68.94], [78.0, 82.88], [88.0, 99.0], [102.0, 103.15], [114.0, 116.02], [123.0, 124.29], [130.0, 129.88]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.83, 34.69, 0.0, 34.71, 0.0, 0.0, 0.0, 0.0, 0.0, 32.11, 35.03, 0.0, 84.8, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.08], ["buzz", 3.32], ["speech", 3.25]], [["speech", 31.67], ["hum", 15.68], ["mains hum", 6.77]], null, [["music", 82.21], ["synthesizer", 1.78], ["bleat", 1.75]], null, null, null, null, null, [["mosquito", 47.55], ["fly, housefly", 18.96], ["insect", 7.79]], [["music", 64.31], ["quack", 6.22], ["groan", 4.73]], null, null, null, null], "duration": [2.75, 3.31, 1.88, 13.68, 1.05, 1.26, 0.24, 1.44, 1.94, 4.88, 11.0, 1.15, 2.02, 1.29, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/bNdddrIe6dQ_filtered.json b/annotations_filtered/bNdddrIe6dQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3d0c608344bb9411025bb420ddc422a083d9091 --- /dev/null +++ b/annotations_filtered/bNdddrIe6dQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.63], [6.0, 5.91], [7.0, 8.13], [10.0, 13.51], [16.0, 17.95], [19.0, 26.97], [28.0, 29.02], [31.0, 32.98], [35.0, 36.09], [39.0, 39.51], [41.0, 42.35], [44.0, 71.17], [73.0, 74.44], [76.0, 80.89], [82.0, 87.93], [89.0, 91.69], [96.0, 97.29], [100.0, 100.89], [104.0, 106.12], [109.0, 109.97], [112.0, 113.71], [116.0, 119.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [86.64, 0.0, 0.0, 83.16, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 0.0, 50.41, 39.37, 99.56, 0.0, 0.0, 77.87, 0.0, 0.0, 39.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 51.79], ["theremin", 33.65], ["cello", 2.15]], null, null, [["music", 54.92], ["theremin", 20.71], ["musical instrument", 3.6]], null, null, null, null, null, null, [["music", 35.56], ["theremin", 22.92], ["didgeridoo", 5.46]]], "duration": [2.63, -0.09, 1.13, 3.51, 1.95, 7.97, 1.02, 1.98, 1.09, 0.51, 1.35, 27.17, 1.44, 4.89, 5.93, 2.69, 1.29, 0.89, 2.12, 0.97, 1.71, 3.08]} \ No newline at end of file diff --git a/annotations_filtered/bNg1XX5ofhw_filtered.json b/annotations_filtered/bNg1XX5ofhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45fced819bc4f3787a99a1eacbb4016d0990cae7 --- /dev/null +++ b/annotations_filtered/bNg1XX5ofhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.41], [14.0, 35.95], [38.0, 97.36], [98.0, 101.04], [105.0, 106.96], [108.0, 109.8], [111.0, 112.26], [113.0, 114.1], [115.0, 117.04], [120.0, 124.58], [126.0, 126.57], [128.0, 127.82], [128.0, 130.45], [131.0, 132.0], [136.0, 137.07], [138.0, 138.3], [140.0, 140.49], [144.0, 144.21], [149.0, 151.82], [153.0, 153.94], [155.0, 155.39], [159.0, 159.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 65.44, 0.0, 99.36, 0.0, 0.0, 0.0, 0.0, 100.0, 99.99, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 21.95, 59.36, 3.04, 1.96, 1.8, 1.26, 1.1, 2.04, 4.58, 0.57, -0.18, 2.45, 1.0, 1.07, 0.3, 0.49, 0.21, 2.82, 0.94, 0.39, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/bNiztacMAJ0_filtered.json b/annotations_filtered/bNiztacMAJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4156c3be1c70197970d59bb77d33a85ef0e97c11 --- /dev/null +++ b/annotations_filtered/bNiztacMAJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 28.19], [31.0, 31.67], [32.0, 32.98], [37.0, 38.8], [40.0, 41.45], [43.0, 43.04], [48.0, 51.0], [59.0, 59.76], [61.0, 61.48], [62.0, 64.13], [68.0, 74.16], [75.0, 79.34], [84.0, 95.57], [97.0, 98.71], [101.0, 104.87], [105.0, 107.87], [110.0, 110.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 85.72, 96.17, 99.91, 99.73, 0.0, 93.13, 65.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.19, 0.67, 0.98, 1.8, 1.45, 0.04, 3.0, 0.76, 0.48, 2.13, 6.16, 4.34, 11.57, 1.71, 3.87, 2.87, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/bNkeBqdWGzE_filtered.json b/annotations_filtered/bNkeBqdWGzE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..422cef972572ea1b76df96acee4f635d161ee8d1 --- /dev/null +++ b/annotations_filtered/bNkeBqdWGzE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.94], [6.0, 12.75], [13.0, 15.08], [16.0, 19.26], [20.0, 20.82], [21.0, 21.07], [21.0, 28.46], [32.0, 35.77], [36.0, 37.15]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [68.54, 57.56, 50.31, 54.97, 0.0, 0.0, 29.12, 99.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 45.85], ["music", 15.08], ["explosion", 6.59]], null, null], "duration": [2.94, 6.75, 2.08, 3.26, 0.82, 0.07, 7.46, 3.77, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/bO7iMQGQjhY_filtered.json b/annotations_filtered/bO7iMQGQjhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c8cb9d9682535a1cab6e87d337e710a4632969e --- /dev/null +++ b/annotations_filtered/bO7iMQGQjhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 46.28], [48.0, 74.8], [77.0, 79.02], [80.0, 80.43], [81.0, 81.5], [82.0, 82.9], [84.0, 84.79], [87.0, 88.72], [90.0, 90.14], [99.0, 100.41], [108.0, 108.3], [110.0, 110.69], [120.0, 122.32], [123.0, 123.63], [126.0, 126.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.35, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 44.21], ["musical instrument", 15.68], ["guitar", 11.24]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [36.28, 26.8, 2.02, 0.43, 0.5, 0.9, 0.79, 1.72, 0.14, 1.41, 0.3, 0.69, 2.32, 0.63, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/bOEcxxyOC-s_filtered.json b/annotations_filtered/bOEcxxyOC-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1edd6301511797bef38003352d77f9ade1fe46af --- /dev/null +++ b/annotations_filtered/bOEcxxyOC-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 68.99], [70.0, 70.55], [74.0, 74.28], [79.0, 79.76], [82.0, 82.44], [88.0, 89.56], [91.0, 92.3], [94.0, 95.13], [96.0, 97.06], [99.0, 101.49], [104.0, 115.33], [123.0, 128.34], [129.0, 129.96], [134.0, 135.19], [137.0, 138.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 95.23, 91.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.99, 0.55, 0.28, 0.76, 0.44, 1.56, 1.3, 1.13, 1.06, 2.49, 11.33, 5.34, 0.96, 1.19, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/bOKID-aX3z8_filtered.json b/annotations_filtered/bOKID-aX3z8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..775440150d0c988080bf0c2e28cc02a0f8d53f16 --- /dev/null +++ b/annotations_filtered/bOKID-aX3z8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 22.44], [23.0, 27.51], [31.0, 31.21], [48.0, 49.5], [50.0, 51.78], [59.0, 59.58], [74.0, 75.15], [76.0, 76.27], [80.0, 79.96], [85.0, 85.48], [88.0, 89.01], [90.0, 89.97], [92.0, 92.06], [94.0, 94.42], [97.0, 107.0], [110.0, 111.45], [115.0, 116.83], [122.0, 122.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [50.71, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.44, 4.51, 0.21, 1.5, 1.78, 0.58, 1.15, 0.27, -0.04, 0.48, 1.01, -0.03, 0.06, 0.42, 10.0, 1.45, 1.83, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/bOP-THNe4m8_filtered.json b/annotations_filtered/bOP-THNe4m8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ac06c36e8aa7088e88e8ec2293e711fc56e50e3 --- /dev/null +++ b/annotations_filtered/bOP-THNe4m8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.87], [10.0, 9.85], [10.0, 36.56], [39.0, 73.53], [76.0, 78.49], [79.0, 81.92], [83.0, 86.12], [87.0, 88.2], [90.0, 160.34]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.64, 0.0, 33.0, 30.99, 31.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 45.38], ["mains hum", 20.71], ["buzz", 9.53]], null, [["hum", 31.54], ["mains hum", 29.11], ["throbbing", 18.14]], [["mains hum", 22.51], ["hum", 20.76], ["music", 14.06]], [["mains hum", 46.2], ["hum", 18.75], ["music", 8.67]], null, null], "duration": [-0.13, -0.15, 26.56, 34.53, 2.49, 2.92, 3.12, 1.2, 70.34]} \ No newline at end of file diff --git a/annotations_filtered/bOR38552MJA_filtered.json b/annotations_filtered/bOR38552MJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a30dd260fb7130906411064242fce1dec9050e35 --- /dev/null +++ b/annotations_filtered/bOR38552MJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.45], [26.0, 30.79], [46.0, 52.49], [70.0, 74.76], [79.0, 83.02]], "keep_status": [false, true, false, false, true], "silence_prob": [31.16, 32.0, 32.33, 31.55, 31.68], "audiomae_on_audioset": [[["music", 78.18], ["singing", 2.41], ["trombone", 1.13]], [["music", 54.83], ["trombone", 4.56], ["speech", 3.65]], [["music", 68.37], ["singing", 6.28], ["yodeling", 2.76]], [["music", 64.25], ["trombone", 7.35], ["musical instrument", 2.42]], [["music", 49.64], ["speech", 6.11], ["singing", 4.35]]], "duration": [2.45, 4.79, 6.49, 4.76, 4.02]} \ No newline at end of file diff --git a/annotations_filtered/bObjXY24Ei4_filtered.json b/annotations_filtered/bObjXY24Ei4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca2d004bc3338def2175e5537acfc7312dc8543f --- /dev/null +++ b/annotations_filtered/bObjXY24Ei4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.27], [12.0, 13.44], [22.0, 22.3], [26.0, 26.49], [29.0, 29.07], [30.0, 32.12], [44.0, 45.62], [50.0, 50.46], [56.0, 56.3], [56.0, 56.79], [62.0, 62.06], [66.0, 67.64], [69.0, 69.55], [81.0, 81.5], [83.0, 83.62], [84.0, 86.27]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.14, 0.0, 0.0, 0.0, 0.0, 36.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.47], "audiomae_on_audioset": [[["speech", 32.71], ["fly, housefly", 17.23], ["music", 6.73]], null, null, null, null, [["cattle, bovinae", 32.53], ["moo", 19.89], ["livestock, farm animals, working animals", 17.02]], null, null, null, null, null, null, null, null, null, [["speech", 37.63], ["music", 35.5], ["musical instrument", 3.41]]], "duration": [3.27, 1.44, 0.3, 0.49, 0.07, 2.12, 1.62, 0.46, 0.3, 0.79, 0.06, 1.64, 0.55, 0.5, 0.62, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/bPH152eXEfU_filtered.json b/annotations_filtered/bPH152eXEfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0b0d430ebfd9628de60defbc020f341d211083c --- /dev/null +++ b/annotations_filtered/bPH152eXEfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.85], [7.0, 15.94], [18.0, 18.5], [19.0, 21.63], [24.0, 27.01], [28.0, 29.78], [35.0, 39.26], [41.0, 41.81], [43.0, 45.15], [46.0, 47.8], [50.0, 53.25], [55.0, 56.42], [60.0, 61.03], [64.0, 66.01], [66.0, 67.42], [70.0, 70.34], [76.0, 77.53], [79.0, 81.67], [84.0, 90.34], [91.0, 94.24], [95.0, 95.96], [96.0, 96.5], [97.0, 97.82], [98.0, 105.21], [107.0, 108.62], [111.0, 111.72], [113.0, 113.27], [113.0, 113.44], [114.0, 122.13], [124.0, 125.86], [127.0, 128.19], [129.0, 130.62], [132.0, 137.59], [138.0, 142.38]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.47, 94.52, 0.0, 99.68, 66.27, 0.0, 90.95, 0.0, 46.47, 0.0, 75.23, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 99.98, 85.72, 79.07, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0, 64.86, 96.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["busy signal", 20.85], ["frog", 11.79], ["sine wave", 7.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.85, 8.94, 0.5, 2.63, 3.01, 1.78, 4.26, 0.81, 2.15, 1.8, 3.25, 1.42, 1.03, 2.01, 1.42, 0.34, 1.53, 2.67, 6.34, 3.24, 0.96, 0.5, 0.82, 7.21, 1.62, 0.72, 0.27, 0.44, 8.13, 1.86, 1.19, 1.62, 5.59, 4.38]} \ No newline at end of file diff --git a/annotations_filtered/bPNkEztLgeo_filtered.json b/annotations_filtered/bPNkEztLgeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0257e242448bee54adc6921960d7d76b7c083e --- /dev/null +++ b/annotations_filtered/bPNkEztLgeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.24], [8.0, 8.75], [12.0, 12.53], [18.0, 19.13], [22.0, 22.79], [24.0, 24.58], [41.0, 45.94], [51.0, 52.1], [53.0, 53.87], [59.0, 66.9], [68.0, 75.32], [77.0, 77.6], [78.0, 103.17], [104.0, 105.75], [106.0, 109.14], [110.0, 111.05], [112.0, 112.89], [114.0, 116.9], [117.0, 118.17], [119.0, 119.72], [126.0, 126.69], [128.0, 128.39], [130.0, 133.1], [134.0, 135.5], [136.0, 137.27], [138.0, 139.01], [140.0, 140.56], [141.0, 142.28], [143.0, 143.65], [144.0, 145.17], [149.0, 150.33], [151.0, 153.25], [155.0, 154.77], [157.0, 164.64], [166.0, 166.36], [167.0, 167.26], [168.0, 168.98]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.66, 0.0, 0.0, 0.0, 0.0, 0.0, 38.72, 0.0, 0.0, 34.31, 34.56, 0.0, 36.37, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 97.73, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 59.06], ["boing", 13.59], ["musical instrument", 2.68]], null, null, null, null, null, [["music", 53.22], ["speech", 7.89], ["didgeridoo", 7.28]], null, null, [["music", 84.04], ["funny music", 2.02], ["funk", 1.43]], [["music", 85.14], ["quack", 2.63], ["funny music", 1.45]], null, [["music", 75.66], ["swing music", 5.01], ["funk", 3.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.24, 0.75, 0.53, 1.13, 0.79, 0.58, 4.94, 1.1, 0.87, 7.9, 7.32, 0.6, 25.17, 1.75, 3.14, 1.05, 0.89, 2.9, 1.17, 0.72, 0.69, 0.39, 3.1, 1.5, 1.27, 1.01, 0.56, 1.28, 0.65, 1.17, 1.33, 2.25, -0.23, 7.64, 0.36, 0.26, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/bPavpV1D-g8_filtered.json b/annotations_filtered/bPavpV1D-g8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e0e2c0441b92b95541a8eab962c26fcfa95c337 --- /dev/null +++ b/annotations_filtered/bPavpV1D-g8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [10.0, 11.45], [12.0, 13.19], [14.0, 15.08], [19.0, 25.98]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 79.76], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.43, 1.45, 1.19, 1.08, 6.98]} \ No newline at end of file diff --git a/annotations_filtered/bPiv1wP8q7g_filtered.json b/annotations_filtered/bPiv1wP8q7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e234ceb4634532565bb8fd92aeddbeb7319af182 --- /dev/null +++ b/annotations_filtered/bPiv1wP8q7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [4.0, 4.89], [7.0, 7.75], [10.0, 10.57], [13.0, 20.8], [23.0, 23.41], [24.0, 25.34], [28.0, 31.35], [32.0, 32.85], [34.0, 39.53], [41.0, 40.95], [42.0, 47.78], [48.0, 57.87], [59.0, 63.51], [64.0, 66.56], [68.0, 68.84], [72.0, 72.13], [75.0, 75.68], [76.0, 76.91], [77.0, 78.12], [80.0, 81.73], [83.0, 86.16], [87.0, 91.32], [92.0, 92.45], [92.0, 92.84], [94.0, 99.94], [102.0, 101.93], [104.0, 114.27], [132.0, 164.67]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.63, 0.0, 0.0, 36.68, 0.0, 38.37, 0.0, 36.72, 37.45, 41.24, 39.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.96, 44.18, 0.0, 0.0, 38.28, 0.0, 38.67, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 12.31], ["whack, thwack", 12.3], ["breaking", 11.57]], null, null, [["breaking", 63.61], ["music", 6.1], ["glass", 4.73]], null, [["rumble", 43.95], ["mains hum", 13.04], ["hum", 7.13]], null, [["breaking", 69.33], ["music", 10.8], ["glass", 6.63]], [["hum", 40.5], ["mains hum", 25.37], ["speech", 15.5]], [["rumble", 65.77], ["hum", 7.32], ["noise", 4.45]], [["sidetone", 62.04], ["speech", 17.04], ["rumble", 4.38]], null, null, null, null, null, null, [["hum", 29.28], ["mains hum", 17.0], ["rumble", 15.33]], [["hum", 38.97], ["throbbing", 34.13], ["heart sounds, heartbeat", 9.14]], null, null, [["speech", 43.77], ["whale vocalization", 10.66], ["rumble", 10.53]], null, [["mains hum", 36.63], ["hum", 32.8], ["rumble", 15.15]], null], "duration": [1.0, 0.89, 0.75, 0.57, 7.8, 0.41, 1.34, 3.35, 0.85, 5.53, -0.05, 5.78, 9.87, 4.51, 2.56, 0.84, 0.13, 0.68, 0.91, 1.12, 1.73, 3.16, 4.32, 0.45, 0.84, 5.94, -0.07, 10.27, 32.67]} \ No newline at end of file diff --git a/annotations_filtered/bQInfO7fE-s_filtered.json b/annotations_filtered/bQInfO7fE-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..475385a7c591a19bd969638898c2af40c1832315 --- /dev/null +++ b/annotations_filtered/bQInfO7fE-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 42.09]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [37.09]} \ No newline at end of file diff --git a/annotations_filtered/bQObeZ5R0mc_filtered.json b/annotations_filtered/bQObeZ5R0mc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31a7255223a7e48c246aabe46bcde648e2374e42 --- /dev/null +++ b/annotations_filtered/bQObeZ5R0mc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.31], [5.0, 13.86], [15.0, 17.66], [18.0, 17.86], [18.0, 18.93], [21.0, 26.11], [31.0, 33.88], [45.0, 46.53], [48.0, 48.32], [51.0, 50.72], [57.0, 62.61], [63.0, 73.13], [74.0, 79.73], [81.0, 82.09]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 67.51, 100.0, 0.0, 0.0, 32.61, 76.37, 0.0, 0.0, 0.0, 40.68, 49.54, 49.18, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["livestock, farm animals, working animals", 25.41], ["cattle, bovinae", 19.9], ["moo", 18.24]], null, null, null, null, [["livestock, farm animals, working animals", 15.14], ["animal", 14.22], ["cattle, bovinae", 9.07]], [["fly, housefly", 28.77], ["insect", 16.87], ["frog", 14.18]], [["fly, housefly", 58.23], ["insect", 21.75], ["mosquito", 9.75]], null], "duration": [0.31, 8.86, 2.66, -0.14, 0.93, 5.11, 2.88, 1.53, 0.32, -0.28, 5.61, 10.13, 5.73, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/bQWaXlsdyko_filtered.json b/annotations_filtered/bQWaXlsdyko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..274fdeb583cecfdd4c4245e6a77d782ed009c8c2 --- /dev/null +++ b/annotations_filtered/bQWaXlsdyko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [4.0, 5.73], [7.0, 7.48], [10.0, 10.49], [13.0, 13.46], [18.0, 19.03], [21.0, 21.78], [24.0, 29.89], [31.0, 31.13], [32.0, 35.55], [43.0, 49.72], [50.0, 83.89], [95.0, 95.57], [101.0, 101.76], [103.0, 102.98], [108.0, 107.76], [109.0, 112.56], [113.0, 113.43], [114.0, 130.4], [131.0, 131.95], [132.0, 147.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.39, 0.0, 30.3, 31.49, 0.0, 0.0, 0.0, 0.0, 0.0, 51.23, 0.0, 31.54, 0.0, 34.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 51.77], ["drum", 11.17], ["musical instrument", 9.26]], null, [["music", 83.46], ["didgeridoo", 6.18], ["musical instrument", 5.26]], [["music", 59.09], ["didgeridoo", 15.38], ["musical instrument", 6.19]], null, null, null, null, null, null, null, [["speech", 68.42], ["fart", 11.25], ["whale vocalization", 4.48]], null, [["fart", 44.27], ["animal", 15.99], ["hum", 4.48]]], "duration": [0.29, 1.73, 0.48, 0.49, 0.46, 1.03, 0.78, 5.89, 0.13, 3.55, 6.72, 33.89, 0.57, 0.76, -0.02, -0.24, 3.56, 0.43, 16.4, 0.95, 15.21]} \ No newline at end of file diff --git a/annotations_filtered/bQXJoR6tLao_filtered.json b/annotations_filtered/bQXJoR6tLao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ae6f0df5901c0fe2b4b77686974fe9726c80d51 --- /dev/null +++ b/annotations_filtered/bQXJoR6tLao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.08], [10.0, 10.22], [14.0, 14.74], [17.0, 17.95], [19.0, 19.79], [24.0, 24.92], [27.0, 28.31], [33.0, 42.25], [45.0, 45.2], [50.0, 50.85], [51.0, 52.14], [53.0, 56.07], [67.0, 72.44], [75.0, 83.47], [98.0, 98.12], [105.0, 105.49], [106.0, 105.56], [106.0, 105.83], [107.0, 107.45], [111.0, 115.48], [120.0, 120.39], [121.0, 125.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.16, 0.0, 0.0, 0.0, 58.47, 31.74, 46.47, 0.0, 0.0, 0.0, 0.0, 0.0, 33.39, 0.0, 29.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 29.05], ["cattle, bovinae", 28.46], ["livestock, farm animals, working animals", 12.58]], [["speech", 30.03], ["creak", 11.71], ["whack, thwack", 10.33]], null, null, null, null, null, [["music", 44.6], ["drum", 7.5], ["musical instrument", 6.63]], null, [["boing", 30.15], ["music", 21.93], ["speech", 5.4]]], "duration": [1.08, 0.22, 0.74, 0.95, 0.79, 0.92, 1.31, 9.25, 0.2, 0.85, 1.14, 3.07, 5.44, 8.47, 0.12, 0.49, -0.44, -0.17, 0.45, 4.48, 0.39, 4.44]} \ No newline at end of file diff --git a/annotations_filtered/bQbH32KcjG0_filtered.json b/annotations_filtered/bQbH32KcjG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a92362398dec10e1c79bfa2b04b88437b7946d30 --- /dev/null +++ b/annotations_filtered/bQbH32KcjG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.65], [6.0, 9.32], [11.0, 13.02], [14.0, 18.5], [25.0, 25.59], [26.0, 26.96], [28.0, 29.29], [33.0, 35.06], [36.0, 40.54], [45.0, 47.02], [54.0, 54.68], [57.0, 59.09], [62.0, 64.3], [69.0, 76.33], [92.0, 98.39], [100.0, 104.13], [105.0, 105.87]], "keep_status": [false, false, true, false, false, false, false, true, true, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 57.32, 48.95, 44.66, 0.0, 0.0, 0.0, 37.5, 39.52, 50.51, 0.0, 32.13, 34.62, 35.76, 68.02, 59.24, 0.0], "audiomae_on_audioset": [null, null, [["music", 38.19], ["singing bowl", 19.11], ["pulse", 5.5]], [["theremin", 47.18], ["music", 34.96], ["musical instrument", 2.24]], null, null, null, [["livestock, farm animals, working animals", 13.97], ["moo", 12.67], ["cattle, bovinae", 10.71]], [["music", 38.6], ["guitar", 12.14], ["effects unit", 10.92]], null, null, [["music", 53.74], ["speech", 9.56], ["trombone", 1.69]], [["speech", 23.21], ["music", 13.72], ["cello", 8.19]], [["music", 34.74], ["theremin", 28.71], ["cello", 6.88]], null, null, null], "duration": [0.65, 3.32, 2.02, 4.5, 0.59, 0.96, 1.29, 2.06, 4.54, 2.02, 0.68, 2.09, 2.3, 7.33, 6.39, 4.13, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/bQme3XqjpCk_filtered.json b/annotations_filtered/bQme3XqjpCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77a6c42a813003a4e9a4edd61ca4250459cca8de --- /dev/null +++ b/annotations_filtered/bQme3XqjpCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [5.0, 5.39], [6.0, 13.22], [14.0, 16.6], [18.0, 20.9], [21.0, 27.63], [28.0, 28.73], [29.0, 31.7]], "keep_status": [false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 40.77, 36.94, 35.32, 36.36, 0.0, 29.25], "audiomae_on_audioset": [null, null, [["music", 34.98], ["hum", 7.75], ["singing bowl", 5.49]], [["music", 46.15], ["ambient music", 9.67], ["theremin", 6.82]], [["music", 64.97], ["synthesizer", 5.73], ["ambient music", 5.13]], [["music", 72.36], ["ambient music", 6.69], ["musical instrument", 3.16]], null, [["music", 56.78], ["theremin", 6.85], ["percussion", 4.79]]], "duration": [0.72, 0.39, 7.22, 2.6, 2.9, 6.63, 0.73, 2.7]} \ No newline at end of file diff --git a/annotations_filtered/bQqcnMHjxvQ_filtered.json b/annotations_filtered/bQqcnMHjxvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa0f8854820f303e37cd1b8edde66b7b0c9fa683 --- /dev/null +++ b/annotations_filtered/bQqcnMHjxvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.64], [33.0, 33.81], [40.0, 40.42], [49.0, 50.6], [52.0, 52.32], [57.0, 58.53], [61.0, 61.28], [68.0, 73.87], [78.0, 79.42], [85.0, 85.75], [87.0, 87.49], [98.0, 100.03], [106.0, 108.95], [111.0, 111.79], [112.0, 114.47], [115.0, 115.72], [117.0, 117.44], [120.0, 121.31], [123.0, 122.84], [124.0, 123.99], [126.0, 127.18]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.26, 0.0, 0.0, 0.0, 36.98, 37.25, 0.0, 37.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 33.49], ["didgeridoo", 14.48], ["speech", 10.37]], null, null, null, [["speech", 38.08], ["buzz", 5.07], ["music", 4.79]], [["music", 77.97], ["didgeridoo", 5.82], ["musical instrument", 2.1]], null, [["music", 30.89], ["speech", 19.31], ["throbbing", 6.56]], null, null, null, null, null, null], "duration": [1.64, 0.81, 0.42, 1.6, 0.32, 1.53, 0.28, 5.87, 1.42, 0.75, 0.49, 2.03, 2.95, 0.79, 2.47, 0.72, 0.44, 1.31, -0.16, -0.01, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/bQzBPo2qRuk_filtered.json b/annotations_filtered/bQzBPo2qRuk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b096205a2d261200ee58e0f8a240a24996940118 --- /dev/null +++ b/annotations_filtered/bQzBPo2qRuk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.65], [14.0, 14.32], [17.0, 19.53], [20.0, 20.71], [22.0, 23.84], [24.0, 25.22], [26.0, 27.19], [28.0, 29.76], [30.0, 40.83]], "keep_status": [false, false, true, false, false, false, false, false, true], "silence_prob": [31.95, 0.0, 33.6, 0.0, 0.0, 0.0, 0.0, 0.0, 43.23], "audiomae_on_audioset": [[["speech", 85.88], ["inside, small room", 1.3], ["music", 1.26]], null, [["speech", 52.57], ["inside, small room", 4.24], ["theremin", 4.22]], null, null, null, null, null, [["livestock, farm animals, working animals", 44.07], ["cattle, bovinae", 8.86], ["speech", 7.64]]], "duration": [2.65, 0.32, 2.53, 0.71, 1.84, 1.22, 1.19, 1.76, 10.83]} \ No newline at end of file diff --git a/annotations_filtered/bQzh5ugYzPg_filtered.json b/annotations_filtered/bQzh5ugYzPg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb5762e876ad0af6853240a071fbb104abc38429 --- /dev/null +++ b/annotations_filtered/bQzh5ugYzPg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [5.0, 5.51], [12.0, 15.4], [28.0, 30.28], [31.0, 31.94], [45.0, 45.15], [45.0, 45.33], [60.0, 60.18], [65.0, 67.9], [74.0, 74.82], [106.0, 105.6], [106.0, 109.16]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.2, 35.26, 0.0, 0.0, 0.0, 0.0, 33.12, 0.0, 0.0, 35.24], "audiomae_on_audioset": [null, null, [["music", 42.32], ["throbbing", 12.76], ["synthesizer", 6.85]], [["music", 43.38], ["throbbing", 17.08], ["musical instrument", 5.75]], null, null, null, null, [["music", 43.9], ["didgeridoo", 23.78], ["musical instrument", 5.59]], null, null, [["music", 63.41], ["didgeridoo", 5.83], ["speech", 5.08]]], "duration": [0.04, 0.51, 3.4, 2.28, 0.94, 0.15, 0.33, 0.18, 2.9, 0.82, -0.4, 3.16]} \ No newline at end of file diff --git a/annotations_filtered/bR2Uon5BWC0_filtered.json b/annotations_filtered/bR2Uon5BWC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74d3c7e7029a950f26cb030664a9865872c76628 --- /dev/null +++ b/annotations_filtered/bR2Uon5BWC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.66], [3.0, 6.51], [8.0, 13.9], [16.0, 40.98], [42.0, 42.18], [43.0, 43.51], [55.0, 55.56], [57.0, 61.72], [67.0, 67.8], [69.0, 71.22], [77.0, 77.21], [78.0, 79.88], [85.0, 85.13], [88.0, 89.5], [92.0, 92.67], [94.0, 95.44], [96.0, 97.34], [99.0, 105.83], [106.0, 109.49], [110.0, 112.56], [114.0, 114.29], [116.0, 117.46], [120.0, 121.24], [123.0, 124.33], [126.0, 127.23], [128.0, 129.07], [129.0, 129.51]], "keep_status": [false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.62, 31.7, 33.2, 0.0, 0.0, 0.0, 36.98, 0.0, 43.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 42.02, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["thunk", 48.69], ["throbbing", 7.48], ["heart sounds, heartbeat", 6.46]], [["speech", 54.64], ["music", 33.99], ["radio", 1.14]], [["speech", 32.74], ["music", 26.49], ["fly, housefly", 5.32]], null, null, null, [["fly, housefly", 36.37], ["insect", 29.13], ["mosquito", 10.71]], null, [["music", 43.34], ["hum", 11.31], ["throbbing", 10.2]], null, null, null, null, null, null, null, null, [["speech", 37.81], ["sidetone", 22.29], ["radio", 10.19]], null, null, null, null, null, null, null, null], "duration": [-0.34, 3.51, 5.9, 24.98, 0.18, 0.51, 0.56, 4.72, 0.8, 2.22, 0.21, 1.88, 0.13, 1.5, 0.67, 1.44, 1.34, 6.83, 3.49, 2.56, 0.29, 1.46, 1.24, 1.33, 1.23, 1.07, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/bRehxlYZ_CE_filtered.json b/annotations_filtered/bRehxlYZ_CE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95a395255e5dfa5d3eda1ddb7a786908c47a8e01 --- /dev/null +++ b/annotations_filtered/bRehxlYZ_CE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 65.4], [66.0, 68.25]], "keep_status": [false, true], "silence_prob": [0.0, 30.64], "audiomae_on_audioset": [null, [["cattle, bovinae", 13.56], ["moo", 13.15], ["livestock, farm animals, working animals", 10.94]]], "duration": [50.4, 2.25]} \ No newline at end of file diff --git a/annotations_filtered/bRilciIycJQ_filtered.json b/annotations_filtered/bRilciIycJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04b7223953410c43eab11a99c7be25977192c44f --- /dev/null +++ b/annotations_filtered/bRilciIycJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 77.09], [80.0, 81.48], [82.0, 85.83], [86.0, 86.54], [87.0, 92.21]], "keep_status": [false, false, false, false, true], "silence_prob": [30.18, 0.0, 31.07, 0.0, 32.4], "audiomae_on_audioset": [[["music", 79.11], ["throbbing", 8.49], ["electronic music", 2.45]], null, [["speech", 62.8], ["explosion", 12.6], ["burst, pop", 3.71]], null, [["whack, thwack", 25.06], ["music", 16.09], ["throbbing", 6.76]]], "duration": [18.09, 1.48, 3.83, 0.54, 5.21]} \ No newline at end of file diff --git a/annotations_filtered/bRzQBGwfMkM_filtered.json b/annotations_filtered/bRzQBGwfMkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00148871f69d568419274a4591a55fcdc91a7d4f --- /dev/null +++ b/annotations_filtered/bRzQBGwfMkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.28], [6.0, 6.29], [12.0, 14.08], [17.0, 17.34], [18.0, 18.55], [19.0, 27.51], [30.0, 31.46], [32.0, 38.06], [39.0, 44.39], [46.0, 46.8], [47.0, 47.01], [47.0, 47.16], [47.0, 51.87], [52.0, 65.43], [66.0, 67.86], [69.0, 70.06]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.54, 0.0, 0.0, 37.14, 0.0, 42.81, 94.81, 0.0, 0.0, 0.0, 70.02, 41.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["glass", 25.51], ["liquid", 18.92], ["speech", 13.18]], null, [["speech", 59.56], ["tuning fork", 11.33], ["dial tone", 5.84]], null, null, null, null, null, [["speech", 70.33], ["electric shaver, electric razor", 11.82], ["burping, eructation", 5.01]], null, null], "duration": [0.28, 0.29, 2.08, 0.34, 0.55, 8.51, 1.46, 6.06, 5.39, 0.8, 0.01, 0.16, 4.87, 13.43, 1.86, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/bS9N8dEdZCQ_filtered.json b/annotations_filtered/bS9N8dEdZCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d695d2964a9aa8841167baa352c07ea498ce30a --- /dev/null +++ b/annotations_filtered/bS9N8dEdZCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.0], [10.0, 10.81], [13.0, 13.12], [16.0, 16.31], [19.0, 22.54], [23.0, 23.36], [27.0, 27.77], [32.0, 32.27], [33.0, 33.4], [34.0, 34.69], [36.0, 47.92], [50.0, 52.12], [54.0, 57.65], [62.0, 62.19], [66.0, 69.15], [71.0, 72.69], [73.0, 78.0], [80.0, 80.38], [82.0, 82.78], [83.0, 84.28], [87.0, 88.28], [89.0, 102.74], [103.0, 110.2], [111.0, 120.31], [121.0, 138.77], [142.0, 148.05], [149.0, 149.45], [151.0, 167.75], [170.0, 169.77], [174.0, 198.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 50.66, 100.0, 0.0, 100.0, 0.0, 74.13, 0.0, 0.0, 0.0, 0.0, 30.24, 31.33, 30.76, 31.94, 32.72, 0.0, 31.13, 0.0, 30.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.64], ["whack, thwack", 6.79], ["noise", 6.27]], [["music", 25.84], ["speech", 21.27], ["livestock, farm animals, working animals", 10.26]], [["noise", 26.09], ["music", 25.6], ["hum", 3.06]], [["buzz", 28.54], ["fly, housefly", 22.18], ["music", 9.9]], [["music", 58.89], ["hum", 7.0], ["didgeridoo", 5.93]], null, [["speech", 40.18], ["fart", 12.37], ["music", 12.32]], null, [["livestock, farm animals, working animals", 28.81], ["cattle, bovinae", 22.94], ["moo", 14.2]]], "duration": [0.0, 0.81, 0.12, 0.31, 3.54, 0.36, 0.77, 0.27, 0.4, 0.69, 11.92, 2.12, 3.65, 0.19, 3.15, 1.69, 5.0, 0.38, 0.78, 1.28, 1.28, 13.74, 7.2, 9.31, 17.77, 6.05, 0.45, 16.75, -0.23, 24.75]} \ No newline at end of file diff --git a/annotations_filtered/bSDqN3UTrPI_filtered.json b/annotations_filtered/bSDqN3UTrPI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70a97ca1d394d6f67ff9d31648327ed1abb5aa28 --- /dev/null +++ b/annotations_filtered/bSDqN3UTrPI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [7.0, 19.4], [25.0, 55.04], [65.0, 65.5], [66.0, 70.95], [73.0, 83.46], [85.0, 85.92]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 31.59, 0.0, 0.0, 36.85, 30.07, 0.0], "audiomae_on_audioset": [null, [["music", 59.75], ["didgeridoo", 8.62], ["throbbing", 8.1]], null, null, [["music", 52.69], ["didgeridoo", 29.19], ["speech", 4.78]], [["livestock, farm animals, working animals", 28.74], ["music", 19.27], ["moo", 9.05]], null], "duration": [0.98, 12.4, 30.04, 0.5, 4.95, 10.46, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/bSE3gq6Sf6Y_filtered.json b/annotations_filtered/bSE3gq6Sf6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0247616bf61dad9a9ea4f8866bed108107994e18 --- /dev/null +++ b/annotations_filtered/bSE3gq6Sf6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.01], [11.0, 13.41], [14.0, 17.91], [19.0, 21.27], [23.0, 26.4], [27.0, 46.48], [59.0, 59.37], [62.0, 62.29], [66.0, 65.99], [68.0, 88.08], [90.0, 92.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.71, 96.54, 99.44, 94.66, 96.66, 84.07, 0.0, 0.0, 0.0, 98.99, 99.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [10.01, 2.41, 3.91, 2.27, 3.4, 19.48, 0.37, 0.29, -0.01, 20.08, 2.94]} \ No newline at end of file diff --git a/annotations_filtered/bSW_sW_A8pg_filtered.json b/annotations_filtered/bSW_sW_A8pg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea9f4b3f38da17b181549de25ac3545909d4f0bf --- /dev/null +++ b/annotations_filtered/bSW_sW_A8pg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [7.0, 7.96], [9.0, 12.45], [14.0, 16.6], [21.0, 21.22], [27.0, 27.82], [29.0, 31.38], [32.0, 33.29], [34.0, 36.56], [39.0, 39.51], [43.0, 44.78], [45.0, 46.45], [50.0, 50.38], [52.0, 52.25], [54.0, 54.09], [56.0, 55.76], [57.0, 58.31], [60.0, 61.7], [64.0, 65.03], [67.0, 72.49], [75.0, 79.71], [80.0, 82.17], [84.0, 84.92], [85.0, 88.05], [90.0, 93.78], [95.0, 97.36], [99.0, 103.38], [105.0, 105.02], [110.0, 110.74], [112.0, 111.87], [112.0, 119.31], [120.0, 120.95], [123.0, 123.06], [125.0, 124.95], [126.0, 126.35], [127.0, 127.7], [129.0, 134.92], [137.0, 138.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 99.99, 0.0, 0.0, 100.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.59, 100.0, 0.0, 99.85, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.96, 3.45, 2.6, 0.22, 0.82, 2.38, 1.29, 2.56, 0.51, 1.78, 1.45, 0.38, 0.25, 0.09, -0.24, 1.31, 1.7, 1.03, 5.49, 4.71, 2.17, 0.92, 3.05, 3.78, 2.36, 4.38, 0.02, 0.74, -0.13, 7.31, 0.95, 0.06, -0.05, 0.35, 0.7, 5.92, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/bSdm_eA1Css_filtered.json b/annotations_filtered/bSdm_eA1Css_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1626865a154bad63df6d166c65dbe8beda5a2c5 --- /dev/null +++ b/annotations_filtered/bSdm_eA1Css_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.64], [15.0, 16.46], [26.0, 26.64], [30.0, 31.01], [39.0, 44.66], [46.0, 46.74], [50.0, 51.09], [58.0, 58.95], [62.0, 65.38], [66.0, 68.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 65.67, 0.0, 0.0, 0.0, 71.57, 90.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [-0.36, 1.46, 0.64, 1.01, 5.66, 0.74, 1.09, 0.95, 3.38, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/bSm3d9ftiJA_filtered.json b/annotations_filtered/bSm3d9ftiJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a0f021fb652408e719cfeaa9b29b70a4ec4adaa --- /dev/null +++ b/annotations_filtered/bSm3d9ftiJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.04], [10.0, 11.31], [13.0, 12.95], [14.0, 14.88], [17.0, 17.58], [18.0, 18.86], [23.0, 23.72], [30.0, 29.84], [30.0, 31.04], [33.0, 33.96], [35.0, 35.29], [40.0, 41.07], [41.0, 43.43], [49.0, 48.95], [50.0, 51.7], [55.0, 55.65], [57.0, 57.91], [65.0, 66.43], [75.0, 75.76], [80.0, 80.54], [84.0, 84.67], [86.0, 87.32], [88.0, 90.61], [92.0, 93.21], [101.0, 101.34], [103.0, 102.78], [107.0, 106.76], [110.0, 110.39], [112.0, 115.16], [119.0, 139.19], [139.0, 139.35], [139.0, 140.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 0.0, 0.0, 0.0, 46.75, 30.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 11.63], ["boing", 8.75], ["hum", 8.33]], [["music", 59.96], ["moo", 3.99], ["livestock, farm animals, working animals", 3.95]], null, null], "duration": [2.04, 1.31, -0.05, 0.88, 0.58, 0.86, 0.72, -0.16, 1.04, 0.96, 0.29, 1.07, 2.43, -0.05, 1.7, 0.65, 0.91, 1.43, 0.76, 0.54, 0.67, 1.32, 2.61, 1.21, 0.34, -0.22, -0.24, 0.39, 3.16, 20.19, 0.35, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/bSxuXQCEC7M_filtered.json b/annotations_filtered/bSxuXQCEC7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ef6fe8e4552bf85b339f96bf4589c98954837a9 --- /dev/null +++ b/annotations_filtered/bSxuXQCEC7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.46], [19.0, 21.34], [22.0, 22.79], [26.0, 26.15], [27.0, 28.32], [30.0, 30.33], [39.0, 40.78], [41.0, 41.69]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [34.78, 32.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 62.55], ["sidetone", 6.4], ["walk, footsteps", 4.66]], [["whack, thwack", 31.68], ["radio", 10.06], ["burst, pop", 6.04]], null, null, null, null, null, null], "duration": [2.46, 2.34, 0.79, 0.15, 1.32, 0.33, 1.78, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/bT6NizTtXug_filtered.json b/annotations_filtered/bT6NizTtXug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45ed3119c3d101e8c2aea612b753259d3ab31705 --- /dev/null +++ b/annotations_filtered/bT6NizTtXug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.38], [16.0, 39.53], [41.0, 133.93], [136.0, 217.02], [218.0, 220.56], [222.0, 223.74]], "keep_status": [true, true, false, false, false, false], "silence_prob": [42.02, 49.68, 0.0, 0.0, 60.89, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 14.33], ["livestock, farm animals, working animals", 12.36], ["moo", 12.36]], [["music", 30.0], ["didgeridoo", 24.75], ["hum", 11.37]], null, null, null, null], "duration": [3.38, 23.53, 92.93, 81.02, 2.56, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/bTE69etu_fg_filtered.json b/annotations_filtered/bTE69etu_fg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fa9eb5b333fd870de33e631762f1368b91097a1 --- /dev/null +++ b/annotations_filtered/bTE69etu_fg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [5.0, 5.0], [6.0, 6.83], [10.0, 11.23], [14.0, 15.04], [17.0, 21.3], [23.0, 23.46], [25.0, 28.73], [30.0, 30.03], [32.0, 32.31], [34.0, 37.72], [38.0, 44.95], [46.0, 46.77], [50.0, 58.73], [61.0, 62.67], [64.0, 65.57], [69.0, 70.87], [73.0, 75.12], [80.0, 80.87], [84.0, 84.75], [87.0, 89.6], [95.0, 95.57], [98.0, 98.66], [102.0, 102.41], [103.0, 104.03], [105.0, 106.95], [108.0, 111.5], [112.0, 114.08], [115.0, 117.31], [120.0, 125.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 0.0, 59.96, 0.0, 0.0, 53.28, 51.55, 0.0, 41.56, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 42.88, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 89.01, 99.85, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.31], ["guitar", 9.63], ["musical instrument", 8.11]], null, null, null, null, null, null, [["speech", 31.17], ["sidetone", 10.89], ["busy signal", 5.88]], null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.0, 0.83, 1.23, 1.04, 4.3, 0.46, 3.73, 0.03, 0.31, 3.72, 6.95, 0.77, 8.73, 1.67, 1.57, 1.87, 2.12, 0.87, 0.75, 2.6, 0.57, 0.66, 0.41, 1.03, 1.95, 3.5, 2.08, 2.31, 5.34]} \ No newline at end of file diff --git a/annotations_filtered/bTJAIONGv0Y_filtered.json b/annotations_filtered/bTJAIONGv0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35217b743117215697740f6cd76528494c3f8c94 --- /dev/null +++ b/annotations_filtered/bTJAIONGv0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.95], [10.0, 11.5], [17.0, 18.17], [20.0, 21.1], [23.0, 23.73], [34.0, 37.49], [38.0, 39.31], [44.0, 44.49], [46.0, 48.81], [63.0, 65.16], [72.0, 74.65], [80.0, 81.43], [93.0, 95.12], [99.0, 100.36], [111.0, 111.48], [114.0, 114.61], [115.0, 117.1], [118.0, 119.47], [123.0, 122.99], [123.0, 123.55], [126.0, 126.54], [128.0, 129.15], [138.0, 137.94], [138.0, 139.4], [141.0, 142.55], [151.0, 153.71], [156.0, 157.94], [161.0, 163.48], [169.0, 171.85], [174.0, 180.0], [181.0, 185.25], [186.0, 189.41], [190.0, 194.02], [195.0, 196.03]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.2, 0.0, 0.0, 29.46, 29.78, 30.59, 0.0, 29.93, 0.0, 0.0, 0.0, 30.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 0.0, 46.15, 62.07, 49.59, 63.21, 53.78, 61.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["insect", 49.65], ["fly, housefly", 39.51], ["bee, wasp, etc.", 8.25]], null, null, [["livestock, farm animals, working animals", 33.98], ["cattle, bovinae", 27.08], ["moo", 22.56]], [["livestock, farm animals, working animals", 23.3], ["cattle, bovinae", 15.92], ["insect", 11.84]], [["speech", 22.69], ["music", 18.91], ["didgeridoo", 10.32]], null, [["crackle", 13.93], ["roar", 8.06], ["sidetone", 7.54]], null, null, null, [["insect", 43.66], ["fly, housefly", 38.11], ["bee, wasp, etc.", 9.93]], null, null, null, null, null, null, null, null, null, null, [["speech", 31.75], ["radio", 15.41], ["frying (food)", 5.54]], null, [["mains hum", 26.21], ["hum", 24.69], ["fly, housefly", 5.84]], null, null, null, null], "duration": [-0.05, 1.5, 1.17, 1.1, 0.73, 3.49, 1.31, 0.49, 2.81, 2.16, 2.65, 1.43, 2.12, 1.36, 0.48, 0.61, 2.1, 1.47, -0.01, 0.55, 0.54, 1.15, -0.06, 1.4, 1.55, 2.71, 1.94, 2.48, 2.85, 6.0, 4.25, 3.41, 4.02, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/bTPrlCglvFo_filtered.json b/annotations_filtered/bTPrlCglvFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d7f1331f2002258241df96f0eec947ca9dd1c0f --- /dev/null +++ b/annotations_filtered/bTPrlCglvFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.19], [28.0, 28.43], [33.0, 34.21], [35.0, 34.77], [36.0, 40.93], [42.0, 43.06], [52.0, 52.64], [55.0, 58.38], [63.0, 63.61], [79.0, 79.25], [82.0, 82.43], [88.0, 88.45], [92.0, 91.74], [93.0, 93.5], [94.0, 95.55], [116.0, 116.56], [119.0, 124.21], [135.0, 135.73], [144.0, 144.83], [150.0, 150.03], [152.0, 152.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.84, 0.0, 0.0, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 46.0], ["speech", 20.11], ["stomach rumble", 6.02]], null, null, [["music", 51.74], ["boing", 28.28], ["speech", 6.16]], null, null, null, null, null, null, null, null, [["music", 82.5], ["boing", 3.32], ["speech", 2.86]], null, null, null, null], "duration": [1.19, 0.43, 1.21, -0.23, 4.93, 1.06, 0.64, 3.38, 0.61, 0.25, 0.43, 0.45, -0.26, 0.5, 1.55, 0.56, 5.21, 0.73, 0.83, 0.03, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/bTUrWYv2vtU_filtered.json b/annotations_filtered/bTUrWYv2vtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ad8498da2b923fdf2a559903f1a4f7374e687fa --- /dev/null +++ b/annotations_filtered/bTUrWYv2vtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.66], [14.0, 16.14], [19.0, 33.29], [35.0, 36.75], [38.0, 38.65], [41.0, 42.04], [47.0, 48.76], [52.0, 52.84], [53.0, 54.85], [55.0, 57.81], [59.0, 59.76], [62.0, 62.56], [70.0, 73.06], [78.0, 79.25], [81.0, 81.89], [86.0, 87.13], [89.0, 89.77], [94.0, 95.4], [98.0, 101.66], [106.0, 107.45], [109.0, 109.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.55, 94.07, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.95, 0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 39.37], ["speech", 37.45], ["hum", 2.82]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.66, 2.14, 14.29, 1.75, 0.65, 1.04, 1.76, 0.84, 1.85, 2.81, 0.76, 0.56, 3.06, 1.25, 0.89, 1.13, 0.77, 1.4, 3.66, 1.45, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/bTdvsBKjlbE_filtered.json b/annotations_filtered/bTdvsBKjlbE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e51b3fd2688a05b092353aa90044e2ca3ba2aa01 --- /dev/null +++ b/annotations_filtered/bTdvsBKjlbE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.65], [6.0, 7.94], [10.0, 10.66], [19.0, 27.09], [29.0, 30.99], [33.0, 35.21], [37.0, 39.51], [41.0, 44.12], [47.0, 59.93], [61.0, 63.98], [65.0, 68.3], [74.0, 75.27], [76.0, 84.37], [89.0, 92.03], [94.0, 98.93], [101.0, 101.07], [102.0, 105.71], [108.0, 109.38]], "keep_status": [true, false, false, false, false, true, true, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [43.4, 0.0, 0.0, 38.2, 0.0, 37.31, 38.7, 76.2, 56.25, 49.09, 44.4, 0.0, 47.35, 39.35, 50.11, 0.0, 53.04, 0.0], "audiomae_on_audioset": [[["animal", 29.54], ["hum", 16.37], ["mains hum", 10.44]], null, null, [["noise", 38.74], ["hum", 21.11], ["mains hum", 13.2]], null, [["speech", 40.38], ["hum", 12.83], ["mains hum", 8.13]], [["frog", 45.73], ["buzz", 6.93], ["croak", 3.97]], null, null, [["hum", 15.86], ["buzz", 11.17], ["animal", 10.13]], [["livestock, farm animals, working animals", 52.16], ["cattle, bovinae", 22.86], ["moo", 18.49]], null, [["frog", 75.35], ["croak", 7.48], ["insect", 3.88]], [["speech", 25.04], ["frog", 15.88], ["hum", 12.85]], null, null, null, null], "duration": [3.65, 1.94, 0.66, 8.09, 1.99, 2.21, 2.51, 3.12, 12.93, 2.98, 3.3, 1.27, 8.37, 3.03, 4.93, 0.07, 3.71, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/bTeYncx1xmI_filtered.json b/annotations_filtered/bTeYncx1xmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec788a640f3a8301ac90aca115917df61d555a00 --- /dev/null +++ b/annotations_filtered/bTeYncx1xmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.39], [17.0, 19.08], [21.0, 21.12], [25.0, 33.93], [36.0, 36.76], [38.0, 39.28], [46.0, 50.28], [55.0, 55.14], [57.0, 58.68], [60.0, 63.8], [66.0, 69.36], [71.0, 72.12], [75.0, 75.91], [78.0, 81.01], [81.0, 82.17], [83.0, 83.46], [87.0, 87.52], [97.0, 97.36], [98.0, 99.25], [102.0, 104.31], [105.0, 105.85], [114.0, 114.78], [120.0, 121.98], [123.0, 123.2], [130.0, 132.88], [134.0, 134.27], [135.0, 135.45], [138.0, 138.43], [144.0, 149.2], [150.0, 150.69], [152.0, 153.82], [154.0, 156.15], [162.0, 163.26], [168.0, 169.35], [170.0, 171.56], [175.0, 176.08]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 60.42, 0.0, 33.87, 0.0, 0.0, 34.02, 0.0, 0.0, 99.95, 76.7, 0.0, 0.0, 56.48, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0, 68.93, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 74.43], ["radio", 5.63], ["whack, thwack", 2.88]], null, null, [["speech", 43.14], ["speech synthesizer", 16.94], ["boing", 7.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 2.08, 0.12, 8.93, 0.76, 1.28, 4.28, 0.14, 1.68, 3.8, 3.36, 1.12, 0.91, 3.01, 1.17, 0.46, 0.52, 0.36, 1.25, 2.31, 0.85, 0.78, 1.98, 0.2, 2.88, 0.27, 0.45, 0.43, 5.2, 0.69, 1.82, 2.15, 1.26, 1.35, 1.56, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/bTrFBrULLmM_filtered.json b/annotations_filtered/bTrFBrULLmM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c6bc8d474c3e89152779b6f90084d779fa119d6 --- /dev/null +++ b/annotations_filtered/bTrFBrULLmM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [11.0, 14.74], [21.0, 21.57], [23.0, 23.5], [26.0, 27.77], [29.0, 29.29], [37.0, 38.01], [42.0, 42.75], [44.0, 44.17], [49.0, 49.17], [51.0, 51.27], [55.0, 58.45], [63.0, 64.84], [66.0, 73.41], [80.0, 80.52], [83.0, 84.69], [86.0, 97.98], [102.0, 103.82], [104.0, 110.94], [112.0, 113.64], [114.0, 117.12], [118.0, 124.88], [125.0, 128.17], [133.0, 134.86], [135.0, 137.13], [138.0, 139.18], [141.0, 141.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 81.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 74.92, 0.0, 0.0, 38.31, 0.0, 65.32, 0.0, 83.52, 38.03, 48.14, 0.0, 35.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.35], ["speech", 30.76], ["throbbing", 6.36]], null, null, null, null, [["music", 48.86], ["theremin", 7.42], ["hum", 6.77]], [["music", 31.78], ["hum", 18.74], ["speech", 17.33]], null, [["speech", 55.77], ["radio", 8.01], ["music", 7.09]], null, null], "duration": [0.51, 3.74, 0.57, 0.5, 1.77, 0.29, 1.01, 0.75, 0.17, 0.17, 0.27, 3.45, 1.84, 7.41, 0.52, 1.69, 11.98, 1.82, 6.94, 1.64, 3.12, 6.88, 3.17, 1.86, 2.13, 1.18, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/bVKJscj58DI_filtered.json b/annotations_filtered/bVKJscj58DI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9e2af983fbc2c5cadebfacfcf1c303ea48747f2 --- /dev/null +++ b/annotations_filtered/bVKJscj58DI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 30.64], [31.0, 31.68], [35.0, 35.51], [36.0, 36.83], [37.0, 37.79], [47.0, 50.04], [51.0, 56.4], [58.0, 58.46], [61.0, 61.32], [63.0, 64.22], [65.0, 66.07], [66.0, 71.81], [73.0, 77.26], [78.0, 79.02], [79.0, 92.43], [97.0, 107.59], [124.0, 123.97], [140.0, 140.49], [142.0, 142.2], [153.0, 154.63], [164.0, 164.69], [172.0, 172.23]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [29.93, 0.0, 0.0, 0.0, 0.0, 43.43, 36.61, 0.0, 0.0, 0.0, 0.0, 30.74, 29.0, 0.0, 29.19, 29.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 31.91], ["music", 23.72], ["breaking", 7.1]], null, null, null, null, [["speech", 72.02], ["thunk", 2.12], ["fly, housefly", 1.96]], [["speech", 62.39], ["beatboxing", 18.25], ["frog", 3.45]], null, null, null, null, [["speech", 30.77], ["whale vocalization", 11.01], ["cattle, bovinae", 10.4]], [["cattle, bovinae", 32.14], ["moo", 23.08], ["livestock, farm animals, working animals", 21.1]], null, [["music", 40.88], ["speech", 11.75], ["moo", 5.96]], [["music", 39.39], ["speech", 35.79], ["foghorn", 3.56]], null, null, null, null, null, null], "duration": [24.64, 0.68, 0.51, 0.83, 0.79, 3.04, 5.4, 0.46, 0.32, 1.22, 1.07, 5.81, 4.26, 1.02, 13.43, 10.59, -0.03, 0.49, 0.2, 1.63, 0.69, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/bW0aNTB523c_filtered.json b/annotations_filtered/bW0aNTB523c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3968fac313e18464a44a1a4a2549d03500367341 --- /dev/null +++ b/annotations_filtered/bW0aNTB523c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 43.06], [44.0, 57.89], [58.0, 65.23], [70.0, 71.47]], "keep_status": [false, false, true, false], "silence_prob": [45.43, 63.74, 38.11, 0.0], "audiomae_on_audioset": [[["speech", 48.05], ["hum", 17.13], ["mains hum", 10.15]], null, [["sidetone", 23.81], ["speech", 18.54], ["hum", 16.31]], null], "duration": [19.06, 13.89, 7.23, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/bWJkPbBOXL4_filtered.json b/annotations_filtered/bWJkPbBOXL4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebd559b6dbbda9800c6499867d9c999d927906db --- /dev/null +++ b/annotations_filtered/bWJkPbBOXL4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.33], [13.0, 14.44], [17.0, 17.81], [19.0, 19.43], [22.0, 22.47], [27.0, 28.21], [29.0, 31.26], [32.0, 35.41], [39.0, 39.95], [41.0, 41.76], [43.0, 43.61], [44.0, 43.87], [45.0, 46.41], [50.0, 50.67], [52.0, 52.93], [60.0, 60.54], [63.0, 63.81], [65.0, 65.87], [66.0, 67.41], [69.0, 70.33], [71.0, 71.37], [73.0, 73.26], [82.0, 82.88], [85.0, 87.0], [91.0, 92.74], [103.0, 103.77], [105.0, 106.81], [108.0, 109.02], [112.0, 112.95], [118.0, 118.1], [121.0, 121.61], [122.0, 122.32], [124.0, 124.21]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.87, 50.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 12.19], ["fly, housefly", 10.51], ["throbbing", 5.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 64.16], ["fly, housefly", 2.33], ["animal", 2.18]], null, null, null, null, null, null, null, null, null], "duration": [1.33, 1.44, 0.81, 0.43, 0.47, 1.21, 2.26, 3.41, 0.95, 0.76, 0.61, -0.13, 1.41, 0.67, 0.93, 0.54, 0.81, 0.87, 1.41, 1.33, 0.37, 0.26, 0.88, 2.0, 1.74, 0.77, 1.81, 1.02, 0.95, 0.1, 0.61, 0.32, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/bWQ1ekGzhwU_filtered.json b/annotations_filtered/bWQ1ekGzhwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb7fd7fd3f0c5832add7e99727151cef41f0a38d --- /dev/null +++ b/annotations_filtered/bWQ1ekGzhwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.41], [24.0, 25.34], [28.0, 28.54], [29.0, 38.2], [39.0, 53.76], [57.0, 61.26], [62.0, 74.22], [75.0, 75.98], [79.0, 106.76], [110.0, 110.76]], "keep_status": [true, false, false, false, true, false, true, false, true, false], "silence_prob": [29.32, 0.0, 0.0, 29.56, 28.64, 30.99, 28.5, 0.0, 28.38, 0.0], "audiomae_on_audioset": [[["music", 36.74], ["musical instrument", 10.0], ["didgeridoo", 8.18]], null, null, [["speech", 45.89], ["vehicle", 32.93], ["car", 3.6]], [["speech", 40.83], ["vehicle", 11.64], ["civil defense siren", 5.89]], [["speech", 64.78], ["vehicle", 14.57], ["aircraft", 3.4]], [["music", 53.59], ["hum", 4.23], ["cacophony", 3.09]], null, [["speech", 26.04], ["music", 16.97], ["vehicle", 14.3]], null], "duration": [9.41, 1.34, 0.54, 9.2, 14.76, 4.26, 12.22, 0.98, 27.76, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/bWaxWtgjY1g_filtered.json b/annotations_filtered/bWaxWtgjY1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4d1ce92c578274192b093670f25285af40f8d4c --- /dev/null +++ b/annotations_filtered/bWaxWtgjY1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [12.0, 12.55], [35.0, 36.15], [41.0, 43.55], [45.0, 46.5], [54.0, 56.4], [59.0, 59.37], [66.0, 73.53], [75.0, 74.97], [76.0, 77.01], [78.0, 78.44], [80.0, 84.54], [104.0, 103.87], [104.0, 105.9], [107.0, 106.78], [107.0, 107.69], [108.0, 109.73], [112.0, 113.26], [114.0, 115.32], [116.0, 115.87], [116.0, 117.76], [122.0, 126.01]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 44.96, 0.0, 53.91, 0.0, 38.45, 0.0, 0.0, 0.0, 39.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.33], "audiomae_on_audioset": [null, null, null, [["hum", 33.91], ["mains hum", 29.84], ["whale vocalization", 9.99]], null, null, null, [["music", 54.18], ["musical instrument", 7.35], ["guitar", 6.25]], null, null, null, [["music", 56.99], ["hum", 5.88], ["musical instrument", 5.57]], null, null, null, null, null, null, null, null, null, [["music", 58.74], ["hum", 7.65], ["synthesizer", 5.28]]], "duration": [0.53, 0.55, 1.15, 2.55, 1.5, 2.4, 0.37, 7.53, -0.03, 1.01, 0.44, 4.54, -0.13, 1.9, -0.22, 0.69, 1.73, 1.26, 1.32, -0.13, 1.76, 4.01]} \ No newline at end of file diff --git a/annotations_filtered/bWm1GC01kGo_filtered.json b/annotations_filtered/bWm1GC01kGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aea8b98011133894461796b333db5e5b260d95b1 --- /dev/null +++ b/annotations_filtered/bWm1GC01kGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.94], [7.0, 8.46], [9.0, 9.21], [11.0, 11.42], [12.0, 12.41], [13.0, 14.81], [18.0, 18.18], [19.0, 20.28], [21.0, 21.56], [22.0, 23.46], [24.0, 24.39], [26.0, 26.27], [29.0, 30.06], [31.0, 32.41], [34.0, 34.99], [38.0, 39.01], [42.0, 45.44], [46.0, 53.55], [55.0, 56.13], [57.0, 58.33], [59.0, 58.97], [59.0, 65.52], [66.0, 66.85], [68.0, 68.67], [70.0, 70.97], [74.0, 75.9], [77.0, 79.32], [80.0, 85.4], [86.0, 86.04], [88.0, 88.3], [89.0, 89.48], [90.0, 90.26], [91.0, 91.81], [93.0, 103.27], [104.0, 105.27], [108.0, 110.86], [113.0, 114.76], [116.0, 116.23], [120.0, 120.24], [124.0, 124.44], [125.0, 143.26], [145.0, 145.49], [146.0, 145.67], [148.0, 148.27], [150.0, 150.43], [152.0, 154.25], [156.0, 156.03], [160.0, 162.06], [164.0, 168.0], [168.0, 169.52], [175.0, 177.62], [178.0, 182.66], [185.0, 185.52], [188.0, 188.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 47.23, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 0.0, 0.0, 90.6, 70.02, 0.0, 0.0, 0.0, 0.0, 0.0, 54.36, 0.0, 56.33, 0.0, 0.0, 0.0, 0.0, 31.72, 0.0, 0.0, 0.0, 0.0, 41.68, 0.0, 36.34, 46.15, 0.0, 54.56, 48.69, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 15.51], ["fly, housefly", 11.51], ["radio", 11.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 12.18], ["siren", 10.72], ["noise", 10.54]], null, null, null, null, [["mains hum", 19.42], ["speech", 11.64], ["hum", 10.32]], null, [["bark", 29.13], ["dog", 14.78], ["animal", 11.0]], [["speech", 50.9], ["sidetone", 15.42], ["radio", 7.05]], null, null, [["speech", 61.36], ["whale vocalization", 3.69], ["stomach rumble", 3.26]], null, null], "duration": [1.94, 1.46, 0.21, 0.42, 0.41, 1.81, 0.18, 1.28, 0.56, 1.46, 0.39, 0.27, 1.06, 1.41, 0.99, 1.01, 3.44, 7.55, 1.13, 1.33, -0.03, 6.52, 0.85, 0.67, 0.97, 1.9, 2.32, 5.4, 0.04, 0.3, 0.48, 0.26, 0.81, 10.27, 1.27, 2.86, 1.76, 0.23, 0.24, 0.44, 18.26, 0.49, -0.33, 0.27, 0.43, 2.25, 0.03, 2.06, 4.0, 1.52, 2.62, 4.66, 0.52, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/bWo3nlFcH5k_filtered.json b/annotations_filtered/bWo3nlFcH5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8cae889245a729228224d4ab9f33d59410a3118 --- /dev/null +++ b/annotations_filtered/bWo3nlFcH5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.21], [8.0, 8.45], [9.0, 10.15], [16.0, 18.42], [19.0, 20.38], [22.0, 23.09], [26.0, 26.2], [27.0, 26.86], [30.0, 30.62], [31.0, 33.49], [39.0, 39.85], [44.0, 44.96], [46.0, 46.31], [48.0, 49.64], [53.0, 52.95], [54.0, 54.45], [58.0, 58.33], [60.0, 60.49], [61.0, 61.69], [63.0, 63.51], [67.0, 68.82], [72.0, 73.82], [74.0, 80.77], [83.0, 83.32], [84.0, 85.21], [86.0, 87.37], [92.0, 93.02], [96.0, 96.62], [97.0, 97.19], [98.0, 98.61], [99.0, 99.37], [100.0, 100.48], [101.0, 106.74], [108.0, 109.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.45, 1.15, 2.42, 1.38, 1.09, 0.2, -0.14, 0.62, 2.49, 0.85, 0.96, 0.31, 1.64, -0.05, 0.45, 0.33, 0.49, 0.69, 0.51, 1.82, 1.82, 6.77, 0.32, 1.21, 1.37, 1.02, 0.62, 0.19, 0.61, 0.37, 0.48, 5.74, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/bWr67LK9-Uo_filtered.json b/annotations_filtered/bWr67LK9-Uo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/bWr67LK9-Uo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/bX-o8WaWp2Q_filtered.json b/annotations_filtered/bX-o8WaWp2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a26918239f8c2e7e075ce3f82a95ac986ccdf58f --- /dev/null +++ b/annotations_filtered/bX-o8WaWp2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.26], [31.0, 31.43], [44.0, 48.93], [53.0, 53.84], [56.0, 56.96], [58.0, 59.29], [60.0, 61.75], [73.0, 72.84], [73.0, 73.53], [76.0, 76.79], [78.0, 78.56], [80.0, 82.17], [85.0, 87.42], [89.0, 95.67], [99.0, 129.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.93, 43.56, 35.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.91], ["electronic music", 5.64], ["throbbing", 4.16]], [["music", 67.57], ["house music", 4.4], ["electronic music", 3.92]], null], "duration": [0.26, 0.43, 4.93, 0.84, 0.96, 1.29, 1.75, -0.16, 0.53, 0.79, 0.56, 2.17, 2.42, 6.67, 30.51]} \ No newline at end of file diff --git a/annotations_filtered/bX6BKxFkU78_filtered.json b/annotations_filtered/bX6BKxFkU78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f1674b3748178ddaaa508bf8e83130f653d35d2 --- /dev/null +++ b/annotations_filtered/bX6BKxFkU78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.04], [9.0, 11.3], [12.0, 11.82], [12.0, 13.95], [14.0, 14.59], [15.0, 15.62], [18.0, 19.82], [22.0, 22.91], [25.0, 26.62], [28.0, 28.81], [32.0, 33.02], [39.0, 39.18], [43.0, 44.15], [47.0, 47.51], [50.0, 50.94], [53.0, 53.62], [73.0, 73.01], [75.0, 75.37], [76.0, 76.23], [78.0, 79.44], [80.0, 82.75], [84.0, 84.87], [87.0, 92.2], [94.0, 95.0], [97.0, 97.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 88.46, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 56.79], ["sidetone", 14.6], ["hum", 5.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 2.3, -0.18, 1.95, 0.59, 0.62, 1.82, 0.91, 1.62, 0.81, 1.02, 0.18, 1.15, 0.51, 0.94, 0.62, 0.01, 0.37, 0.23, 1.44, 2.75, 0.87, 5.2, 1.0, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/bXEglx-or6k_filtered.json b/annotations_filtered/bXEglx-or6k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01c3b6488dac0125ea8994e6e84dde709a42ab90 --- /dev/null +++ b/annotations_filtered/bXEglx-or6k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.8], [25.0, 25.79], [29.0, 29.4], [37.0, 38.48]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.8, 0.79, 0.4, 1.48]} \ No newline at end of file diff --git a/annotations_filtered/bXRv0TjJQZ0_filtered.json b/annotations_filtered/bXRv0TjJQZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d2fc74658e766164ecbefc6f47c43710fcebd58 --- /dev/null +++ b/annotations_filtered/bXRv0TjJQZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.34], [26.0, 29.3], [30.0, 30.86], [32.0, 35.53], [36.0, 49.82], [51.0, 52.89], [54.0, 54.18], [55.0, 56.96], [58.0, 68.17], [69.0, 74.88], [76.0, 79.19], [80.0, 86.16], [87.0, 91.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.34, 3.3, 0.86, 3.53, 13.82, 1.89, 0.18, 1.96, 10.17, 5.88, 3.19, 6.16, 4.29]} \ No newline at end of file diff --git a/annotations_filtered/bXS1LMaU7TM_filtered.json b/annotations_filtered/bXS1LMaU7TM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c481025b8da7d043296eaf212dcbb0b079533b65 --- /dev/null +++ b/annotations_filtered/bXS1LMaU7TM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [5.0, 7.69], [8.0, 11.21], [13.0, 13.95], [15.0, 15.16], [16.0, 18.99], [21.0, 21.73], [28.0, 29.52], [42.0, 42.5], [44.0, 45.82], [47.0, 48.24], [52.0, 51.9], [52.0, 52.39], [63.0, 62.99], [67.0, 67.73], [69.0, 70.12], [72.0, 72.76], [82.0, 82.44], [99.0, 99.72], [102.0, 103.13], [109.0, 108.99], [110.0, 110.66], [115.0, 115.92], [118.0, 118.64], [124.0, 125.64], [131.0, 132.81], [133.0, 133.59], [134.0, 136.75], [139.0, 139.08], [141.0, 141.89], [145.0, 147.45], [152.0, 157.89], [159.0, 162.84], [164.0, 165.01]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false], "silence_prob": [0.0, 60.14, 61.47, 0.0, 0.0, 39.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.47, 0.0, 0.0, 29.86, 30.41, 29.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 43.36], ["theremin", 6.95], ["musical instrument", 6.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 16.57], ["moo", 10.22], ["mosquito", 7.96]], null, null, [["music", 47.79], ["theremin", 4.3], ["didgeridoo", 2.15]], [["music", 63.42], ["theremin", 27.6], ["didgeridoo", 0.89]], [["music", 46.1], ["chant", 7.53], ["opera", 5.65]], null], "duration": [0.51, 2.69, 3.21, 0.95, 0.16, 2.99, 0.73, 1.52, 0.5, 1.82, 1.24, -0.1, 0.39, -0.01, 0.73, 1.12, 0.76, 0.44, 0.72, 1.13, -0.01, 0.66, 0.92, 0.64, 1.64, 1.81, 0.59, 2.75, 0.08, 0.89, 2.45, 5.89, 3.84, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/bXYobuaTjNs_filtered.json b/annotations_filtered/bXYobuaTjNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3efe80e835470b66113397d7efa8b1d52cc8032 --- /dev/null +++ b/annotations_filtered/bXYobuaTjNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.28], [21.0, 21.84], [26.0, 47.12], [48.0, 70.6], [71.0, 73.03]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.72, 31.15, 32.28], "audiomae_on_audioset": [null, null, [["music", 48.22], ["speech", 25.85], ["hum", 5.46]], [["music", 56.99], ["throbbing", 13.44], ["hum", 12.47]], [["music", 81.06], ["musical instrument", 4.05], ["guitar", 3.49]]], "duration": [1.28, 0.84, 21.12, 22.6, 2.03]} \ No newline at end of file diff --git a/annotations_filtered/bXZFFinWVYw_filtered.json b/annotations_filtered/bXZFFinWVYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46868c3a39018767b5b6764340bc2768282faf2c --- /dev/null +++ b/annotations_filtered/bXZFFinWVYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.64], [8.0, 10.29], [12.0, 11.89], [16.0, 16.31], [18.0, 18.62], [20.0, 20.28], [29.0, 29.64], [30.0, 30.45], [32.0, 31.82], [34.0, 34.23], [35.0, 35.99], [37.0, 37.42], [39.0, 40.15], [41.0, 41.2], [44.0, 44.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.1, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.64, 2.29, -0.11, 0.31, 0.62, 0.28, 0.64, 0.45, -0.18, 0.23, 0.99, 0.42, 1.15, 0.2, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/bXq3dytL6ZA_filtered.json b/annotations_filtered/bXq3dytL6ZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..190e18bbd6ddab1d2d55577b9c1d23534a31b5c7 --- /dev/null +++ b/annotations_filtered/bXq3dytL6ZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.54], [10.0, 12.01], [13.0, 14.08], [15.0, 15.89], [17.0, 19.62], [22.0, 22.27], [23.0, 24.43], [26.0, 27.13], [29.0, 29.84], [35.0, 35.77], [38.0, 40.0], [41.0, 42.23], [46.0, 47.71], [49.0, 50.03], [52.0, 54.72], [56.0, 87.61], [89.0, 89.85], [92.0, 106.98], [111.0, 130.71], [131.0, 130.82], [131.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [73.36, 70.86, 0.0, 0.0, 59.51, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 44.29, 0.0, 0.0, 29.13, 29.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 65.46], ["theremin", 4.24], ["synthesizer", 3.59]], null, null, [["vehicle", 13.13], ["car", 10.31], ["music", 7.9]], [["music", 49.24], ["cacophony", 6.95], ["throbbing", 5.81]], null, null], "duration": [4.54, 2.01, 1.08, 0.89, 2.62, 0.27, 1.43, 1.13, 0.84, 0.77, 2.0, 1.23, 1.71, 1.03, 2.72, 31.61, 0.85, 14.98, 19.71, -0.18, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/bXt-KqvrSh0_filtered.json b/annotations_filtered/bXt-KqvrSh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..212ec3ccf045e8a9c3be152fb78d1b1c6c48e5cb --- /dev/null +++ b/annotations_filtered/bXt-KqvrSh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.02], [5.0, 5.31], [14.0, 15.75], [16.0, 16.97], [19.0, 20.17], [21.0, 20.95], [23.0, 29.59], [33.0, 33.22], [34.0, 35.68]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 53.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [2.02, 0.31, 1.75, 0.97, 1.17, -0.05, 6.59, 0.22, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/bXtvpRR4VbA_filtered.json b/annotations_filtered/bXtvpRR4VbA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9705c6bb72997472d6a2dee778c09c90249f271 --- /dev/null +++ b/annotations_filtered/bXtvpRR4VbA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [3.0, 4.35], [9.0, 10.17], [20.0, 19.87], [29.0, 29.79], [30.0, 30.75], [32.0, 32.31], [35.0, 36.41], [38.0, 39.65], [42.0, 41.93], [42.0, 43.77], [44.0, 46.01], [51.0, 53.11], [55.0, 55.98], [57.0, 61.87], [79.0, 78.85], [80.0, 79.71], [81.0, 80.65], [88.0, 89.21], [92.0, 92.72], [97.0, 97.8], [99.0, 99.99], [106.0, 107.06], [108.0, 108.58], [110.0, 112.5], [113.0, 114.08], [115.0, 116.46], [121.0, 121.27], [124.0, 124.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.76, 69.61, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 1.35, 1.17, -0.13, 0.79, 0.75, 0.31, 1.41, 1.65, -0.07, 1.77, 2.01, 2.11, 0.98, 4.87, -0.15, -0.29, -0.35, 1.21, 0.72, 0.8, 0.99, 1.06, 0.58, 2.5, 1.08, 1.46, 0.27, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/bXy8AgE7jBo_filtered.json b/annotations_filtered/bXy8AgE7jBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cae6a6215bfd326263d6d9ff45e7d16eebfba194 --- /dev/null +++ b/annotations_filtered/bXy8AgE7jBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.77], [33.0, 33.61], [35.0, 35.94], [37.0, 37.07], [39.0, 43.46], [49.0, 49.13], [51.0, 52.07], [55.0, 56.69], [58.0, 61.47], [63.0, 64.13], [65.0, 70.8], [71.0, 73.97], [75.0, 79.95], [82.0, 86.09], [88.0, 88.57], [90.0, 92.38], [95.0, 95.52], [98.0, 99.62], [100.0, 110.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 82.07, 0.0, 0.0, 0.0, 52.16, 0.0, 51.99, 40.34, 40.02, 44.87, 0.0, 45.02, 0.0, 0.0, 36.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.26], ["hum", 11.55], ["mains hum", 4.36]], [["insect", 33.7], ["fly, housefly", 30.82], ["bee, wasp, etc.", 8.85]], [["speech", 19.31], ["fly, housefly", 16.35], ["hum", 8.43]], null, [["speech", 28.33], ["sidetone", 26.1], ["radio", 13.68]], null, null, [["speech", 48.38], ["burst, pop", 9.04], ["explosion", 5.59]]], "duration": [0.77, 0.61, 0.94, 0.07, 4.46, 0.13, 1.07, 1.69, 3.47, 1.13, 5.8, 2.97, 4.95, 4.09, 0.57, 2.38, 0.52, 1.62, 10.4]} \ No newline at end of file diff --git a/annotations_filtered/bXzp-98u468_filtered.json b/annotations_filtered/bXzp-98u468_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8eb0d68318feca463d00b3301a9bb6c179fb057 --- /dev/null +++ b/annotations_filtered/bXzp-98u468_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [10.0, 11.21], [16.0, 16.73], [23.0, 24.38], [26.0, 26.43], [29.0, 29.44], [30.0, 30.92], [34.0, 34.32], [36.0, 36.69], [39.0, 39.83], [41.0, 42.25], [46.0, 45.82], [49.0, 49.22], [50.0, 51.19], [54.0, 54.51], [57.0, 57.69], [75.0, 75.37], [82.0, 83.35], [90.0, 90.21], [92.0, 94.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 1.21, 0.73, 1.38, 0.43, 0.44, 0.92, 0.32, 0.69, 0.83, 1.25, -0.18, 0.22, 1.19, 0.51, 0.69, 0.37, 1.35, 0.21, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/bY-jTccddQo_filtered.json b/annotations_filtered/bY-jTccddQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..521ed3a25d9068d6f4da269d19c721f942bfa4ba --- /dev/null +++ b/annotations_filtered/bY-jTccddQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [5.0, 13.91], [15.0, 18.05], [19.0, 19.6], [26.0, 30.21], [41.0, 41.54], [46.0, 47.04], [48.0, 54.14], [58.0, 63.19], [66.0, 66.65], [73.0, 77.04], [79.0, 80.84], [94.0, 95.42]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 29.33, 28.67, 0.0, 28.71, 0.0, 0.0, 28.17, 36.14, 0.0, 50.26, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 33.54], ["speech", 27.53], ["electric shaver, electric razor", 5.26]], [["music", 25.0], ["throbbing", 10.21], ["hum", 8.52]], null, [["speech", 85.74], ["music", 3.67], ["sound effect", 0.95]], null, null, [["livestock, farm animals, working animals", 35.21], ["cattle, bovinae", 20.76], ["speech", 10.04]], [["hum", 38.21], ["mains hum", 22.91], ["throbbing", 11.81]], null, null, null, null], "duration": [0.52, 8.91, 3.05, 0.6, 4.21, 0.54, 1.04, 6.14, 5.19, 0.65, 4.04, 1.84, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/bY6jLt3owBQ_filtered.json b/annotations_filtered/bY6jLt3owBQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45fdde5c2c2909e09907360a60475143461a2b9c --- /dev/null +++ b/annotations_filtered/bY6jLt3owBQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.34], [8.0, 8.77], [23.0, 23.31], [27.0, 27.4], [29.0, 37.07], [48.0, 48.41], [53.0, 101.02], [106.0, 124.43]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.69, 0.0, 0.0, 31.62], "audiomae_on_audioset": [null, null, null, null, [["music", 61.21], ["synthesizer", 9.79], ["electronic music", 2.81]], null, null, [["music", 79.77], ["electronic music", 1.25], ["musical instrument", 1.16]]], "duration": [1.34, 0.77, 0.31, 0.4, 8.07, 0.41, 48.02, 18.43]} \ No newline at end of file diff --git a/annotations_filtered/bYO_AhZaG24_filtered.json b/annotations_filtered/bYO_AhZaG24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eff6993b7ecabc56ad16a378b550dae922803203 --- /dev/null +++ b/annotations_filtered/bYO_AhZaG24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.28], [22.0, 22.57], [24.0, 27.28], [30.0, 31.08], [33.0, 35.36], [39.0, 60.39], [63.0, 87.49], [94.0, 102.74], [106.0, 113.63], [115.0, 119.28], [124.0, 136.04]], "keep_status": [false, false, false, false, true, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 32.08, 0.0, 31.32, 30.47, 31.22, 32.75, 31.33, 32.06, 33.56], "audiomae_on_audioset": [null, null, [["speech", 51.74], ["music", 16.84], ["musical instrument", 3.63]], null, [["whoosh, swoosh, swish", 12.17], ["fly, housefly", 11.62], ["whip", 10.87]], [["music", 62.78], ["speech", 13.09], ["boing", 6.44]], [["music", 58.28], ["throbbing", 8.47], ["electronic music", 6.75]], [["music", 34.66], ["sidetone", 28.68], ["speech", 15.71]], [["music", 56.65], ["buzz", 6.33], ["boing", 5.59]], [["music", 23.7], ["explosion", 16.08], ["speech", 11.56]], [["music", 60.99], ["theremin", 3.61], ["synthesizer", 3.53]]], "duration": [1.28, 0.57, 3.28, 1.08, 2.36, 21.39, 24.49, 8.74, 7.63, 4.28, 12.04]} \ No newline at end of file diff --git a/annotations_filtered/bYQjcjDeGF4_filtered.json b/annotations_filtered/bYQjcjDeGF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..642b18c5663813326ad500762a93c151ad2f2284 --- /dev/null +++ b/annotations_filtered/bYQjcjDeGF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.68], [13.0, 15.18], [16.0, 21.09], [22.0, 25.84], [27.0, 27.26], [29.0, 29.94], [32.0, 33.44], [35.0, 36.17], [39.0, 40.02], [43.0, 43.09], [45.0, 45.5], [47.0, 48.69], [52.0, 54.01], [55.0, 57.94], [59.0, 66.78], [68.0, 70.38], [72.0, 71.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 99.78, 99.4, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 99.91, 97.83, 95.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.68, 2.18, 5.09, 3.84, 0.26, 0.94, 1.44, 1.17, 1.02, 0.09, 0.5, 1.69, 2.01, 2.94, 7.78, 2.38, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/bYUJuCsymVM_filtered.json b/annotations_filtered/bYUJuCsymVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..474b3a6788d270011d34edc6c82087645b6ed359 --- /dev/null +++ b/annotations_filtered/bYUJuCsymVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.34], [17.0, 25.86], [27.0, 37.03], [41.0, 41.62], [45.0, 44.73], [47.0, 49.33], [52.0, 55.16], [59.0, 77.14], [80.0, 105.71]], "keep_status": [false, false, false, false, false, false, true, true, true], "silence_prob": [45.88, 33.96, 64.41, 0.0, 0.0, 88.83, 30.29, 29.52, 30.93], "audiomae_on_audioset": [[["music", 36.45], ["speech", 29.79], ["didgeridoo", 7.92]], [["music", 73.99], ["synthesizer", 7.3], ["didgeridoo", 1.83]], null, null, null, null, [["music", 30.11], ["cacophony", 12.74], ["throbbing", 8.4]], [["speech", 31.82], ["music", 24.77], ["hum", 6.4]], [["music", 45.4], ["hum", 17.31], ["mains hum", 7.21]]], "duration": [2.34, 8.86, 10.03, 0.62, -0.27, 2.33, 3.16, 18.14, 25.71]} \ No newline at end of file diff --git a/annotations_filtered/bYVsnJR_f80_filtered.json b/annotations_filtered/bYVsnJR_f80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ffc3d37e4582c0a09a9fabf3551b71240d9a2a1 --- /dev/null +++ b/annotations_filtered/bYVsnJR_f80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.13], [10.0, 10.2], [12.0, 13.05], [15.0, 18.69], [24.0, 24.53], [25.0, 29.19], [31.0, 33.27], [41.0, 45.35], [45.0, 45.5], [46.0, 46.26], [52.0, 55.29], [56.0, 59.36], [61.0, 63.78], [66.0, 66.34], [71.0, 71.12], [77.0, 81.41], [105.0, 106.89], [112.0, 112.31], [115.0, 120.87], [122.0, 126.57], [132.0, 134.13], [143.0, 142.99], [144.0, 150.99], [152.0, 152.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 47.74, 0.0, 34.86, 38.23, 30.45, 0.0, 0.0, 31.25, 33.68, 40.45, 0.0, 0.0, 30.23, 0.0, 0.0, 31.06, 30.45, 33.27, 0.0, 37.03, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 53.06], ["speech", 9.98], ["hum", 8.7]], null, [["speech", 39.56], ["music", 27.85], ["hum", 4.45]], [["music", 68.47], ["throbbing", 10.75], ["didgeridoo", 5.95]], [["speech", 38.67], ["music", 30.25], ["boing", 4.49]], null, null, [["speech", 40.41], ["music", 35.59], ["mains hum", 3.47]], [["speech", 41.22], ["music", 39.19], ["breaking", 3.97]], [["music", 49.25], ["theremin", 21.81], ["didgeridoo", 10.44]], null, null, [["speech", 33.88], ["music", 30.84], ["dubstep", 5.14]], null, null, [["music", 62.65], ["speech", 17.0], ["hum", 4.04]], [["hum", 50.19], ["mains hum", 32.98], ["throbbing", 6.71]], [["hum", 43.0], ["mains hum", 12.85], ["music", 9.7]], null, [["music", 38.49], ["hum", 13.41], ["throbbing", 10.11]], null], "duration": [0.13, 0.2, 1.05, 3.69, 0.53, 4.19, 2.27, 4.35, 0.5, 0.26, 3.29, 3.36, 2.78, 0.34, 0.12, 4.41, 1.89, 0.31, 5.87, 4.57, 2.13, -0.01, 6.99, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/bYt5SAF0M3I_filtered.json b/annotations_filtered/bYt5SAF0M3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06e421d8867b8c9d5fff774f212322b039eef086 --- /dev/null +++ b/annotations_filtered/bYt5SAF0M3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.48], [11.0, 12.82], [15.0, 15.74], [17.0, 18.86], [20.0, 20.14], [21.0, 24.43], [26.0, 29.49], [30.0, 31.7], [33.0, 36.17], [37.0, 38.15], [39.0, 41.1], [43.0, 48.64], [50.0, 52.22], [54.0, 54.6], [56.0, 57.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 47.86, 44.23, 0.0, 41.74, 0.0, 52.56, 95.09, 66.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 72.38], ["radio", 7.54], ["sidetone", 4.19]], [["speech", 32.24], ["stomach rumble", 20.87], ["radio", 17.77]], null, [["speech", 42.45], ["radio", 41.6], ["sidetone", 9.95]], null, null, null, null, null, null], "duration": [1.48, 1.82, 0.74, 1.86, 0.14, 3.43, 3.49, 1.7, 3.17, 1.15, 2.1, 5.64, 2.22, 0.6, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/bZ0jZaH48b8_filtered.json b/annotations_filtered/bZ0jZaH48b8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2ba11299785f0138f8f7b96690571ec4b68dc7c --- /dev/null +++ b/annotations_filtered/bZ0jZaH48b8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.94], [10.0, 15.33], [19.0, 33.4], [36.0, 37.81], [40.0, 41.12], [44.0, 44.98], [46.0, 48.29], [49.0, 51.44], [53.0, 54.26], [55.0, 79.03], [79.0, 124.17]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [37.13, 37.98, 32.85, 0.0, 0.0, 0.0, 98.36, 41.81, 0.0, 36.87, 0.0], "audiomae_on_audioset": [[["throbbing", 35.27], ["music", 31.1], ["hum", 12.25]], [["music", 40.01], ["scary music", 8.16], ["hum", 6.33]], [["music", 73.84], ["scary music", 2.77], ["buzz", 1.76]], null, null, null, null, [["speech", 52.64], ["music", 10.51], ["noise", 7.78]], null, [["hum", 29.86], ["livestock, farm animals, working animals", 21.14], ["mains hum", 13.16]], null], "duration": [4.94, 5.33, 14.4, 1.81, 1.12, 0.98, 2.29, 2.44, 1.26, 24.03, 45.17]} \ No newline at end of file diff --git a/annotations_filtered/bZ7ZsN1FXuI_filtered.json b/annotations_filtered/bZ7ZsN1FXuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..756e5aa1fbac2a83bf83a1653375d68818c915de --- /dev/null +++ b/annotations_filtered/bZ7ZsN1FXuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.91], [3.0, 3.06], [3.0, 13.53], [16.0, 18.94], [20.0, 42.6], [43.0, 79.81], [83.0, 97.66]], "keep_status": [false, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 46.9, 34.44, 31.57, 0.0, 30.06], "audiomae_on_audioset": [null, null, [["speech", 36.0], ["hum", 12.69], ["whale vocalization", 6.24]], [["dog", 32.49], ["animal", 17.98], ["bark", 14.56]], [["rumble", 10.69], ["fly, housefly", 9.81], ["mosquito", 7.43]], null, [["mains hum", 65.94], ["hum", 20.09], ["buzz", 1.82]]], "duration": [0.91, 0.06, 10.53, 2.94, 22.6, 36.81, 14.66]} \ No newline at end of file diff --git a/annotations_filtered/bZhBhpm6m_A_filtered.json b/annotations_filtered/bZhBhpm6m_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f2a6648fc590a22eea0fbdf1f4b81afdc5835c0 --- /dev/null +++ b/annotations_filtered/bZhBhpm6m_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.29], [14.0, 14.4], [15.0, 15.87], [18.0, 18.18], [26.0, 27.51], [28.0, 29.27], [36.0, 37.86], [38.0, 41.35], [46.0, 45.81], [49.0, 50.04], [52.0, 53.4], [56.0, 56.46], [64.0, 64.62], [67.0, 67.41], [68.0, 70.68], [71.0, 81.38], [82.0, 83.66], [84.0, 84.92], [86.0, 86.24], [89.0, 89.31], [90.0, 91.02], [93.0, 93.92], [101.0, 101.63], [104.0, 105.19], [107.0, 107.55], [111.0, 112.78], [113.0, 115.13], [118.0, 120.16], [123.0, 122.99], [128.0, 129.83], [131.0, 131.53], [132.0, 135.9], [137.0, 164.17], [169.0, 170.18], [170.0, 171.26], [172.0, 172.64], [174.0, 173.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.86, 30.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 99.94, 0.0, 0.0, 0.0, 45.65, 30.86, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 57.31], ["gunshot, gunfire", 7.89], ["explosion", 7.04]], null, null, null, null, null, null, null, [["speech", 46.58], ["explosion", 23.09], ["gunshot, gunfire", 9.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.85], ["hum", 29.83], ["mains hum", 12.99]], [["music", 25.6], ["hum", 11.11], ["crushing", 6.33]], null, null, null, null], "duration": [0.29, 0.4, 0.87, 0.18, 1.51, 1.27, 1.86, 3.35, -0.19, 1.04, 1.4, 0.46, 0.62, 0.41, 2.68, 10.38, 1.66, 0.92, 0.24, 0.31, 1.02, 0.92, 0.63, 1.19, 0.55, 1.78, 2.13, 2.16, -0.01, 1.83, 0.53, 3.9, 27.17, 1.18, 1.26, 0.64, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/b_BA368IluE_filtered.json b/annotations_filtered/b_BA368IluE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49ff2f8437ca163a140ca33e0784f32c3d17eba8 --- /dev/null +++ b/annotations_filtered/b_BA368IluE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.81], [25.0, 26.47], [27.0, 30.84], [42.0, 42.72], [55.0, 55.46], [61.0, 62.46], [64.0, 65.33], [71.0, 70.68], [74.0, 74.83], [87.0, 88.45], [90.0, 90.46]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [31.57, 0.0, 38.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 59.43], ["radio", 11.13], ["music", 2.86]], null, [["speech", 48.62], ["fly, housefly", 8.21], ["livestock, farm animals, working animals", 3.14]], null, null, null, null, null, null, null, null], "duration": [2.81, 1.47, 3.84, 0.72, 0.46, 1.46, 1.33, -0.32, 0.83, 1.45, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/b_HhiU1mOwU_filtered.json b/annotations_filtered/b_HhiU1mOwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4feb6baa091f32b49b12a271105baa9502b87ea7 --- /dev/null +++ b/annotations_filtered/b_HhiU1mOwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.99], [1.0, 6.69], [9.0, 30.32], [31.0, 30.94], [31.0, 31.16], [32.0, 34.1], [42.0, 43.23], [45.0, 46.13], [53.0, 53.86], [55.0, 55.86], [69.0, 68.81], [70.0, 72.12], [75.0, 75.51], [84.0, 84.74], [86.0, 85.83], [87.0, 87.86], [90.0, 93.29], [98.0, 97.95], [98.0, 98.66], [99.0, 101.6]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.33, 34.43, 0.0, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 70.44], "audiomae_on_audioset": [null, [["speech", 21.42], ["hum", 15.33], ["vehicle", 7.63]], [["music", 32.75], ["mains hum", 15.99], ["hum", 12.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 5.69, 21.32, -0.06, 0.16, 2.1, 1.23, 1.13, 0.86, 0.86, -0.19, 2.12, 0.51, 0.74, -0.17, 0.86, 3.29, -0.05, 0.66, 2.6]} \ No newline at end of file diff --git a/annotations_filtered/b_aJy2SE60E_filtered.json b/annotations_filtered/b_aJy2SE60E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f68b82da1e71fdaeb22bbbf50881af64cced368d --- /dev/null +++ b/annotations_filtered/b_aJy2SE60E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.48], [18.0, 18.98], [30.0, 30.42], [32.0, 31.92], [53.0, 53.6], [71.0, 71.46], [97.0, 98.1], [103.0, 103.17], [106.0, 105.7], [128.0, 129.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.98, 0.42, -0.08, 0.6, 0.46, 1.1, 0.17, -0.3, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/b_jYYdrSYBg_filtered.json b/annotations_filtered/b_jYYdrSYBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..300e0d1fee396c1afe72d3223479212b8c003344 --- /dev/null +++ b/annotations_filtered/b_jYYdrSYBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.21], [19.0, 20.12], [22.0, 23.08], [26.0, 35.73], [42.0, 82.49], [83.0, 84.37], [94.0, 97.87], [100.0, 101.82]], "keep_status": [true, false, false, false, false, false, true, false], "silence_prob": [37.95, 0.0, 0.0, 86.82, 0.0, 0.0, 32.55, 0.0], "audiomae_on_audioset": [[["speech", 29.83], ["music", 9.72], ["animal", 2.03]], null, null, null, null, null, [["speech", 29.81], ["music", 15.83], ["explosion", 11.24]], null], "duration": [2.21, 1.12, 1.08, 9.73, 40.49, 1.37, 3.87, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/b_tZKOxNR7o_filtered.json b/annotations_filtered/b_tZKOxNR7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc95ccd28eebc2af8cf00f9a8f060ab385342c51 --- /dev/null +++ b/annotations_filtered/b_tZKOxNR7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.94], [9.0, 9.95], [11.0, 11.55], [14.0, 15.01], [20.0, 21.07], [24.0, 81.55], [84.0, 88.21], [90.0, 100.6]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.82, 30.03], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 31.23], ["effects unit", 30.3], ["distortion", 11.18]], [["hum", 35.68], ["cacophony", 16.25], ["mains hum", 15.33]]], "duration": [0.94, 0.95, 0.55, 1.01, 1.07, 57.55, 4.21, 10.6]} \ No newline at end of file diff --git a/annotations_filtered/b_uKO3N_JJQ_filtered.json b/annotations_filtered/b_uKO3N_JJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73bad9a732c4e5b9897797bb482fdd49ff46628e --- /dev/null +++ b/annotations_filtered/b_uKO3N_JJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.59], [12.0, 13.54], [14.0, 23.58], [27.0, 32.16]], "keep_status": [false, false, true, true], "silence_prob": [32.98, 0.0, 29.84, 45.27], "audiomae_on_audioset": [[["whale vocalization", 28.4], ["speech", 23.62], ["music", 19.76]], null, [["music", 24.81], ["speech", 20.47], ["whack, thwack", 5.75]], [["hum", 18.47], ["noise", 11.88], ["mains hum", 9.87]]], "duration": [5.59, 1.54, 9.58, 5.16]} \ No newline at end of file diff --git a/annotations_filtered/b_uXZZRpO-E_filtered.json b/annotations_filtered/b_uXZZRpO-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a008623dafa661efe63b2a087d03dc99c624e3f --- /dev/null +++ b/annotations_filtered/b_uXZZRpO-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.32], [23.0, 23.5], [25.0, 25.49], [27.0, 33.94], [35.0, 35.04], [38.0, 38.91], [41.0, 41.66], [44.0, 44.27], [47.0, 47.44], [50.0, 51.27], [55.0, 56.57], [58.0, 59.0], [63.0, 64.25], [66.0, 66.63], [67.0, 67.78], [69.0, 70.24], [73.0, 74.83], [76.0, 76.91], [78.0, 79.03], [84.0, 84.62], [88.0, 88.16], [97.0, 98.17], [109.0, 109.93], [114.0, 114.98], [124.0, 126.03], [127.0, 129.12]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.16, 0.0, 0.0, 33.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.76], "audiomae_on_audioset": [[["mains hum", 29.43], ["hum", 15.23], ["speech", 12.76]], null, null, [["speech", 22.99], ["sidetone", 19.33], ["mains hum", 14.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.32, 0.5, 0.49, 6.94, 0.04, 0.91, 0.66, 0.27, 0.44, 1.27, 1.57, 1.0, 1.25, 0.63, 0.78, 1.24, 1.83, 0.91, 1.03, 0.62, 0.16, 1.17, 0.93, 0.98, 2.03, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/b_wnD6jxREU_filtered.json b/annotations_filtered/b_wnD6jxREU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76d4b4d0afaaa24b318108745e5ab88dc4b7e72f --- /dev/null +++ b/annotations_filtered/b_wnD6jxREU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.83], [5.0, 8.5], [10.0, 12.63], [13.0, 16.12], [18.0, 21.88], [24.0, 28.22], [29.0, 29.25], [30.0, 34.48], [35.0, 38.04], [38.0, 57.06], [58.0, 64.15], [66.0, 72.13], [75.0, 86.58], [88.0, 99.45], [101.0, 104.79], [113.0, 116.88], [118.0, 121.51], [122.0, 139.26], [140.0, 139.8], [142.0, 149.59], [153.0, 158.33], [164.0, 165.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 53.59, 57.09, 56.25, 58.64, 59.77, 0.0, 60.32, 57.01, 56.7, 58.38, 50.51, 39.43, 43.96, 37.31, 43.82, 39.7, 32.21, 0.0, 30.89, 31.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.38], ["cello", 7.62], ["double bass", 6.18]], [["music", 47.5], ["speech", 16.45], ["theremin", 8.59]], [["music", 42.52], ["theremin", 20.03], ["musical instrument", 5.73]], [["music", 57.9], ["theremin", 7.77], ["didgeridoo", 4.94]], [["music", 40.5], ["theremin", 9.62], ["musical instrument", 6.81]], [["music", 34.66], ["theremin", 14.8], ["speech", 8.76]], null, [["music", 41.03], ["theremin", 35.52], ["ambient music", 4.28]], [["music", 70.65], ["synthesizer", 5.76], ["theremin", 4.42]], null], "duration": [1.83, 3.5, 2.63, 3.12, 3.88, 4.22, 0.25, 4.48, 3.04, 19.06, 6.15, 6.13, 11.58, 11.45, 3.79, 3.88, 3.51, 17.26, -0.2, 7.59, 5.33, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/ba-U_sXRFqg_filtered.json b/annotations_filtered/ba-U_sXRFqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae7749542780673b32348da94e7b3ea33bb52d49 --- /dev/null +++ b/annotations_filtered/ba-U_sXRFqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.27], [5.0, 5.91], [7.0, 7.4], [17.0, 18.22], [20.0, 20.97], [22.0, 22.2], [24.0, 26.43], [30.0, 30.59], [34.0, 35.29], [39.0, 40.12], [45.0, 46.04], [49.0, 49.28], [50.0, 50.6], [51.0, 52.02], [53.0, 53.65], [55.0, 57.54], [65.0, 67.24], [69.0, 69.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 81.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 71.29], ["music", 5.67], ["busy signal", 4.13]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.27, 0.91, 0.4, 1.22, 0.97, 0.2, 2.43, 0.59, 1.29, 1.12, 1.04, 0.28, 0.6, 1.02, 0.65, 2.54, 2.24, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/ba2VaalmijM_filtered.json b/annotations_filtered/ba2VaalmijM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2235131068f27e1fdd25826ef235cad8cae4db99 --- /dev/null +++ b/annotations_filtered/ba2VaalmijM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [4.0, 5.49], [7.0, 8.68], [10.0, 14.54], [17.0, 30.18], [33.0, 33.84], [37.0, 38.1], [39.0, 39.5], [42.0, 42.7], [45.0, 45.1], [47.0, 48.03], [52.0, 53.08], [55.0, 55.46], [57.0, 59.1], [62.0, 62.33], [64.0, 64.84], [69.0, 75.46], [79.0, 82.29], [83.0, 84.13], [91.0, 91.17], [94.0, 105.39], [108.0, 108.65], [111.0, 115.1], [116.0, 117.17], [118.0, 118.99], [120.0, 121.91], [123.0, 123.69], [126.0, 130.06], [137.0, 138.01], [139.0, 140.19], [142.0, 142.55], [144.0, 169.33]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 90.78, 31.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 99.96, 91.81, 0.0, 0.0, 93.29, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 30.91, 0.0, 0.0, 0.0, 30.85], "audiomae_on_audioset": [null, null, null, null, [["vehicle", 13.6], ["speech", 12.14], ["music", 9.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.02], ["carnatic music", 8.07], ["musical instrument", 5.99]], null, null, null, [["fly, housefly", 36.97], ["music", 17.54], ["speech", 16.85]]], "duration": [0.78, 1.49, 1.68, 4.54, 13.18, 0.84, 1.1, 0.5, 0.7, 0.1, 1.03, 1.08, 0.46, 2.1, 0.33, 0.84, 6.46, 3.29, 1.13, 0.17, 11.39, 0.65, 4.1, 1.17, 0.99, 1.91, 0.69, 4.06, 1.01, 1.19, 0.55, 25.33]} \ No newline at end of file diff --git a/annotations_filtered/ba4niP3IwLQ_filtered.json b/annotations_filtered/ba4niP3IwLQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68b6e636e6803e32588c4a1f02c754e195c8401f --- /dev/null +++ b/annotations_filtered/ba4niP3IwLQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 77.28]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [65.28]} \ No newline at end of file diff --git a/annotations_filtered/ba5F8G778C0_filtered.json b/annotations_filtered/ba5F8G778C0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b45cd67bd35719af5f3f204d7b3f265370170725 --- /dev/null +++ b/annotations_filtered/ba5F8G778C0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.43], [7.0, 8.5], [10.0, 10.88], [12.0, 12.06], [12.0, 12.73], [13.0, 14.91], [15.0, 15.55], [21.0, 21.68], [32.0, 33.12], [34.0, 34.7], [35.0, 35.82], [36.0, 36.91], [38.0, 37.81], [39.0, 39.18], [46.0, 45.79], [48.0, 47.97], [49.0, 49.71], [55.0, 55.11], [60.0, 63.58], [67.0, 67.78], [69.0, 77.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 0.0, 99.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 1.5, 0.88, 0.06, 0.73, 1.91, 0.55, 0.68, 1.12, 0.7, 0.82, 0.91, -0.19, 0.18, -0.21, -0.03, 0.71, 0.11, 3.58, 0.78, 8.67]} \ No newline at end of file diff --git a/annotations_filtered/ba9YG9xCC7A_filtered.json b/annotations_filtered/ba9YG9xCC7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bbb18add7f009f017d64cc331cafa4ba07b3a81 --- /dev/null +++ b/annotations_filtered/ba9YG9xCC7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.36], [13.0, 42.72], [45.0, 61.21], [62.0, 71.27], [72.0, 72.55], [73.0, 73.2], [78.0, 83.34], [87.0, 87.4], [88.0, 88.89], [100.0, 101.92], [103.0, 113.44], [120.0, 122.67], [129.0, 133.12], [134.0, 150.01]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false, true, false, true], "silence_prob": [0.0, 40.11, 44.12, 33.79, 0.0, 0.0, 31.46, 0.0, 0.0, 0.0, 32.96, 48.61, 89.72, 37.03], "audiomae_on_audioset": [null, [["music", 55.66], ["percussion", 13.65], ["musical instrument", 8.2]], [["music", 23.96], ["hum", 19.24], ["buzz", 17.27]], [["music", 52.79], ["livestock, farm animals, working animals", 6.5], ["didgeridoo", 5.88]], null, null, [["fly, housefly", 24.22], ["insect", 15.05], ["hum", 12.2]], null, null, null, [["music", 58.09], ["speech", 9.92], ["frog", 5.18]], [["music", 21.72], ["whale vocalization", 16.77], ["hum", 9.49]], null, [["music", 45.71], ["speech", 8.43], ["hum", 7.67]]], "duration": [1.36, 29.72, 16.21, 9.27, 0.55, 0.2, 5.34, 0.4, 0.89, 1.92, 10.44, 2.67, 4.12, 16.01]} \ No newline at end of file diff --git a/annotations_filtered/baNc64S4DHY_filtered.json b/annotations_filtered/baNc64S4DHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cba8ae9719fc0d100daf16d6b0f26a1de696954a --- /dev/null +++ b/annotations_filtered/baNc64S4DHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.9], [22.0, 23.95], [27.0, 27.65], [29.0, 30.65], [37.0, 38.06], [39.0, 39.66], [49.0, 49.22], [53.0, 53.84], [60.0, 61.05], [63.0, 63.9], [75.0, 76.79], [78.0, 78.66], [80.0, 80.16], [83.0, 83.78], [86.0, 88.37], [89.0, 89.34], [91.0, 91.64], [96.0, 96.47], [99.0, 100.25], [105.0, 105.46], [106.0, 108.65], [114.0, 115.21], [120.0, 121.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 1.95, 0.65, 1.65, 1.06, 0.66, 0.22, 0.84, 1.05, 0.9, 1.79, 0.66, 0.16, 0.78, 2.37, 0.34, 0.64, 0.47, 1.25, 0.46, 2.65, 1.21, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/bb9m4vvEkHc_filtered.json b/annotations_filtered/bb9m4vvEkHc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ad59fea881c7aa56c4f259ccb4b00bbd2b0ee44 --- /dev/null +++ b/annotations_filtered/bb9m4vvEkHc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [5.0, 5.02], [7.0, 17.91], [20.0, 26.69], [32.0, 35.45], [36.0, 41.59], [43.0, 53.1], [54.0, 53.69], [56.0, 56.07], [58.0, 63.34], [68.0, 68.77], [70.0, 69.94], [78.0, 85.82], [88.0, 93.53], [95.0, 95.0], [97.0, 100.92], [115.0, 118.77], [119.0, 120.33], [123.0, 132.73], [136.0, 143.6], [145.0, 148.95], [149.0, 149.99], [151.0, 160.98], [162.0, 161.94], [162.0, 169.26], [172.0, 173.53], [176.0, 184.05], [185.0, 189.6], [190.0, 192.01], [200.0, 201.65], [202.0, 203.35], [207.0, 208.95]], "keep_status": [false, false, true, false, false, true, false, false, false, true, false, false, true, false, false, true, false, false, true, true, false, false, true, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 29.49, 28.92, 30.24, 29.15, 29.61, 0.0, 0.0, 29.06, 0.0, 0.0, 29.78, 29.86, 0.0, 29.15, 30.24, 0.0, 28.52, 29.95, 29.36, 0.0, 28.49, 0.0, 39.96, 0.0, 28.76, 29.67, 45.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 62.17], ["whack, thwack", 4.49], ["tuning fork", 2.4]], [["smash, crash", 44.81], ["music", 20.57], ["whack, thwack", 6.04]], [["music", 54.75], ["speech", 21.3], ["electronic music", 3.4]], [["music", 32.59], ["throbbing", 14.63], ["smash, crash", 11.5]], [["speech", 38.22], ["music", 32.94], ["whack, thwack", 9.0]], null, null, [["music", 46.3], ["speech", 14.6], ["clang", 3.54]], null, null, [["speech", 38.47], ["music", 22.61], ["whack, thwack", 5.54]], [["speech", 51.57], ["music", 18.28], ["whack, thwack", 9.77]], null, [["music", 28.99], ["burst, pop", 17.75], ["speech", 11.96]], [["music", 35.99], ["speech", 34.26], ["thunk", 4.49]], null, [["speech", 30.42], ["music", 29.98], ["bang", 7.93]], [["music", 35.17], ["livestock, farm animals, working animals", 8.92], ["throbbing", 8.59]], [["speech", 52.62], ["music", 32.73], ["thump, thud", 1.83]], null, [["music", 27.99], ["hum", 15.25], ["throbbing", 10.79]], null, [["speech", 36.39], ["hum", 16.78], ["throbbing", 10.64]], null, [["hum", 28.3], ["explosion", 17.31], ["mains hum", 10.22]], [["speech", 50.33], ["sound effect", 5.22], ["busy signal", 4.28]], [["animal", 37.91], ["dog", 22.94], ["domestic animals, pets", 11.28]], null, null, null], "duration": [0.38, 0.02, 10.91, 6.69, 3.45, 5.59, 10.1, -0.31, 0.07, 5.34, 0.77, -0.06, 7.82, 5.53, 0.0, 3.92, 3.77, 1.33, 9.73, 7.6, 3.95, 0.99, 9.98, -0.06, 7.26, 1.53, 8.05, 4.6, 2.01, 1.65, 1.35, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/bbJEqSj7Wkk_filtered.json b/annotations_filtered/bbJEqSj7Wkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43239a28e7893f7e47ec169cfc027f5364b97e25 --- /dev/null +++ b/annotations_filtered/bbJEqSj7Wkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.46], [18.0, 18.91], [24.0, 24.73], [25.0, 25.69], [26.0, 32.76], [37.0, 37.56], [41.0, 48.24], [52.0, 68.08], [69.0, 80.45]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [82.07, 0.0, 0.0, 0.0, 41.74, 0.0, 34.67, 30.13, 30.12], "audiomae_on_audioset": [null, null, null, null, [["speech", 51.97], ["music", 24.06], ["synthesizer", 3.8]], null, [["music", 42.67], ["fart", 29.1], ["synthesizer", 5.35]], [["music", 50.14], ["theremin", 27.22], ["hum", 4.85]], [["music", 42.39], ["speech", 21.47], ["theremin", 16.99]]], "duration": [2.46, 0.91, 0.73, 0.69, 6.76, 0.56, 7.24, 16.08, 11.45]} \ No newline at end of file diff --git a/annotations_filtered/bbTgmSIDyn8_filtered.json b/annotations_filtered/bbTgmSIDyn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f4d4aff9030985e17196bdfac81396bde941d4b --- /dev/null +++ b/annotations_filtered/bbTgmSIDyn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [8.0, 28.49], [29.0, 30.62], [32.0, 32.91], [37.0, 38.4], [41.0, 42.15], [43.0, 44.58], [45.0, 45.87], [48.0, 50.03], [50.0, 56.17], [57.0, 58.26], [59.0, 60.13], [65.0, 66.65], [72.0, 72.47], [76.0, 76.5], [78.0, 78.09], [80.0, 82.22], [83.0, 83.94], [85.0, 85.89], [87.0, 90.88], [92.0, 93.29], [104.0, 104.5], [110.0, 110.66], [117.0, 121.58], [124.0, 125.83], [129.0, 130.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.64, 44.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.74, 0.0, 0.0, 43.15, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 46.54], ["theremin", 25.57], ["radio", 5.72]], null, null, null, null, null, null, null, [["radio", 57.17], ["sidetone", 9.32], ["noise", 8.24]], null, null, null, null, null, null, [["speech", 70.67], ["radio", 22.9], ["sidetone", 1.38]], null, null, [["speech", 58.25], ["radio", 9.08], ["animal", 2.77]], null, null, null, null, null, null], "duration": [0.43, 20.49, 1.62, 0.91, 1.4, 1.15, 1.58, 0.87, 2.03, 6.17, 1.26, 1.13, 1.65, 0.47, 0.5, 0.09, 2.22, 0.94, 0.89, 3.88, 1.29, 0.5, 0.66, 4.58, 1.83, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/bbVqciFRioA_filtered.json b/annotations_filtered/bbVqciFRioA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b750f9c74e0acf57e8ac9bb4d86f8531c7b5e43e --- /dev/null +++ b/annotations_filtered/bbVqciFRioA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 21.2], [24.0, 31.31], [38.0, 40.22], [43.0, 57.77], [61.0, 61.96], [63.0, 62.82], [67.0, 68.49], [80.0, 86.76], [95.0, 95.18], [99.0, 102.91]], "keep_status": [true, true, true, true, false, false, false, false, false, false], "silence_prob": [38.3, 34.97, 35.2, 34.48, 0.0, 0.0, 0.0, 37.82, 0.0, 42.53], "audiomae_on_audioset": [[["throbbing", 13.03], ["fly, housefly", 10.83], ["hum", 10.3]], [["music", 24.04], ["speech", 14.43], ["didgeridoo", 9.98]], [["music", 23.92], ["hum", 6.28], ["musical instrument", 5.23]], [["music", 28.33], ["speech", 18.13], ["fly, housefly", 6.5]], null, null, null, [["throbbing", 30.39], ["music", 26.55], ["hum", 25.65]], null, [["music", 66.82], ["electronic music", 3.86], ["hum", 2.09]]], "duration": [4.2, 7.31, 2.22, 14.77, 0.96, -0.18, 1.49, 6.76, 0.18, 3.91]} \ No newline at end of file diff --git a/annotations_filtered/bbX5KM0tFVk_filtered.json b/annotations_filtered/bbX5KM0tFVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43afaa0eded760ba8f95f84e13af6e9d92041dc0 --- /dev/null +++ b/annotations_filtered/bbX5KM0tFVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [7.0, 10.32], [13.0, 17.51], [18.0, 19.85], [21.0, 24.71], [27.0, 29.27], [31.0, 35.94], [38.0, 40.05], [42.0, 45.01], [46.0, 57.43], [58.0, 59.97], [62.0, 132.66], [135.0, 139.7], [142.0, 144.98], [148.0, 156.1]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 90.95, 100.0, 0.0, 99.31, 47.46, 39.3, 100.0, 90.25, 50.26, 0.0, 0.0, 72.01, 64.63, 47.66], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 77.03], ["sidetone", 8.28], ["dial tone", 3.83]], [["hum", 14.74], ["mains hum", 12.77], ["fly, housefly", 10.1]], null, null, null, null, null, null, null, [["noise", 24.95], ["stomach rumble", 16.14], ["effects unit", 8.99]]], "duration": [0.96, 3.32, 4.51, 1.85, 3.71, 2.27, 4.94, 2.05, 3.01, 11.43, 1.97, 70.66, 4.7, 2.98, 8.1]} \ No newline at end of file diff --git a/annotations_filtered/bbnkw5RyiCI_filtered.json b/annotations_filtered/bbnkw5RyiCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b7a4ab330a45435388726fdd73dd690668c9a4f --- /dev/null +++ b/annotations_filtered/bbnkw5RyiCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.38], [25.0, 28.61], [29.0, 29.86], [30.0, 33.22], [37.0, 39.29], [54.0, 57.27], [77.0, 76.99], [81.0, 84.18], [103.0, 104.06], [106.0, 107.33], [114.0, 113.7], [114.0, 113.73], [114.0, 115.4], [117.0, 116.78], [118.0, 122.98], [124.0, 124.48], [125.0, 136.24], [138.0, 141.57], [144.0, 144.61], [146.0, 154.45], [157.0, 157.33]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [66.51, 42.74, 0.0, 63.85, 49.59, 34.36, 0.0, 33.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.56, 0.0, 69.74, 84.43, 0.0, 31.9, 0.0], "audiomae_on_audioset": [null, [["speech", 44.37], ["frog", 12.49], ["croak", 10.33]], null, null, [["speech", 39.4], ["cattle, bovinae", 7.27], ["music", 5.33]], [["livestock, farm animals, working animals", 41.73], ["moo", 27.84], ["cattle, bovinae", 19.13]], null, [["fly, housefly", 27.48], ["insect", 21.31], ["livestock, farm animals, working animals", 20.37]], null, null, null, null, null, null, [["speech", 31.07], ["sidetone", 23.53], ["noise", 12.82]], null, null, null, null, [["music", 37.48], ["speech", 16.22], ["buzz", 6.5]], null], "duration": [2.38, 3.61, 0.86, 3.22, 2.29, 3.27, -0.01, 3.18, 1.06, 1.33, -0.3, -0.27, 1.4, -0.22, 4.98, 0.48, 11.24, 3.57, 0.61, 8.45, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/bbpQmRxCYUU_filtered.json b/annotations_filtered/bbpQmRxCYUU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aabf1935188569ee281d77890a508cf67cd14410 --- /dev/null +++ b/annotations_filtered/bbpQmRxCYUU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.28], [19.0, 22.08], [24.0, 24.26], [29.0, 28.98], [33.0, 33.66], [35.0, 36.49], [37.0, 40.19], [42.0, 43.31], [48.0, 49.52], [55.0, 55.34], [58.0, 59.53], [60.0, 61.1], [63.0, 63.0], [67.0, 67.83], [70.0, 70.61], [75.0, 78.48], [81.0, 81.04], [82.0, 86.97], [91.0, 91.44], [93.0, 96.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.82, 85.17, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 94.66, 0.0, 97.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.28, 3.08, 0.26, -0.02, 0.66, 1.49, 3.19, 1.31, 1.52, 0.34, 1.53, 1.1, 0.0, 0.83, 0.61, 3.48, 0.04, 4.97, 0.44, 3.11]} \ No newline at end of file diff --git a/annotations_filtered/bbqRezPHMDQ_filtered.json b/annotations_filtered/bbqRezPHMDQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42f0113ca772888fc01fdaec5127d5dfb7415ad6 --- /dev/null +++ b/annotations_filtered/bbqRezPHMDQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.4], [11.0, 12.04], [13.0, 110.74], [111.0, 112.55]], "keep_status": [false, false, false, false], "silence_prob": [99.26, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [5.4, 1.04, 97.74, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/bc2muGlQIlk_filtered.json b/annotations_filtered/bc2muGlQIlk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63f740010de06cea03e1edb039f35b76cd2e317d --- /dev/null +++ b/annotations_filtered/bc2muGlQIlk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 10.3], [16.0, 17.2], [30.0, 31.01], [37.0, 38.13], [39.0, 39.87], [47.0, 47.43], [50.0, 50.8], [54.0, 54.63], [58.0, 58.72], [66.0, 70.06], [73.0, 76.1], [77.0, 77.87], [80.0, 80.76], [82.0, 83.05], [85.0, 86.8], [89.0, 89.55], [92.0, 92.67], [101.0, 103.99], [106.0, 126.84], [127.0, 127.67], [130.0, 130.03], [146.0, 147.07]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.2, 39.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 46.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 60.51], ["radio", 7.79], ["hum", 6.57]], null, null, null, null, null, null, null, null, [["hum", 26.47], ["music", 15.56], ["mains hum", 8.92]], [["speech", 54.43], ["music", 8.5], ["sidetone", 2.93]], null, null, null, null, null, null, null, [["fly, housefly", 40.63], ["insect", 22.48], ["bee, wasp, etc.", 14.0]], null, null, null], "duration": [9.3, 1.2, 1.01, 1.13, 0.87, 0.43, 0.8, 0.63, 0.72, 4.06, 3.1, 0.87, 0.76, 1.05, 1.8, 0.55, 0.67, 2.99, 20.84, 0.67, 0.03, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/bc84pYZICbk_filtered.json b/annotations_filtered/bc84pYZICbk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cca376da84e6dc762dd1c0f40a27ae37520991b --- /dev/null +++ b/annotations_filtered/bc84pYZICbk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [6.0, 6.79], [7.0, 12.06], [14.0, 14.23], [15.0, 15.31], [16.0, 18.0], [21.0, 21.27], [26.0, 60.27]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.44, 0.79, 5.06, 0.23, 0.31, 2.0, 0.27, 34.27]} \ No newline at end of file diff --git a/annotations_filtered/bcAACOrgVKE_filtered.json b/annotations_filtered/bcAACOrgVKE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7f819647f79146cce0b89ce6ede1f70473a62bc --- /dev/null +++ b/annotations_filtered/bcAACOrgVKE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 63.21], [78.0, 78.17], [82.0, 82.7], [92.0, 91.89], [102.0, 102.34], [108.0, 108.6], [119.0, 120.51], [123.0, 123.92]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [31.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 70.15], ["throbbing", 4.68], ["electronic music", 3.9]], null, null, null, null, null, null, null], "duration": [28.21, 0.17, 0.7, -0.11, 0.34, 0.6, 1.51, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/bcY4Lhb3yhI_filtered.json b/annotations_filtered/bcY4Lhb3yhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f471bf7538086b3364de50e6742ab75f60774437 --- /dev/null +++ b/annotations_filtered/bcY4Lhb3yhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.23], [11.0, 12.01], [13.0, 18.22], [36.0, 36.09], [36.0, 44.07], [45.0, 46.57], [47.0, 78.7], [81.0, 90.44], [92.0, 105.66]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.02, 0.0, 31.32, 0.0, 0.0, 29.73, 29.56], "audiomae_on_audioset": [null, null, [["music", 65.22], ["musical instrument", 5.31], ["synthesizer", 4.09]], null, [["music", 71.45], ["crowd", 5.97], ["cheering", 2.84]], null, null, [["music", 71.76], ["music of latin america", 7.98], ["salsa music", 5.36]], [["music", 88.82], ["salsa music", 1.55], ["music of latin america", 1.51]]], "duration": [1.23, 1.01, 5.22, 0.09, 8.07, 1.57, 31.7, 9.44, 13.66]} \ No newline at end of file diff --git a/annotations_filtered/bchPm7InHcg_filtered.json b/annotations_filtered/bchPm7InHcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc3a1abde80416fd86e72f3f652fc7e7878e022b --- /dev/null +++ b/annotations_filtered/bchPm7InHcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.38], [17.0, 17.1], [17.0, 18.3], [48.0, 49.44], [51.0, 52.3], [55.0, 55.7], [57.0, 58.33], [60.0, 60.44], [62.0, 62.77], [76.0, 76.06], [79.0, 80.74], [112.0, 113.51], [114.0, 113.76], [116.0, 118.54], [119.0, 119.26], [120.0, 120.26], [125.0, 127.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 62.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 0.1, 1.3, 1.44, 1.3, 0.7, 1.33, 0.44, 0.77, 0.06, 1.74, 1.51, -0.24, 2.54, 0.26, 0.26, 2.95]} \ No newline at end of file diff --git a/annotations_filtered/bcokL59jeqU_filtered.json b/annotations_filtered/bcokL59jeqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dca70bbccf071252d19e792c2f5cf65bd623983 --- /dev/null +++ b/annotations_filtered/bcokL59jeqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [4.0, 4.77], [6.0, 6.96], [8.0, 8.07], [13.0, 14.76], [16.0, 17.34], [18.0, 20.16], [21.0, 21.63], [24.0, 24.53], [26.0, 27.26], [29.0, 30.75], [31.0, 31.77], [33.0, 33.52], [34.0, 37.39], [38.0, 38.7], [45.0, 46.6], [49.0, 54.95], [55.0, 55.54], [56.0, 56.37], [59.0, 61.28], [62.0, 69.48], [70.0, 72.18], [73.0, 75.84], [77.0, 92.04], [94.0, 95.08], [99.0, 100.75], [101.0, 102.69], [109.0, 109.07], [110.0, 110.46], [112.0, 112.38], [114.0, 114.27], [115.0, 116.14], [117.0, 117.88], [118.0, 119.37], [120.0, 120.43], [121.0, 121.44], [125.0, 125.81], [127.0, 127.95], [131.0, 131.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 35.47, 0.0, 0.0, 99.99, 71.72, 34.84, 41.83, 37.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.44], ["sidetone", 10.07], ["noise", 8.01]], null, null, null, null, [["sidetone", 48.58], ["speech", 41.83], ["dial tone", 1.67]], [["speech", 64.68], ["walk, footsteps", 6.05], ["stomach rumble", 4.06]], [["sidetone", 46.19], ["speech", 32.55], ["hum", 5.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.77, 0.96, 0.07, 1.76, 1.34, 2.16, 0.63, 0.53, 1.26, 1.75, 0.77, 0.52, 3.39, 0.7, 1.6, 5.95, 0.54, 0.37, 2.28, 7.48, 2.18, 2.84, 15.04, 1.08, 1.75, 1.69, 0.07, 0.46, 0.38, 0.27, 1.14, 0.88, 1.37, 0.43, 0.44, 0.81, 0.95, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/bcs2En6tGRw_filtered.json b/annotations_filtered/bcs2En6tGRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b36ca7e16760550b56fc85627993b3405a8fd45d --- /dev/null +++ b/annotations_filtered/bcs2En6tGRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 33.93], [35.0, 50.58], [54.0, 58.94], [61.0, 73.23], [76.0, 77.4], [80.0, 85.56]], "keep_status": [false, true, false, true, false, false], "silence_prob": [87.37, 41.07, 30.34, 34.55, 0.0, 53.16], "audiomae_on_audioset": [null, [["music", 40.2], ["singing bowl", 10.75], ["electronic music", 7.68]], [["music", 55.76], ["noise", 12.43], ["synthesizer", 10.04]], [["sound effect", 15.43], ["music", 13.94], ["fart", 12.1]], null, null], "duration": [27.93, 15.58, 4.94, 12.23, 1.4, 5.56]} \ No newline at end of file diff --git a/annotations_filtered/bd0IiiCDDGI_filtered.json b/annotations_filtered/bd0IiiCDDGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8815d9894606b069f3400eb6f727eb85e3c8475 --- /dev/null +++ b/annotations_filtered/bd0IiiCDDGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [7.0, 7.28], [8.0, 9.24], [11.0, 10.77], [11.0, 11.5], [12.0, 12.5], [14.0, 16.16], [20.0, 24.29], [25.0, 26.08], [28.0, 28.16], [28.0, 28.98], [34.0, 42.3], [44.0, 44.04], [45.0, 45.03], [47.0, 47.17], [52.0, 53.1], [54.0, 64.62], [65.0, 71.78], [73.0, 75.0], [78.0, 121.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 78.04, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 48.31, 47.35, 53.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.99], ["speech", 34.07], ["scary music", 1.2]], [["music", 63.4], ["carnatic music", 12.25], ["theremin", 4.73]], null, null], "duration": [0.18, 0.28, 1.24, -0.23, 0.5, 0.5, 2.16, 4.29, 1.08, 0.16, 0.98, 8.3, 0.04, 0.03, 0.17, 1.1, 10.62, 6.78, 2.0, 43.36]} \ No newline at end of file diff --git a/annotations_filtered/bd0ZO7Ewiq0_filtered.json b/annotations_filtered/bd0ZO7Ewiq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb0117f03bbde4faab14d6db945cf64240c7e17d --- /dev/null +++ b/annotations_filtered/bd0ZO7Ewiq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.22], [7.0, 8.88], [11.0, 12.97], [14.0, 20.29], [21.0, 22.4], [23.0, 27.92], [30.0, 33.94], [35.0, 36.81], [37.0, 43.09], [44.0, 49.28], [51.0, 52.08], [53.0, 54.53], [55.0, 55.51], [57.0, 57.72], [59.0, 60.08], [65.0, 65.69], [69.0, 78.53], [80.0, 82.54], [84.0, 84.65], [88.0, 88.67], [90.0, 91.37], [100.0, 99.84], [105.0, 105.73], [117.0, 118.89], [120.0, 122.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 98.66, 0.0, 99.99, 100.0, 0.0, 95.09, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.22, 1.88, 1.97, 6.29, 1.4, 4.92, 3.94, 1.81, 6.09, 5.28, 1.08, 1.53, 0.51, 0.72, 1.08, 0.69, 9.53, 2.54, 0.65, 0.67, 1.37, -0.16, 0.73, 1.89, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/bdFKfRmmbk0_filtered.json b/annotations_filtered/bdFKfRmmbk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f769fd6f3d5e72e54195b4733255befd58218805 --- /dev/null +++ b/annotations_filtered/bdFKfRmmbk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.4], [10.0, 10.71], [12.0, 12.45], [13.0, 15.36], [18.0, 17.96], [23.0, 23.48], [25.0, 26.5], [29.0, 30.59], [31.0, 33.88], [36.0, 37.47], [39.0, 41.2], [44.0, 46.35], [48.0, 50.89], [53.0, 56.02], [57.0, 61.11], [62.0, 69.21], [72.0, 73.89], [76.0, 77.55], [80.0, 80.11], [81.0, 85.09], [89.0, 90.58], [93.0, 93.01], [93.0, 93.83], [96.0, 99.81], [106.0, 107.87], [111.0, 112.28], [113.0, 117.0], [123.0, 126.86], [128.0, 129.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 82.61, 0.0, 99.52, 95.37, 76.2, 72.75, 82.79, 91.81, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 53.1, 0.0, 0.0, 80.82, 71.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.4, 0.71, 0.45, 2.36, -0.04, 0.48, 1.5, 1.59, 2.88, 1.47, 2.2, 2.35, 2.89, 3.02, 4.11, 7.21, 1.89, 1.55, 0.11, 4.09, 1.58, 0.01, 0.83, 3.81, 1.87, 1.28, 4.0, 3.86, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/bdFo-WtjOmA_filtered.json b/annotations_filtered/bdFo-WtjOmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cf2412325ba0f843d0d3f9a290a4992ec9b2021 --- /dev/null +++ b/annotations_filtered/bdFo-WtjOmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 60.74], [62.0, 82.09], [83.0, 87.44], [88.0, 89.18], [90.0, 92.53], [96.0, 97.58], [102.0, 109.07], [112.0, 114.12], [116.0, 116.28], [118.0, 121.34], [124.0, 126.18]], "keep_status": [true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [48.14, 31.89, 34.87, 0.0, 33.36, 0.0, 31.3, 35.95, 0.0, 34.78, 30.83], "audiomae_on_audioset": [[["cough", 40.69], ["music", 17.73], ["throat clearing", 8.2]], [["hum", 33.52], ["mains hum", 33.49], ["music", 10.97]], [["hum", 34.23], ["mains hum", 29.35], ["music", 10.89]], null, [["whale vocalization", 82.03], ["music", 9.04], ["hum", 1.75]], null, [["music", 52.29], ["theremin", 21.8], ["noise", 1.87]], [["gong", 38.65], ["music", 19.78], ["didgeridoo", 10.65]], null, [["hum", 45.56], ["mains hum", 38.49], ["music", 4.76]], [["hum", 21.68], ["mains hum", 21.44], ["vehicle", 5.48]]], "duration": [4.74, 20.09, 4.44, 1.18, 2.53, 1.58, 7.07, 2.12, 0.28, 3.34, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/bdJPnMKhsnY_filtered.json b/annotations_filtered/bdJPnMKhsnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9d5ce27a11f4f18c8b6b61e27e5991f15e84880 --- /dev/null +++ b/annotations_filtered/bdJPnMKhsnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.86], [32.0, 32.31], [56.0, 56.25], [59.0, 60.2], [62.0, 62.6], [64.0, 64.88], [69.0, 72.59]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.82], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 77.37], ["hum", 3.71], ["electronic music", 1.97]]], "duration": [-0.14, 0.31, 0.25, 1.2, 0.6, 0.88, 3.59]} \ No newline at end of file diff --git a/annotations_filtered/bdJcCwoJ4KQ_filtered.json b/annotations_filtered/bdJcCwoJ4KQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..066b91ddb1f7cb886545a67e1fdbe47586bd0bbb --- /dev/null +++ b/annotations_filtered/bdJcCwoJ4KQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 6.37], [16.0, 21.39], [23.0, 23.7], [26.0, 26.03], [29.0, 28.95], [31.0, 31.72], [35.0, 36.32], [38.0, 49.03], [55.0, 64.13], [65.0, 66.66], [70.0, 80.05], [81.0, 81.08], [84.0, 86.91], [89.0, 92.16], [93.0, 96.74], [97.0, 99.05], [100.0, 100.92], [102.0, 104.68], [109.0, 117.49], [120.0, 140.16], [144.0, 146.79], [147.0, 157.71], [160.0, 175.27]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 93.13, 36.18, 0.0, 0.0, 0.0, 0.0, 0.0, 46.83, 29.04, 0.0, 49.04, 0.0, 80.82, 75.72, 73.21, 51.12, 0.0, 39.5, 39.47, 42.3, 39.02, 50.91, 43.48], "audiomae_on_audioset": [null, null, [["chirp tone", 22.74], ["tuning fork", 15.5], ["hum", 12.78]], null, null, null, null, null, [["music", 24.36], ["hum", 9.75], ["electric shaver, electric razor", 8.75]], [["quack", 37.27], ["duck", 24.82], ["music", 9.21]], null, [["music", 69.15], ["sonar", 8.18], ["buzz", 5.93]], null, null, null, null, null, null, [["music", 49.93], ["coin (dropping)", 13.37], ["throbbing", 8.9]], [["didgeridoo", 38.78], ["music", 32.69], ["musical instrument", 2.99]], [["music", 68.06], ["hum", 11.85], ["throbbing", 5.24]], [["hum", 46.43], ["throbbing", 14.63], ["mains hum", 12.83]], null, [["ding", 27.16], ["music", 24.59], ["speech", 10.5]]], "duration": [0.89, 2.37, 5.39, 0.7, 0.03, -0.05, 0.72, 1.32, 11.03, 9.13, 1.66, 10.05, 0.08, 2.91, 3.16, 3.74, 2.05, 0.92, 2.68, 8.49, 20.16, 2.79, 10.71, 15.27]} \ No newline at end of file diff --git a/annotations_filtered/bdYiJgwzumg_filtered.json b/annotations_filtered/bdYiJgwzumg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9d7418b6762fdf1e8dd48b5f685567793086da6 --- /dev/null +++ b/annotations_filtered/bdYiJgwzumg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 29.78], [31.0, 35.77], [36.0, 49.15], [51.0, 106.78], [109.0, 109.71], [110.0, 111.99]], "keep_status": [false, false, false, false, false, false], "silence_prob": [30.45, 43.61, 30.48, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.87], ["foghorn", 26.62], ["brass instrument", 5.25]], [["music", 70.11], ["scary music", 4.49], ["soundtrack music", 3.01]], [["music", 67.0], ["didgeridoo", 13.95], ["musical instrument", 6.0]], null, null, null], "duration": [11.78, 4.77, 13.15, 55.78, 0.71, 1.99]} \ No newline at end of file diff --git a/annotations_filtered/bdft59iqlKQ_filtered.json b/annotations_filtered/bdft59iqlKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37b60521694e42698361d315688bf449115e4e9a --- /dev/null +++ b/annotations_filtered/bdft59iqlKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.57], [10.0, 10.18], [14.0, 14.86], [16.0, 18.55], [20.0, 32.68], [33.0, 34.79], [37.0, 45.15], [51.0, 51.21], [52.0, 54.11], [56.0, 57.25], [61.0, 61.57], [67.0, 67.83], [70.0, 70.58], [71.0, 71.04], [71.0, 74.36], [85.0, 86.05], [87.0, 87.52], [89.0, 90.05], [91.0, 93.39], [96.0, 97.04], [98.0, 99.71], [101.0, 101.95], [104.0, 106.29], [107.0, 112.01], [113.0, 117.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.92, 0.0, 0.0, 98.51, 99.99, 0.0, 99.62, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 99.76, 99.76, 98.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.57, 0.18, 0.86, 2.55, 12.68, 1.79, 8.15, 0.21, 2.11, 1.25, 0.57, 0.83, 0.58, 0.04, 3.36, 1.05, 0.52, 1.05, 2.39, 1.04, 1.71, 0.95, 2.29, 5.01, 4.41]} \ No newline at end of file diff --git a/annotations_filtered/bdm9LVNbuNg_filtered.json b/annotations_filtered/bdm9LVNbuNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ec3d25f5fb45fd18dad09deede269ddee3ed1e7 --- /dev/null +++ b/annotations_filtered/bdm9LVNbuNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.83], [3.0, 2.88], [3.0, 3.0], [3.0, 3.6], [6.0, 6.98], [16.0, 19.01], [32.0, 31.73], [41.0, 43.26], [55.0, 55.58], [67.0, 66.73], [73.0, 73.03], [87.0, 87.34], [92.0, 92.13], [100.0, 102.57], [111.0, 115.01], [116.0, 116.82], [121.0, 123.28]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 42.55, 0.0, 44.9, 0.0, 0.0, 0.0, 0.0, 0.0, 40.84, 55.53, 0.0, 40.14], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 53.48], ["cattle, bovinae", 9.22], ["moo", 4.65]], null, [["speech", 30.76], ["music", 7.58], ["hum", 6.82]], null, null, null, null, null, [["didgeridoo", 34.22], ["speech", 23.79], ["fart", 13.98]], null, null, [["speech", 17.27], ["hum", 14.25], ["mains hum", 13.86]]], "duration": [-0.17, -0.12, 0.0, 0.6, 0.98, 3.01, -0.27, 2.26, 0.58, -0.27, 0.03, 0.34, 0.13, 2.57, 4.01, 0.82, 2.28]} \ No newline at end of file diff --git a/annotations_filtered/be-Ou9Xkh48_filtered.json b/annotations_filtered/be-Ou9Xkh48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b408abc70ea60cbbc2981b46f2a24aeaeb1f0b1 --- /dev/null +++ b/annotations_filtered/be-Ou9Xkh48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [4.0, 5.95], [9.0, 9.88], [12.0, 12.16], [14.0, 15.97], [17.0, 18.27], [21.0, 20.8], [23.0, 24.27], [25.0, 25.46], [26.0, 26.57], [28.0, 28.38], [30.0, 30.47], [32.0, 33.49], [35.0, 36.68], [38.0, 39.07], [40.0, 41.94], [44.0, 48.05], [49.0, 50.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["effects unit", 15.73], ["music", 7.34], ["fart", 6.07]], null], "duration": [0.93, 1.95, 0.88, 0.16, 1.97, 1.27, -0.2, 1.27, 0.46, 0.57, 0.38, 0.47, 1.49, 1.68, 1.07, 1.94, 4.05, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/be9FJeol_aQ_filtered.json b/annotations_filtered/be9FJeol_aQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aafdb4af0ce764f96bf70de37e51645d3f1ba2d4 --- /dev/null +++ b/annotations_filtered/be9FJeol_aQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 97.8], [101.0, 124.55]], "keep_status": [false, true], "silence_prob": [0.0, 31.25], "audiomae_on_audioset": [null, [["music", 44.97], ["livestock, farm animals, working animals", 12.63], ["moo", 8.59]]], "duration": [93.8, 23.55]} \ No newline at end of file diff --git a/annotations_filtered/beAc5oqxBHw_filtered.json b/annotations_filtered/beAc5oqxBHw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4622573536de3387fe48e5e163b1cda4d75a412d --- /dev/null +++ b/annotations_filtered/beAc5oqxBHw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.69], [22.0, 68.76]], "keep_status": [false, false], "silence_prob": [31.84, 0.0], "audiomae_on_audioset": [[["music", 57.76], ["throbbing", 9.75], ["theme music", 3.93]], null], "duration": [2.69, 46.76]} \ No newline at end of file diff --git a/annotations_filtered/bfKu5Jc8TjA_filtered.json b/annotations_filtered/bfKu5Jc8TjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b251b5c00589f6529dc550b5722f26b01c0cc3e --- /dev/null +++ b/annotations_filtered/bfKu5Jc8TjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.58], [15.0, 27.62], [31.0, 35.5], [39.0, 40.46], [44.0, 52.61], [54.0, 56.03], [56.0, 59.0], [64.0, 64.72], [72.0, 109.44], [112.0, 114.29], [116.0, 118.22], [118.0, 118.66], [121.0, 123.04], [126.0, 129.66], [130.0, 135.11], [135.0, 135.68], [136.0, 137.27], [138.0, 143.63]], "keep_status": [false, true, false, false, true, true, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.57, 32.77, 0.0, 33.07, 33.76, 32.91, 0.0, 0.0, 34.8, 93.6, 0.0, 97.54, 77.7, 93.29, 0.0, 0.0, 49.5], "audiomae_on_audioset": [null, [["music", 38.92], ["sidetone", 12.8], ["speech", 10.62]], [["music", 50.07], ["boing", 17.49], ["didgeridoo", 7.1]], null, [["fart", 25.55], ["fly, housefly", 10.51], ["vehicle", 8.69]], [["music", 32.75], ["hum", 10.38], ["mains hum", 6.97]], [["speech", 43.47], ["music", 19.45], ["radio", 5.03]], null, null, [["music", 34.73], ["throbbing", 26.13], ["hum", 6.37]], null, null, null, null, null, null, null, [["music", 73.88], ["didgeridoo", 7.9], ["musical instrument", 4.5]]], "duration": [0.58, 12.62, 4.5, 1.46, 8.61, 2.03, 3.0, 0.72, 37.44, 2.29, 2.22, 0.66, 2.04, 3.66, 5.11, 0.68, 1.27, 5.63]} \ No newline at end of file diff --git a/annotations_filtered/bfzJMOBenVA_filtered.json b/annotations_filtered/bfzJMOBenVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdcb6fe286592c67d31a7805a8fb714083adff27 --- /dev/null +++ b/annotations_filtered/bfzJMOBenVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.58], [8.0, 9.24], [36.0, 36.34], [37.0, 40.27], [51.0, 51.49], [52.0, 56.73], [57.0, 56.78], [58.0, 60.93], [80.0, 80.86], [83.0, 85.02], [90.0, 90.75], [91.0, 91.13], [91.0, 94.9], [95.0, 95.82], [97.0, 97.87], [99.0, 99.62], [101.0, 102.05], [105.0, 106.39]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.6, 0.0, 56.86, 0.0, 39.58, 0.0, 53.59, 0.0, 0.0, 39.96, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 14.65], ["speech", 12.24], ["throbbing", 9.8]], null, null, null, null, [["speech", 71.36], ["sidetone", 4.9], ["music", 4.43]], null, null, null, null, null], "duration": [0.58, 1.24, 0.34, 3.27, 0.49, 4.73, -0.22, 2.93, 0.86, 2.02, 0.75, 0.13, 3.9, 0.82, 0.87, 0.62, 1.05, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/bg5SLBapMiI_filtered.json b/annotations_filtered/bg5SLBapMiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f910170454c73a02e83d7ab4d75d128f9e208dca --- /dev/null +++ b/annotations_filtered/bg5SLBapMiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 0.84], [3.0, 5.37], [7.0, 8.8], [12.0, 28.21], [28.0, 41.0], [41.0, 45.44], [47.0, 52.1], [52.0, 52.19], [53.0, 126.76]], "keep_status": [false, false, false, false, true, true, true, true, false, false], "silence_prob": [0.0, 0.0, 35.95, 0.0, 30.68, 32.24, 32.37, 32.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 73.76], ["synthesizer", 2.72], ["electronic music", 2.25]], null, [["music", 22.43], ["smash, crash", 15.57], ["whack, thwack", 11.69]], [["music", 53.28], ["musical instrument", 7.37], ["effects unit", 5.91]], [["fly, housefly", 34.63], ["mosquito", 11.25], ["insect", 8.55]], [["music", 28.71], ["hum", 10.51], ["throbbing", 7.63]], null, null], "duration": [0.5, -0.16, 2.37, 1.8, 16.21, 13.0, 4.44, 5.1, 0.19, 73.76]} \ No newline at end of file diff --git a/annotations_filtered/bg9SuuzPdVE_filtered.json b/annotations_filtered/bg9SuuzPdVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82d638e6718e4d8c47645586f95f316158844db4 --- /dev/null +++ b/annotations_filtered/bg9SuuzPdVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [5.0, 5.41], [8.0, 12.12], [12.0, 16.36], [20.0, 20.56], [22.0, 23.52], [31.0, 32.17], [34.0, 35.61], [38.0, 38.87], [39.0, 39.45], [42.0, 42.11], [42.0, 50.03], [55.0, 56.39], [65.0, 65.23], [67.0, 73.87], [76.0, 77.67], [80.0, 86.56], [89.0, 89.06], [93.0, 93.41], [96.0, 96.52], [97.0, 99.06], [100.0, 100.62], [103.0, 103.92], [107.0, 107.32], [108.0, 109.05], [115.0, 115.4], [116.0, 117.1], [118.0, 121.47], [123.0, 128.55], [129.0, 129.12], [131.0, 132.46]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 52.8, 36.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.92, 0.0, 0.0, 50.06, 0.0, 39.34, 0.0, 0.0, 0.0, 45.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.21, 42.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 36.59], ["speech", 19.46], ["sidetone", 10.05]], null, null, null, null, null, null, null, [["speech", 26.1], ["music", 16.63], ["sidetone", 7.06]], null, null, null, null, [["music", 28.12], ["hum", 22.2], ["throbbing", 21.13]], null, null, null, [["music", 24.22], ["fly, housefly", 13.21], ["musical instrument", 7.36]], null, null, null, null, null, null, [["music", 37.89], ["speech", 34.41], ["fart", 3.99]], [["music", 44.02], ["musical instrument", 10.28], ["speech", 8.55]], null, null], "duration": [0.55, 0.41, 4.12, 4.36, 0.56, 1.52, 1.17, 1.61, 0.87, 0.45, 0.11, 8.03, 1.39, 0.23, 6.87, 1.67, 6.56, 0.06, 0.41, 0.52, 2.06, 0.62, 0.92, 0.32, 1.05, 0.4, 1.1, 3.47, 5.55, 0.12, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/bgS0GPQhzHg_filtered.json b/annotations_filtered/bgS0GPQhzHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d1c8dc45f731258472ebd42d81191a2f1d6eb6e --- /dev/null +++ b/annotations_filtered/bgS0GPQhzHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [10.0, 11.38], [12.0, 39.9], [41.0, 40.78], [45.0, 48.3], [49.0, 72.05]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 28.91, 0.0, 29.82, 28.7], "audiomae_on_audioset": [null, null, [["music", 56.12], ["throbbing", 9.19], ["synthesizer", 8.08]], null, [["music", 50.85], ["throbbing", 8.08], ["ambient music", 5.27]], [["music", 83.81], ["ambient music", 3.72], ["synthesizer", 2.2]]], "duration": [1.02, 1.38, 27.9, -0.22, 3.3, 23.05]} \ No newline at end of file diff --git a/annotations_filtered/bgXlHdBRpjs_filtered.json b/annotations_filtered/bgXlHdBRpjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9193bb1bc267a3f749bfdab5df2c215fa11c30e --- /dev/null +++ b/annotations_filtered/bgXlHdBRpjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.03], [12.0, 35.5], [45.0, 45.79]], "keep_status": [true, true, false], "silence_prob": [36.84, 30.78, 0.0], "audiomae_on_audioset": [[["music", 29.53], ["theremin", 15.33], ["fly, housefly", 10.11]], [["music", 37.68], ["moo", 15.75], ["cattle, bovinae", 13.68]], null], "duration": [4.03, 23.5, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/bgZWbi1o8bY_filtered.json b/annotations_filtered/bgZWbi1o8bY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7363af14b5fd809faf8a97c0ecf00cea3aff1b3 --- /dev/null +++ b/annotations_filtered/bgZWbi1o8bY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.0], [11.0, 23.18], [49.0, 48.84], [81.0, 86.48], [97.0, 97.66], [107.0, 107.49], [110.0, 111.35], [112.0, 112.11], [113.0, 113.04], [114.0, 114.67], [116.0, 117.68], [121.0, 121.76], [122.0, 142.18], [152.0, 152.2], [155.0, 163.44], [172.0, 172.52]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 30.0, 0.0, 29.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.6, 0.0, 29.75, 0.0], "audiomae_on_audioset": [null, [["music", 34.42], ["speech", 31.63], ["electric shaver, electric razor", 10.98]], null, [["speech", 20.03], ["cattle, bovinae", 16.32], ["livestock, farm animals, working animals", 14.87]], null, null, null, null, null, null, null, null, [["music", 50.07], ["speech", 29.77], ["cattle, bovinae", 4.2]], null, [["music", 29.21], ["whip", 8.97], ["groan", 8.94]], null], "duration": [0.0, 12.18, -0.16, 5.48, 0.66, 0.49, 1.35, 0.11, 0.04, 0.67, 1.68, 0.76, 20.18, 0.2, 8.44, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/bh2ShAQ4lw0_filtered.json b/annotations_filtered/bh2ShAQ4lw0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e64e0c09402274e6ec808d7bb6b565aad9af4f7 --- /dev/null +++ b/annotations_filtered/bh2ShAQ4lw0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.56], [9.0, 8.55], [9.0, 12.04], [13.0, 13.81], [15.0, 18.08], [29.0, 29.52], [35.0, 39.14], [40.0, 41.27], [44.0, 45.05], [47.0, 49.49], [59.0, 64.69], [68.0, 70.14], [74.0, 76.79], [82.0, 84.15], [102.0, 103.62], [118.0, 118.18]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [73.36, 0.0, 87.0, 0.0, 44.15, 0.0, 89.54, 0.0, 0.0, 56.25, 75.23, 94.52, 39.44, 35.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 29.76], ["speech", 11.4], ["synthesizer", 6.21]], null, null, null, null, null, null, null, [["music", 24.2], ["hum", 13.32], ["musical instrument", 6.76]], [["speech", 35.07], ["music", 14.92], ["synthesizer", 2.37]], null, null], "duration": [2.56, -0.45, 3.04, 0.81, 3.08, 0.52, 4.14, 1.27, 1.05, 2.49, 5.69, 2.14, 2.79, 2.15, 1.62, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/bhGFCS11OR8_filtered.json b/annotations_filtered/bhGFCS11OR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..656d80595ad4afa10bb82cb55f273b5a1ce20180 --- /dev/null +++ b/annotations_filtered/bhGFCS11OR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.2], [17.0, 17.31], [19.0, 19.41], [21.0, 21.63], [23.0, 23.73], [25.0, 24.93], [35.0, 35.53], [39.0, 63.95], [69.0, 70.7], [73.0, 78.6], [81.0, 80.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.68, 0.0, 33.59, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["fly, housefly", 44.39], ["insect", 40.65], ["bee, wasp, etc.", 5.69]], null, [["speech", 51.48], ["vehicle", 28.46], ["boat, water vehicle", 3.07]], null], "duration": [0.2, 0.31, 0.41, 0.63, 0.73, -0.07, 0.53, 24.95, 1.7, 5.6, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/bhGfpwfae-k_filtered.json b/annotations_filtered/bhGfpwfae-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..216e9373b843fe6ae1d16de4086585e952b5c00b --- /dev/null +++ b/annotations_filtered/bhGfpwfae-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.14], [8.0, 10.07], [12.0, 22.84], [41.0, 57.11], [58.0, 69.58]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 80.29, 76.37, 36.37, 71.87], "audiomae_on_audioset": [null, null, null, [["hum", 55.57], ["mains hum", 21.97], ["throbbing", 10.77]], null], "duration": [0.14, 2.07, 10.84, 16.11, 11.58]} \ No newline at end of file diff --git a/annotations_filtered/bhYOGuozHd4_filtered.json b/annotations_filtered/bhYOGuozHd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40da39c3c44893d828889c46360bd604cdbcea60 --- /dev/null +++ b/annotations_filtered/bhYOGuozHd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.19], [18.0, 18.49], [20.0, 23.43], [25.0, 30.96], [33.0, 33.74], [36.0, 46.8], [49.0, 55.12], [58.0, 60.94], [62.0, 62.24], [66.0, 69.01], [70.0, 70.36], [75.0, 77.21], [77.0, 77.95], [80.0, 88.43], [93.0, 97.71], [101.0, 106.47], [110.0, 119.33], [125.0, 137.81], [140.0, 140.68], [144.0, 144.63], [148.0, 148.88]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, true, false, true, true, true, true, true, false, false, false], "silence_prob": [70.3, 0.0, 59.51, 49.54, 0.0, 39.91, 49.64, 47.05, 0.0, 71.57, 0.0, 36.21, 0.0, 30.95, 29.12, 30.98, 31.36, 30.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 28.8], ["hum", 9.08], ["throbbing", 6.41]], null, [["speech", 45.75], ["music", 23.13], ["whack, thwack", 2.27]], [["speech", 47.33], ["music", 17.38], ["fart", 6.29]], [["speech", 19.24], ["music", 17.87], ["carnatic music", 6.29]], null, null, null, [["speech", 26.46], ["music", 17.77], ["livestock, farm animals, working animals", 3.72]], null, [["music", 24.27], ["speech", 22.5], ["electric shaver, electric razor", 6.6]], [["speech", 24.8], ["music", 20.73], ["electric shaver, electric razor", 4.61]], [["speech", 47.31], ["cattle, bovinae", 7.3], ["livestock, farm animals, working animals", 6.74]], [["electric shaver, electric razor", 25.77], ["speech", 10.29], ["livestock, farm animals, working animals", 7.65]], [["music", 40.84], ["speech", 15.01], ["fart", 7.61]], null, null, null], "duration": [2.19, 0.49, 3.43, 5.96, 0.74, 10.8, 6.12, 2.94, 0.24, 3.01, 0.36, 2.21, 0.95, 8.43, 4.71, 5.47, 9.33, 12.81, 0.68, 0.63, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/bhtJNsUfHIM_filtered.json b/annotations_filtered/bhtJNsUfHIM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..985cef5348713349bd081f33085b81214eef080b --- /dev/null +++ b/annotations_filtered/bhtJNsUfHIM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.41], [7.0, 7.28], [13.0, 13.96], [15.0, 17.39], [19.0, 22.25], [23.0, 25.98], [27.0, 27.3], [29.0, 29.29], [29.0, 30.47], [33.0, 34.8], [36.0, 36.0], [38.0, 39.51], [45.0, 45.39], [48.0, 47.97], [54.0, 54.58], [56.0, 56.47], [60.0, 61.13], [64.0, 63.66], [66.0, 66.16], [67.0, 67.34], [70.0, 72.17], [74.0, 74.07], [76.0, 77.6], [81.0, 81.8], [83.0, 84.6], [94.0, 94.34], [98.0, 99.5], [101.0, 101.82], [102.0, 104.63], [107.0, 107.25], [109.0, 110.07], [111.0, 111.62], [121.0, 121.88], [123.0, 123.52], [127.0, 128.17], [130.0, 130.38], [134.0, 136.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 86.64, 99.62, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.45], ["throbbing", 19.41], ["hum", 13.63]]], "duration": [1.41, 0.28, 0.96, 2.39, 3.25, 2.98, 0.3, 0.29, 1.47, 1.8, 0.0, 1.51, 0.39, -0.03, 0.58, 0.47, 1.13, -0.34, 0.16, 0.34, 2.17, 0.07, 1.6, 0.8, 1.6, 0.34, 1.5, 0.82, 2.63, 0.25, 1.07, 0.62, 0.88, 0.52, 1.17, 0.38, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/biYVl18JAFM_filtered.json b/annotations_filtered/biYVl18JAFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..767d4080ea254fa772e754975c25de8ab6e221f6 --- /dev/null +++ b/annotations_filtered/biYVl18JAFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.12], [7.0, 10.25], [11.0, 11.7], [14.0, 14.86], [17.0, 18.06], [25.0, 29.73], [34.0, 35.7], [36.0, 37.45], [43.0, 48.83], [50.0, 51.56], [54.0, 54.6], [60.0, 72.77], [74.0, 76.32], [77.0, 80.67], [82.0, 82.83], [85.0, 92.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [91.13, 95.78, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 63.85, 0.0, 0.0, 50.41, 62.99, 43.66, 0.0, 29.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.7], ["hum", 16.97], ["mains hum", 9.73]], null, [["music", 19.94], ["noise", 14.66], ["hum", 9.84]]], "duration": [4.12, 3.25, 0.7, 0.86, 1.06, 4.73, 1.7, 1.45, 5.83, 1.56, 0.6, 12.77, 2.32, 3.67, 0.83, 7.82]} \ No newline at end of file diff --git a/annotations_filtered/bjLdEjOL1s8_filtered.json b/annotations_filtered/bjLdEjOL1s8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/bjLdEjOL1s8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/bjaJxs12l44_filtered.json b/annotations_filtered/bjaJxs12l44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..156ae6b4501cec25860ec1d8cde58b6145a5c7e8 --- /dev/null +++ b/annotations_filtered/bjaJxs12l44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 37.29], [38.0, 59.53], [60.0, 64.59], [65.0, 70.68]], "keep_status": [false, false, true, true], "silence_prob": [59.59, 57.81, 46.47, 41.7], "audiomae_on_audioset": [null, null, [["music", 38.91], ["hum", 15.7], ["sonar", 5.99]], [["music", 30.56], ["hum", 14.61], ["whale vocalization", 11.61]]], "duration": [7.29, 21.53, 4.59, 5.68]} \ No newline at end of file diff --git a/annotations_filtered/bjqjgoiV6BQ_filtered.json b/annotations_filtered/bjqjgoiV6BQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39d6576da24b6f3e41ba6a5a5ed613babe7be7c5 --- /dev/null +++ b/annotations_filtered/bjqjgoiV6BQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [6.0, 5.98], [7.0, 7.74], [10.0, 10.93], [13.0, 15.31], [16.0, 17.1], [19.0, 21.17], [25.0, 26.16], [30.0, 31.63], [33.0, 61.08], [61.0, 61.86], [65.0, 65.23], [66.0, 70.28], [73.0, 73.47], [75.0, 75.54], [77.0, 76.94], [77.0, 101.29]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 99.99, 0.0, 0.0, 47.7, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 52.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 45.9], ["speech", 9.93], ["musical instrument", 8.77]], null, null, null, null, null, null, null], "duration": [0.4, -0.02, 0.74, 0.93, 2.31, 1.1, 2.17, 1.16, 1.63, 28.08, 0.86, 0.23, 4.28, 0.47, 0.54, -0.06, 24.29]} \ No newline at end of file diff --git a/annotations_filtered/bjqsWtO5Xjg_filtered.json b/annotations_filtered/bjqsWtO5Xjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bef0c86e393c951c4f4fd4bad9f28ffbb575f81 --- /dev/null +++ b/annotations_filtered/bjqsWtO5Xjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 22.0], [26.0, 37.79], [39.0, 39.43], [40.0, 54.77], [56.0, 67.58], [68.0, 80.49], [84.0, 84.11], [85.0, 86.66], [89.0, 89.48], [90.0, 90.64], [91.0, 93.14], [94.0, 95.22], [96.0, 98.29], [99.0, 99.03]], "keep_status": [true, true, false, true, true, false, false, false, false, false, true, false, true, false], "silence_prob": [28.5, 29.16, 0.0, 28.68, 33.65, 32.57, 0.0, 0.0, 0.0, 0.0, 37.08, 0.0, 35.59, 0.0], "audiomae_on_audioset": [[["music", 22.88], ["rumble", 11.0], ["hum", 9.25]], [["speech", 49.34], ["music", 14.11], ["mains hum", 6.08]], null, [["music", 54.86], ["rumble", 6.13], ["breaking", 4.98]], [["music", 38.17], ["boing", 20.8], ["smash, crash", 10.17]], [["music", 57.62], ["throbbing", 11.89], ["speech", 9.09]], null, null, null, null, [["music", 28.26], ["hum", 17.84], ["speech", 14.45]], null, [["music", 58.39], ["speech", 5.14], ["electronic music", 4.1]], null], "duration": [6.0, 11.79, 0.43, 14.77, 11.58, 12.49, 0.11, 1.66, 0.48, 0.64, 2.14, 1.22, 2.29, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/bk9oFLFDsfE_filtered.json b/annotations_filtered/bk9oFLFDsfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8d85e1ed58a0230fa4272772e6ad4b956452872 --- /dev/null +++ b/annotations_filtered/bk9oFLFDsfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 27.53], [39.0, 39.95], [43.0, 43.39], [47.0, 47.82], [51.0, 52.76], [61.0, 61.99], [74.0, 74.95], [77.0, 77.13], [79.0, 80.65], [89.0, 89.46], [93.0, 93.63], [95.0, 96.67], [98.0, 98.85], [105.0, 106.1], [109.0, 110.49], [111.0, 112.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 42.59], ["trombone", 21.32], ["brass instrument", 8.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.53, 0.95, 0.39, 0.82, 1.76, 0.99, 0.95, 0.13, 1.65, 0.46, 0.63, 1.67, 0.85, 1.1, 1.49, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/bkeLkORd2y4_filtered.json b/annotations_filtered/bkeLkORd2y4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4ed95d07fdb63119092363df98e7302b4235122 --- /dev/null +++ b/annotations_filtered/bkeLkORd2y4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [3.0, 8.58], [10.0, 14.3], [15.0, 15.42], [31.0, 31.87], [35.0, 35.28], [42.0, 43.17], [48.0, 48.59], [53.0, 56.93]], "keep_status": [false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 52.45, 32.48, 0.0, 0.0, 0.0, 0.0, 0.0, 41.64], "audiomae_on_audioset": [null, null, [["speech", 52.41], ["breaking", 11.52], ["boing", 4.65]], null, null, null, null, null, [["music", 63.67], ["speech", 5.75], ["electronic music", 4.05]]], "duration": [1.1, 5.58, 4.3, 0.42, 0.87, 0.28, 1.17, 0.59, 3.93]} \ No newline at end of file diff --git a/annotations_filtered/bkhUe1txLoc_filtered.json b/annotations_filtered/bkhUe1txLoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..135af6e52794f0bc2b20c51d7278bca5d8374e9d --- /dev/null +++ b/annotations_filtered/bkhUe1txLoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [6.0, 6.61], [8.0, 8.24], [9.0, 9.91], [10.0, 10.25], [10.0, 10.3], [10.0, 10.34], [10.0, 10.83], [11.0, 12.46], [13.0, 14.23], [15.0, 18.1], [19.0, 21.69], [24.0, 24.9], [31.0, 31.43], [36.0, 37.29], [41.0, 42.38], [42.0, 43.33], [51.0, 51.31], [55.0, 55.54], [62.0, 61.7], [68.0, 68.71], [76.0, 78.36], [79.0, 80.22], [83.0, 84.05], [91.0, 91.56], [105.0, 105.39], [118.0, 119.28], [123.0, 123.87], [126.0, 126.84], [128.0, 131.26], [131.0, 133.83], [142.0, 143.16], [146.0, 146.91], [150.0, 150.38], [151.0, 152.05], [153.0, 154.67], [157.0, 158.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 60.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.52, 0.61, 0.24, 0.91, 0.25, 0.3, 0.34, 0.83, 1.46, 1.23, 3.1, 2.69, 0.9, 0.43, 1.29, 1.38, 1.33, 0.31, 0.54, -0.3, 0.71, 2.36, 1.22, 1.05, 0.56, 0.39, 1.28, 0.87, 0.84, 3.26, 2.83, 1.16, 0.91, 0.38, 1.05, 1.67, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/bkpuLB3ftow_filtered.json b/annotations_filtered/bkpuLB3ftow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62de798dbc2ce3de579f49dd4bc3930b430f1e77 --- /dev/null +++ b/annotations_filtered/bkpuLB3ftow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 7.53], [10.0, 10.76], [21.0, 24.17], [25.0, 25.42], [26.0, 26.42], [29.0, 29.52], [30.0, 43.61], [47.0, 52.12], [54.0, 63.96], [66.0, 75.41], [77.0, 77.73], [80.0, 80.92], [82.0, 82.21], [83.0, 87.72], [93.0, 93.95], [96.0, 98.34], [101.0, 107.35], [108.0, 112.01], [116.0, 115.99], [119.0, 119.08]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.31, 0.0, 36.91, 0.0, 0.0, 0.0, 61.18, 99.59, 49.87, 98.36, 0.0, 0.0, 0.0, 58.81, 0.0, 85.54, 71.72, 69.47, 0.0, 0.0], "audiomae_on_audioset": [[["clarinet", 50.06], ["music", 26.59], ["musical instrument", 7.78]], null, [["music", 34.39], ["speech", 29.94], ["musical instrument", 5.5]], null, null, null, null, null, [["music", 32.18], ["speech", 15.59], ["noise", 9.8]], null, null, null, null, null, null, null, null, null, null, null], "duration": [7.53, 0.76, 3.17, 0.42, 0.42, 0.52, 13.61, 5.12, 9.96, 9.41, 0.73, 0.92, 0.21, 4.72, 0.95, 2.34, 6.35, 4.01, -0.01, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/bkxVMf2ozrs_filtered.json b/annotations_filtered/bkxVMf2ozrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cf71f56b6b2c9f3688add0a34d3997159489203 --- /dev/null +++ b/annotations_filtered/bkxVMf2ozrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.29], [21.0, 23.4], [25.0, 27.01], [28.0, 30.05], [31.0, 33.3], [37.0, 52.12], [57.0, 59.21], [60.0, 61.06], [70.0, 70.87], [72.0, 77.46], [78.0, 79.84], [81.0, 86.0], [87.0, 87.57], [89.0, 89.77], [95.0, 95.98], [97.0, 101.66], [102.0, 107.57], [109.0, 115.7], [118.0, 119.03], [119.0, 125.95], [127.0, 127.52], [129.0, 131.75], [133.0, 133.39], [135.0, 136.04], [137.0, 138.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [99.87, 99.92, 99.78, 81.17, 99.4, 99.31, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 38.16, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["breaking", 20.87], ["explosion", 13.12], ["burst, pop", 6.89]], null, null, null, null, null, null, null], "duration": [9.29, 2.4, 2.01, 2.05, 2.3, 15.12, 2.21, 1.06, 0.87, 5.46, 1.84, 5.0, 0.57, 0.77, 0.98, 4.66, 5.57, 6.7, 1.03, 6.95, 0.52, 2.75, 0.39, 1.04, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/blDYzZvYAak_filtered.json b/annotations_filtered/blDYzZvYAak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3813c885db2415dc5e36c3f1d217cbd288842f74 --- /dev/null +++ b/annotations_filtered/blDYzZvYAak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.47], [19.0, 19.72], [31.0, 38.65], [53.0, 54.09], [57.0, 57.4], [65.0, 66.14], [67.0, 67.54], [73.0, 75.19], [79.0, 81.99], [85.0, 85.35], [97.0, 97.61], [104.0, 105.39], [111.0, 112.65], [120.0, 120.53]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 40.82, 0.0, 0.0, 0.0, 0.0, 37.73, 55.46, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 77.83], ["synthesizer", 8.5], ["musical instrument", 2.42]], null, null, null, null, [["music", 52.54], ["musical instrument", 8.66], ["synthesizer", 6.48]], null, null, null, null, null, null], "duration": [0.47, 0.72, 7.65, 1.09, 0.4, 1.14, 0.54, 2.19, 2.99, 0.35, 0.61, 1.39, 1.65, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/blQ8Wi0VAn0_filtered.json b/annotations_filtered/blQ8Wi0VAn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3cdbffb233ec404be08d37d1c8de6ef1af4c28f --- /dev/null +++ b/annotations_filtered/blQ8Wi0VAn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 42.03], [54.0, 64.29], [64.0, 64.44], [65.0, 67.53], [69.0, 69.48], [70.0, 72.79], [74.0, 77.45], [81.0, 80.87], [92.0, 93.28], [96.0, 96.77], [101.0, 103.94], [108.0, 115.87], [120.0, 120.5], [122.0, 122.52], [125.0, 126.6], [129.0, 130.28], [132.0, 132.36]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.46, 93.29, 0.0, 87.92, 0.0, 94.22, 75.55, 0.0, 0.0, 0.0, 98.73, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 20.01], ["fart", 20.01], ["musical instrument", 8.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.03, 10.29, 0.44, 2.53, 0.48, 2.79, 3.45, -0.13, 1.28, 0.77, 2.94, 7.87, 0.5, 0.52, 1.6, 1.28, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/blWBATSOCtA_filtered.json b/annotations_filtered/blWBATSOCtA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e36f4b3e6c334287bc93bc7cd6ccb797f7497614 --- /dev/null +++ b/annotations_filtered/blWBATSOCtA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.57], [3.0, 4.24], [6.0, 6.24], [12.0, 13.76], [15.0, 15.79], [17.0, 18.18], [20.0, 21.41], [22.0, 121.07], [121.0, 122.98]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.57, 1.24, 0.24, 1.76, 0.79, 1.18, 1.41, 99.07, 1.98]} \ No newline at end of file diff --git a/annotations_filtered/blbqbdPFfns_filtered.json b/annotations_filtered/blbqbdPFfns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a6b3eee09fa2312270e896c9f14d233e3ff283f --- /dev/null +++ b/annotations_filtered/blbqbdPFfns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.79], [17.0, 21.57], [22.0, 29.15], [31.0, 37.86], [39.0, 40.34], [42.0, 47.44], [51.0, 54.01], [58.0, 64.66], [67.0, 67.46], [68.0, 78.48], [83.0, 82.98]], "keep_status": [true, false, false, true, false, true, true, false, false, true, false], "silence_prob": [31.76, 36.31, 33.8, 39.85, 0.0, 30.81, 33.34, 60.6, 0.0, 31.16, 0.0], "audiomae_on_audioset": [[["music", 31.35], ["livestock, farm animals, working animals", 14.46], ["cattle, bovinae", 12.27]], [["music", 70.11], ["speech", 13.07], ["electronic music", 1.52]], [["music", 58.4], ["speech", 24.86], ["hum", 4.49]], [["music", 25.18], ["speech", 11.7], ["horse", 10.44]], null, [["speech", 22.81], ["buzz", 16.16], ["fly, housefly", 7.39]], [["mosquito", 15.88], ["crowd", 15.35], ["speech", 11.08]], null, null, [["buzz", 26.04], ["music", 14.94], ["livestock, farm animals, working animals", 10.57]], null], "duration": [8.79, 4.57, 7.15, 6.86, 1.34, 5.44, 3.01, 6.66, 0.46, 10.48, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/bllBC-ThwjQ_filtered.json b/annotations_filtered/bllBC-ThwjQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf962a5336de816c61099d9613adb11687a3e190 --- /dev/null +++ b/annotations_filtered/bllBC-ThwjQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [6.0, 6.91], [8.0, 9.39], [15.0, 15.89], [17.0, 17.09], [28.0, 28.19], [30.0, 30.7], [31.0, 30.97], [32.0, 32.22], [32.0, 32.41], [33.0, 33.93], [35.0, 37.42], [40.0, 41.84], [42.0, 43.95], [44.0, 48.2], [49.0, 49.42], [50.0, 53.23], [55.0, 55.98], [60.0, 61.16], [66.0, 70.92], [72.0, 72.08], [77.0, 77.63], [86.0, 87.51], [89.0, 90.12], [92.0, 103.11], [105.0, 108.23], [108.0, 112.21], [114.0, 115.77], [116.0, 116.55], [117.0, 116.9], [117.0, 117.56], [121.0, 120.97], [122.0, 122.15], [129.0, 130.33], [132.0, 133.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.08, 0.0, 0.0, 32.22, 0.0, 40.61, 0.0, 0.0, 31.48, 0.0, 0.0, 0.0, 0.0, 31.74, 29.12, 30.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 13.77], ["whale vocalization", 11.43], ["mosquito", 10.96]], null, [["music", 32.46], ["synthesizer", 9.7], ["hum", 7.16]], null, null, [["whale vocalization", 25.52], ["music", 19.94], ["hum", 8.21]], null, null, null, null, [["music", 53.41], ["noise", 8.07], ["insect", 3.8]], [["electric shaver, electric razor", 24.72], ["music", 18.4], ["mains hum", 7.45]], [["electric shaver, electric razor", 47.37], ["speech", 24.16], ["music", 6.66]], null, null, null, null, null, null, null, null], "duration": [0.5, 0.91, 1.39, 0.89, 0.09, 0.19, 0.7, -0.03, 0.22, 0.41, 0.93, 2.42, 1.84, 1.95, 4.2, 0.42, 3.23, 0.98, 1.16, 4.92, 0.08, 0.63, 1.51, 1.12, 11.11, 3.23, 4.21, 1.77, 0.55, -0.1, 0.56, -0.03, 0.15, 1.33, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/bmBh8DSdcnU_filtered.json b/annotations_filtered/bmBh8DSdcnU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..001a548147b11a1e5caed444525dcf0c37cd0c76 --- /dev/null +++ b/annotations_filtered/bmBh8DSdcnU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[96.0, 140.12], [140.0, 145.22], [145.0, 159.75]], "keep_status": [false, true, true], "silence_prob": [0.0, 29.41, 33.96], "audiomae_on_audioset": [null, [["speech", 31.59], ["explosion", 9.38], ["groan", 6.83]], [["speech", 28.81], ["groan", 17.32], ["outside, rural or natural", 5.86]]], "duration": [44.12, 5.22, 14.75]} \ No newline at end of file diff --git a/annotations_filtered/bmJ4doOPxd8_filtered.json b/annotations_filtered/bmJ4doOPxd8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4119064d796d170a992922e38fdf1690273b8a85 --- /dev/null +++ b/annotations_filtered/bmJ4doOPxd8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.21], [14.0, 15.82], [17.0, 17.71], [19.0, 18.69], [19.0, 21.15], [23.0, 23.38], [25.0, 25.41], [31.0, 36.56], [43.0, 43.51], [47.0, 47.43], [53.0, 56.59], [59.0, 60.42], [61.0, 64.2], [67.0, 67.71], [77.0, 78.68], [82.0, 84.13], [90.0, 90.04], [92.0, 101.71], [102.0, 103.25], [105.0, 105.11], [106.0, 106.79]], "keep_status": [false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.91, 0.0, 0.0, 0.0, 41.34, 0.0, 0.0, 43.87, 0.0, 0.0, 38.56, 0.0, 58.89, 0.0, 0.0, 51.77, 0.0, 32.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["sidetone", 37.1], ["speech", 21.18], ["sine wave", 16.9]], null, null, null, [["sidetone", 37.5], ["speech", 14.66], ["radio", 3.96]], null, null, [["music", 53.39], ["speech", 5.82], ["cattle, bovinae", 4.74]], null, null, [["speech", 30.13], ["sidetone", 11.55], ["music", 10.57]], null, null, null, null, null, null, [["music", 76.41], ["didgeridoo", 8.54], ["musical instrument", 2.22]], null, null, null], "duration": [2.21, 1.82, 0.71, -0.31, 2.15, 0.38, 0.41, 5.56, 0.51, 0.43, 3.59, 1.42, 3.2, 0.71, 1.68, 2.13, 0.04, 9.71, 1.25, 0.11, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/bmdgHN34hnk_filtered.json b/annotations_filtered/bmdgHN34hnk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..540412f0e354f5353f49722935048f518cd8f6fa --- /dev/null +++ b/annotations_filtered/bmdgHN34hnk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.14], [24.0, 25.02], [31.0, 31.43], [37.0, 37.49], [50.0, 50.8], [53.0, 53.62], [56.0, 55.98], [62.0, 61.92], [67.0, 68.84], [70.0, 72.69], [73.0, 75.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 75.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.14, 1.02, 0.43, 0.49, 0.8, 0.62, -0.02, -0.08, 1.84, 2.69, 2.71]} \ No newline at end of file diff --git a/annotations_filtered/bmeh1eFkyHg_filtered.json b/annotations_filtered/bmeh1eFkyHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ccd84014f75aee263fd94c5c79288eafcd02b0c --- /dev/null +++ b/annotations_filtered/bmeh1eFkyHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 37.59], [41.0, 87.61]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [35.59, 46.61]} \ No newline at end of file diff --git a/annotations_filtered/bmmxeZEnsL0_filtered.json b/annotations_filtered/bmmxeZEnsL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e9662eee2f106c882a7ca03e800e3cce2c9343f --- /dev/null +++ b/annotations_filtered/bmmxeZEnsL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.79], [8.0, 8.83], [16.0, 16.39], [18.0, 20.04], [32.0, 36.76], [68.0, 70.39], [72.0, 76.89], [81.0, 92.64]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 37.19, 34.49, 32.73, 32.1, 32.94], "audiomae_on_audioset": [null, null, null, [["music", 58.05], ["speech", 12.26], ["electronic music", 5.04]], [["music", 74.59], ["musical instrument", 5.15], ["speech", 3.15]], [["music", 67.24], ["swing music", 3.99], ["speech", 3.18]], [["music", 57.02], ["swing music", 14.91], ["musical instrument", 3.57]], [["music", 48.47], ["speech", 11.72], ["drum kit", 3.99]]], "duration": [0.79, 0.83, 0.39, 2.04, 4.76, 2.39, 4.89, 11.64]} \ No newline at end of file diff --git a/annotations_filtered/bnLhMGzgfSM_filtered.json b/annotations_filtered/bnLhMGzgfSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cc5a4904a074f515969577d888334fd88d2b6e8 --- /dev/null +++ b/annotations_filtered/bnLhMGzgfSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [5.0, 6.29], [7.0, 20.58], [22.0, 25.57], [26.0, 29.46], [47.0, 50.46], [58.0, 68.76], [70.0, 71.07], [73.0, 73.23], [74.0, 74.78], [78.0, 83.22], [88.0, 94.1], [101.0, 103.2], [104.0, 105.0], [108.0, 109.98], [111.0, 112.08], [125.0, 126.4], [127.0, 128.39], [129.0, 131.65], [136.0, 137.15], [138.0, 139.4], [140.0, 145.32], [146.0, 148.54], [152.0, 153.55], [155.0, 155.63], [158.0, 163.63], [165.0, 168.57]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 88.46, 95.64, 78.72, 99.56, 42.79, 0.0, 0.0, 0.0, 100.0, 98.99, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["fly, housefly", 40.4], ["insect", 16.01], ["frog", 8.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 1.29, 13.58, 3.57, 3.46, 3.46, 10.76, 1.07, 0.23, 0.78, 5.22, 6.1, 2.2, 1.0, 1.98, 1.08, 1.4, 1.39, 2.65, 1.15, 1.4, 5.32, 2.54, 1.55, 0.63, 5.63, 3.57]} \ No newline at end of file diff --git a/annotations_filtered/bn_Df5UNy3s_filtered.json b/annotations_filtered/bn_Df5UNy3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40ad8b04ae5025a405beacda02a36d37148c429b --- /dev/null +++ b/annotations_filtered/bn_Df5UNy3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 95.74], [96.0, 122.12]], "keep_status": [false, true], "silence_prob": [0.0, 29.41], "audiomae_on_audioset": [null, [["music", 30.13], ["cattle, bovinae", 10.11], ["moo", 9.72]]], "duration": [69.74, 26.12]} \ No newline at end of file diff --git a/annotations_filtered/bnitvEUDaBE_filtered.json b/annotations_filtered/bnitvEUDaBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4746f6973b466d86d73654ba906607e42c91c7a5 --- /dev/null +++ b/annotations_filtered/bnitvEUDaBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.3], [6.0, 6.2], [11.0, 14.0], [15.0, 16.88], [21.0, 21.83], [23.0, 24.11], [24.0, 36.83], [63.0, 63.73], [72.0, 72.08], [80.0, 80.76], [83.0, 86.54], [87.0, 87.67], [89.0, 89.02], [89.0, 92.15], [93.0, 94.0], [94.0, 94.93], [99.0, 99.84], [101.0, 101.78], [102.0, 112.63], [114.0, 119.25], [120.0, 126.91]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 31.84, 0.0, 0.0, 0.0, 54.7, 0.0, 0.0, 33.75, 0.0, 0.0, 0.0, 0.0, 51.99, 59.59, 35.76], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 47.15], ["sidetone", 10.68], ["electric shaver, electric razor", 9.32]], null, null, null, null, null, null, [["speech", 51.16], ["radio", 20.28], ["sidetone", 16.0]], null, null, null, null, null, null, [["fly, housefly", 29.07], ["speech", 19.36], ["insect", 17.55]]], "duration": [0.3, 0.2, 3.0, 1.88, 0.83, 1.11, 12.83, 0.73, 0.08, 0.76, 3.54, 0.67, 0.02, 3.15, 1.0, 0.93, 0.84, 0.78, 10.63, 5.25, 6.91]} \ No newline at end of file diff --git a/annotations_filtered/boCpijI2k5I_filtered.json b/annotations_filtered/boCpijI2k5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e26404e8c87b0dc3369f427d86b2dcea11654197 --- /dev/null +++ b/annotations_filtered/boCpijI2k5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.02], [3.0, 4.09], [8.0, 8.88], [11.0, 11.33], [12.0, 13.05], [15.0, 16.14], [18.0, 18.93], [21.0, 21.88], [27.0, 27.55], [29.0, 29.2], [30.0, 31.35], [34.0, 34.7], [38.0, 41.61], [43.0, 44.64], [50.0, 51.27], [54.0, 54.84], [58.0, 58.95], [61.0, 61.43], [62.0, 62.55], [67.0, 69.77], [71.0, 72.13], [83.0, 83.61], [86.0, 86.1], [86.0, 86.51], [87.0, 88.37], [89.0, 90.24], [93.0, 93.73], [95.0, 95.64], [100.0, 100.68], [104.0, 104.04], [105.0, 106.03], [109.0, 108.92], [110.0, 110.88], [111.0, 112.87], [128.0, 129.02], [129.0, 130.06], [132.0, 132.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 1.09, 0.88, 0.33, 1.05, 1.14, 0.93, 0.88, 0.55, 0.2, 1.35, 0.7, 3.61, 1.64, 1.27, 0.84, 0.95, 0.43, 0.55, 2.77, 1.13, 0.61, 0.1, 0.51, 1.37, 1.24, 0.73, 0.64, 0.68, 0.04, 1.03, -0.08, 0.88, 1.87, 1.02, 1.06, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/boGgXcQIe-8_filtered.json b/annotations_filtered/boGgXcQIe-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be56f0e5d1d7880cc4eccad73ce317c687288059 --- /dev/null +++ b/annotations_filtered/boGgXcQIe-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.4], [5.0, 9.32], [11.0, 14.52], [16.0, 16.95], [20.0, 20.6], [21.0, 21.63], [22.0, 22.98], [24.0, 24.75], [29.0, 29.27], [32.0, 38.31], [40.0, 43.48], [47.0, 50.41], [51.0, 54.82], [57.0, 102.22], [109.0, 109.56], [112.0, 111.99], [113.0, 113.91], [121.0, 121.2]], "keep_status": [false, true, true, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 30.93, 46.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.83, 40.61, 39.52, 40.24, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 24.61], ["music", 22.82], ["hum", 13.68]], [["hum", 27.71], ["music", 11.0], ["vehicle", 8.49]], null, null, null, null, null, null, [["speech", 14.4], ["music", 9.41], ["singing bowl", 6.8]], [["speech", 25.51], ["rumble", 21.17], ["whale vocalization", 21.07]], [["rumble", 29.51], ["whale vocalization", 25.7], ["speech", 14.94]], [["whale vocalization", 25.17], ["rumble", 20.52], ["hum", 8.81]], null, null, null, null, null], "duration": [1.4, 4.32, 3.52, 0.95, 0.6, 0.63, 0.98, 0.75, 0.27, 6.31, 3.48, 3.41, 3.82, 45.22, 0.56, -0.01, 0.91, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/bolHm17q3ik_filtered.json b/annotations_filtered/bolHm17q3ik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10d1ea59a77762da37c9931191699c626840ccfd --- /dev/null +++ b/annotations_filtered/bolHm17q3ik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[112.0, 114.42], [115.0, 116.72], [118.0, 118.5], [120.0, 131.85]], "keep_status": [true, false, false, true], "silence_prob": [38.8, 0.0, 0.0, 35.05], "audiomae_on_audioset": [[["speech", 39.64], ["music", 8.78], ["hum", 4.55]], null, null, [["music", 49.51], ["speech", 6.3], ["musical instrument", 5.61]]], "duration": [2.42, 1.72, 0.5, 11.85]} \ No newline at end of file diff --git a/annotations_filtered/bp5HRI2hEW0_filtered.json b/annotations_filtered/bp5HRI2hEW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fad258bdaa770845b3e2c6c08e1b0123fa3a111 --- /dev/null +++ b/annotations_filtered/bp5HRI2hEW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 85.4]], "keep_status": [false], "silence_prob": [65.67], "audiomae_on_audioset": [null], "duration": [4.4]} \ No newline at end of file diff --git a/annotations_filtered/bpNxVXA5dcQ_filtered.json b/annotations_filtered/bpNxVXA5dcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..523497a2d713c03d9447d68a11d4e427b39049da --- /dev/null +++ b/annotations_filtered/bpNxVXA5dcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.24], [9.0, 9.9], [10.0, 30.23], [35.0, 36.21], [37.0, 37.71], [38.0, 43.14], [52.0, 52.98], [54.0, 54.38], [55.0, 57.69], [58.0, 61.16], [62.0, 64.74], [66.0, 117.88], [121.0, 127.53]], "keep_status": [false, false, true, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 32.05, 0.0, 0.0, 33.64, 0.0, 0.0, 47.98, 42.15, 44.29, 0.0, 99.98], "audiomae_on_audioset": [null, null, [["music", 47.77], ["didgeridoo", 8.37], ["hum", 4.23]], null, null, [["music", 39.66], ["speech", 27.48], ["hum", 6.36]], null, null, [["music", 25.4], ["speech", 15.15], ["effects unit", 11.74]], [["music", 49.66], ["speech", 12.33], ["musical instrument", 11.29]], [["music", 51.92], ["bass guitar", 5.63], ["plucked string instrument", 5.48]], null, null], "duration": [1.24, 0.9, 20.23, 1.21, 0.71, 5.14, 0.98, 0.38, 2.69, 3.16, 2.74, 51.88, 6.53]} \ No newline at end of file diff --git a/annotations_filtered/bp_GxHYCq90_filtered.json b/annotations_filtered/bp_GxHYCq90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d02476d694366b3f76ca12206e1c112e158bfb29 --- /dev/null +++ b/annotations_filtered/bp_GxHYCq90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.26], [6.0, 7.05], [10.0, 10.37], [12.0, 13.37], [24.0, 29.96], [38.0, 40.71], [43.0, 43.55], [46.0, 51.27], [52.0, 52.27], [53.0, 63.14], [65.0, 77.04], [78.0, 78.85], [80.0, 92.58], [95.0, 99.13], [105.0, 107.15], [111.0, 112.68], [116.0, 119.55], [123.0, 124.53], [127.0, 130.03]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, true, true, true, false, true, false, true], "silence_prob": [29.28, 0.0, 0.0, 0.0, 29.11, 28.76, 0.0, 28.82, 0.0, 28.74, 29.69, 0.0, 28.44, 28.5, 29.16, 0.0, 28.29, 0.0, 28.11], "audiomae_on_audioset": [[["fart", 26.26], ["speech", 8.88], ["boing", 7.44]], null, null, null, [["music", 32.02], ["speech", 19.27], ["throbbing", 4.96]], [["speech", 72.76], ["music", 5.13], ["machine gun", 4.78]], null, [["music", 67.3], ["speech", 17.8], ["gunshot, gunfire", 1.93]], null, [["music", 46.45], ["speech", 27.14], ["whack, thwack", 4.12]], [["music", 33.99], ["speech", 27.36], ["throbbing", 20.34]], null, [["music", 30.96], ["hum", 21.71], ["mains hum", 10.4]], [["music", 52.9], ["throbbing", 10.6], ["musical instrument", 4.46]], [["mains hum", 30.11], ["hum", 25.63], ["speech", 7.28]], null, [["hum", 29.28], ["speech", 18.97], ["mains hum", 17.33]], null, [["music", 26.66], ["hum", 11.15], ["mains hum", 8.67]]], "duration": [4.26, 1.05, 0.37, 1.37, 5.96, 2.71, 0.55, 5.27, 0.27, 10.14, 12.04, 0.85, 12.58, 4.13, 2.15, 1.68, 3.55, 1.53, 3.03]} \ No newline at end of file diff --git a/annotations_filtered/bpc3TKhS6MU_filtered.json b/annotations_filtered/bpc3TKhS6MU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b8a258b192f060a6ee3c188a51cfaaa74857e2b --- /dev/null +++ b/annotations_filtered/bpc3TKhS6MU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.13], [5.0, 11.91], [14.0, 14.79], [16.0, 22.23], [24.0, 30.32], [31.0, 32.54], [36.0, 37.5], [39.0, 40.93], [42.0, 43.16], [45.0, 48.56], [53.0, 54.24], [55.0, 58.36], [61.0, 70.04], [71.0, 84.72], [86.0, 94.76], [101.0, 110.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [62.99, 93.6, 0.0, 96.42, 50.56, 0.0, 0.0, 0.0, 0.0, 65.2, 0.0, 54.36, 38.8, 35.34, 34.51, 35.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 82.82], ["musical instrument", 3.9], ["synthesizer", 3.02]], [["music", 46.48], ["wind instrument, woodwind instrument", 8.56], ["musical instrument", 7.7]], [["music", 46.57], ["brass instrument", 11.76], ["saxophone", 9.45]], [["music", 51.62], ["musical instrument", 5.82], ["percussion", 4.06]]], "duration": [2.13, 6.91, 0.79, 6.23, 6.32, 1.54, 1.5, 1.93, 1.16, 3.56, 1.24, 3.36, 9.04, 13.72, 8.76, 9.17]} \ No newline at end of file diff --git a/annotations_filtered/bpcwhWgWfCc_filtered.json b/annotations_filtered/bpcwhWgWfCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..069154d0f09ff9e430c3b7d0e67fece89fb2d53f --- /dev/null +++ b/annotations_filtered/bpcwhWgWfCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 18.32], [20.0, 25.35], [29.0, 45.5], [47.0, 48.63], [54.0, 55.46], [56.0, 56.49], [57.0, 57.77], [58.0, 59.31]], "keep_status": [false, true, true, false, false, false, false, false], "silence_prob": [76.7, 31.6, 49.87, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 16.76], ["cacophony", 10.17], ["reverberation", 8.41]], [["music", 43.12], ["didgeridoo", 13.85], ["effects unit", 5.72]], null, null, null, null, null], "duration": [16.32, 5.35, 16.5, 1.63, 1.46, 0.49, 0.77, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/bqPbkGVa_wc_filtered.json b/annotations_filtered/bqPbkGVa_wc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96a25360aece8fbbf5f06bc1374e93521a030770 --- /dev/null +++ b/annotations_filtered/bqPbkGVa_wc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 21.29], [22.0, 27.14], [28.0, 29.24], [32.0, 38.52], [39.0, 43.87], [45.0, 101.31], [105.0, 113.46], [116.0, 122.22], [124.0, 131.73]], "keep_status": [false, false, false, false, false, false, true, true, true], "silence_prob": [53.53, 60.98, 0.0, 80.64, 76.04, 0.0, 36.76, 36.15, 40.04], "audiomae_on_audioset": [null, null, null, null, null, null, [["sidetone", 21.59], ["speech", 11.88], ["siren", 7.65]], [["pulse", 29.75], ["hum", 24.07], ["throbbing", 10.69]], [["police car (siren)", 20.06], ["emergency vehicle", 16.31], ["siren", 9.19]]], "duration": [4.29, 5.14, 1.24, 6.52, 4.87, 56.31, 8.46, 6.22, 7.73]} \ No newline at end of file diff --git a/annotations_filtered/bq_WJS_HlPc_filtered.json b/annotations_filtered/bq_WJS_HlPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f170d3ea159468659afeb3ecb8a67fe300dccd8b --- /dev/null +++ b/annotations_filtered/bq_WJS_HlPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 44.2], [47.0, 51.34], [53.0, 55.68], [57.0, 61.32], [64.0, 67.46], [69.0, 72.62], [76.0, 88.6], [92.0, 148.34]], "keep_status": [true, true, false, true, true, true, false, false], "silence_prob": [28.71, 30.16, 29.97, 30.0, 29.01, 29.81, 29.33, 0.0], "audiomae_on_audioset": [[["music", 27.17], ["whack, thwack", 11.8], ["speech", 10.45]], [["livestock, farm animals, working animals", 21.95], ["music", 18.9], ["cattle, bovinae", 15.32]], [["music", 36.7], ["throbbing", 21.95], ["hum", 11.66]], [["mains hum", 32.11], ["hum", 16.92], ["music", 14.44]], [["music", 16.8], ["mains hum", 11.2], ["speech", 10.37]], [["music", 37.11], ["speech", 18.16], ["hum", 5.62]], [["music", 64.4], ["throbbing", 5.31], ["hum", 5.22]], null], "duration": [23.2, 4.34, 2.68, 4.32, 3.46, 3.62, 12.6, 56.34]} \ No newline at end of file diff --git a/annotations_filtered/bqvMCDQ3HEU_filtered.json b/annotations_filtered/bqvMCDQ3HEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6e99468cbcf003ad6cd2cb379837878813e73e8 --- /dev/null +++ b/annotations_filtered/bqvMCDQ3HEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.32], [10.0, 13.12], [14.0, 16.65], [35.0, 36.12], [38.0, 46.2], [50.0, 55.26], [55.0, 118.76], [119.0, 119.82], [122.0, 122.91], [126.0, 137.24], [138.0, 140.1], [144.0, 145.1], [146.0, 147.73], [152.0, 153.44]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.68, 60.14, 0.0, 53.97, 39.07, 0.0, 0.0, 0.0, 42.88, 54.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 38.4], ["music", 22.22], ["didgeridoo", 6.41]], null, null, null, [["animal", 17.2], ["music", 10.43], ["clip-clop", 7.73]], null, null, null, [["speech", 65.42], ["electric shaver, electric razor", 7.79], ["buzz", 6.91]], null, null, null, null], "duration": [0.32, 3.12, 2.65, 1.12, 8.2, 5.26, 63.76, 0.82, 0.91, 11.24, 2.1, 1.1, 1.73, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/bqwH3cQUlNA_filtered.json b/annotations_filtered/bqwH3cQUlNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a313e4ff942ae011d623be8b4311c4cc41c4ee3d --- /dev/null +++ b/annotations_filtered/bqwH3cQUlNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 35.43], [36.0, 36.21], [39.0, 38.89], [43.0, 43.61], [44.0, 45.47], [46.0, 48.02], [49.0, 50.33], [51.0, 52.68], [54.0, 55.88], [66.0, 71.46], [72.0, 73.13], [75.0, 77.33], [92.0, 92.08], [97.0, 98.59], [101.0, 100.92], [102.0, 103.01], [107.0, 135.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [30.77, 0.0, 0.0, 0.0, 0.0, 90.43, 0.0, 0.0, 0.0, 90.08, 0.0, 32.8, 0.0, 0.0, 0.0, 0.0, 30.75], "audiomae_on_audioset": [[["music", 54.43], ["throbbing", 10.0], ["hum", 6.01]], null, null, null, null, null, null, null, null, null, null, [["music", 55.59], ["singing bowl", 7.56], ["musical instrument", 3.36]], null, null, null, null, [["music", 38.25], ["speech", 23.45], ["hum", 6.0]]], "duration": [13.43, 0.21, -0.11, 0.61, 1.47, 2.02, 1.33, 1.68, 1.88, 5.46, 1.13, 2.33, 0.08, 1.59, -0.08, 1.01, 28.9]} \ No newline at end of file diff --git a/annotations_filtered/bqwS3qz3GhE_filtered.json b/annotations_filtered/bqwS3qz3GhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d4afe153376a7af4f9588e533d51312b8f7cd9c --- /dev/null +++ b/annotations_filtered/bqwS3qz3GhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 48.69], [50.0, 51.44], [55.0, 55.8], [59.0, 60.22], [61.0, 61.38], [62.0, 149.35], [150.0, 153.69], [156.0, 156.47], [165.0, 167.51]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [72.31, 0.0, 0.0, 0.0, 0.0, 0.0, 45.72, 0.0, 82.61], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 30.73], ["fire", 13.45], ["mains hum", 9.79]], null, null], "duration": [2.69, 1.44, 0.8, 1.22, 0.38, 87.35, 3.69, 0.47, 2.51]} \ No newline at end of file diff --git a/annotations_filtered/bqxDIHYcp9g_filtered.json b/annotations_filtered/bqxDIHYcp9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1302b7089c31bf5728a1ec25fba4ad6e88b05e8d --- /dev/null +++ b/annotations_filtered/bqxDIHYcp9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 51.66], [54.0, 66.06], [68.0, 88.06], [89.0, 103.25], [104.0, 118.86]], "keep_status": [false, false, false, false, false], "silence_prob": [96.66, 91.47, 82.43, 86.64, 81.89], "audiomae_on_audioset": [null, null, null, null, null], "duration": [20.66, 12.06, 20.06, 14.25, 14.86]} \ No newline at end of file diff --git a/annotations_filtered/br2rj_3KW1A_filtered.json b/annotations_filtered/br2rj_3KW1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ab79f635adc687793a69bfc55a998621129e90e --- /dev/null +++ b/annotations_filtered/br2rj_3KW1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.71], [26.0, 26.49], [30.0, 30.48], [35.0, 35.75], [38.0, 38.69], [39.0, 39.18], [44.0, 45.87], [55.0, 55.7], [56.0, 57.45], [62.0, 65.82], [66.0, 68.84], [70.0, 91.86], [92.0, 103.32], [105.0, 107.59], [112.0, 114.3]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0, 31.4, 29.16, 28.76, 30.16, 30.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 33.44], ["hum", 17.19], ["mains hum", 10.01]], [["music", 23.79], ["didgeridoo", 18.14], ["mains hum", 8.55]], [["music", 55.89], ["throbbing", 20.47], ["hum", 6.53]], [["music", 53.6], ["hum", 9.3], ["throbbing", 5.62]], [["music", 18.13], ["explosion", 7.92], ["groan", 7.25]], [["music", 34.33], ["speech", 28.46], ["boing", 11.52]]], "duration": [0.71, 0.49, 0.48, 0.75, 0.69, 0.18, 1.87, 0.7, 1.45, 3.82, 2.84, 21.86, 11.32, 2.59, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/brTGAgUYnIc_filtered.json b/annotations_filtered/brTGAgUYnIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..921df8c3ea480e9eee68c30676063e8a052ee009 --- /dev/null +++ b/annotations_filtered/brTGAgUYnIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.18], [5.0, 5.66], [6.0, 7.52], [10.0, 10.66], [30.0, 31.53], [33.0, 33.61], [37.0, 37.79], [40.0, 40.05], [42.0, 42.84], [43.0, 45.23], [52.0, 57.57], [62.0, 62.28], [63.0, 72.89], [75.0, 78.87], [82.0, 82.26], [82.0, 88.01]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.86, 51.55, 0.0, 43.15, 45.33, 0.0, 41.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["whale vocalization", 40.39], ["frog", 18.7], ["radio", 5.34]], null, null, [["music", 51.12], ["speech", 19.73], ["synthesizer", 8.5]], [["music", 27.13], ["throbbing", 8.04], ["electronic music", 6.92]], null, [["music", 37.95], ["throbbing", 17.72], ["hum", 15.05]]], "duration": [0.18, 0.66, 1.52, 0.66, 1.53, 0.61, 0.79, 0.05, 0.84, 2.23, 5.57, 0.28, 9.89, 3.87, 0.26, 6.01]} \ No newline at end of file diff --git a/annotations_filtered/bryVfEK0U4k_filtered.json b/annotations_filtered/bryVfEK0U4k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0633f5b870ca60a99c20c0993aa25140d7fb55c4 --- /dev/null +++ b/annotations_filtered/bryVfEK0U4k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.21], [10.0, 10.08], [13.0, 13.64], [16.0, 17.83], [18.0, 18.57], [19.0, 20.82], [30.0, 30.45], [33.0, 32.9], [44.0, 44.88], [49.0, 48.81], [54.0, 53.91], [57.0, 57.89], [60.0, 59.95], [65.0, 65.37], [71.0, 71.27], [73.0, 73.18], [75.0, 76.71], [100.0, 100.3], [105.0, 105.02], [106.0, 106.29], [111.0, 111.11], [112.0, 112.8], [120.0, 122.82], [124.0, 125.91], [133.0, 133.79], [135.0, 135.41], [150.0, 150.35], [169.0, 169.87], [172.0, 173.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.08, 0.64, 1.83, 0.57, 1.82, 0.45, -0.1, 0.88, -0.19, -0.09, 0.89, -0.05, 0.37, 0.27, 0.18, 1.71, 0.3, 0.02, 0.29, 0.11, 0.8, 2.82, 1.91, 0.79, 0.41, 0.35, 0.87, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/bsaA903oxvc_filtered.json b/annotations_filtered/bsaA903oxvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/bsaA903oxvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/bt6-F11LZsQ_filtered.json b/annotations_filtered/bt6-F11LZsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ada275c53672477f2143cf38ae325a85f110dcdf --- /dev/null +++ b/annotations_filtered/bt6-F11LZsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 34.84], [42.0, 46.38]], "keep_status": [false, true], "silence_prob": [39.98, 33.85], "audiomae_on_audioset": [[["music", 83.33], ["electronic music", 1.97], ["funk", 1.48]], [["music", 43.36], ["sidetone", 13.76], ["boing", 11.3]]], "duration": [7.84, 4.38]} \ No newline at end of file diff --git a/annotations_filtered/btMisVovQKk_filtered.json b/annotations_filtered/btMisVovQKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..088b21fb54c54f0a56713ea109d96ed996d809da --- /dev/null +++ b/annotations_filtered/btMisVovQKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.87], [9.0, 8.68], [15.0, 14.82], [19.0, 19.41], [25.0, 25.25], [27.0, 27.6], [36.0, 37.08], [38.0, 38.26], [44.0, 44.44], [45.0, 46.75], [60.0, 60.24], [65.0, 65.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.13, -0.32, -0.18, 0.41, 0.25, 0.6, 1.08, 0.26, 0.44, 1.75, 0.24, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/btRNa3CItMc_filtered.json b/annotations_filtered/btRNa3CItMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a76d1dfb65a2e21ec6b8786bd5413abb59162e73 --- /dev/null +++ b/annotations_filtered/btRNa3CItMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.18], [5.0, 5.93], [9.0, 11.47], [18.0, 44.29], [47.0, 47.73], [48.0, 49.62], [50.0, 65.96], [87.0, 90.02], [94.0, 94.71], [102.0, 102.57], [103.0, 105.27], [107.0, 108.18]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [51.07, 0.0, 91.47, 90.25, 0.0, 0.0, 98.86, 45.27, 0.0, 0.0, 53.28, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 34.71], ["speech", 19.01], ["musical instrument", 4.33]], null, null, null, null], "duration": [2.18, 0.93, 2.47, 26.29, 0.73, 1.62, 15.96, 3.02, 0.71, 0.57, 2.27, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/btVoaFC1Aqk_filtered.json b/annotations_filtered/btVoaFC1Aqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c80f3a2eb803981b2c6a5d98a1f4fc60b613405 --- /dev/null +++ b/annotations_filtered/btVoaFC1Aqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 38.03], [39.0, 40.78], [43.0, 49.84], [53.0, 55.76], [58.0, 62.21], [63.0, 75.71], [77.0, 76.94], [80.0, 88.6], [90.0, 92.08], [94.0, 94.37]], "keep_status": [false, false, false, true, false, false, false, true, true, false], "silence_prob": [30.24, 0.0, 29.51, 29.41, 30.88, 29.5, 0.0, 30.89, 30.02, 0.0], "audiomae_on_audioset": [[["music", 76.44], ["electronic music", 4.01], ["synthesizer", 3.06]], null, [["throbbing", 36.63], ["hum", 29.41], ["music", 7.2]], [["music", 44.3], ["speech", 17.48], ["breaking", 7.27]], [["hum", 37.69], ["music", 17.51], ["throbbing", 16.34]], [["music", 51.07], ["hum", 21.16], ["throbbing", 14.08]], null, [["speech", 39.19], ["bee, wasp, etc.", 14.43], ["fly, housefly", 11.64]], [["music", 20.44], ["didgeridoo", 17.86], ["speech", 8.56]], null], "duration": [23.03, 1.78, 6.84, 2.76, 4.21, 12.71, -0.06, 8.6, 2.08, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/btWDXgrF-bo_filtered.json b/annotations_filtered/btWDXgrF-bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..298ed84d3b8de9ed750177ab3c004b4f3611be7e --- /dev/null +++ b/annotations_filtered/btWDXgrF-bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 5.24], [7.0, 30.1], [33.0, 44.31], [45.0, 46.18], [48.0, 48.57], [49.0, 50.19], [51.0, 53.72], [56.0, 56.46], [57.0, 62.53], [68.0, 68.15], [72.0, 73.79], [78.0, 82.68], [91.0, 91.94], [95.0, 102.03], [104.0, 103.62], [107.0, 107.69], [111.0, 111.64], [114.0, 114.22], [115.0, 115.72], [117.0, 117.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.13, 56.33, 0.0, 0.0, 0.0, 71.87, 0.0, 55.39, 0.0, 0.0, 49.92, 0.0, 46.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 88.42], ["singing", 1.01], ["guitar", 0.93]], null, null, null, null, null, null, null, null, null, [["music", 66.27], ["musical instrument", 3.84], ["throbbing", 2.74]], null, [["music", 73.53], ["throbbing", 2.96], ["sampler", 2.0]], null, null, null, null, null, null], "duration": [0.89, 1.24, 23.1, 11.31, 1.18, 0.57, 1.19, 2.72, 0.46, 5.53, 0.15, 1.79, 4.68, 0.94, 7.03, -0.38, 0.69, 0.64, 0.22, 0.72, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/btfIH4Q2BQA_filtered.json b/annotations_filtered/btfIH4Q2BQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..868faf3a54cea19e9c9504cf04edbf58ea1329da --- /dev/null +++ b/annotations_filtered/btfIH4Q2BQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.72], [7.0, 8.13], [9.0, 12.18], [14.0, 17.74], [19.0, 20.12], [21.0, 23.16], [23.0, 27.03], [27.0, 27.53], [32.0, 32.05], [33.0, 33.89], [35.0, 35.92], [38.0, 38.52], [41.0, 41.96], [43.0, 44.12], [46.0, 45.77], [46.0, 48.73], [49.0, 50.55], [51.0, 51.51], [52.0, 52.74], [54.0, 55.17], [57.0, 57.54], [62.0, 63.14], [65.0, 66.6], [68.0, 68.93], [70.0, 70.88], [74.0, 74.09], [76.0, 78.26], [80.0, 80.1], [83.0, 91.22], [95.0, 95.2], [100.0, 104.35], [106.0, 106.78], [109.0, 112.16], [115.0, 116.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 45.95, 86.27, 0.0, 84.98, 31.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 0.0, 58.81, 0.0, 48.82, 0.0, 57.25, 0.0], "audiomae_on_audioset": [null, null, [["speech", 65.33], ["hum", 4.18], ["inside, small room", 3.42]], null, null, null, [["breaking", 47.09], ["speech", 43.34], ["glass", 3.49]], null, null, null, null, null, null, null, null, [["music", 42.47], ["speech", 17.09], ["sidetone", 10.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.64], ["mains hum", 19.04], ["speech", 6.94]], null, null, null], "duration": [1.72, 1.13, 3.18, 3.74, 1.12, 2.16, 4.03, 0.53, 0.05, 0.89, 0.92, 0.52, 0.96, 1.12, -0.23, 2.73, 1.55, 0.51, 0.74, 1.17, 0.54, 1.14, 1.6, 0.93, 0.88, 0.09, 2.26, 0.1, 8.22, 0.2, 4.35, 0.78, 3.16, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/btk4Wp0RssY_filtered.json b/annotations_filtered/btk4Wp0RssY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..501588b6822a9bc45785b0f8d0ccde3d49aff0be --- /dev/null +++ b/annotations_filtered/btk4Wp0RssY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.24], [5.0, 6.44], [8.0, 10.35], [12.0, 12.61], [16.0, 17.83], [20.0, 21.71], [25.0, 26.45], [29.0, 30.23], [33.0, 35.28], [36.0, 38.62], [40.0, 45.89], [48.0, 49.4], [51.0, 52.29], [54.0, 55.98], [58.0, 59.49], [60.0, 60.3], [63.0, 64.1], [66.0, 67.41], [69.0, 71.02], [73.0, 74.53], [79.0, 81.18], [88.0, 88.28], [90.0, 90.88], [92.0, 98.51], [100.0, 99.81], [106.0, 112.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [62.78, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 99.84, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 43.69, 0.0, 0.0, 49.54, 0.0, 39.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["chirp tone", 51.7], ["speech", 7.81], ["sine wave", 7.49]], null, null, [["speech", 20.0], ["mains hum", 15.61], ["hum", 13.31]], null, [["music", 41.29], ["door", 8.81], ["speech", 7.76]]], "duration": [2.24, 1.44, 2.35, 0.61, 1.83, 1.71, 1.45, 1.23, 2.28, 2.62, 5.89, 1.4, 1.29, 1.98, 1.49, 0.3, 1.1, 1.41, 2.02, 1.53, 2.18, 0.28, 0.88, 6.51, -0.19, 6.62]} \ No newline at end of file diff --git a/annotations_filtered/btwtChuzeaA_filtered.json b/annotations_filtered/btwtChuzeaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c145ebeaf570b1406632e66c5cda04075d3d1b3c --- /dev/null +++ b/annotations_filtered/btwtChuzeaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.51], [11.0, 14.34], [15.0, 14.98], [16.0, 29.08], [32.0, 35.43], [36.0, 35.67], [36.0, 58.43], [60.0, 62.63], [64.0, 64.69], [68.0, 67.69], [68.0, 68.93], [70.0, 83.25]], "keep_status": [true, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [29.27, 28.67, 0.0, 29.01, 29.34, 0.0, 28.9, 33.92, 0.0, 0.0, 0.0, 29.25], "audiomae_on_audioset": [[["breaking", 27.77], ["thunk", 20.47], ["music", 13.52]], [["whack, thwack", 62.81], ["speech", 5.25], ["thump, thud", 5.22]], null, [["music", 53.75], ["whack, thwack", 6.07], ["sound effect", 3.34]], [["grunt", 26.51], ["music", 21.33], ["animal", 8.61]], null, [["music", 57.79], ["speech", 10.52], ["throbbing", 5.36]], [["music", 44.35], ["hum", 16.84], ["mains hum", 14.45]], null, null, null, [["speech", 43.02], ["music", 39.09], ["whack, thwack", 2.91]]], "duration": [3.51, 3.34, -0.02, 13.08, 3.43, -0.33, 22.43, 2.63, 0.69, -0.31, 0.93, 13.25]} \ No newline at end of file diff --git a/annotations_filtered/bu5m4sr6e6I_filtered.json b/annotations_filtered/bu5m4sr6e6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec297489155df0fa8dccf5f0df4bb548633c3b1d --- /dev/null +++ b/annotations_filtered/bu5m4sr6e6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 27.35], [30.0, 42.4], [48.0, 54.4], [56.0, 56.69], [58.0, 58.83], [63.0, 68.98], [81.0, 86.83], [100.0, 100.14], [108.0, 123.65]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [29.67, 29.81, 29.8, 0.0, 0.0, 29.94, 30.26, 0.0, 29.79], "audiomae_on_audioset": [[["music", 48.89], ["cacophony", 29.79], ["throbbing", 2.98]], [["music", 77.54], ["throbbing", 6.29], ["electronic music", 2.17]], [["music", 55.15], ["didgeridoo", 18.85], ["throbbing", 6.05]], null, null, [["music", 32.58], ["throbbing", 23.24], ["hum", 13.27]], [["music", 70.79], ["cacophony", 9.18], ["synthesizer", 2.79]], null, [["music", 40.44], ["throbbing", 20.4], ["synthesizer", 12.95]]], "duration": [19.35, 12.4, 6.4, 0.69, 0.83, 5.98, 5.83, 0.14, 15.65]} \ No newline at end of file diff --git a/annotations_filtered/bu83p1i0D1A_filtered.json b/annotations_filtered/bu83p1i0D1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58ce1350113ba401fef1d85855befdc165442911 --- /dev/null +++ b/annotations_filtered/bu83p1i0D1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.88], [13.0, 18.81], [22.0, 58.24], [69.0, 69.35], [70.0, 72.15], [76.0, 76.91], [78.0, 86.93]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [0.0, 31.34, 0.0, 0.0, 30.93, 0.0, 34.01], "audiomae_on_audioset": [null, [["music", 60.37], ["groan", 6.04], ["whack, thwack", 4.39]], null, null, [["speech", 55.9], ["sidetone", 7.42], ["sound effect", 4.8]], null, [["music", 67.02], ["synthesizer", 3.17], ["electronic music", 2.58]]], "duration": [1.88, 5.81, 36.24, 0.35, 2.15, 0.91, 8.93]} \ No newline at end of file diff --git a/annotations_filtered/bu9YxTb6gf8_filtered.json b/annotations_filtered/bu9YxTb6gf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe43c86110e931023e356fa439d3f2d62ec3a9a5 --- /dev/null +++ b/annotations_filtered/bu9YxTb6gf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [10.0, 10.57], [23.0, 24.29], [27.0, 27.48], [32.0, 33.59], [38.0, 39.58], [42.0, 43.56], [46.0, 47.53], [53.0, 55.44], [60.0, 63.19], [68.0, 70.04], [71.0, 71.83], [75.0, 78.31], [79.0, 79.66], [82.0, 86.44], [92.0, 92.26], [97.0, 98.1], [105.0, 105.81], [111.0, 113.49], [118.0, 121.88], [125.0, 128.16], [133.0, 135.84]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 30.38, 30.37, 0.0, 29.96, 0.0, 30.31, 0.0, 0.0, 0.0, 32.26, 30.08, 29.96, 30.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 51.79], ["throbbing", 7.45], ["cacophony", 4.64]], [["music", 73.92], ["sampler", 2.54], ["musical instrument", 2.18]], [["music", 84.15], ["guitar", 3.18], ["musical instrument", 2.93]], null, [["music", 58.51], ["throbbing", 8.3], ["hum", 7.57]], null, [["music", 66.3], ["guitar", 4.19], ["plucked string instrument", 3.73]], null, null, null, [["music", 57.27], ["musical instrument", 7.64], ["electronic music", 2.86]], [["music", 36.99], ["didgeridoo", 34.81], ["boing", 3.67]], [["music", 57.31], ["speech", 4.75], ["boing", 4.26]], [["music", 50.43], ["sampler", 5.04], ["synthesizer", 3.44]]], "duration": [0.4, 0.57, 1.29, 0.48, 1.59, 1.58, 1.56, 1.53, 2.44, 3.19, 2.04, 0.83, 3.31, 0.66, 4.44, 0.26, 1.1, 0.81, 2.49, 3.88, 3.16, 2.84]} \ No newline at end of file diff --git a/annotations_filtered/buH0CUEx-_Q_filtered.json b/annotations_filtered/buH0CUEx-_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ff61cb09a86185b65c9a74c07cbe18dc41b1b19 --- /dev/null +++ b/annotations_filtered/buH0CUEx-_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 32.14], [32.0, 32.17], [33.0, 55.49], [59.0, 58.68], [59.0, 60.03], [61.0, 91.93], [97.0, 103.98], [104.0, 106.3]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [29.4, 0.0, 29.04, 0.0, 0.0, 0.0, 31.18, 37.15], "audiomae_on_audioset": [[["music", 54.11], ["throbbing", 16.71], ["hum", 6.16]], null, [["music", 44.74], ["throbbing", 18.85], ["hum", 10.13]], null, null, null, [["music", 67.15], ["throbbing", 9.79], ["angry music", 4.61]], [["music", 59.72], ["didgeridoo", 7.12], ["speech", 5.9]]], "duration": [22.14, 0.17, 22.49, -0.32, 1.03, 30.93, 6.98, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/buIXWAgTUIU_filtered.json b/annotations_filtered/buIXWAgTUIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ead5aeb3dc2c43b7d3b00cc77b178ecdc11213d1 --- /dev/null +++ b/annotations_filtered/buIXWAgTUIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 57.99], [59.0, 60.4], [63.0, 65.3], [68.0, 84.57], [85.0, 89.11], [90.0, 93.16], [94.0, 95.01], [96.0, 99.4], [101.0, 105.0], [106.0, 106.62], [108.0, 108.21], [109.0, 109.75], [111.0, 111.91], [113.0, 113.53], [115.0, 114.94], [117.0, 117.76]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.45, 0.0, 30.22, 30.6, 41.32, 40.21, 0.0, 56.33, 56.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.6], ["didgeridoo", 37.22], ["throbbing", 2.88]], null, [["music", 72.72], ["didgeridoo", 5.09], ["screaming", 2.22]], [["music", 54.76], ["didgeridoo", 11.37], ["speech", 5.69]], [["music", 29.1], ["throbbing", 22.62], ["didgeridoo", 9.42]], [["music", 63.36], ["didgeridoo", 18.93], ["musical instrument", 4.41]], null, null, null, null, null, null, null, null, null, null], "duration": [21.99, 1.4, 2.3, 16.57, 4.11, 3.16, 1.01, 3.4, 4.0, 0.62, 0.21, 0.75, 0.91, 0.53, -0.06, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/buNwwAximcE_filtered.json b/annotations_filtered/buNwwAximcE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..677d78407949fa309925c28c66df4dc81b3c5eb7 --- /dev/null +++ b/annotations_filtered/buNwwAximcE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 44.31], [52.0, 52.52], [54.0, 54.99], [66.0, 66.12], [76.0, 77.01], [79.0, 80.38], [86.0, 86.59], [92.0, 109.85], [112.0, 112.48]], "keep_status": [true, false, false, false, false, false, false, true, false], "silence_prob": [32.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.73, 0.0], "audiomae_on_audioset": [[["music", 40.27], ["thunk", 10.12], ["musical instrument", 4.68]], null, null, null, null, null, null, [["music", 58.67], ["throbbing", 5.52], ["musical instrument", 3.71]], null], "duration": [16.31, 0.52, 0.99, 0.12, 1.01, 1.38, 0.59, 17.85, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/buRR_o85qhQ_filtered.json b/annotations_filtered/buRR_o85qhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0630e29554472ab6b4f32265326a3bce1b31b870 --- /dev/null +++ b/annotations_filtered/buRR_o85qhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.04], [14.0, 15.94], [17.0, 19.31], [21.0, 21.36], [23.0, 23.16], [26.0, 26.82], [29.0, 29.0], [31.0, 32.93], [34.0, 34.7], [38.0, 38.7], [41.0, 42.23], [47.0, 47.55], [49.0, 49.18], [54.0, 54.11], [56.0, 56.62], [59.0, 60.59], [62.0, 62.43], [63.0, 63.46], [64.0, 64.83], [66.0, 68.03], [69.0, 70.34], [75.0, 76.25], [81.0, 81.55], [84.0, 84.79], [85.0, 86.34], [87.0, 90.29], [92.0, 94.0], [95.0, 98.34], [100.0, 101.85], [105.0, 107.11], [108.0, 109.27], [110.0, 110.98], [113.0, 114.29], [116.0, 116.29], [118.0, 125.09]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [33.89, 0.0, 38.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.14, 0.0, 0.0, 0.0, 0.0, 0.0, 38.83, 32.11, 43.71, 0.0, 46.22, 0.0, 0.0, 0.0, 0.0, 33.3], "audiomae_on_audioset": [[["music", 49.0], ["speech", 21.66], ["theremin", 5.67]], null, [["music", 34.76], ["speech", 23.72], ["didgeridoo", 4.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.3], ["speech", 15.3], ["mains hum", 6.69]], null, null, null, null, null, [["music", 72.15], ["theremin", 16.62], ["musical instrument", 1.68]], [["music", 57.41], ["theremin", 8.02], ["synthesizer", 4.19]], [["music", 54.96], ["theremin", 19.9], ["effects unit", 3.73]], null, [["music", 51.95], ["quack", 11.68], ["theremin", 9.13]], null, null, null, null, [["music", 55.1], ["theremin", 26.93], ["musical instrument", 4.18]]], "duration": [2.04, 1.94, 2.31, 0.36, 0.16, 0.82, 0.0, 1.93, 0.7, 0.7, 1.23, 0.55, 0.18, 0.11, 0.62, 1.59, 0.43, 0.46, 0.83, 2.03, 1.34, 1.25, 0.55, 0.79, 1.34, 3.29, 2.0, 3.34, 1.85, 2.11, 1.27, 0.98, 1.29, 0.29, 7.09]} \ No newline at end of file diff --git a/annotations_filtered/buoodeEt_hM_filtered.json b/annotations_filtered/buoodeEt_hM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b541207e05a524f89377faef3869ab9534cc0944 --- /dev/null +++ b/annotations_filtered/buoodeEt_hM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.1], [19.0, 52.02], [54.0, 65.45], [67.0, 88.1], [89.0, 107.05], [108.0, 109.16], [110.0, 112.73], [119.0, 123.92]], "keep_status": [true, false, true, true, false, false, true, false], "silence_prob": [36.52, 0.0, 32.75, 32.86, 35.42, 0.0, 39.04, 54.17], "audiomae_on_audioset": [[["hum", 28.58], ["music", 25.24], ["mains hum", 6.92]], null, [["speech", 37.38], ["music", 24.57], ["cacophony", 5.87]], [["music", 22.2], ["throbbing", 17.88], ["hum", 10.89]], [["speech", 56.78], ["music", 26.95], ["musical instrument", 2.12]], null, [["mains hum", 21.25], ["music", 16.67], ["hum", 16.64]], null], "duration": [6.1, 33.02, 11.45, 21.1, 18.05, 1.16, 2.73, 4.92]} \ No newline at end of file diff --git a/annotations_filtered/bvEJjjYbgtk_filtered.json b/annotations_filtered/bvEJjjYbgtk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ed900c0d874c2788c6fc3980315e391095429c3 --- /dev/null +++ b/annotations_filtered/bvEJjjYbgtk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 52.74], [55.0, 58.26], [69.0, 96.79]], "keep_status": [false, false, false], "silence_prob": [0.0, 37.01, 47.16], "audiomae_on_audioset": [null, [["speech", 38.64], ["music", 23.38], ["rumble", 10.65]], [["music", 60.77], ["hum", 13.36], ["buzz", 4.49]]], "duration": [0.74, 3.26, 27.79]} \ No newline at end of file diff --git a/annotations_filtered/bvITByUy5fA_filtered.json b/annotations_filtered/bvITByUy5fA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1036a1315cfb3213224eff453bd1c84142cb08b0 --- /dev/null +++ b/annotations_filtered/bvITByUy5fA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [43.0, 43.23], [44.0, 44.24], [56.0, 59.21], [65.0, 65.3], [71.0, 72.52], [74.0, 74.65], [76.0, 76.86], [78.0, 78.19], [93.0, 96.06], [97.0, 106.64], [108.0, 108.08], [109.0, 110.22], [113.0, 118.56], [126.0, 129.98], [131.0, 131.19], [143.0, 143.88], [145.0, 147.07], [150.0, 150.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 50.71, 0.0, 0.0, 92.15, 99.98, 0.0, 0.0, 91.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 0.23, 0.24, 3.21, 0.3, 1.52, 0.65, 0.86, 0.19, 3.06, 9.64, 0.08, 1.22, 5.56, 3.98, 0.19, 0.88, 2.07, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/bvRS9b2nhh4_filtered.json b/annotations_filtered/bvRS9b2nhh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..132395c93dc3c67bebfc6997627db41b14b48270 --- /dev/null +++ b/annotations_filtered/bvRS9b2nhh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.84], [10.0, 10.18], [11.0, 14.27], [16.0, 17.49], [18.0, 21.15], [23.0, 35.14], [51.0, 55.53], [58.0, 67.19]], "keep_status": [false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 84.98, 0.0, 62.78, 46.83, 28.93, 33.18], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 46.01], ["rowboat, canoe, kayak", 18.61], ["insect", 4.67]], [["music", 27.67], ["hum", 7.92], ["buzz", 7.9]], [["speech", 34.0], ["hum", 16.84], ["mains hum", 9.52]]], "duration": [0.84, 0.18, 3.27, 1.49, 3.15, 12.14, 4.53, 9.19]} \ No newline at end of file diff --git a/annotations_filtered/bvjLvggrYUo_filtered.json b/annotations_filtered/bvjLvggrYUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f72d74c7b69d304e48e7a0075bc84382595df543 --- /dev/null +++ b/annotations_filtered/bvjLvggrYUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.83], [17.0, 18.0], [20.0, 20.31], [21.0, 23.94], [25.0, 38.62], [42.0, 42.52], [46.0, 47.16], [49.0, 50.18], [51.0, 52.19], [53.0, 53.35], [54.0, 54.35], [56.0, 58.01], [59.0, 59.24], [60.0, 59.88], [61.0, 61.18], [63.0, 63.32], [64.0, 65.75], [67.0, 67.96], [68.0, 68.89], [70.0, 70.19], [71.0, 74.09], [76.0, 78.75], [81.0, 82.51], [84.0, 84.54], [86.0, 88.05], [90.0, 90.39], [93.0, 93.93], [96.0, 96.82], [100.0, 100.99], [102.0, 103.01], [106.0, 106.08], [107.0, 107.65], [109.0, 110.24], [112.0, 113.04], [116.0, 118.35], [120.0, 120.56], [122.0, 122.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 97.83, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 1.0, 0.31, 2.94, 13.62, 0.52, 1.16, 1.18, 1.19, 0.35, 0.35, 2.01, 0.24, -0.12, 0.18, 0.32, 1.75, 0.96, 0.89, 0.19, 3.09, 2.75, 1.51, 0.54, 2.05, 0.39, 0.93, 0.82, 0.99, 1.01, 0.08, 0.65, 1.24, 1.04, 2.35, 0.56, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/bvl-DxX9N8g_filtered.json b/annotations_filtered/bvl-DxX9N8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9403c74bd8e4ca0deac7830538633f0a88970aea --- /dev/null +++ b/annotations_filtered/bvl-DxX9N8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.36], [6.0, 6.32], [7.0, 7.77], [8.0, 11.91], [13.0, 13.44], [16.0, 16.5], [19.0, 19.7], [22.0, 22.08], [25.0, 26.23], [27.0, 28.49], [29.0, 30.3], [33.0, 34.25], [36.0, 36.48], [39.0, 39.93], [46.0, 46.95], [57.0, 58.09], [65.0, 74.22], [75.0, 79.73], [80.0, 83.05], [85.0, 85.99], [87.0, 89.29], [93.0, 94.71], [98.0, 104.58], [105.0, 120.48], [122.0, 123.09], [126.0, 127.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 97.33, 0.0, 87.92, 0.0, 61.57, 85.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 63.22], ["sidetone", 8.48], ["radio", 3.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.32, 0.77, 3.91, 0.44, 0.5, 0.7, 0.08, 1.23, 1.49, 1.3, 1.25, 0.48, 0.93, 0.95, 1.09, 9.22, 4.73, 3.05, 0.99, 2.29, 1.71, 6.58, 15.48, 1.09, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/bvnOqxRHjuc_filtered.json b/annotations_filtered/bvnOqxRHjuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb47eb89949f9b3e357f0ce59b29e7ee536b5b2 --- /dev/null +++ b/annotations_filtered/bvnOqxRHjuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 107.11], [108.0, 108.67], [114.0, 115.01]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [43.11, 0.67, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/bw4xDTQYIfE_filtered.json b/annotations_filtered/bw4xDTQYIfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ccff04a38bb49a4099c053de82606583f0c1b81 --- /dev/null +++ b/annotations_filtered/bw4xDTQYIfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [15.0, 15.09], [25.0, 25.37], [41.0, 40.78], [48.0, 48.22], [53.0, 52.83], [62.0, 62.16], [70.0, 70.95], [82.0, 81.6], [82.0, 81.65], [83.0, 83.46], [94.0, 94.36], [114.0, 114.52], [115.0, 116.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.09, 0.37, -0.22, 0.22, -0.17, 0.16, 0.95, -0.4, -0.35, 0.46, 0.36, 0.52, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/bw7GnKjkThQ_filtered.json b/annotations_filtered/bw7GnKjkThQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f632fdf94ec040ef31801660dd8f8443af29293 --- /dev/null +++ b/annotations_filtered/bw7GnKjkThQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 27.8], [29.0, 57.4], [58.0, 67.31], [69.0, 74.8], [76.0, 86.09], [88.0, 88.47], [91.0, 112.11]], "keep_status": [true, true, false, true, false, false, false], "silence_prob": [44.69, 44.4, 36.67, 41.93, 43.48, 0.0, 39.21], "audiomae_on_audioset": [[["music", 48.22], ["boing", 5.35], ["ding", 4.53]], [["music", 38.74], ["synthesizer", 10.71], ["effects unit", 10.04]], [["music", 39.36], ["boing", 21.1], ["speech", 10.33]], [["music", 53.44], ["musical instrument", 3.73], ["didgeridoo", 3.72]], [["music", 73.24], ["synthesizer", 3.86], ["musical instrument", 3.19]], null, [["music", 65.82], ["thunk", 5.27], ["synthesizer", 2.29]]], "duration": [24.8, 28.4, 9.31, 5.8, 10.09, 0.47, 21.11]} \ No newline at end of file diff --git a/annotations_filtered/bwKwR3hV0zA_filtered.json b/annotations_filtered/bwKwR3hV0zA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21bb9f194a5dc198e48be58a91fe1febea7d8a93 --- /dev/null +++ b/annotations_filtered/bwKwR3hV0zA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.93], [24.0, 34.28], [35.0, 37.2], [39.0, 46.2], [50.0, 66.06], [68.0, 76.99], [78.0, 85.62], [86.0, 95.69], [97.0, 134.15], [136.0, 137.05], [139.0, 140.7], [143.0, 144.8], [146.0, 145.93], [146.0, 158.94], [160.0, 160.88], [161.0, 162.87], [166.0, 166.62], [172.0, 172.88], [177.0, 177.57], [183.0, 183.24], [183.0, 183.9], [185.0, 196.43], [199.0, 199.64], [200.0, 201.21], [203.0, 203.0], [211.0, 211.45], [213.0, 213.83], [216.0, 218.86], [219.0, 219.67]], "keep_status": [false, true, true, false, true, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 31.11, 37.14, 28.97, 29.77, 44.6, 32.2, 29.95, 0.0, 0.0, 0.0, 0.0, 0.0, 29.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.18, 0.0, 0.0, 0.0, 0.0, 0.0, 34.87, 0.0], "audiomae_on_audioset": [null, [["music", 47.56], ["speech", 16.5], ["didgeridoo", 3.52]], [["music", 47.16], ["throbbing", 7.21], ["musical instrument", 5.65]], [["music", 38.91], ["speech", 16.49], ["throbbing", 14.69]], [["music", 43.29], ["hum", 14.45], ["theremin", 7.09]], [["cattle, bovinae", 22.12], ["animal", 17.04], ["moo", 9.66]], [["music", 31.2], ["noise", 10.08], ["speech", 9.17]], [["music", 53.26], ["throbbing", 13.4], ["hum", 8.44]], null, null, null, null, null, [["speech", 48.1], ["music", 10.61], ["breaking", 5.96]], null, null, null, null, null, null, null, [["speech", 65.14], ["fart", 18.94], ["music", 5.91]], null, null, null, null, null, [["music", 44.45], ["theremin", 13.26], ["grunt", 9.55]], null], "duration": [1.93, 10.28, 2.2, 7.2, 16.06, 8.99, 7.62, 9.69, 37.15, 1.05, 1.7, 1.8, -0.07, 12.94, 0.88, 1.87, 0.62, 0.88, 0.57, 0.24, 0.9, 11.43, 0.64, 1.21, 0.0, 0.45, 0.83, 2.86, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/bwTe_vZ_2dg_filtered.json b/annotations_filtered/bwTe_vZ_2dg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c70d12d4625555a9d70b10fff0f7fed41f0c8a3c --- /dev/null +++ b/annotations_filtered/bwTe_vZ_2dg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 38.06], [42.0, 77.06], [79.0, 79.15], [81.0, 82.32], [86.0, 86.83], [88.0, 88.57], [91.0, 97.24], [98.0, 100.53], [102.0, 103.67], [107.0, 111.81]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [32.52, 0.0, 0.0, 0.0, 0.0, 0.0, 92.31, 41.64, 0.0, 56.78], "audiomae_on_audioset": [[["music", 60.43], ["musical instrument", 10.63], ["wind instrument, woodwind instrument", 4.77]], null, null, null, null, null, null, [["mains hum", 23.3], ["hum", 21.82], ["speech", 17.35]], null, null], "duration": [7.06, 35.06, 0.15, 1.32, 0.83, 0.57, 6.24, 2.53, 1.67, 4.81]} \ No newline at end of file diff --git a/annotations_filtered/bwf_EFTMZ9k_filtered.json b/annotations_filtered/bwf_EFTMZ9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5038cef0db717b17f4399def1388bd3ebd91936b --- /dev/null +++ b/annotations_filtered/bwf_EFTMZ9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 57.4], [58.0, 95.22], [100.0, 119.94], [122.0, 121.66], [122.0, 122.01], [122.0, 131.75], [134.0, 134.74], [140.0, 139.8], [143.0, 143.85], [145.0, 153.99], [159.0, 159.83], [163.0, 163.98], [171.0, 172.99], [175.0, 175.69], [177.0, 181.57], [186.0, 186.49]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false], "silence_prob": [100.0, 0.0, 33.99, 0.0, 0.0, 31.61, 0.0, 0.0, 0.0, 33.02, 0.0, 0.0, 0.0, 0.0, 31.39, 0.0], "audiomae_on_audioset": [null, null, [["music", 68.77], ["musical instrument", 2.21], ["speech", 2.09]], null, null, [["music", 46.81], ["cacophony", 6.91], ["didgeridoo", 6.64]], null, null, null, [["music", 45.01], ["hum", 8.65], ["whale vocalization", 8.14]], null, null, null, null, [["music", 44.38], ["noise", 9.55], ["synthesizer", 6.6]], null], "duration": [11.4, 37.22, 19.94, -0.34, 0.01, 9.75, 0.74, -0.2, 0.85, 8.99, 0.83, 0.98, 1.99, 0.69, 4.57, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/bwzuMk8SRzY_filtered.json b/annotations_filtered/bwzuMk8SRzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d08ecb9c296904d3fb8434555aede182fad7a43 --- /dev/null +++ b/annotations_filtered/bwzuMk8SRzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.72], [17.0, 19.21], [21.0, 35.82], [46.0, 58.72], [59.0, 62.04], [64.0, 105.34]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 88.46, 29.1, 28.81, 33.02, 0.0], "audiomae_on_audioset": [null, null, [["hum", 46.13], ["mains hum", 22.46], ["rumble", 5.87]], [["music", 52.82], ["hum", 18.31], ["throbbing", 11.67]], [["hum", 27.23], ["music", 26.84], ["throbbing", 22.17]], null], "duration": [0.72, 2.21, 14.82, 12.72, 3.04, 41.34]} \ No newline at end of file diff --git a/annotations_filtered/bx50ueZJgns_filtered.json b/annotations_filtered/bx50ueZJgns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90bdb9fa4ba225109db838cbbc333de6cbfd66de --- /dev/null +++ b/annotations_filtered/bx50ueZJgns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.37], [23.0, 26.4], [27.0, 32.19], [33.0, 33.4], [34.0, 39.68], [41.0, 43.28], [44.0, 69.89], [70.0, 77.13], [77.0, 77.16], [80.0, 80.35], [81.0, 100.47], [104.0, 110.78], [116.0, 138.08], [142.0, 170.21], [171.0, 190.49]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 30.24, 30.76, 0.0, 29.53, 33.46, 32.17, 30.05, 0.0, 0.0, 31.32, 30.3, 29.91, 30.2, 30.57], "audiomae_on_audioset": [null, [["whack, thwack", 20.9], ["mosquito", 16.53], ["fly, housefly", 13.94]], [["speech", 74.28], ["music", 13.56], ["throbbing", 1.04]], null, [["speech", 15.27], ["creak", 13.9], ["music", 13.69]], [["throbbing", 35.08], ["music", 34.07], ["hum", 17.66]], [["throbbing", 43.25], ["hum", 32.1], ["speech", 14.78]], [["music", 30.15], ["speech", 13.21], ["hum", 10.34]], null, null, [["hum", 36.6], ["throbbing", 29.29], ["mains hum", 16.63]], [["speech", 48.24], ["fart", 11.25], ["thump, thud", 8.4]], [["speech", 49.03], ["music", 17.72], ["breaking", 10.47]], [["speech", 37.05], ["music", 25.35], ["whack, thwack", 17.43]], [["music", 40.45], ["speech", 23.89], ["fart", 6.0]]], "duration": [1.37, 3.4, 5.19, 0.4, 5.68, 2.28, 25.89, 7.13, 0.16, 0.35, 19.47, 6.78, 22.08, 28.21, 19.49]} \ No newline at end of file diff --git a/annotations_filtered/bxAiioYl1bw_filtered.json b/annotations_filtered/bxAiioYl1bw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98c0bb26af097fc8632a01a1ec6997efcbbddd66 --- /dev/null +++ b/annotations_filtered/bxAiioYl1bw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 64.74], [65.0, 107.16]], "keep_status": [true, false], "silence_prob": [39.17, 0.0], "audiomae_on_audioset": [[["hum", 17.84], ["music", 9.04], ["noise", 8.94]], null], "duration": [9.74, 42.16]} \ No newline at end of file diff --git a/annotations_filtered/bxEqg39v9Ec_filtered.json b/annotations_filtered/bxEqg39v9Ec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..264ea9dad80a0598369f93f7ad45936001ca925f --- /dev/null +++ b/annotations_filtered/bxEqg39v9Ec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [3.0, 3.52], [4.0, 4.51], [5.0, 5.68], [6.0, 8.55], [9.0, 10.93], [12.0, 12.9], [14.0, 16.23], [17.0, 18.86], [20.0, 22.33], [24.0, 23.94], [25.0, 26.72], [27.0, 26.96], [28.0, 28.93], [30.0, 30.11], [31.0, 32.73], [33.0, 34.08], [36.0, 36.37], [37.0, 37.81], [40.0, 40.37], [41.0, 42.6], [44.0, 44.25], [45.0, 46.41], [48.0, 48.29], [49.0, 51.58], [53.0, 53.64], [54.0, 56.2], [58.0, 58.56], [60.0, 69.2], [70.0, 76.84], [80.0, 81.4], [85.0, 85.14], [89.0, 89.18], [94.0, 95.23], [96.0, 96.31], [99.0, 99.1], [102.0, 102.32], [104.0, 104.99], [107.0, 107.87], [109.0, 109.39], [111.0, 111.64], [116.0, 116.24], [120.0, 120.01], [121.0, 121.41], [122.0, 122.61], [125.0, 126.06], [127.0, 127.82], [129.0, 129.47], [130.0, 130.03], [130.0, 131.36], [133.0, 135.26], [136.0, 136.14], [137.0, 138.4], [139.0, 139.97], [140.0, 141.27], [142.0, 146.25], [148.0, 148.71], [151.0, 151.43], [154.0, 154.16], [157.0, 157.17], [158.0, 161.4], [163.0, 165.06], [167.0, 169.72], [170.0, 171.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 77.2, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 99.1, 0.0, 99.85, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 92.97, 97.73, 94.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 0.52, 0.51, 0.68, 2.55, 1.93, 0.9, 2.23, 1.86, 2.33, -0.06, 1.72, -0.04, 0.93, 0.11, 1.73, 1.08, 0.37, 0.81, 0.37, 1.6, 0.25, 1.41, 0.29, 2.58, 0.64, 2.2, 0.56, 9.2, 6.84, 1.4, 0.14, 0.18, 1.23, 0.31, 0.1, 0.32, 0.99, 0.87, 0.39, 0.64, 0.24, 0.01, 0.41, 0.61, 1.06, 0.82, 0.47, 0.03, 1.36, 2.26, 0.14, 1.4, 0.97, 1.27, 4.25, 0.71, 0.43, 0.16, 0.17, 3.4, 2.06, 2.72, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/bx_rua3EXFc_filtered.json b/annotations_filtered/bx_rua3EXFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..313bf9a16676015ae287ac50ce313941de7b7e17 --- /dev/null +++ b/annotations_filtered/bx_rua3EXFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.26], [14.0, 14.59], [18.0, 19.04], [22.0, 23.33], [30.0, 30.32], [31.0, 32.17], [34.0, 33.93], [34.0, 34.97], [39.0, 44.85], [47.0, 50.14], [54.0, 86.66], [88.0, 92.58], [93.0, 98.46], [99.0, 101.95], [102.0, 103.57], [106.0, 108.43], [109.0, 172.15], [175.0, 177.2], [178.0, 178.51], [185.0, 185.26], [187.0, 188.89], [190.0, 190.16], [206.0, 206.0]], "keep_status": [true, false, false, false, false, false, false, false, true, true, false, true, true, true, false, true, false, true, false, false, false, false, false], "silence_prob": [28.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.78, 28.44, 0.0, 30.0, 31.08, 30.42, 0.0, 38.49, 0.0, 29.49, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["rumble", 14.19], ["speech", 11.4], ["music", 8.99]], null, null, null, null, null, null, null, [["music", 51.8], ["speech", 12.66], ["whack, thwack", 5.03]], [["music", 36.87], ["theremin", 9.22], ["vehicle", 4.23]], null, [["whack, thwack", 36.7], ["speech", 25.13], ["boing", 6.49]], [["music", 27.09], ["mains hum", 17.36], ["hum", 16.54]], [["music", 36.61], ["speech", 12.3], ["moo", 8.56]], null, [["music", 35.54], ["musical instrument", 7.98], ["theremin", 4.83]], null, [["music", 51.58], ["speech", 11.37], ["musical instrument", 3.9]], null, null, null, null, null], "duration": [3.26, 0.59, 1.04, 1.33, 0.32, 1.17, -0.07, 0.97, 5.85, 3.14, 32.66, 4.58, 5.46, 2.95, 1.57, 2.43, 63.15, 2.2, 0.51, 0.26, 1.89, 0.16, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/bxegamvM8ME_filtered.json b/annotations_filtered/bxegamvM8ME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba6c333d427f630c3e86b5c81a2c0585742429f --- /dev/null +++ b/annotations_filtered/bxegamvM8ME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.5], [16.0, 15.82], [17.0, 19.45], [20.0, 22.35], [28.0, 31.45], [37.0, 37.4], [41.0, 46.11], [48.0, 47.93], [48.0, 52.3], [59.0, 59.07], [73.0, 75.12], [75.0, 80.7], [91.0, 90.98], [97.0, 101.97], [105.0, 106.91], [108.0, 108.51], [110.0, 112.01], [121.0, 121.24], [123.0, 125.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [79.94, 0.0, 81.0, 87.37, 94.66, 0.0, 84.25, 0.0, 80.29, 0.0, 99.31, 44.4, 0.0, 99.52, 0.0, 0.0, 100.0, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.05], ["music", 13.38], ["arrow", 6.05]], null, null, null, null, null, null, null], "duration": [2.5, -0.18, 2.45, 2.35, 3.45, 0.4, 5.11, -0.07, 4.3, 0.07, 2.12, 5.7, -0.02, 4.97, 1.91, 0.51, 2.01, 0.24, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/bxgZWv4Db5I_filtered.json b/annotations_filtered/bxgZWv4Db5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a03e8fe580a0d8c424d1253a952762bfe6e651e --- /dev/null +++ b/annotations_filtered/bxgZWv4Db5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.3], [4.0, 4.16], [5.0, 5.66], [17.0, 18.0], [28.0, 28.0], [35.0, 36.04], [47.0, 48.27], [63.0, 74.33], [75.0, 76.05], [79.0, 80.08], [81.0, 81.95], [83.0, 85.94], [86.0, 103.77], [108.0, 108.16], [109.0, 109.0], [109.0, 110.51], [118.0, 121.07], [128.0, 129.3], [140.0, 139.73], [148.0, 148.34], [154.0, 155.06], [156.0, 157.98], [163.0, 165.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.35, 0.0, 0.0, 0.0, 30.3, 31.94, 0.0, 0.0, 0.0, 32.2, 0.0, 0.0, 0.0, 0.0, 0.0, 32.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 80.52], ["whistling", 4.75], ["speech", 4.21]], null, null, null, [["music", 45.74], ["didgeridoo", 9.4], ["throbbing", 7.46]], [["music", 77.51], ["fart", 9.13], ["speech", 1.72]], null, null, null, [["music", 66.63], ["quack", 7.21], ["theremin", 2.8]], null, null, null, null, null, [["music", 80.55], ["musical instrument", 3.8], ["brass instrument", 2.27]]], "duration": [0.3, 0.16, 0.66, 1.0, 0.0, 1.04, 1.27, 11.33, 1.05, 1.08, 0.95, 2.94, 17.77, 0.16, 0.0, 1.51, 3.07, 1.3, -0.27, 0.34, 1.06, 1.98, 2.62]} \ No newline at end of file diff --git a/annotations_filtered/bxs77K1DkD0_filtered.json b/annotations_filtered/bxs77K1DkD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c1881b40b79dd3182eba0e9d42d297ba238bd19 --- /dev/null +++ b/annotations_filtered/bxs77K1DkD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.12], [17.0, 17.88], [18.0, 28.41], [29.0, 30.72], [33.0, 32.95], [34.0, 34.57], [35.0, 35.58], [39.0, 39.77], [40.0, 42.43], [44.0, 46.89], [48.0, 49.28], [52.0, 54.58], [55.0, 57.01], [58.0, 60.91], [71.0, 133.86], [134.0, 135.41], [136.0, 140.53], [142.0, 145.32], [146.0, 146.92], [150.0, 150.16], [151.0, 150.69], [152.0, 152.36], [158.0, 158.21], [159.0, 160.17], [161.0, 162.58], [164.0, 168.02], [170.0, 175.05], [177.0, 178.8], [179.0, 179.04], [179.0, 179.07], [179.0, 179.1], [180.0, 181.99], [182.0, 182.55], [183.0, 184.08], [184.0, 184.35], [185.0, 193.38]], "keep_status": [true, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [34.03, 0.0, 39.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.55, 39.19, 0.0, 37.83, 51.23, 65.09, 0.0, 0.0, 56.4, 48.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.92, 38.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.96], "audiomae_on_audioset": [[["throbbing", 25.65], ["hum", 25.63], ["music", 14.28]], null, [["hum", 38.02], ["speech", 15.23], ["throbbing", 15.14]], null, null, null, null, null, [["sine wave", 46.35], ["chirp tone", 12.69], ["singing bowl", 6.12]], [["sine wave", 16.59], ["chirp tone", 6.7], ["dog", 6.23]], null, [["chirp tone", 40.01], ["sine wave", 23.13], ["music", 9.52]], null, null, null, null, null, [["gong", 25.01], ["music", 14.44], ["hum", 9.25]], null, null, null, null, null, null, null, [["hum", 22.12], ["mains hum", 17.65], ["speech", 15.92]], [["sine wave", 22.17], ["gong", 20.77], ["singing bowl", 12.38]], null, null, null, null, null, null, null, null, [["music", 51.58], ["speech", 13.05], ["didgeridoo", 5.92]]], "duration": [2.12, 0.88, 10.41, 1.72, -0.05, 0.57, 0.58, 0.77, 2.43, 2.89, 1.28, 2.58, 2.01, 2.91, 62.86, 1.41, 4.53, 3.32, 0.92, 0.16, -0.31, 0.36, 0.21, 1.17, 1.58, 4.02, 5.05, 1.8, 0.04, 0.07, 0.1, 1.99, 0.55, 1.08, 0.35, 8.38]} \ No newline at end of file diff --git a/annotations_filtered/bxxHPYFtbE4_filtered.json b/annotations_filtered/bxxHPYFtbE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..093faee997b1f6584bc69b25e698e47ffc8d07a2 --- /dev/null +++ b/annotations_filtered/bxxHPYFtbE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.88], [12.0, 12.01], [21.0, 20.82], [26.0, 26.33], [33.0, 34.03], [34.0, 38.38], [40.0, 42.28], [44.0, 45.57], [47.0, 47.51], [48.0, 50.19], [52.0, 51.76], [52.0, 53.81], [55.0, 55.86], [59.0, 59.29], [63.0, 63.58], [65.0, 65.6], [75.0, 74.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 98.19, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.88, 0.01, -0.18, 0.33, 1.03, 4.38, 2.28, 1.57, 0.51, 2.19, -0.24, 1.81, 0.86, 0.29, 0.58, 0.6, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/byObeFcFXmo_filtered.json b/annotations_filtered/byObeFcFXmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa6f25e45a8fc644eff46841553f77f6a31b5b40 --- /dev/null +++ b/annotations_filtered/byObeFcFXmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.83], [37.0, 37.22], [40.0, 40.83], [48.0, 48.71], [50.0, 51.14]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.83, 0.22, 0.83, 0.71, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/byPJ22JDFjI_filtered.json b/annotations_filtered/byPJ22JDFjI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ff2c21f190ee02b859d121bed2468be36bde46a --- /dev/null +++ b/annotations_filtered/byPJ22JDFjI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.19], [9.0, 24.29], [25.0, 34.21], [39.0, 41.12], [46.0, 47.61], [48.0, 48.41], [50.0, 52.1], [53.0, 54.06], [55.0, 61.37], [62.0, 71.42], [72.0, 91.96], [94.0, 98.19], [99.0, 99.25], [100.0, 106.05], [107.0, 108.03], [108.0, 112.68], [116.0, 120.95], [124.0, 124.38], [125.0, 141.94], [147.0, 149.94]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [38.16, 44.6, 38.17, 34.64, 0.0, 0.0, 38.55, 0.0, 35.72, 34.06, 31.9, 31.11, 0.0, 34.86, 0.0, 31.75, 31.96, 0.0, 30.26, 30.21], "audiomae_on_audioset": [[["music", 27.25], ["speech", 21.38], ["didgeridoo", 6.19]], [["speech", 31.72], ["music", 30.9], ["theremin", 13.1]], [["music", 65.16], ["theremin", 4.41], ["hum", 4.17]], [["speech", 40.76], ["music", 33.44], ["musical instrument", 3.82]], null, null, [["music", 52.23], ["speech", 11.71], ["synthesizer", 3.54]], null, [["music", 78.98], ["synthesizer", 3.36], ["didgeridoo", 2.14]], [["music", 67.82], ["mains hum", 7.73], ["hum", 3.23]], [["music", 63.58], ["didgeridoo", 7.74], ["fart", 4.88]], [["music", 42.27], ["speech", 20.85], ["musical instrument", 7.76]], null, [["music", 18.4], ["speech", 11.14], ["didgeridoo", 6.63]], null, [["electric shaver, electric razor", 22.71], ["music", 11.79], ["mosquito", 9.6]], [["music", 34.12], ["didgeridoo", 34.12], ["theremin", 14.86]], null, [["music", 58.76], ["synthesizer", 8.04], ["musical instrument", 6.86]], [["music", 17.87], ["cattle, bovinae", 10.51], ["moo", 8.14]]], "duration": [2.19, 15.29, 9.21, 2.12, 1.61, 0.41, 2.1, 1.06, 6.37, 9.42, 19.96, 4.19, 0.25, 6.05, 1.03, 4.68, 4.95, 0.38, 16.94, 2.94]} \ No newline at end of file diff --git a/annotations_filtered/bzGDMtX1IU0_filtered.json b/annotations_filtered/bzGDMtX1IU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..547693e71221a839aed159a9b08d7db150295ba3 --- /dev/null +++ b/annotations_filtered/bzGDMtX1IU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 42.21], [46.0, 46.84], [50.0, 66.23], [67.0, 67.46], [69.0, 78.76], [82.0, 82.56], [86.0, 120.82], [123.0, 133.71], [135.0, 145.02]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [51.02, 0.0, 37.82, 0.0, 34.57, 0.0, 0.0, 88.1, 65.44], "audiomae_on_audioset": [null, null, [["music", 54.52], ["thunk", 13.75], ["boing", 3.8]], null, [["music", 52.05], ["musical instrument", 7.08], ["livestock, farm animals, working animals", 3.37]], null, null, null, null], "duration": [15.21, 0.84, 16.23, 0.46, 9.76, 0.56, 34.82, 10.71, 10.02]} \ No newline at end of file diff --git a/annotations_filtered/bzSIHZcXwvQ_filtered.json b/annotations_filtered/bzSIHZcXwvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..604d6d33085d65b9278754cdf02dc86a11abc641 --- /dev/null +++ b/annotations_filtered/bzSIHZcXwvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [4.0, 4.4], [5.0, 14.28], [15.0, 16.43], [17.0, 18.54], [19.0, 19.47], [20.0, 20.49], [21.0, 24.95], [29.0, 30.2], [31.0, 35.23], [36.0, 38.6], [40.0, 43.28], [45.0, 46.26], [48.0, 48.25], [48.0, 49.84], [51.0, 51.9], [53.0, 52.84], [53.0, 54.95], [56.0, 57.62], [58.0, 57.77], [59.0, 60.78], [61.0, 70.24], [71.0, 72.13], [75.0, 75.59], [77.0, 77.94], [79.0, 81.33], [83.0, 83.44], [84.0, 85.41], [86.0, 88.26], [91.0, 96.09], [97.0, 98.22], [99.0, 101.01], [102.0, 102.66], [104.0, 105.14], [106.0, 108.8], [110.0, 110.81], [111.0, 113.7], [114.0, 114.24], [115.0, 121.78], [123.0, 127.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 98.66, 98.51, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.63, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 53.47, 95.64, 0.0, 80.29, 0.0, 0.0, 61.18, 0.0, 54.9, 0.0, 91.81, 95.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["echo", 23.17], ["laughter", 8.51], ["snicker", 6.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.04, 0.4, 9.28, 1.43, 1.54, 0.47, 0.49, 3.95, 1.2, 4.23, 2.6, 3.28, 1.26, 0.25, 1.84, 0.9, -0.16, 1.95, 1.62, -0.23, 1.78, 9.24, 1.13, 0.59, 0.94, 2.33, 0.44, 1.41, 2.26, 5.09, 1.22, 2.01, 0.66, 1.14, 2.8, 0.81, 2.7, 0.24, 6.78, 4.35]} \ No newline at end of file