diff --git a/annotations_filtered/l-GbvgBXi18_filtered.json b/annotations_filtered/l-GbvgBXi18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3b0ab52be4ea68a3321f7283b4b70d5ab6b5dfe --- /dev/null +++ b/annotations_filtered/l-GbvgBXi18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.6], [10.0, 13.85], [16.0, 16.63], [18.0, 23.73], [27.0, 26.89], [27.0, 28.32], [29.0, 30.75], [34.0, 37.71], [41.0, 41.62], [44.0, 46.57], [70.0, 71.1], [72.0, 76.99], [78.0, 87.88], [96.0, 96.42], [97.0, 97.51], [98.0, 99.82], [108.0, 133.25], [140.0, 145.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.04, 0.0, 35.0, 0.0, 0.0, 0.0, 42.44, 0.0, 99.92, 0.0, 87.55, 60.05, 0.0, 0.0, 0.0, 37.59, 99.65], "audiomae_on_audioset": [null, null, null, [["speech", 64.85], ["whack, thwack", 5.66], ["arrow", 2.1]], null, null, null, [["hum", 36.27], ["whale vocalization", 16.44], ["throbbing", 11.94]], null, null, null, null, null, null, null, null, [["whale vocalization", 81.95], ["rumble", 5.63], ["stomach rumble", 2.14]], null], "duration": [0.6, 3.85, 0.63, 5.73, -0.11, 1.32, 1.75, 3.71, 0.62, 2.57, 1.1, 4.99, 9.88, 0.42, 0.51, 1.82, 25.25, 5.94]} \ No newline at end of file diff --git a/annotations_filtered/l-PmluGC2wk_filtered.json b/annotations_filtered/l-PmluGC2wk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..423e7bc50131be066c6dd6d8ea42b8cd3aa8c51a --- /dev/null +++ b/annotations_filtered/l-PmluGC2wk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.06], [5.0, 5.76], [8.0, 9.76], [13.0, 13.46], [20.0, 20.95], [22.0, 22.52], [24.0, 25.05], [26.0, 27.09], [29.0, 28.83], [31.0, 32.8], [34.0, 35.5], [37.0, 37.56], [38.0, 39.06], [41.0, 41.47], [42.0, 42.33], [43.0, 43.87], [46.0, 46.23], [48.0, 49.47], [50.0, 50.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.06, 0.76, 1.76, 0.46, 0.95, 0.52, 1.05, 1.09, -0.17, 1.8, 1.5, 0.56, 1.06, 0.47, 0.33, 0.87, 0.23, 1.47, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/l-uqZJwOieA_filtered.json b/annotations_filtered/l-uqZJwOieA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/l-uqZJwOieA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/l-vk0fgFGd4_filtered.json b/annotations_filtered/l-vk0fgFGd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4c49134aed5e8bc22e1d95edbfac2e976b9a23b --- /dev/null +++ b/annotations_filtered/l-vk0fgFGd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.9], [21.0, 22.49], [25.0, 25.15], [26.0, 31.36], [35.0, 35.58], [38.0, 37.84], [39.0, 39.19], [42.0, 42.72], [47.0, 47.24], [50.0, 49.87], [52.0, 54.36], [57.0, 57.97], [58.0, 58.78], [62.0, 62.73], [65.0, 64.74], [66.0, 66.58], [72.0, 73.52], [75.0, 76.74], [80.0, 79.95], [81.0, 81.48], [87.0, 87.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.26, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.9, 1.49, 0.15, 5.36, 0.58, -0.16, 0.19, 0.72, 0.24, -0.13, 2.36, 0.97, 0.78, 0.73, -0.26, 0.58, 1.52, 1.74, -0.05, 0.48, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/l081UdHizvg_filtered.json b/annotations_filtered/l081UdHizvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58626b70210cb0020dbdf7a49eefead172f345a2 --- /dev/null +++ b/annotations_filtered/l081UdHizvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.7], [10.0, 13.47], [15.0, 15.4], [20.0, 20.39], [23.0, 23.77], [25.0, 25.22], [27.0, 27.99], [29.0, 30.05], [31.0, 31.7], [35.0, 35.82], [39.0, 38.99], [51.0, 57.72], [62.0, 62.19], [64.0, 64.56], [65.0, 66.09], [69.0, 71.64], [72.0, 73.57], [74.0, 75.15], [76.0, 76.86], [79.0, 80.76], [86.0, 88.43], [89.0, 89.5], [91.0, 91.49], [100.0, 101.8], [103.0, 102.95], [104.0, 105.81], [106.0, 107.18], [108.0, 108.8], [110.0, 112.02], [113.0, 114.02], [117.0, 116.99], [122.0, 122.67], [125.0, 125.54], [129.0, 129.83], [133.0, 133.03], [135.0, 154.74], [173.0, 174.51]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.81, 0.0, 0.0, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.47, 0.0], "audiomae_on_audioset": [null, [["music", 24.02], ["speech", 22.13], ["animal", 4.54]], null, null, null, null, null, null, null, null, null, [["hum", 22.94], ["livestock, farm animals, working animals", 12.7], ["cattle, bovinae", 11.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.94], ["foghorn", 7.79], ["musical instrument", 4.8]], null], "duration": [1.7, 3.47, 0.4, 0.39, 0.77, 0.22, 0.99, 1.05, 0.7, 0.82, -0.01, 6.72, 0.19, 0.56, 1.09, 2.64, 1.57, 1.15, 0.86, 1.76, 2.43, 0.5, 0.49, 1.8, -0.05, 1.81, 1.18, 0.8, 2.02, 1.02, -0.01, 0.67, 0.54, 0.83, 0.03, 19.74, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/l0Io_aXWgkQ_filtered.json b/annotations_filtered/l0Io_aXWgkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d32847d2d20994e47c2808a8ade93ee7aeaf71e --- /dev/null +++ b/annotations_filtered/l0Io_aXWgkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.17], [18.0, 18.0], [21.0, 33.61], [38.0, 48.63], [55.0, 55.66], [57.0, 79.15], [81.0, 81.5], [86.0, 86.48], [94.0, 94.09], [94.0, 95.08], [101.0, 101.01], [106.0, 106.61], [111.0, 111.16], [114.0, 113.95], [120.0, 120.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.94, 29.26, 0.0, 33.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 27.52], ["livestock, farm animals, working animals", 23.66], ["moo", 22.53]], [["cattle, bovinae", 40.19], ["livestock, farm animals, working animals", 37.6], ["moo", 19.68]], null, [["livestock, farm animals, working animals", 33.52], ["cattle, bovinae", 29.27], ["moo", 24.99]], null, null, null, null, null, null, null, null, null], "duration": [1.17, 0.0, 12.61, 10.63, 0.66, 22.15, 0.5, 0.48, 0.09, 1.08, 0.01, 0.61, 0.16, -0.05, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/l0RkrxY9mH8_filtered.json b/annotations_filtered/l0RkrxY9mH8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6efe18aceff665ef3a9415d960a541c437809751 --- /dev/null +++ b/annotations_filtered/l0RkrxY9mH8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 29.73], [31.0, 48.68], [49.0, 52.52], [53.0, 55.11], [57.0, 59.27], [61.0, 63.31], [65.0, 66.95], [69.0, 75.57], [77.0, 78.24], [82.0, 82.68], [85.0, 87.67], [89.0, 91.23], [93.0, 95.13], [96.0, 98.31], [99.0, 108.03], [112.0, 112.95], [114.0, 116.21], [119.0, 119.55], [121.0, 127.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 100.0, 98.19, 98.59, 99.95, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.73, 17.68, 3.52, 2.11, 2.27, 2.31, 1.95, 6.57, 1.24, 0.68, 2.67, 2.23, 2.13, 2.31, 9.03, 0.95, 2.21, 0.55, 6.4]} \ No newline at end of file diff --git a/annotations_filtered/l0VX6h8lP08_filtered.json b/annotations_filtered/l0VX6h8lP08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76b28f4474f6efd79ebe28e5fbd9fee656926eee --- /dev/null +++ b/annotations_filtered/l0VX6h8lP08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 43.92], [45.0, 45.76], [47.0, 47.83], [72.0, 84.45], [88.0, 89.56], [92.0, 92.99], [93.0, 94.2], [102.0, 104.35], [109.0, 111.4], [114.0, 114.89], [115.0, 118.99], [122.0, 122.54]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.22, 0.0, 0.0, 0.0, 38.31, 39.94, 0.0, 37.15, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 51.78], ["speech", 16.91], ["throbbing", 2.96]], null, null, null, [["music", 61.89], ["didgeridoo", 5.62], ["musical instrument", 3.64]], [["frog", 33.3], ["music", 16.99], ["croak", 10.56]], null, [["music", 28.84], ["speech", 8.34], ["hum", 6.57]], null], "duration": [42.92, 0.76, 0.83, 12.45, 1.56, 0.99, 1.2, 2.35, 2.4, 0.89, 3.99, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/l0zmCUVB0Yw_filtered.json b/annotations_filtered/l0zmCUVB0Yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7a5c806a6229708f9063d41ab8b399166e8280b --- /dev/null +++ b/annotations_filtered/l0zmCUVB0Yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.4], [1.0, 5.49], [12.0, 12.66], [26.0, 25.68], [27.0, 27.46], [41.0, 42.52], [54.0, 53.82], [66.0, 66.01], [72.0, 72.57], [86.0, 86.7], [91.0, 91.45], [93.0, 94.9], [97.0, 97.38], [98.0, 99.45], [100.0, 100.8], [116.0, 116.51], [120.0, 120.8], [122.0, 122.44], [124.0, 124.61], [128.0, 127.89], [132.0, 132.21], [143.0, 143.43], [144.0, 143.95], [145.0, 144.76], [145.0, 145.66], [152.0, 161.81], [172.0, 172.57], [174.0, 174.8]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 32.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 49.72], ["musical instrument", 5.08], ["speech", 3.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.24], ["synthesizer", 16.42], ["speech", 15.84]], null, null], "duration": [0.4, 4.49, 0.66, -0.32, 0.46, 1.52, -0.18, 0.01, 0.57, 0.7, 0.45, 1.9, 0.38, 1.45, 0.8, 0.51, 0.8, 0.44, 0.61, -0.11, 0.21, 0.43, -0.05, -0.24, 0.66, 9.81, 0.57, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/l17e0M4TTBA_filtered.json b/annotations_filtered/l17e0M4TTBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0d3b73326501caf13173162dfbc4de2a7c4f49d --- /dev/null +++ b/annotations_filtered/l17e0M4TTBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [17.0, 17.44], [19.0, 20.68], [22.0, 22.79], [24.0, 28.0], [30.0, 32.7], [33.0, 36.27], [38.0, 43.34], [44.0, 45.54], [50.0, 51.41], [52.0, 54.48], [57.0, 57.3], [69.0, 70.6], [71.0, 88.65], [91.0, 95.96], [99.0, 104.23], [109.0, 111.72], [116.0, 117.9], [121.0, 122.81], [124.0, 125.85], [130.0, 133.51], [134.0, 135.68], [137.0, 138.23], [144.0, 147.04], [150.0, 151.31], [153.0, 158.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.54, 53.59, 97.92, 75.88, 0.0, 0.0, 72.01, 0.0, 0.0, 59.15, 88.46, 99.21, 54.97, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0, 59.33, 0.0, 99.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.44, 1.68, 0.79, 4.0, 2.7, 3.27, 5.34, 1.54, 1.41, 2.48, 0.3, 1.6, 17.65, 4.96, 5.23, 2.72, 1.9, 1.81, 1.85, 3.51, 1.68, 1.23, 3.04, 1.31, 5.25]} \ No newline at end of file diff --git a/annotations_filtered/l1B1_jQnlFk_filtered.json b/annotations_filtered/l1B1_jQnlFk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36a43c94aa7d3aa95330f4201c8233c809b20291 --- /dev/null +++ b/annotations_filtered/l1B1_jQnlFk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.19], [8.0, 9.71], [11.0, 11.37], [13.0, 14.2], [22.0, 24.14], [25.0, 26.86], [27.0, 30.01], [31.0, 31.7], [34.0, 34.26], [47.0, 49.72], [50.0, 51.19], [52.0, 52.76], [54.0, 56.46], [59.0, 59.64], [70.0, 98.29], [101.0, 103.42], [105.0, 107.35], [112.0, 111.94], [114.0, 115.35], [116.0, 116.75], [119.0, 120.65], [122.0, 122.66], [124.0, 125.31], [126.0, 126.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 76.37, 0.0, 0.0, 30.91, 0.0, 0.0, 99.76, 0.0, 49.82, 49.18, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 54.3], ["beatboxing", 13.17], ["fart", 7.43]], null, null, null, null, [["speech", 48.32], ["frog", 12.16], ["boing", 12.08]], [["speech", 77.95], ["boing", 2.87], ["laughter", 2.56]], null, null, null, null, null, null, null, null], "duration": [1.19, 1.71, 0.37, 1.2, 2.14, 1.86, 3.01, 0.7, 0.26, 2.72, 1.19, 0.76, 2.46, 0.64, 28.29, 2.42, 2.35, -0.06, 1.35, 0.75, 1.65, 0.66, 1.31, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/l1NB8NQc7wU_filtered.json b/annotations_filtered/l1NB8NQc7wU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da1011293a79b765dbebc97437adadba69e0f305 --- /dev/null +++ b/annotations_filtered/l1NB8NQc7wU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 69.7], [73.0, 73.55]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [30.7, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/l1OgTkhFJn8_filtered.json b/annotations_filtered/l1OgTkhFJn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1268b5f1503634aa33277d56e331b418da41b253 --- /dev/null +++ b/annotations_filtered/l1OgTkhFJn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.35], [15.0, 31.35], [45.0, 45.47], [48.0, 49.28], [50.0, 51.29], [54.0, 56.81], [57.0, 57.94], [59.0, 59.46], [63.0, 63.48], [66.0, 67.27], [71.0, 71.96], [81.0, 81.13], [85.0, 85.92], [87.0, 87.74], [89.0, 90.37], [92.0, 92.8], [97.0, 98.14], [101.0, 101.95], [102.0, 105.09], [108.0, 110.93], [115.0, 117.14], [120.0, 124.83], [126.0, 128.36], [136.0, 136.44], [141.0, 145.42], [147.0, 148.44], [152.0, 152.34], [153.0, 154.52], [155.0, 156.09], [157.0, 158.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.18, 0.0, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 68.02, 100.0, 78.04, 39.54, 0.0, 59.07, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.82], ["thunk", 2.3], ["music", 2.01]], null, null, null, null, null, null, null], "duration": [0.35, 16.35, 0.47, 1.28, 1.29, 2.81, 0.94, 0.46, 0.48, 1.27, 0.96, 0.13, 0.92, 0.74, 1.37, 0.8, 1.14, 0.95, 3.09, 2.93, 2.14, 4.83, 2.36, 0.44, 4.42, 1.44, 0.34, 1.52, 1.09, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/l1SZ4ccagFQ_filtered.json b/annotations_filtered/l1SZ4ccagFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efb606081199a93eb33c39a74272d80295a442a7 --- /dev/null +++ b/annotations_filtered/l1SZ4ccagFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.66], [7.0, 22.3], [22.0, 38.26], [40.0, 40.44], [40.0, 52.02], [52.0, 52.05], [59.0, 95.88], [102.0, 109.46], [112.0, 112.29], [116.0, 119.77]], "keep_status": [false, true, true, false, true, false, false, true, false, false], "silence_prob": [0.0, 34.61, 31.06, 0.0, 31.34, 0.0, 0.0, 33.26, 0.0, 98.01], "audiomae_on_audioset": [null, [["music", 22.16], ["hum", 13.46], ["speech", 12.07]], [["speech", 21.07], ["throbbing", 15.61], ["music", 12.57]], null, [["music", 39.76], ["speech", 7.23], ["whack, thwack", 4.67]], null, null, [["whip", 20.46], ["whack, thwack", 16.94], ["hum", 16.13]], null, null], "duration": [0.66, 15.3, 16.26, 0.44, 12.02, 0.05, 36.88, 7.46, 0.29, 3.77]} \ No newline at end of file diff --git a/annotations_filtered/l1jCg_FmQmQ_filtered.json b/annotations_filtered/l1jCg_FmQmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f4b5a5feb31e15bfbd783fbc779f47b266030c4 --- /dev/null +++ b/annotations_filtered/l1jCg_FmQmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.78], [37.0, 40.32], [41.0, 56.37], [57.0, 62.97], [65.0, 66.93], [68.0, 73.01], [74.0, 75.15], [81.0, 96.36], [96.0, 96.45], [98.0, 98.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 99.73, 99.73, 0.0, 100.0, 0.0, 89.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 3.32, 15.37, 5.97, 1.93, 5.01, 1.15, 15.36, 0.45, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/l24yOwR9saU_filtered.json b/annotations_filtered/l24yOwR9saU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac3604692c878c26e84129e467868ad1108d0221 --- /dev/null +++ b/annotations_filtered/l24yOwR9saU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.62], [12.0, 16.56], [19.0, 22.49], [23.0, 24.33], [28.0, 28.24], [36.0, 36.1], [39.0, 39.5], [40.0, 45.72], [67.0, 70.24], [72.0, 73.2], [76.0, 85.99], [90.0, 95.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.86, 52.1, 0.0, 0.0, 0.0, 0.0, 59.15, 65.09, 0.0, 52.56, 47.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 30.8], ["speech", 22.93], ["hum", 22.33]]], "duration": [1.62, 4.56, 3.49, 1.33, 0.24, 0.1, 0.5, 5.72, 3.24, 1.2, 9.99, 5.76]} \ No newline at end of file diff --git a/annotations_filtered/l2IJxv1lbAc_filtered.json b/annotations_filtered/l2IJxv1lbAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec40d79f0aac79e1fbd555c89351fc2cf37ec33b --- /dev/null +++ b/annotations_filtered/l2IJxv1lbAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [6.0, 6.99], [11.0, 12.14], [13.0, 14.17], [25.0, 25.46], [26.0, 25.86], [28.0, 30.4], [35.0, 35.26], [36.0, 36.53], [39.0, 42.87], [45.0, 45.81], [46.0, 47.22], [48.0, 48.95], [50.0, 50.63], [52.0, 52.62], [55.0, 92.21], [101.0, 101.95], [106.0, 107.43], [108.0, 108.3], [112.0, 112.43], [113.0, 113.07], [119.0, 120.77], [124.0, 126.62]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.78, 0.0, 0.0, 37.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.99], "audiomae_on_audioset": [null, null, null, null, null, null, [["quack", 17.71], ["music", 9.24], ["speech", 6.88]], null, null, [["mains hum", 32.6], ["hum", 27.43], ["music", 20.32]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 24.73], ["hum", 24.04], ["throbbing", 11.77]]], "duration": [0.87, 0.99, 1.14, 1.17, 0.46, -0.14, 2.4, 0.26, 0.53, 3.87, 0.81, 1.22, 0.95, 0.63, 0.62, 37.21, 0.95, 1.43, 0.3, 0.43, 0.07, 1.77, 2.62]} \ No newline at end of file diff --git a/annotations_filtered/l2K4Fw-pmLw_filtered.json b/annotations_filtered/l2K4Fw-pmLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2679a72d255b30f61a23fc1af88bc8f7646beb6c --- /dev/null +++ b/annotations_filtered/l2K4Fw-pmLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.29], [14.0, 15.2], [17.0, 17.98], [18.0, 18.87], [28.0, 32.56], [34.0, 35.11], [40.0, 40.49], [45.0, 45.39], [55.0, 57.67], [61.0, 63.91], [64.0, 67.86], [69.0, 69.15], [73.0, 73.43], [87.0, 87.62], [92.0, 93.51], [101.0, 101.87], [103.0, 103.94], [105.0, 105.6], [107.0, 107.89], [110.0, 111.67], [113.0, 113.43], [119.0, 119.26], [122.0, 123.45], [125.0, 125.39]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 30.43, 36.47, 50.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 43.51], ["music", 18.43], ["boing", 4.59]], [["speech", 57.27], ["sneeze", 7.77], ["inside, small room", 3.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.29, 1.2, 0.98, 0.87, 4.56, 1.11, 0.49, 0.39, 2.67, 2.91, 3.86, 0.15, 0.43, 0.62, 1.51, 0.87, 0.94, 0.6, 0.89, 1.67, 0.43, 0.26, 1.45, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/l2g7v4DYYik_filtered.json b/annotations_filtered/l2g7v4DYYik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e01c411ba3a206a97556a8105b6de352b627089a --- /dev/null +++ b/annotations_filtered/l2g7v4DYYik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 107.99], [114.0, 114.84], [132.0, 132.61], [140.0, 140.78]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [41.99, 0.84, 0.61, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/l2zrJ_LZrhg_filtered.json b/annotations_filtered/l2zrJ_LZrhg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2478a921ad33eb0eb2471972ab4cb2837d6222c2 --- /dev/null +++ b/annotations_filtered/l2zrJ_LZrhg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.25], [22.0, 26.7], [30.0, 31.02], [32.0, 33.84], [41.0, 41.71], [46.0, 48.88], [59.0, 59.75], [60.0, 65.45], [68.0, 78.95], [86.0, 87.83], [88.0, 89.95], [92.0, 94.49], [98.0, 98.02], [99.0, 103.5], [113.0, 113.46], [117.0, 120.11], [123.0, 131.89], [146.0, 147.12], [151.0, 152.14], [155.0, 157.84], [158.0, 162.06], [165.0, 167.04]], "keep_status": [false, true, false, false, false, true, false, true, false, false, false, true, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 33.61, 0.0, 0.0, 0.0, 33.9, 0.0, 30.07, 33.22, 0.0, 0.0, 42.74, 0.0, 31.58, 0.0, 90.6, 51.18, 0.0, 0.0, 39.46, 34.79, 39.3], "audiomae_on_audioset": [null, [["speech", 34.27], ["thunk", 17.83], ["whack, thwack", 10.15]], null, null, null, [["hum", 32.05], ["speech", 29.31], ["mains hum", 8.42]], null, [["speech", 36.88], ["sidetone", 14.05], ["music", 13.06]], [["speech", 56.79], ["music", 22.23], ["fart", 4.71]], null, null, [["hum", 17.38], ["throbbing", 16.39], ["music", 14.13]], null, [["livestock, farm animals, working animals", 24.58], ["cattle, bovinae", 20.05], ["moo", 18.87]], null, null, null, null, null, [["music", 53.96], ["musical instrument", 7.06], ["didgeridoo", 4.37]], [["music", 65.83], ["musical instrument", 3.32], ["guitar", 2.0]], [["music", 47.04], ["cello", 10.83], ["double bass", 8.04]]], "duration": [1.25, 4.7, 1.02, 1.84, 0.71, 2.88, 0.75, 5.45, 10.95, 1.83, 1.95, 2.49, 0.02, 4.5, 0.46, 3.11, 8.89, 1.12, 1.14, 2.84, 4.06, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/l38Qliee6VE_filtered.json b/annotations_filtered/l38Qliee6VE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a567293154f755fce37d62314e80f91ebf1c54d8 --- /dev/null +++ b/annotations_filtered/l38Qliee6VE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.6], [10.0, 15.33], [18.0, 19.43], [20.0, 20.38], [25.0, 27.9], [49.0, 51.92], [61.0, 61.3], [62.0, 62.94], [64.0, 65.42], [67.0, 69.18], [70.0, 71.02], [71.0, 87.2], [87.0, 87.37], [87.0, 87.71], [88.0, 87.74], [88.0, 87.98], [88.0, 95.86], [107.0, 108.51], [112.0, 112.11], [113.0, 113.46], [119.0, 127.38], [129.0, 132.38], [134.0, 136.65], [143.0, 151.14], [152.0, 156.39]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 55.25, 0.0, 0.0, 38.11, 59.96, 0.0, 0.0, 0.0, 40.99, 0.0, 31.57, 0.0, 0.0, 0.0, 0.0, 31.75, 0.0, 0.0, 0.0, 40.19, 39.22, 75.23, 78.38, 49.18], "audiomae_on_audioset": [null, null, null, null, [["speech", 29.2], ["wail, moan", 19.16], ["fart", 11.28]], null, null, null, null, [["music", 33.31], ["hum", 6.27], ["musical instrument", 3.69]], null, [["music", 56.52], ["speech", 10.06], ["synthesizer", 9.18]], null, null, null, null, [["music", 56.53], ["sidetone", 14.12], ["speech", 5.12]], null, null, null, [["music", 82.44], ["speech", 4.41], ["musical instrument", 2.06]], [["music", 56.16], ["musical instrument", 4.13], ["hum", 2.77]], null, null, [["music", 28.34], ["speech", 17.1], ["sidetone", 11.26]]], "duration": [-0.4, 5.33, 1.43, 0.38, 2.9, 2.92, 0.3, 0.94, 1.42, 2.18, 1.02, 16.2, 0.37, 0.71, -0.26, -0.02, 7.86, 1.51, 0.11, 0.46, 8.38, 3.38, 2.65, 8.14, 4.39]} \ No newline at end of file diff --git a/annotations_filtered/l3t1ZSuwLzg_filtered.json b/annotations_filtered/l3t1ZSuwLzg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a95aaf805502c8e0a042a9996e726091c570a8ff --- /dev/null +++ b/annotations_filtered/l3t1ZSuwLzg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.4]], "keep_status": [false], "silence_prob": [71.14], "audiomae_on_audioset": [null], "duration": [2.4]} \ No newline at end of file diff --git a/annotations_filtered/l46yjkR0SqU_filtered.json b/annotations_filtered/l46yjkR0SqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38cd542ff5ea235a39c355dce17e2ac37de81320 --- /dev/null +++ b/annotations_filtered/l46yjkR0SqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.69], [19.0, 20.33], [21.0, 21.47], [23.0, 22.98], [24.0, 36.44], [38.0, 84.97], [85.0, 86.39], [87.0, 100.45], [104.0, 115.13], [120.0, 122.1], [124.0, 125.63], [126.0, 126.79], [130.0, 130.27], [131.0, 134.03], [137.0, 137.24], [138.0, 140.02], [141.0, 158.82], [160.0, 160.37], [163.0, 167.86]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true], "silence_prob": [35.42, 0.0, 0.0, 0.0, 53.53, 0.0, 0.0, 29.03, 30.52, 62.58, 0.0, 0.0, 0.0, 40.45, 0.0, 43.35, 39.89, 0.0, 37.35], "audiomae_on_audioset": [[["hum", 28.04], ["throbbing", 17.13], ["whale vocalization", 15.07]], null, null, null, null, null, null, [["music", 68.86], ["marimba, xylophone", 4.87], ["musical instrument", 2.74]], [["music", 69.46], ["theremin", 12.56], ["soundtrack music", 1.42]], null, null, null, null, [["cattle, bovinae", 9.82], ["fly, housefly", 9.7], ["speech", 9.15]], null, [["speech", 35.97], ["music", 5.78], ["hum", 4.73]], [["hum", 37.13], ["mains hum", 16.82], ["throbbing", 14.55]], null, [["speech", 32.24], ["music", 8.79], ["mains hum", 7.83]]], "duration": [10.69, 1.33, 0.47, -0.02, 12.44, 46.97, 1.39, 13.45, 11.13, 2.1, 1.63, 0.79, 0.27, 3.03, 0.24, 2.02, 17.82, 0.37, 4.86]} \ No newline at end of file diff --git a/annotations_filtered/l4AmSVb6Hew_filtered.json b/annotations_filtered/l4AmSVb6Hew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49a3b6268019a14270b4f08513710482c89d9f35 --- /dev/null +++ b/annotations_filtered/l4AmSVb6Hew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.25], [11.0, 11.52], [16.0, 16.28], [30.0, 30.54], [42.0, 42.6], [45.0, 47.36], [48.0, 48.57], [52.0, 52.69], [54.0, 54.72], [61.0, 61.4], [67.0, 67.0], [70.0, 72.42], [96.0, 97.71], [99.0, 112.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 29.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.24], ["thunk", 3.96], ["livestock, farm animals, working animals", 3.31]]], "duration": [1.25, 0.52, 0.28, 0.54, 0.6, 2.36, 0.57, 0.69, 0.72, 0.4, 0.0, 2.42, 1.71, 13.45]} \ No newline at end of file diff --git a/annotations_filtered/l4L9Yi-lXbo_filtered.json b/annotations_filtered/l4L9Yi-lXbo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6856ef2961cde03bc9a252d1225d1c29e65a4af7 --- /dev/null +++ b/annotations_filtered/l4L9Yi-lXbo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.99], [13.0, 14.22], [17.0, 19.89], [22.0, 27.97], [29.0, 30.54], [33.0, 35.31], [37.0, 41.34], [46.0, 48.81], [52.0, 53.79], [56.0, 57.48], [60.0, 62.04], [67.0, 69.28], [73.0, 82.63], [87.0, 89.46], [92.0, 97.75], [99.0, 107.2], [108.0, 116.92], [118.0, 122.35]], "keep_status": [true, false, false, true, false, false, true, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [39.12, 0.0, 78.04, 31.18, 0.0, 56.48, 36.44, 70.3, 0.0, 0.0, 48.82, 95.51, 57.97, 51.99, 36.71, 37.52, 33.17, 37.28], "audiomae_on_audioset": [[["whale vocalization", 39.52], ["burping, eructation", 15.88], ["buzz", 7.06]], null, null, [["speech", 45.25], ["telephone", 7.51], ["fart", 6.38]], null, null, [["fart", 21.09], ["music", 15.31], ["speech", 14.87]], null, null, null, [["hum", 38.02], ["speech", 24.89], ["throbbing", 8.72]], null, null, null, [["hum", 28.91], ["speech", 21.43], ["mains hum", 13.65]], [["music", 30.29], ["theremin", 20.95], ["hum", 5.5]], [["hum", 45.83], ["mains hum", 21.13], ["music", 8.79]], [["hum", 32.82], ["music", 24.23], ["theremin", 11.33]]], "duration": [6.99, 1.22, 2.89, 5.97, 1.54, 2.31, 4.34, 2.81, 1.79, 1.48, 2.04, 2.28, 9.63, 2.46, 5.75, 8.2, 8.92, 4.35]} \ No newline at end of file diff --git a/annotations_filtered/l4S4IBACQCM_filtered.json b/annotations_filtered/l4S4IBACQCM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a558c0944860c39a9b177beca85e141e80213c26 --- /dev/null +++ b/annotations_filtered/l4S4IBACQCM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [3.0, 7.15], [8.0, 8.94], [9.0, 10.83], [22.0, 22.69], [25.0, 25.02], [26.0, 26.47], [30.0, 31.56], [32.0, 32.66], [34.0, 34.13], [40.0, 41.39], [51.0, 51.46], [71.0, 108.7], [113.0, 134.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.85], "audiomae_on_audioset": [null, [["music", 53.16], ["brass instrument", 11.65], ["trombone", 9.66]], null, null, null, null, null, null, null, null, null, null, null, [["music", 62.04], ["buzz", 6.35], ["musical instrument", 4.06]]], "duration": [0.93, 4.15, 0.94, 1.83, 0.69, 0.02, 0.47, 1.56, 0.66, 0.13, 1.39, 0.46, 37.7, 21.6]} \ No newline at end of file diff --git a/annotations_filtered/l53Q1UXk2DE_filtered.json b/annotations_filtered/l53Q1UXk2DE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10dc414a93f191195abcaa308e8ac3fe560b3b6e --- /dev/null +++ b/annotations_filtered/l53Q1UXk2DE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 37.69], [43.0, 46.4], [50.0, 54.51], [55.0, 54.89], [58.0, 80.86], [89.0, 173.99]], "keep_status": [false, true, true, false, true, false], "silence_prob": [0.0, 34.23, 33.9, 0.0, 35.08, 0.0], "audiomae_on_audioset": [null, [["music", 46.21], ["sampler", 8.77], ["boing", 6.26]], [["music", 53.37], ["throbbing", 8.39], ["synthesizer", 4.07]], null, [["music", 56.27], ["sampler", 4.85], ["synthesizer", 4.5]], null], "duration": [30.69, 3.4, 4.51, -0.11, 22.86, 84.99]} \ No newline at end of file diff --git a/annotations_filtered/l59t24vh3QI_filtered.json b/annotations_filtered/l59t24vh3QI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53830d0f1a16c573eac51e04f7f28694daba06ea --- /dev/null +++ b/annotations_filtered/l59t24vh3QI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.82], [8.0, 7.86], [15.0, 16.07], [20.0, 21.41], [29.0, 29.71], [47.0, 47.68], [49.0, 50.13], [52.0, 53.92], [55.0, 64.52], [67.0, 67.31], [70.0, 80.15], [81.0, 85.53], [86.0, 88.21], [92.0, 92.84], [93.0, 109.58], [110.0, 116.87], [119.0, 119.25], [120.0, 126.42], [127.0, 129.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.11, 0.0, 32.24, 32.55, 30.09, 0.0, 32.85, 31.76, 0.0, 30.8, 31.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 31.24], ["mains hum", 30.3], ["music", 16.7]], null, [["music", 42.67], ["theremin", 11.75], ["hum", 9.61]], [["music", 33.04], ["mains hum", 9.78], ["hum", 8.58]], [["music", 15.87], ["didgeridoo", 11.19], ["fart", 4.53]], null, [["music", 34.11], ["synthesizer", 16.37], ["noise", 10.09]], [["music", 24.44], ["theremin", 16.95], ["mains hum", 14.25]], null, [["theremin", 42.21], ["music", 41.41], ["musical instrument", 2.89]], [["theremin", 30.74], ["music", 26.66], ["siren", 3.81]]], "duration": [0.82, -0.14, 1.07, 1.41, 0.71, 0.68, 1.13, 1.92, 9.52, 0.31, 10.15, 4.53, 2.21, 0.84, 16.58, 6.87, 0.25, 6.42, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/l5s3_XV1rkA_filtered.json b/annotations_filtered/l5s3_XV1rkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..156b303afcfa707243310f0b1bb70e8b8dca3674 --- /dev/null +++ b/annotations_filtered/l5s3_XV1rkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.1], [14.0, 16.9], [20.0, 27.31], [30.0, 43.66], [45.0, 45.32], [46.0, 46.74], [52.0, 64.35], [67.0, 69.35], [80.0, 80.79], [83.0, 84.05], [84.0, 85.94], [87.0, 86.85], [89.0, 96.58], [98.0, 98.58], [100.0, 100.72]], "keep_status": [true, false, true, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [31.38, 31.12, 30.95, 30.95, 0.0, 0.0, 30.13, 31.77, 0.0, 0.0, 0.0, 0.0, 30.84, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.54], ["synthesizer", 6.75], ["ambient music", 6.19]], [["music", 79.54], ["synthesizer", 2.82], ["musical instrument", 2.42]], [["music", 45.58], ["didgeridoo", 11.6], ["synthesizer", 6.57]], [["brass instrument", 34.83], ["music", 34.34], ["trombone", 10.29]], null, null, [["music", 39.35], ["trombone", 27.12], ["brass instrument", 15.12]], [["hum", 31.78], ["mains hum", 20.32], ["throbbing", 6.21]], null, null, null, null, [["music", 44.77], ["musical instrument", 7.11], ["hum", 6.93]], null, null], "duration": [4.1, 2.9, 7.31, 13.66, 0.32, 0.74, 12.35, 2.35, 0.79, 1.05, 1.94, -0.15, 7.58, 0.58, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/l65KNW2ZGV8_filtered.json b/annotations_filtered/l65KNW2ZGV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63914db13df8bf2019a54e21e7125dff4ee807f7 --- /dev/null +++ b/annotations_filtered/l65KNW2ZGV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [4.0, 4.78], [6.0, 6.96], [7.0, 8.92], [11.0, 11.13], [12.0, 12.43], [12.0, 13.91], [16.0, 17.02], [18.0, 17.95], [19.0, 19.94], [31.0, 32.07], [34.0, 34.32], [38.0, 38.82], [42.0, 43.09], [45.0, 45.2], [46.0, 50.03], [52.0, 52.73], [54.0, 53.59], [54.0, 55.68], [56.0, 67.44], [72.0, 72.49], [77.0, 77.16], [79.0, 79.68], [80.0, 80.84], [82.0, 83.3], [87.0, 88.23], [91.0, 91.2], [94.0, 94.36], [95.0, 96.26], [106.0, 106.62], [114.0, 115.86], [117.0, 119.1], [119.0, 120.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 0.78, 0.96, 1.92, 0.13, 0.43, 1.91, 1.02, -0.05, 0.94, 1.07, 0.32, 0.82, 1.09, 0.2, 4.03, 0.73, -0.41, 1.68, 11.44, 0.49, 0.16, 0.68, 0.84, 1.3, 1.23, 0.2, 0.36, 1.26, 0.62, 1.86, 2.1, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/l6NIVn6_m1c_filtered.json b/annotations_filtered/l6NIVn6_m1c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10c03b224530aeecebbf96ff744c8a52cf98c316 --- /dev/null +++ b/annotations_filtered/l6NIVn6_m1c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.47], [9.0, 9.48], [11.0, 11.74], [12.0, 14.32], [16.0, 20.87], [21.0, 24.76], [34.0, 36.07], [45.0, 55.8], [59.0, 59.91], [61.0, 64.02], [65.0, 78.07], [85.0, 84.99], [87.0, 87.24], [103.0, 113.75], [116.0, 121.12], [123.0, 123.57], [125.0, 131.41], [134.0, 144.68], [147.0, 147.78], [149.0, 149.88], [151.0, 154.94], [156.0, 157.59], [161.0, 162.21], [164.0, 164.98], [167.0, 167.26], [170.0, 170.7], [171.0, 172.29], [173.0, 173.16]], "keep_status": [false, false, false, false, true, true, false, true, false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.18, 35.93, 31.36, 31.73, 45.11, 0.0, 34.16, 31.58, 0.0, 0.0, 39.93, 39.35, 0.0, 33.81, 37.23, 0.0, 0.0, 32.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 49.32], ["theremin", 6.9], ["hum", 4.51]], [["music", 40.76], ["livestock, farm animals, working animals", 4.18], ["trombone", 3.16]], [["livestock, farm animals, working animals", 40.38], ["moo", 19.43], ["cattle, bovinae", 13.4]], [["music", 23.42], ["hum", 21.11], ["throbbing", 10.95]], null, [["speech", 27.41], ["music", 21.88], ["radio", 17.97]], [["music", 39.8], ["theremin", 33.28], ["synthesizer", 8.36]], null, null, [["hum", 50.56], ["mains hum", 20.53], ["throbbing", 11.8]], [["music", 60.11], ["theremin", 12.69], ["musical instrument", 1.7]], null, [["music", 75.75], ["musical instrument", 8.78], ["synthesizer", 1.24]], [["music", 37.06], ["musical instrument", 18.03], ["brass instrument", 8.7]], null, null, [["music", 26.4], ["theremin", 9.04], ["noise", 8.98]], null, null, null, null, null, null, null], "duration": [0.47, 0.48, 0.74, 2.32, 4.87, 3.76, 2.07, 10.8, 0.91, 3.02, 13.07, -0.01, 0.24, 10.75, 5.12, 0.57, 6.41, 10.68, 0.78, 0.88, 3.94, 1.59, 1.21, 0.98, 0.26, 0.7, 1.29, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/l6StIaMaRsg_filtered.json b/annotations_filtered/l6StIaMaRsg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc009e46c4aee969ae959c5637f0d39426676deb --- /dev/null +++ b/annotations_filtered/l6StIaMaRsg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 30.25], [33.0, 37.1], [38.0, 40.74], [42.0, 47.93], [50.0, 50.28], [50.0, 50.77], [52.0, 53.65], [58.0, 64.42], [66.0, 71.41], [72.0, 72.44], [73.0, 73.31], [76.0, 76.44], [79.0, 79.68], [91.0, 96.99], [97.0, 102.32], [104.0, 107.69], [110.0, 111.67]], "keep_status": [false, true, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [61.97, 37.81, 37.3, 36.98, 0.0, 0.0, 0.0, 35.39, 90.78, 0.0, 0.0, 0.0, 0.0, 62.99, 47.94, 82.43, 0.0], "audiomae_on_audioset": [null, [["hum", 16.67], ["fly, housefly", 11.46], ["music", 10.78]], [["mains hum", 31.58], ["hum", 23.01], ["music", 14.88]], [["hum", 24.06], ["mains hum", 18.55], ["music", 9.55]], null, null, null, [["hum", 53.18], ["mains hum", 22.64], ["music", 9.57]], null, null, null, null, null, null, [["music", 36.9], ["speech", 26.42], ["musical instrument", 6.03]], null, null], "duration": [2.25, 4.1, 2.74, 5.93, 0.28, 0.77, 1.65, 6.42, 5.41, 0.44, 0.31, 0.44, 0.68, 5.99, 5.32, 3.69, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/l6TGERgrXmA_filtered.json b/annotations_filtered/l6TGERgrXmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0477d3030c9f5b3f24fe2ccab26ab3f38baddc3 --- /dev/null +++ b/annotations_filtered/l6TGERgrXmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.76], [2.0, 5.68], [19.0, 19.84], [25.0, 26.74], [35.0, 36.02], [38.0, 38.2], [43.0, 45.15], [46.0, 46.57], [54.0, 61.33], [64.0, 64.56], [65.0, 67.07], [68.0, 68.5], [71.0, 71.22], [74.0, 75.03], [82.0, 84.2], [95.0, 98.25], [102.0, 103.13], [115.0, 124.48], [127.0, 130.47], [131.0, 132.68], [133.0, 144.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 62.58, 0.0, 61.97, 0.0, 53.84, 0.0, 0.0, 0.0, 56.25, 99.92, 0.0, 90.95, 92.8, 0.0, 96.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.24, 3.68, 0.84, 1.74, 1.02, 0.2, 2.15, 0.57, 7.33, 0.56, 2.07, 0.5, 0.22, 1.03, 2.2, 3.25, 1.13, 9.48, 3.47, 1.68, 11.15]} \ No newline at end of file diff --git a/annotations_filtered/l6cFM5Ubilw_filtered.json b/annotations_filtered/l6cFM5Ubilw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e71855a6005db18fc127236e99cd291de4634b03 --- /dev/null +++ b/annotations_filtered/l6cFM5Ubilw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.91], [12.0, 16.92], [19.0, 20.43], [24.0, 25.32], [28.0, 29.02], [30.0, 36.22], [37.0, 43.92], [44.0, 43.95], [44.0, 47.01], [47.0, 47.04], [56.0, 57.2], [61.0, 64.81], [68.0, 69.26], [73.0, 80.45], [86.0, 107.87], [110.0, 130.01]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 49.73, 0.0, 0.0, 0.0, 58.47, 39.91, 0.0, 32.6, 0.0, 0.0, 41.07, 0.0, 31.61, 29.03, 44.04], "audiomae_on_audioset": [null, [["speech", 37.02], ["music", 34.49], ["foghorn", 3.37]], null, null, null, null, [["music", 37.81], ["speech", 14.96], ["singing bowl", 6.91]], null, [["speech", 28.81], ["music", 20.96], ["whale vocalization", 19.75]], null, null, [["whale vocalization", 43.99], ["music", 38.61], ["speech", 9.2]], null, [["music", 60.17], ["speech", 13.45], ["hum", 2.59]], [["speech", 45.77], ["music", 23.68], ["buzz", 4.08]], [["music", 40.34], ["hum", 15.37], ["mains hum", 8.31]]], "duration": [-0.09, 4.92, 1.43, 1.32, 1.02, 6.22, 6.92, -0.05, 3.01, 0.04, 1.2, 3.81, 1.26, 7.45, 21.87, 20.01]} \ No newline at end of file diff --git a/annotations_filtered/l6e1M2d4BJ0_filtered.json b/annotations_filtered/l6e1M2d4BJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74bfc2c6d08b11934cee3b548ddfc1166fa836f7 --- /dev/null +++ b/annotations_filtered/l6e1M2d4BJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [5.0, 7.5], [10.0, 10.5], [11.0, 12.39], [16.0, 16.98], [18.0, 21.34], [25.0, 25.81], [27.0, 28.73], [30.0, 31.75], [33.0, 35.04], [37.0, 39.85], [42.0, 42.52], [45.0, 46.68], [47.0, 51.12], [54.0, 55.65], [57.0, 57.65], [62.0, 64.61], [68.0, 68.89], [71.0, 72.17], [76.0, 77.82], [82.0, 84.1], [85.0, 86.22], [88.0, 88.72], [90.0, 90.78], [92.0, 94.63], [95.0, 95.81], [98.0, 99.25], [101.0, 102.3], [104.0, 104.87], [107.0, 108.4], [111.0, 111.27], [112.0, 112.8], [117.0, 117.22], [119.0, 120.51], [124.0, 127.14], [127.0, 128.9], [131.0, 132.9], [135.0, 135.78], [138.0, 138.72], [140.0, 147.95], [150.0, 151.68], [154.0, 154.41], [156.0, 157.69], [159.0, 162.75], [163.0, 164.91], [165.0, 166.08], [168.0, 170.13], [172.0, 175.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 87.55, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 100.0, 98.01, 0.0, 0.0, 84.43, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 84.8, 73.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 2.5, 0.5, 1.39, 0.98, 3.34, 0.81, 1.73, 1.75, 2.04, 2.85, 0.52, 1.68, 4.12, 1.65, 0.65, 2.61, 0.89, 1.17, 1.82, 2.1, 1.22, 0.72, 0.78, 2.63, 0.81, 1.25, 1.3, 0.87, 1.4, 0.27, 0.8, 0.22, 1.51, 3.14, 1.9, 1.9, 0.78, 0.72, 7.95, 1.68, 0.41, 1.69, 3.75, 1.91, 1.08, 2.13, 3.83]} \ No newline at end of file diff --git a/annotations_filtered/l6uaxfye2Ig_filtered.json b/annotations_filtered/l6uaxfye2Ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ca999be2621d01d977a5deb47bac6320fc79f2e --- /dev/null +++ b/annotations_filtered/l6uaxfye2Ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [7.0, 7.47], [12.0, 13.0], [14.0, 16.44], [23.0, 22.99], [44.0, 44.58], [48.0, 48.2], [51.0, 51.68], [60.0, 60.69], [62.0, 62.63], [65.0, 65.94], [69.0, 70.34], [74.0, 75.68], [86.0, 87.76], [89.0, 90.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 69.16], ["beatboxing", 3.82], ["fart", 3.41]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.47, 1.0, 2.44, -0.01, 0.58, 0.2, 0.68, 0.69, 0.63, 0.94, 1.34, 1.68, 1.76, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/l6zm1uCb30w_filtered.json b/annotations_filtered/l6zm1uCb30w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0191d06c5189ea27035995a49a0eada1d890a016 --- /dev/null +++ b/annotations_filtered/l6zm1uCb30w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.73], [3.0, 3.7], [6.0, 8.14], [10.0, 10.4], [11.0, 10.98], [11.0, 11.97], [13.0, 14.37], [18.0, 19.16], [21.0, 22.25], [22.0, 22.94], [24.0, 24.34], [27.0, 27.87]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 24.58], ["mains hum", 8.74], ["speech", 6.41]], null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.7, 2.14, 0.4, -0.02, 0.97, 1.37, 1.16, 1.25, 0.94, 0.34, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/l7FkN4ooYvA_filtered.json b/annotations_filtered/l7FkN4ooYvA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a584a05e954f9425d0c9d1535c245c1840f5e41e --- /dev/null +++ b/annotations_filtered/l7FkN4ooYvA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.3], [13.0, 13.07], [28.0, 27.82], [28.0, 28.24], [28.0, 28.29], [35.0, 38.47], [43.0, 59.8], [61.0, 69.09], [69.0, 69.16], [69.0, 70.78], [77.0, 79.84], [84.0, 95.12], [102.0, 101.88], [108.0, 107.94], [108.0, 108.26], [116.0, 116.51], [119.0, 118.94], [124.0, 129.41], [130.0, 139.38], [142.0, 144.83], [166.0, 169.23], [172.0, 174.31]], "keep_status": [true, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, true], "silence_prob": [43.08, 0.0, 0.0, 0.0, 0.0, 33.77, 32.13, 31.81, 0.0, 0.0, 29.05, 32.61, 0.0, 0.0, 0.0, 0.0, 0.0, 37.37, 32.2, 35.53, 29.39, 29.62], "audiomae_on_audioset": [[["music", 41.04], ["bow-wow", 11.26], ["speech", 8.64]], null, null, null, null, [["vehicle", 12.32], ["motorcycle", 12.29], ["siren", 11.47]], [["music", 53.36], ["boing", 32.63], ["speech", 4.03]], [["music", 67.0], ["boing", 10.35], ["scratching (performance technique)", 3.59]], null, null, [["speech", 26.34], ["sidetone", 11.01], ["music", 10.72]], [["music", 55.98], ["theremin", 10.15], ["buzz", 3.46]], null, null, null, null, null, [["music", 71.55], ["speech", 11.47], ["sidetone", 3.01]], [["music", 67.5], ["speech", 6.65], ["groan", 4.84]], [["groan", 34.29], ["music", 23.55], ["boing", 18.51]], [["music", 53.34], ["electronic music", 3.58], ["effects unit", 3.02]], [["music", 23.69], ["speech", 4.54], ["musical instrument", 2.28]]], "duration": [2.3, 0.07, -0.18, 0.24, 0.29, 3.47, 16.8, 8.09, 0.16, 1.78, 2.84, 11.12, -0.12, -0.06, 0.26, 0.51, -0.06, 5.41, 9.38, 2.83, 3.23, 2.31]} \ No newline at end of file diff --git a/annotations_filtered/l83CcqhP-kY_filtered.json b/annotations_filtered/l83CcqhP-kY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edc8db578b6b5521bbd4acd1584d122671e1526e --- /dev/null +++ b/annotations_filtered/l83CcqhP-kY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.2], [15.0, 15.63], [19.0, 19.31], [19.0, 19.45], [47.0, 47.83], [62.0, 63.04], [64.0, 69.01], [69.0, 69.96], [72.0, 77.46], [79.0, 79.32], [80.0, 80.28], [81.0, 82.8], [96.0, 96.35], [97.0, 97.63], [100.0, 102.44], [103.0, 103.55], [108.0, 107.79], [117.0, 117.86], [119.0, 119.85]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.96, 0.0, 29.63, 0.0, 0.0, 0.0, 0.0, 0.0, 34.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 70.34], ["sidetone", 8.07], ["noise", 4.93]], null, [["explosion", 23.21], ["whack, thwack", 16.38], ["speech", 9.62]], null, null, null, null, null, [["speech", 29.3], ["coin (dropping)", 23.43], ["dishes, pots, and pans", 16.08]], null, null, null, null], "duration": [0.2, 0.63, 0.31, 0.45, 0.83, 1.04, 5.01, 0.96, 5.46, 0.32, 0.28, 1.8, 0.35, 0.63, 2.44, 0.55, -0.21, 0.86, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/l8MFxT9ILKY_filtered.json b/annotations_filtered/l8MFxT9ILKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5c0933f535b9b625257a6c481f8d7308d96e896 --- /dev/null +++ b/annotations_filtered/l8MFxT9ILKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.26], [15.0, 26.89], [31.0, 34.96], [37.0, 38.3], [39.0, 46.01], [47.0, 53.87], [60.0, 60.45], [63.0, 74.66], [78.0, 79.2], [80.0, 81.51], [83.0, 89.67], [93.0, 104.14], [106.0, 107.42], [108.0, 144.15], [146.0, 146.11], [148.0, 147.75], [149.0, 160.91], [162.0, 163.76], [165.0, 166.13]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.45, 30.18, 0.0, 33.63, 44.32, 0.0, 41.36, 0.0, 0.0, 34.3, 30.33, 0.0, 0.0, 0.0, 0.0, 30.44, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 36.47], ["vehicle", 8.92], ["hum", 8.59]], [["speech", 45.64], ["hubbub, speech noise, speech babble", 11.15], ["cattle, bovinae", 3.68]], null, [["speech", 64.71], ["theremin", 5.02], ["music", 4.38]], [["speech", 37.49], ["music", 30.69], ["hum", 3.35]], null, [["mains hum", 55.52], ["hum", 38.39], ["speech", 1.05]], null, null, [["music", 67.67], ["hum", 2.68], ["scary music", 2.54]], [["music", 56.25], ["hum", 9.0], ["buzz", 8.47]], null, null, null, null, [["music", 53.96], ["hum", 20.39], ["mains hum", 12.97]], null, null], "duration": [0.26, 11.89, 3.96, 1.3, 7.01, 6.87, 0.45, 11.66, 1.2, 1.51, 6.67, 11.14, 1.42, 36.15, 0.11, -0.25, 11.91, 1.76, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/l8aozWddbPA_filtered.json b/annotations_filtered/l8aozWddbPA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a17508219176969edaacfed7952a89d309ad98d --- /dev/null +++ b/annotations_filtered/l8aozWddbPA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.77], [13.0, 13.29], [14.0, 16.19], [20.0, 20.38], [22.0, 24.09], [28.0, 28.39], [36.0, 37.4], [40.0, 40.51], [43.0, 45.64], [48.0, 48.22], [51.0, 50.87], [53.0, 53.33], [55.0, 57.43], [60.0, 60.12], [61.0, 61.62], [63.0, 66.06], [68.0, 68.98], [72.0, 72.89], [76.0, 77.08], [80.0, 84.43], [85.0, 88.94], [113.0, 113.02], [113.0, 113.24], [114.0, 116.77]], "keep_status": [true, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [32.76, 0.0, 38.63, 0.0, 45.36, 0.0, 0.0, 0.0, 34.01, 0.0, 0.0, 0.0, 40.64, 0.0, 0.0, 39.5, 0.0, 0.0, 0.0, 39.63, 34.56, 0.0, 0.0, 33.52], "audiomae_on_audioset": [[["music", 25.36], ["animal", 6.72], ["speech", 6.36]], null, [["speech", 61.69], ["baby laughter", 6.46], ["laughter", 3.63]], null, [["speech", 24.83], ["sidetone", 14.98], ["frog", 10.32]], null, null, null, [["noise", 15.62], ["speech", 11.84], ["whale vocalization", 11.6]], null, null, null, [["mosquito", 35.81], ["frog", 30.79], ["croak", 9.93]], null, null, [["music", 33.54], ["speech", 14.09], ["animal", 10.0]], null, null, null, [["music", 51.21], ["speech", 17.89], ["didgeridoo", 5.08]], [["speech", 47.15], ["music", 18.45], ["radio", 5.41]], null, null, [["frog", 39.4], ["music", 13.37], ["boing", 6.73]]], "duration": [3.77, 0.29, 2.19, 0.38, 2.09, 0.39, 1.4, 0.51, 2.64, 0.22, -0.13, 0.33, 2.43, 0.12, 0.62, 3.06, 0.98, 0.89, 1.08, 4.43, 3.94, 0.02, 0.24, 2.77]} \ No newline at end of file diff --git a/annotations_filtered/l94geYuwNJg_filtered.json b/annotations_filtered/l94geYuwNJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17ab885ea5eab14dd8a67a2f68be6f2d0ecec6c4 --- /dev/null +++ b/annotations_filtered/l94geYuwNJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.33]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.33]} \ No newline at end of file diff --git a/annotations_filtered/l97NtEMUx0M_filtered.json b/annotations_filtered/l97NtEMUx0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..157db7304f0d82c9ee51024670edb292f5becd27 --- /dev/null +++ b/annotations_filtered/l97NtEMUx0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 31.62], [32.0, 40.46], [42.0, 43.09], [50.0, 51.07], [53.0, 57.6], [61.0, 64.42], [67.0, 67.74], [69.0, 71.61], [72.0, 72.57], [73.0, 74.24], [80.0, 82.76], [88.0, 89.83]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [29.42, 29.83, 0.0, 0.0, 28.78, 49.22, 0.0, 75.07, 0.0, 0.0, 74.44, 0.0], "audiomae_on_audioset": [[["buzz", 44.5], ["music", 24.7], ["speech", 7.74]], [["music", 37.74], ["speech", 23.11], ["buzz", 18.34]], null, null, [["music", 38.5], ["hum", 18.33], ["throbbing", 11.99]], [["hum", 20.6], ["music", 17.27], ["mains hum", 8.07]], null, null, null, null, null, null], "duration": [12.62, 8.46, 1.09, 1.07, 4.6, 3.42, 0.74, 2.61, 0.57, 1.24, 2.76, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/l9LOKUiY0Dg_filtered.json b/annotations_filtered/l9LOKUiY0Dg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..860268a00825975aed32b6996ad85508557a053f --- /dev/null +++ b/annotations_filtered/l9LOKUiY0Dg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.12], [32.0, 33.59], [36.0, 45.67], [46.0, 45.77], [47.0, 47.21], [57.0, 59.31], [72.0, 73.85], [84.0, 107.38], [109.0, 110.84], [112.0, 113.24], [123.0, 124.43], [125.0, 126.15], [126.0, 127.63], [128.0, 129.41], [134.0, 134.92], [137.0, 138.11], [147.0, 148.15], [149.0, 151.48], [153.0, 153.52], [155.0, 158.8]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.85, 0.0, 32.5, 0.0, 0.0, 44.84, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.78, 0.0, 50.11], "audiomae_on_audioset": [[["music", 16.07], ["speech", 14.51], ["hum", 6.83]], null, [["music", 35.37], ["throbbing", 29.57], ["speech", 9.58]], null, null, [["throbbing", 31.82], ["hum", 29.31], ["music", 20.48]], null, [["music", 49.62], ["throbbing", 18.95], ["hum", 10.41]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.12, 1.59, 9.67, -0.23, 0.21, 2.31, 1.85, 23.38, 1.84, 1.24, 1.43, 1.15, 1.63, 1.41, 0.92, 1.11, 1.15, 2.48, 0.52, 3.8]} \ No newline at end of file diff --git a/annotations_filtered/l9c1k_m6POA_filtered.json b/annotations_filtered/l9c1k_m6POA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d992d990e22532c6fa872eb0c198699cf1d491f7 --- /dev/null +++ b/annotations_filtered/l9c1k_m6POA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [4.0, 4.53], [7.0, 8.34], [12.0, 15.5], [16.0, 17.83], [18.0, 25.64], [27.0, 29.02], [30.0, 30.4], [31.0, 31.62], [32.0, 35.97], [37.0, 40.74], [42.0, 46.36], [52.0, 53.74], [54.0, 55.29], [58.0, 58.95], [69.0, 69.48], [72.0, 73.52], [75.0, 76.2], [79.0, 80.57], [81.0, 83.51], [85.0, 86.31], [89.0, 89.14], [92.0, 92.62], [96.0, 98.32], [101.0, 101.97], [103.0, 109.07], [110.0, 110.46], [115.0, 115.5], [118.0, 121.78], [126.0, 130.54], [132.0, 133.19], [134.0, 147.19], [149.0, 149.61], [155.0, 155.83], [157.0, 163.44], [164.0, 165.01], [166.0, 167.46]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 49.0, 0.0, 35.47, 92.64, 0.0, 0.0, 81.71, 99.95, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 65.91, 0.0, 83.34, 0.0, 0.0, 99.94, 63.74, 0.0, 96.17, 0.0, 0.0, 89.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.68], ["synthesizer", 14.41], ["musical instrument", 10.82]], null, [["music", 58.13], ["speech", 26.66], ["thunk", 3.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.53, 1.34, 3.5, 1.83, 7.64, 2.02, 0.4, 0.62, 3.97, 3.74, 4.36, 1.74, 1.29, 0.95, 0.48, 1.52, 1.2, 1.57, 2.51, 1.31, 0.14, 0.62, 2.32, 0.97, 6.07, 0.46, 0.5, 3.78, 4.54, 1.19, 13.19, 0.61, 0.83, 6.44, 1.01, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/l9k9_K8Tea0_filtered.json b/annotations_filtered/l9k9_K8Tea0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84f22ef651713cd9e2e6aba1f22093ee3ce561fb --- /dev/null +++ b/annotations_filtered/l9k9_K8Tea0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 46.72], [49.0, 49.76], [51.0, 52.56], [60.0, 60.34], [65.0, 66.33], [67.0, 67.93], [69.0, 75.69]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [35.33, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97], "audiomae_on_audioset": [[["speech", 72.77], ["music", 12.71], ["sidetone", 2.7]], null, null, null, null, null, null], "duration": [19.72, 0.76, 1.56, 0.34, 1.33, 0.93, 6.69]} \ No newline at end of file diff --git a/annotations_filtered/lAIJ6Twk8aQ_filtered.json b/annotations_filtered/lAIJ6Twk8aQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f41188876d3676235f0b39218d7fdea75e01d1ad --- /dev/null +++ b/annotations_filtered/lAIJ6Twk8aQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.19], [8.0, 8.48], [11.0, 11.91], [16.0, 36.22], [37.0, 52.08], [53.0, 54.16], [56.0, 59.09], [61.0, 61.96], [63.0, 64.81], [67.0, 76.27], [77.0, 78.11], [81.0, 81.84], [83.0, 84.77], [88.0, 88.7], [91.0, 100.2], [102.0, 102.93], [106.0, 112.5], [113.0, 113.88], [117.0, 117.93], [121.0, 121.61], [123.0, 123.13], [125.0, 128.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 65.91, 80.82, 0.0, 99.26, 0.0, 0.0, 99.52, 0.0, 0.0, 0.0, 0.0, 97.92, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.48, 0.91, 20.22, 15.08, 1.16, 3.09, 0.96, 1.81, 9.27, 1.11, 0.84, 1.77, 0.7, 9.2, 0.93, 6.5, 0.88, 0.93, 0.61, 0.13, 3.76]} \ No newline at end of file diff --git a/annotations_filtered/lAcZxn1DeHs_filtered.json b/annotations_filtered/lAcZxn1DeHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..463d034606e7e21e4e6b968ed16f570832fabf1c --- /dev/null +++ b/annotations_filtered/lAcZxn1DeHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.53], [14.0, 57.25], [59.0, 66.51], [70.0, 84.43]], "keep_status": [true, false, true, true], "silence_prob": [31.8, 0.0, 32.98, 30.72], "audiomae_on_audioset": [[["music", 37.34], ["synthesizer", 22.43], ["didgeridoo", 8.34]], null, [["music", 34.77], ["synthesizer", 16.58], ["speech", 9.15]], [["music", 57.25], ["speech", 7.79], ["trance music", 4.39]]], "duration": [2.53, 43.25, 7.51, 14.43]} \ No newline at end of file diff --git a/annotations_filtered/lAgPsmTxBfc_filtered.json b/annotations_filtered/lAgPsmTxBfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53aa80ece9177fa90faebe611f39c23217e158aa --- /dev/null +++ b/annotations_filtered/lAgPsmTxBfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.51], [17.0, 18.66], [21.0, 23.09], [27.0, 27.68], [28.0, 29.08], [31.0, 33.29], [37.0, 37.18], [39.0, 40.86], [45.0, 45.17], [49.0, 50.5], [58.0, 61.28], [72.0, 72.5], [84.0, 84.81], [94.0, 94.44], [94.0, 94.71], [96.0, 98.73], [100.0, 99.93], [110.0, 110.47], [116.0, 116.53], [117.0, 118.0], [119.0, 119.65], [124.0, 124.88], [128.0, 129.12]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.61, 0.0, 0.0, 32.72, 0.0, 0.0, 0.0, 0.0, 54.17, 0.0, 0.0, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["burping, eructation", 29.83], ["cough", 21.97], ["boing", 3.78]], null, null, [["boing", 31.77], ["speech", 19.78], ["didgeridoo", 8.49]], null, null, null, null, null, null, null, null, null, [["speech", 57.7], ["laughter", 14.41], ["fart", 3.73]], null, null, null, null, null, null, null], "duration": [0.51, 1.66, 2.09, 0.68, 1.08, 2.29, 0.18, 1.86, 0.17, 1.5, 3.28, 0.5, 0.81, 0.44, 0.71, 2.73, -0.07, 0.47, 0.53, 1.0, 0.65, 0.88, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/lAhQbCN-Zvg_filtered.json b/annotations_filtered/lAhQbCN-Zvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33710ee968b2362cb2cad8ffcea5a2cf368dc6ca --- /dev/null +++ b/annotations_filtered/lAhQbCN-Zvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.02], [5.0, 5.49], [8.0, 8.95], [11.0, 13.78], [15.0, 14.96], [16.0, 16.88], [18.0, 18.47], [19.0, 19.85], [21.0, 22.15], [23.0, 24.6], [28.0, 27.99], [29.0, 32.59], [33.0, 34.5], [38.0, 39.24], [40.0, 40.91], [47.0, 47.38], [62.0, 63.17], [68.0, 68.64], [72.0, 73.35], [77.0, 78.65], [88.0, 91.84], [94.0, 97.04], [98.0, 99.2], [100.0, 101.12], [103.0, 105.48], [106.0, 107.99], [111.0, 115.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 0.49, 0.95, 2.78, -0.04, 0.88, 0.47, 0.85, 1.15, 1.6, -0.01, 3.59, 1.5, 1.24, 0.91, 0.38, 1.17, 0.64, 1.35, 1.65, 3.84, 3.04, 1.2, 1.12, 2.48, 1.99, 4.2]} \ No newline at end of file diff --git a/annotations_filtered/lAklD2ULzh0_filtered.json b/annotations_filtered/lAklD2ULzh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18af370fef8bf8bc5458e486ab503f2342ae9fea --- /dev/null +++ b/annotations_filtered/lAklD2ULzh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.77], [20.0, 20.22], [22.0, 21.95], [26.0, 27.11], [36.0, 45.25], [46.0, 53.4], [55.0, 56.29], [57.0, 58.04], [60.0, 60.62], [63.0, 64.93], [68.0, 76.67], [78.0, 81.24], [84.0, 88.8], [90.0, 92.35], [93.0, 96.65], [97.0, 101.7], [108.0, 116.48], [118.0, 120.99], [121.0, 121.71], [122.0, 123.9], [126.0, 135.7], [136.0, 135.78]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.17, 38.08, 0.0, 0.0, 0.0, 0.0, 75.39, 49.18, 67.63, 58.89, 50.97, 53.28, 69.74, 76.7, 0.0, 0.0, 37.03, 0.0], "audiomae_on_audioset": [null, null, null, null, [["synthesizer", 10.28], ["radio", 9.77], ["music", 8.57]], [["speech", 28.01], ["radio", 18.78], ["sidetone", 12.99]], null, null, null, null, null, [["speech", 34.88], ["music", 18.26], ["whale vocalization", 9.4]], null, null, null, null, null, null, null, null, [["singing bowl", 52.9], ["music", 14.66], ["gong", 7.93]], null], "duration": [0.77, 0.22, -0.05, 1.11, 9.25, 7.4, 1.29, 1.04, 0.62, 1.93, 8.67, 3.24, 4.8, 2.35, 3.65, 4.7, 8.48, 2.99, 0.71, 1.9, 9.7, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/lB6Gk5EtunI_filtered.json b/annotations_filtered/lB6Gk5EtunI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe44b4dc4674441d8cb239c01f6d78443534f3f6 --- /dev/null +++ b/annotations_filtered/lB6Gk5EtunI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.41], [10.0, 11.57], [14.0, 15.47], [17.0, 17.91], [18.0, 19.36], [20.0, 20.76], [21.0, 21.98], [24.0, 24.88], [27.0, 27.08], [29.0, 33.27], [36.0, 54.77], [56.0, 65.03], [68.0, 68.89], [71.0, 70.88], [77.0, 78.41], [85.0, 86.07], [96.0, 96.01], [119.0, 121.83], [135.0, 149.39], [163.0, 163.81], [167.0, 168.62], [174.0, 174.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 100.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 39.96, 34.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.19], ["crowd", 11.19], ["cheering", 6.38]], [["insect", 19.47], ["livestock, farm animals, working animals", 12.7], ["fly, housefly", 10.82]], null, null, null], "duration": [2.41, 1.57, 1.47, 0.91, 1.36, 0.76, 0.98, 0.88, 0.08, 4.27, 18.77, 9.03, 0.89, -0.12, 1.41, 1.07, 0.01, 2.83, 14.39, 0.81, 1.62, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/lBS9AHilxg0_filtered.json b/annotations_filtered/lBS9AHilxg0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..667e30564b0296dccb1dfc2c81bacdfb29d7f54a --- /dev/null +++ b/annotations_filtered/lBS9AHilxg0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.31], [17.0, 18.17], [19.0, 25.1], [28.0, 29.19], [33.0, 33.42], [35.0, 43.26], [44.0, 44.91], [47.0, 52.46], [54.0, 56.25], [57.0, 57.82], [59.0, 59.51], [60.0, 64.3], [66.0, 66.24], [68.0, 74.36], [76.0, 75.9], [76.0, 77.03], [80.0, 82.93], [84.0, 85.26], [86.0, 87.89], [90.0, 94.02], [98.0, 122.5], [124.0, 124.51], [126.0, 126.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 81.0, 0.0, 0.0, 99.8, 0.0, 96.29, 99.98, 0.0, 0.0, 100.0, 0.0, 67.38, 0.0, 0.0, 37.31, 0.0, 0.0, 62.68, 58.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 21.25], ["music", 11.85], ["throbbing", 7.23]], null, null, null, null, null, null], "duration": [1.31, 1.17, 6.1, 1.19, 0.42, 8.26, 0.91, 5.46, 2.25, 0.82, 0.51, 4.3, 0.24, 6.36, -0.1, 1.03, 2.93, 1.26, 1.89, 4.02, 24.5, 0.51, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/lBeh1jkanrE_filtered.json b/annotations_filtered/lBeh1jkanrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..578305ff2e647b4a008815342ca152e3c178e61c --- /dev/null +++ b/annotations_filtered/lBeh1jkanrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 57.86], [58.0, 59.59], [60.0, 85.6], [86.0, 87.86], [91.0, 91.49], [92.0, 93.9], [98.0, 99.15], [100.0, 101.61], [102.0, 103.25], [104.0, 104.94], [105.0, 105.76], [106.0, 107.65], [108.0, 109.56], [111.0, 112.67], [114.0, 115.47], [116.0, 116.97], [117.0, 118.23], [119.0, 120.09], [121.0, 121.76], [125.0, 126.15], [129.0, 129.51], [137.0, 139.16], [140.0, 140.91], [143.0, 144.19], [145.0, 145.86], [147.0, 152.37], [154.0, 155.51], [157.0, 157.3], [158.0, 160.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.33, 0.0, 32.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 58.81], "audiomae_on_audioset": [[["music", 84.53], ["musical instrument", 4.86], ["didgeridoo", 2.11]], null, [["music", 51.08], ["theremin", 17.04], ["musical instrument", 6.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.86, 1.59, 25.6, 1.86, 0.49, 1.9, 1.15, 1.61, 1.25, 0.94, 0.76, 1.65, 1.56, 1.67, 1.47, 0.97, 1.23, 1.09, 0.76, 1.15, 0.51, 2.16, 0.91, 1.19, 0.86, 5.37, 1.51, 0.3, 2.44]} \ No newline at end of file diff --git a/annotations_filtered/lBs_nLdio1M_filtered.json b/annotations_filtered/lBs_nLdio1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8e451ed483cc2033bd51f8234d2d5a430e32554 --- /dev/null +++ b/annotations_filtered/lBs_nLdio1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.8], [15.0, 24.17], [26.0, 27.13], [27.0, 27.57], [32.0, 39.61], [45.0, 44.91], [46.0, 48.39], [56.0, 58.28], [60.0, 61.62], [62.0, 68.32], [73.0, 81.03], [86.0, 90.07], [92.0, 93.34], [96.0, 102.47], [103.0, 104.63]], "keep_status": [false, true, false, false, false, false, true, false, false, true, false, true, false, false, false], "silence_prob": [29.97, 28.92, 0.0, 0.0, 29.92, 0.0, 31.83, 29.47, 0.0, 31.0, 44.75, 30.15, 0.0, 32.6, 0.0], "audiomae_on_audioset": [[["throbbing", 41.22], ["music", 23.76], ["hum", 17.49]], [["music", 48.3], ["cacophony", 12.92], ["hum", 5.59]], null, null, [["music", 67.94], ["cacophony", 7.03], ["electronic music", 4.88]], null, [["hum", 24.4], ["music", 23.11], ["throbbing", 17.74]], [["music", 70.89], ["cacophony", 3.09], ["noise", 2.44]], null, [["hum", 23.73], ["music", 18.42], ["cacophony", 17.17]], [["music", 56.39], ["throbbing", 21.92], ["hum", 8.6]], [["music", 38.25], ["speech", 14.49], ["siren", 6.54]], null, [["music", 44.29], ["speech", 26.8], ["smash, crash", 11.8]], null], "duration": [5.8, 9.17, 1.13, 0.57, 7.61, -0.09, 2.39, 2.28, 1.62, 6.32, 8.03, 4.07, 1.34, 6.47, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/lCF6_l8gtdA_filtered.json b/annotations_filtered/lCF6_l8gtdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cce6e7183e28c6111d61f1e647e066888cb29f3a --- /dev/null +++ b/annotations_filtered/lCF6_l8gtdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.66], [3.0, 4.01], [5.0, 5.34], [6.0, 6.54], [9.0, 11.89], [17.0, 17.2], [37.0, 39.51], [50.0, 51.02], [53.0, 53.27], [53.0, 53.91], [56.0, 56.03], [56.0, 59.31], [61.0, 62.72], [63.0, 65.06], [70.0, 76.52], [81.0, 88.11], [89.0, 89.14], [90.0, 90.29], [92.0, 92.84], [94.0, 94.29], [96.0, 96.3], [100.0, 100.63], [105.0, 107.92], [109.0, 110.42], [111.0, 111.52], [114.0, 114.96], [116.0, 117.9], [125.0, 128.41], [129.0, 133.59], [135.0, 135.31], [136.0, 137.3], [138.0, 139.67], [140.0, 141.02], [144.0, 145.89], [146.0, 146.82], [149.0, 149.23], [150.0, 153.35], [158.0, 163.36], [164.0, 165.27], [168.0, 167.83], [170.0, 170.7], [171.0, 173.18], [174.0, 174.43], [175.0, 176.28], [178.0, 179.64], [181.0, 183.95], [185.0, 185.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 60.32, 0.0, 0.0, 0.0, 0.0, 43.13, 0.0, 54.43, 76.7, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 0.0, 0.0, 50.26, 40.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.18, 41.95, 0.0, 0.0, 0.0, 42.88, 0.0, 0.0, 0.0, 53.28, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 14.98], ["noise", 10.72], ["radio", 6.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.17], ["music", 26.49], ["didgeridoo", 4.99]], null, null, null, null, null, null, null, [["mains hum", 39.35], ["hum", 27.28], ["music", 7.84]], [["hum", 38.88], ["mains hum", 27.15], ["music", 13.12]], null, null, null, [["speech", 17.05], ["mains hum", 17.01], ["sidetone", 15.06]], null, null, null, null, null], "duration": [0.66, 1.01, 0.34, 0.54, 2.89, 0.2, 2.51, 1.02, 0.27, 0.91, 0.03, 3.31, 1.72, 2.06, 6.52, 7.11, 0.14, 0.29, 0.84, 0.29, 0.3, 0.63, 2.92, 1.42, 0.52, 0.96, 1.9, 3.41, 4.59, 0.31, 1.3, 1.67, 1.02, 1.89, 0.82, 0.23, 3.35, 5.36, 1.27, -0.17, 0.7, 2.18, 0.43, 1.28, 1.64, 2.95, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/lCL7DI3ah40_filtered.json b/annotations_filtered/lCL7DI3ah40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f7b292f08ab79c96052665c7d7907d42e0b36f9 --- /dev/null +++ b/annotations_filtered/lCL7DI3ah40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.29], [19.0, 20.28], [30.0, 81.67]], "keep_status": [false, false, false], "silence_prob": [32.33, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 34.42], ["mains hum", 23.92], ["speech", 13.76]], null, null], "duration": [3.29, 1.28, 51.67]} \ No newline at end of file diff --git a/annotations_filtered/lCUBQnsS9go_filtered.json b/annotations_filtered/lCUBQnsS9go_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c89c6f0c8ea9b23a71cc5c2a2721b101537bddb --- /dev/null +++ b/annotations_filtered/lCUBQnsS9go_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.34], [11.0, 11.18], [16.0, 16.36], [17.0, 17.58], [19.0, 18.98], [19.0, 19.7], [20.0, 22.1], [25.0, 32.37], [34.0, 36.15], [38.0, 38.85], [41.0, 41.62], [43.0, 43.28], [44.0, 45.2], [47.0, 49.42], [53.0, 54.24], [62.0, 62.14], [66.0, 69.36], [72.0, 72.76], [78.0, 79.74], [81.0, 82.12], [83.0, 86.78], [87.0, 86.81], [87.0, 86.86], [90.0, 90.0], [95.0, 97.46], [99.0, 113.91], [115.0, 115.45], [116.0, 118.05], [119.0, 128.68], [129.0, 129.71], [131.0, 131.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.64, 100.0, 99.85, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 96.66, 98.8, 0.0, 92.97, 81.17, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 0.18, 0.36, 0.58, -0.02, 0.7, 2.1, 7.37, 2.15, 0.85, 0.62, 0.28, 1.2, 2.42, 1.24, 0.14, 3.36, 0.76, 1.74, 1.12, 3.78, -0.19, -0.14, 0.0, 2.46, 14.91, 0.45, 2.05, 9.68, 0.71, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/lCcWPDXqKi0_filtered.json b/annotations_filtered/lCcWPDXqKi0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26aa7aa409eea55b45ddc8943b7a825e74760955 --- /dev/null +++ b/annotations_filtered/lCcWPDXqKi0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.93], [11.0, 19.18], [20.0, 19.92], [20.0, 23.84], [25.0, 35.29], [37.0, 38.99], [51.0, 52.98], [53.0, 54.13], [57.0, 60.07], [61.0, 60.66], [61.0, 60.79], [61.0, 60.94], [67.0, 69.25], [75.0, 76.0], [76.0, 79.2]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 42.79, 0.0, 45.56, 46.54, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 45.18, 0.0, 46.64], "audiomae_on_audioset": [null, [["music", 45.85], ["speech", 27.88], ["synthesizer", 2.4]], null, [["music", 20.04], ["hum", 17.55], ["throbbing", 17.11]], [["music", 51.14], ["throbbing", 6.83], ["speech", 5.94]], null, null, null, [["music", 75.25], ["speech", 4.12], ["electronic music", 2.32]], null, null, null, [["music", 42.43], ["frog", 21.2], ["croak", 18.89]], null, [["speech", 24.59], ["music", 23.52], ["animal", 14.34]]], "duration": [1.93, 8.18, -0.08, 3.84, 10.29, 1.99, 1.98, 1.13, 3.07, -0.34, -0.21, -0.06, 2.25, 1.0, 3.2]} \ No newline at end of file diff --git a/annotations_filtered/lChJz2DSpsE_filtered.json b/annotations_filtered/lChJz2DSpsE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb6b53fe821d7cbd0b6641a46589506d0f3d619d --- /dev/null +++ b/annotations_filtered/lChJz2DSpsE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.34]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.34]} \ No newline at end of file diff --git a/annotations_filtered/lCiravgbbJk_filtered.json b/annotations_filtered/lCiravgbbJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb182c3443a6023789e96d397f97acc0c4009243 --- /dev/null +++ b/annotations_filtered/lCiravgbbJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [28.0, 28.65]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.22, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/lClRzGmpFrs_filtered.json b/annotations_filtered/lClRzGmpFrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bbebf37e2dac6260546de4b9c4e24abb48884ee --- /dev/null +++ b/annotations_filtered/lClRzGmpFrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.46], [13.0, 16.26], [17.0, 24.12], [29.0, 29.57], [31.0, 39.53], [40.0, 40.42], [41.0, 48.05], [49.0, 52.25], [58.0, 58.78], [59.0, 60.2], [65.0, 73.82], [75.0, 76.99], [80.0, 81.68], [85.0, 86.88], [91.0, 91.59], [96.0, 98.73], [100.0, 102.93]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.16, 85.17, 56.33, 0.0, 30.61, 0.0, 33.28, 51.88, 0.0, 0.0, 60.14, 0.0, 0.0, 0.0, 0.0, 53.22, 99.97], "audiomae_on_audioset": [null, null, null, null, [["music", 52.93], ["thunk", 6.46], ["explosion", 6.17]], null, [["music", 27.18], ["explosion", 12.44], ["noise", 8.38]], null, null, null, null, null, null, null, null, null, null], "duration": [8.46, 3.26, 7.12, 0.57, 8.53, 0.42, 7.05, 3.25, 0.78, 1.2, 8.82, 1.99, 1.68, 1.88, 0.59, 2.73, 2.93]} \ No newline at end of file diff --git a/annotations_filtered/lCqHKRjIMu8_filtered.json b/annotations_filtered/lCqHKRjIMu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfa4890a1b2d8726937e732e5ac8005626273d8f --- /dev/null +++ b/annotations_filtered/lCqHKRjIMu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.68], [6.0, 7.2], [9.0, 10.64], [14.0, 15.7], [17.0, 17.05], [18.0, 21.74], [26.0, 26.18], [27.0, 27.35], [28.0, 29.12], [30.0, 30.75], [33.0, 33.02], [35.0, 35.14], [35.0, 35.18], [35.0, 35.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 1.2, 1.64, 1.7, 0.05, 3.74, 0.18, 0.35, 1.12, 0.75, 0.02, 0.14, 0.18, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/lCs7qjJzoDg_filtered.json b/annotations_filtered/lCs7qjJzoDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..903392a247289af8b43185fbb7df20be1b216e25 --- /dev/null +++ b/annotations_filtered/lCs7qjJzoDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.08], [15.0, 15.45], [20.0, 22.65], [23.0, 24.97], [26.0, 38.08], [38.0, 39.09], [40.0, 44.73], [46.0, 45.99], [47.0, 47.87], [50.0, 50.82], [51.0, 52.57], [53.0, 53.96], [55.0, 55.73], [56.0, 59.36], [65.0, 76.38], [78.0, 79.98], [82.0, 82.88], [86.0, 87.56], [89.0, 90.07], [96.0, 98.79], [105.0, 106.34], [107.0, 107.97], [109.0, 109.7]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [30.66, 0.0, 31.76, 0.0, 30.31, 0.0, 31.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.74, 32.51, 0.0, 0.0, 0.0, 0.0, 30.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 56.32], ["music", 12.21], ["mains hum", 10.23]], null, [["foghorn", 29.59], ["speech", 23.48], ["music", 17.7]], null, [["music", 42.94], ["speech", 28.55], ["hum", 4.13]], null, [["speech", 24.61], ["whale vocalization", 17.63], ["music", 16.32]], null, null, null, null, null, null, [["speech", 34.94], ["music", 25.87], ["throbbing", 14.25]], [["hum", 41.11], ["speech", 16.98], ["music", 11.71]], null, null, null, null, [["mains hum", 40.14], ["hum", 16.19], ["thunk", 8.31]], null, null, null], "duration": [10.08, 0.45, 2.65, 1.97, 12.08, 1.09, 4.73, -0.01, 0.87, 0.82, 1.57, 0.96, 0.73, 3.36, 11.38, 1.98, 0.88, 1.56, 1.07, 2.79, 1.34, 0.97, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/lCyS2Gxxzfg_filtered.json b/annotations_filtered/lCyS2Gxxzfg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8a1ecd82f9d299f9c3de6b1462c52558f8e3c84 --- /dev/null +++ b/annotations_filtered/lCyS2Gxxzfg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [2.0, 11.47], [15.0, 15.84], [18.0, 18.18], [19.0, 41.18], [43.0, 44.76], [47.0, 48.3], [54.0, 54.82], [60.0, 60.67], [65.0, 66.41], [67.0, 69.79], [72.0, 76.47], [78.0, 80.01], [85.0, 86.68], [88.0, 90.78], [92.0, 92.74], [94.0, 99.39], [101.0, 101.9], [105.0, 105.36], [106.0, 108.08]], "keep_status": [false, true, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 42.08, 0.0, 0.0, 31.21, 0.0, 0.0, 0.0, 0.0, 0.0, 41.7, 35.29, 35.07, 0.0, 61.67, 0.0, 30.46, 0.0, 0.0, 40.07], "audiomae_on_audioset": [null, [["speech", 19.51], ["quack", 15.58], ["throbbing", 11.05]], null, null, [["whack, thwack", 37.61], ["thump, thud", 14.53], ["speech", 9.12]], null, null, null, null, null, [["music", 54.38], ["singing bowl", 9.84], ["musical instrument", 2.64]], [["music", 59.05], ["ambient music", 7.37], ["singing bowl", 3.65]], [["speech", 37.46], ["music", 21.73], ["hum", 8.83]], null, null, null, [["throbbing", 32.52], ["hum", 27.4], ["music", 13.17]], null, null, [["music", 21.97], ["speech", 9.76], ["didgeridoo", 4.04]]], "duration": [1.0, 9.47, 0.84, 0.18, 22.18, 1.76, 1.3, 0.82, 0.67, 1.41, 2.79, 4.47, 2.01, 1.68, 2.78, 0.74, 5.39, 0.9, 0.36, 2.08]} \ No newline at end of file diff --git a/annotations_filtered/lD1XDCbhtn0_filtered.json b/annotations_filtered/lD1XDCbhtn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3de6ebb3b3765a027e0c667a3c1501321b53de0b --- /dev/null +++ b/annotations_filtered/lD1XDCbhtn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.07], [25.0, 25.57], [27.0, 30.54], [43.0, 46.13]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 48.78, 42.13], "audiomae_on_audioset": [null, null, [["speech", 50.03], ["chirp tone", 15.91], ["whale vocalization", 5.19]], [["stomach rumble", 22.82], ["noise", 7.36], ["speech", 6.95]]], "duration": [0.07, 0.57, 3.54, 3.13]} \ No newline at end of file diff --git a/annotations_filtered/lD7Xo_FhL4s_filtered.json b/annotations_filtered/lD7Xo_FhL4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37575be00daf3228d2b10d3d7541409d932d7b6b --- /dev/null +++ b/annotations_filtered/lD7Xo_FhL4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.64], [29.0, 39.63], [41.0, 41.39], [42.0, 43.21], [47.0, 47.28], [50.0, 51.12], [55.0, 61.8], [62.0, 63.69], [64.0, 64.56], [68.0, 68.45], [69.0, 69.36], [70.0, 70.14], [73.0, 73.74], [74.0, 74.68], [75.0, 76.32], [79.0, 83.05], [83.0, 84.82], [86.0, 86.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.56, 0.0, 0.0, 0.0, 0.0, 30.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.19, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 68.7], ["brass instrument", 4.91], ["musical instrument", 3.96]], null, null, null, null, [["speech", 80.28], ["applause", 3.66], ["clapping", 2.34]], null, null, null, null, null, null, null, null, [["beatboxing", 63.08], ["music", 5.18], ["fart", 4.62]], null, null], "duration": [1.64, 10.63, 0.39, 1.21, 0.28, 1.12, 6.8, 1.69, 0.56, 0.45, 0.36, 0.14, 0.74, 0.68, 1.32, 4.05, 1.82, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/lDDtJ_J_hhw_filtered.json b/annotations_filtered/lDDtJ_J_hhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75976156f08d2b7092ab830dc5c0c56147aaa8dd --- /dev/null +++ b/annotations_filtered/lDDtJ_J_hhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 48.51], [50.0, 51.38], [54.0, 53.97], [55.0, 56.44], [59.0, 60.79], [62.0, 62.65], [64.0, 64.88], [71.0, 70.92], [71.0, 72.49], [73.0, 73.75], [74.0, 82.16], [83.0, 83.2], [83.0, 111.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 99.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.51, 1.38, -0.03, 1.44, 1.79, 0.65, 0.88, -0.08, 1.49, 0.75, 8.16, 0.2, 28.27]} \ No newline at end of file diff --git a/annotations_filtered/lDRzG3mH-DQ_filtered.json b/annotations_filtered/lDRzG3mH-DQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..262201620f939606740fe66f9730b696bd662973 --- /dev/null +++ b/annotations_filtered/lDRzG3mH-DQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 42.48], [45.0, 46.43], [48.0, 51.27], [53.0, 55.02], [56.0, 59.71], [61.0, 65.53], [68.0, 70.83], [72.0, 79.37], [80.0, 113.64], [117.0, 119.3], [123.0, 125.27], [126.0, 126.76], [128.0, 129.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [64.63, 0.0, 85.17, 41.52, 99.87, 98.27, 99.65, 91.81, 0.0, 51.34, 47.66, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 55.33], ["music", 24.5], ["musical instrument", 3.71]], null, null, null, null, null, null, [["music", 32.8], ["didgeridoo", 14.56], ["throbbing", 13.88]], null, null], "duration": [2.48, 1.43, 3.27, 2.02, 3.71, 4.53, 2.83, 7.37, 33.64, 2.3, 2.27, 0.76, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/lDa6qc93nNs_filtered.json b/annotations_filtered/lDa6qc93nNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a58ff00b845070cc287a0883ffd1239f56cacd91 --- /dev/null +++ b/annotations_filtered/lDa6qc93nNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 22.2], [23.0, 33.45], [35.0, 38.64], [39.0, 39.31], [39.0, 39.5], [40.0, 39.53], [40.0, 41.54], [45.0, 73.33], [76.0, 112.24]], "keep_status": [false, false, true, false, false, false, false, true, false], "silence_prob": [30.8, 31.65, 31.08, 0.0, 0.0, 0.0, 0.0, 32.56, 0.0], "audiomae_on_audioset": [[["music", 60.39], ["reverberation", 5.93], ["hum", 4.07]], [["music", 49.4], ["speech", 29.34], ["throbbing", 3.91]], [["music", 43.91], ["synthesizer", 4.38], ["sound effect", 3.75]], null, null, null, null, [["music", 26.45], ["buzz", 14.76], ["noise", 13.66]], null], "duration": [7.2, 10.45, 3.64, 0.31, 0.5, -0.47, 1.54, 28.33, 36.24]} \ No newline at end of file diff --git a/annotations_filtered/lDduI2NkIsQ_filtered.json b/annotations_filtered/lDduI2NkIsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..684855d87c63838a636ee28d99f165e857e71d69 --- /dev/null +++ b/annotations_filtered/lDduI2NkIsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 32.26], [33.0, 45.71], [50.0, 78.02], [81.0, 81.26]], "keep_status": [true, true, false, false], "silence_prob": [31.07, 31.17, 32.22, 0.0], "audiomae_on_audioset": [[["music", 39.54], ["speech", 17.16], ["bow-wow", 10.82]], [["music", 35.61], ["speech", 13.89], ["fly, housefly", 10.09]], [["music", 48.52], ["speech", 37.0], ["didgeridoo", 2.17]], null], "duration": [28.26, 12.71, 28.02, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/lDetwrOZPZg_filtered.json b/annotations_filtered/lDetwrOZPZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..762a15b96b24dd7cd177d62bf368c84ee5a4cbc2 --- /dev/null +++ b/annotations_filtered/lDetwrOZPZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.15], [22.0, 22.47], [24.0, 24.76], [27.0, 29.34], [31.0, 37.86], [40.0, 40.2], [43.0, 43.63], [50.0, 49.84], [51.0, 51.22], [52.0, 52.49], [54.0, 54.11], [56.0, 56.22], [59.0, 59.14], [61.0, 61.79], [63.0, 63.85], [65.0, 65.4], [68.0, 68.99], [70.0, 74.16], [75.0, 76.79], [78.0, 78.85], [81.0, 81.77], [83.0, 83.56], [84.0, 88.11]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 44.69, 33.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.52, 0.0, 0.0, 0.0, 0.0, 34.1], "audiomae_on_audioset": [null, null, null, [["speech", 21.72], ["police car (siren)", 17.05], ["siren", 11.21]], [["speech", 37.94], ["siren", 25.49], ["civil defense siren", 17.29]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 75.54], ["sidetone", 6.46], ["radio", 6.29]], null, null, null, null, [["sidetone", 46.15], ["speech", 9.75], ["fly, housefly", 8.77]]], "duration": [1.15, 0.47, 0.76, 2.34, 6.86, 0.2, 0.63, -0.16, 0.22, 0.49, 0.11, 0.22, 0.14, 0.79, 0.85, 0.4, 0.99, 4.16, 1.79, 0.85, 0.77, 0.56, 4.11]} \ No newline at end of file diff --git a/annotations_filtered/lEFx1qmW4ts_filtered.json b/annotations_filtered/lEFx1qmW4ts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d930b6e6f92f4bdb413a91b6dc06e2f13db35fc1 --- /dev/null +++ b/annotations_filtered/lEFx1qmW4ts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.48], [5.0, 55.04], [63.0, 74.95], [79.0, 80.67], [85.0, 100.13]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.9, 0.0, 30.96], "audiomae_on_audioset": [null, null, [["mains hum", 45.35], ["hum", 44.8], ["buzz", 3.17]], null, [["hum", 31.28], ["mains hum", 29.14], ["music", 12.15]]], "duration": [1.48, 50.04, 11.95, 1.67, 15.13]} \ No newline at end of file diff --git a/annotations_filtered/lEPfDu4pVqg_filtered.json b/annotations_filtered/lEPfDu4pVqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bf08a83acb0ac367c14fb683f7da80c2ea06fae --- /dev/null +++ b/annotations_filtered/lEPfDu4pVqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.0], [73.0, 73.03]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.0, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/lEiwqEMhS9E_filtered.json b/annotations_filtered/lEiwqEMhS9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3eca668334fa2c8d7d05e15ccd24a97b01dde55 --- /dev/null +++ b/annotations_filtered/lEiwqEMhS9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.97], [11.0, 11.65], [16.0, 16.73], [22.0, 22.52], [26.0, 26.76], [31.0, 32.04], [35.0, 35.34], [37.0, 38.4], [40.0, 39.99], [41.0, 41.17], [43.0, 44.05], [48.0, 49.77], [51.0, 52.19], [55.0, 56.94], [61.0, 61.8], [62.0, 63.51], [72.0, 73.75], [75.0, 75.25], [76.0, 76.38], [78.0, 79.15], [79.0, 80.28], [84.0, 84.94], [91.0, 105.9], [107.0, 108.13], [109.0, 109.24], [110.0, 121.51], [125.0, 125.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [40.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.84, 0.0, 0.0, 29.59, 0.0], "audiomae_on_audioset": [[["music", 60.79], ["hum", 6.94], ["mains hum", 5.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 21.8], ["music", 20.92], ["sidetone", 15.98]], null, null, [["radio", 12.63], ["vehicle", 9.22], ["noise", 7.92]], null], "duration": [3.97, 0.65, 0.73, 0.52, 0.76, 1.04, 0.34, 1.4, -0.01, 0.17, 1.05, 1.77, 1.19, 1.94, 0.8, 1.51, 1.75, 0.25, 0.38, 1.15, 1.28, 0.94, 14.9, 1.13, 0.24, 11.51, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/lEykI65QtSQ_filtered.json b/annotations_filtered/lEykI65QtSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a4fec14d85b7917572e05db8eda9c26dfe361d6 --- /dev/null +++ b/annotations_filtered/lEykI65QtSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.7], [47.0, 46.95], [59.0, 59.44], [61.0, 60.74], [66.0, 66.19], [67.0, 68.57], [81.0, 82.04], [82.0, 82.7], [85.0, 88.57], [96.0, 97.28], [98.0, 98.34], [99.0, 99.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.31, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["thunk", 66.8], ["speech", 17.16], ["music", 6.64]], null, null, null], "duration": [1.7, -0.05, 0.44, -0.26, 0.19, 1.57, 1.04, 0.7, 3.57, 1.28, 0.34, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/lF3IIOXn5qU_filtered.json b/annotations_filtered/lF3IIOXn5qU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfeb210152b1c91560cfb68a2734bc9a194753d8 --- /dev/null +++ b/annotations_filtered/lF3IIOXn5qU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.08], [13.0, 15.72], [18.0, 18.28], [21.0, 21.71], [33.0, 34.8], [36.0, 37.4], [41.0, 41.66], [53.0, 53.33], [55.0, 55.46], [56.0, 58.99], [73.0, 73.21], [75.0, 75.76], [82.0, 86.48], [88.0, 88.94], [92.0, 94.47], [95.0, 96.25], [102.0, 103.15], [107.0, 108.01], [114.0, 115.25], [116.0, 117.31], [144.0, 145.57], [146.0, 146.84], [153.0, 156.56], [159.0, 158.82]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 29.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.53, 0.0, 0.0, 31.34, 0.0, 31.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.25, 0.0], "audiomae_on_audioset": [null, [["music", 32.21], ["boing", 11.13], ["speech", 9.18]], null, null, null, null, null, null, null, [["music", 22.56], ["livestock, farm animals, working animals", 15.21], ["moo", 9.85]], null, null, [["speech", 24.95], ["whack, thwack", 10.32], ["boing", 9.45]], null, [["music", 31.96], ["sidetone", 27.96], ["speech", 16.69]], null, null, null, null, null, null, null, [["music", 14.66], ["speech", 8.86], ["sheep", 3.7]], null], "duration": [1.08, 2.72, 0.28, 0.71, 1.8, 1.4, 0.66, 0.33, 0.46, 2.99, 0.21, 0.76, 4.48, 0.94, 2.47, 1.25, 1.15, 1.01, 1.25, 1.31, 1.57, 0.84, 3.56, -0.18]} \ No newline at end of file diff --git a/annotations_filtered/lFGfoPuKx9o_filtered.json b/annotations_filtered/lFGfoPuKx9o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fef17c86b77d3050e280236e05f07672ca21f905 --- /dev/null +++ b/annotations_filtered/lFGfoPuKx9o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [6.0, 10.49], [11.0, 11.5], [12.0, 13.24], [14.0, 14.93], [16.0, 26.01], [28.0, 44.02], [45.0, 48.37]], "keep_status": [false, true, false, false, false, true, false, true], "silence_prob": [0.0, 30.3, 0.0, 0.0, 0.0, 31.51, 31.76, 32.48], "audiomae_on_audioset": [null, [["music", 39.88], ["whale vocalization", 10.44], ["hum", 5.13]], null, null, null, [["throbbing", 29.39], ["music", 16.72], ["hum", 15.6]], [["mains hum", 33.06], ["hum", 29.15], ["throbbing", 16.85]], [["music", 27.2], ["hum", 17.34], ["mains hum", 9.63]]], "duration": [1.6, 4.49, 0.5, 1.24, 0.93, 10.01, 16.02, 3.37]} \ No newline at end of file diff --git a/annotations_filtered/lFHLE24hDQY_filtered.json b/annotations_filtered/lFHLE24hDQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c00125a8a55e89813ea0b8da61f648b045893c7 --- /dev/null +++ b/annotations_filtered/lFHLE24hDQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.84], [9.0, 10.5], [12.0, 12.12], [17.0, 23.68], [25.0, 26.62], [27.0, 29.19], [30.0, 30.2], [31.0, 32.21], [33.0, 33.93], [45.0, 45.0], [45.0, 47.07], [47.0, 48.91], [62.0, 63.71], [65.0, 65.37], [67.0, 67.32], [69.0, 71.29], [74.0, 73.82], [75.0, 84.65], [86.0, 93.82], [94.0, 98.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 63.74, 0.0, 56.78, 0.0, 0.0, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 61.57, 57.56, 57.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 1.5, 0.12, 6.68, 1.62, 2.19, 0.2, 1.21, 0.93, 0.0, 2.07, 1.91, 1.71, 0.37, 0.32, 2.29, -0.18, 9.65, 7.82, 4.04]} \ No newline at end of file diff --git a/annotations_filtered/lFyh5QCd6kw_filtered.json b/annotations_filtered/lFyh5QCd6kw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72f7e761e8d142e0e3282fe918bc8b22e6c07166 --- /dev/null +++ b/annotations_filtered/lFyh5QCd6kw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 85.82]], "keep_status": [false], "silence_prob": [30.89], "audiomae_on_audioset": [[["music", 64.87], ["explosion", 3.29], ["brass instrument", 1.94]]], "duration": [4.82]} \ No newline at end of file diff --git a/annotations_filtered/lGAADj8laqo_filtered.json b/annotations_filtered/lGAADj8laqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9425b52c9b8b94c7e9b4e1d0f8dccc5d3a36ceb --- /dev/null +++ b/annotations_filtered/lGAADj8laqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.71], [10.0, 11.82], [13.0, 16.11], [19.0, 22.13], [23.0, 25.27], [26.0, 28.66], [30.0, 32.12], [33.0, 36.54], [37.0, 38.26], [39.0, 46.67], [48.0, 50.33], [51.0, 54.5], [58.0, 61.86], [63.0, 66.14], [68.0, 72.15], [74.0, 77.5], [83.0, 83.29], [84.0, 84.27], [85.0, 87.59], [89.0, 95.64], [97.0, 105.27], [106.0, 109.21], [111.0, 114.13], [115.0, 123.03]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [84.62, 0.0, 72.75, 98.86, 49.27, 53.16, 44.52, 59.96, 0.0, 98.19, 99.52, 84.43, 56.55, 70.72, 98.66, 64.18, 0.0, 0.0, 99.05, 99.48, 48.39, 50.46, 88.28, 90.6], "audiomae_on_audioset": [null, null, null, null, [["speech", 56.11], ["dial tone", 8.87], ["busy signal", 4.73]], null, [["speech", 39.74], ["music", 8.28], ["hum", 7.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 22.03], ["hum", 18.35], ["heart sounds, heartbeat", 8.34]], null, null, null], "duration": [3.71, 1.82, 3.11, 3.13, 2.27, 2.66, 2.12, 3.54, 1.26, 7.67, 2.33, 3.5, 3.86, 3.14, 4.15, 3.5, 0.29, 0.27, 2.59, 6.64, 8.27, 3.21, 3.13, 8.03]} \ No newline at end of file diff --git a/annotations_filtered/lGFrkYzbfoU_filtered.json b/annotations_filtered/lGFrkYzbfoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc7cc39b01b5352505fe6949bdc49051cd9fc9b7 --- /dev/null +++ b/annotations_filtered/lGFrkYzbfoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 46.9], [49.0, 85.99], [87.0, 94.64], [95.0, 98.37], [99.0, 100.08], [101.0, 111.38], [113.0, 114.74], [117.0, 118.69], [122.0, 122.94], [124.0, 126.08], [129.0, 130.99], [132.0, 133.47], [143.0, 145.2], [147.0, 147.38], [149.0, 150.45], [153.0, 153.64], [154.0, 156.44], [163.0, 165.21], [167.0, 168.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.18, 74.13, 0.0, 84.8, 0.0, 0.0, 0.0, 88.83, 0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 99.78, 71.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.9, 36.99, 7.64, 3.37, 1.08, 10.38, 1.74, 1.69, 0.94, 2.08, 1.99, 1.47, 2.2, 0.38, 1.45, 0.64, 2.44, 2.21, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/lGlvNt-N140_filtered.json b/annotations_filtered/lGlvNt-N140_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03196dc47fb90213c38543fe96db9a043dd0ba1f --- /dev/null +++ b/annotations_filtered/lGlvNt-N140_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.92], [15.0, 19.25], [21.0, 21.84], [26.0, 29.39], [31.0, 33.71], [35.0, 36.53], [38.0, 38.18], [39.0, 41.96], [42.0, 42.52], [44.0, 45.23], [46.0, 57.84], [59.0, 75.24], [76.0, 77.36], [78.0, 90.48], [92.0, 101.16], [102.0, 113.36]], "keep_status": [false, false, false, true, true, false, false, true, false, false, true, true, false, true, false, true], "silence_prob": [0.0, 33.17, 0.0, 31.18, 32.1, 0.0, 0.0, 32.09, 0.0, 0.0, 31.04, 35.01, 0.0, 35.57, 33.03, 30.52], "audiomae_on_audioset": [null, [["whale vocalization", 35.87], ["livestock, farm animals, working animals", 23.33], ["moo", 15.32]], null, [["synthesizer", 14.61], ["music", 11.92], ["musical instrument", 8.61]], [["music", 33.64], ["didgeridoo", 27.65], ["synthesizer", 3.23]], null, null, [["music", 32.31], ["musical instrument", 9.62], ["guitar", 7.1]], null, null, [["music", 24.07], ["hum", 21.92], ["mains hum", 8.34]], [["cattle, bovinae", 21.1], ["hum", 19.17], ["livestock, farm animals, working animals", 16.27]], null, [["music", 18.52], ["didgeridoo", 10.84], ["whale vocalization", 9.82]], [["whale vocalization", 48.11], ["hum", 17.82], ["throbbing", 13.4]], [["cattle, bovinae", 20.29], ["livestock, farm animals, working animals", 15.92], ["didgeridoo", 14.96]]], "duration": [0.92, 4.25, 0.84, 3.39, 2.71, 1.53, 0.18, 2.96, 0.52, 1.23, 11.84, 16.24, 1.36, 12.48, 9.16, 11.36]} \ No newline at end of file diff --git a/annotations_filtered/lGqBJx2xbqQ_filtered.json b/annotations_filtered/lGqBJx2xbqQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6967e81ced68d7994bfebfc517de73a82c74dd1 --- /dev/null +++ b/annotations_filtered/lGqBJx2xbqQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [5.0, 5.41], [12.0, 13.0], [15.0, 55.54], [58.0, 72.44]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.96], "audiomae_on_audioset": [null, null, null, null, [["music", 24.98], ["speech", 13.52], ["fart", 11.68]]], "duration": [0.79, 0.41, 1.0, 40.54, 14.44]} \ No newline at end of file diff --git a/annotations_filtered/lGuivq-6xrw_filtered.json b/annotations_filtered/lGuivq-6xrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c31b49e1fd45fa617f95e69757a23ed635b18d4 --- /dev/null +++ b/annotations_filtered/lGuivq-6xrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.54], [14.0, 17.29], [32.0, 34.25], [42.0, 44.51], [49.0, 54.36], [66.0, 69.63], [72.0, 80.62], [81.0, 81.38], [83.0, 83.96], [100.0, 100.5], [117.0, 118.4], [136.0, 137.13], [147.0, 150.03], [164.0, 166.45], [171.0, 171.0], [176.0, 192.7], [193.0, 214.46], [223.0, 240.81], [250.0, 254.82], [270.0, 276.57]], "keep_status": [true, true, false, true, true, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false], "silence_prob": [29.77, 30.32, 31.86, 32.28, 29.37, 31.3, 29.83, 0.0, 0.0, 0.0, 0.0, 0.0, 35.42, 28.58, 0.0, 28.79, 29.18, 28.7, 30.48, 29.85], "audiomae_on_audioset": [[["music", 60.46], ["didgeridoo", 2.76], ["theremin", 2.54]], [["speech", 35.78], ["music", 30.68], ["mains hum", 3.48]], [["music", 60.6], ["synthesizer", 8.64], ["speech", 6.23]], [["whack, thwack", 20.16], ["speech", 13.04], ["clang", 12.71]], [["speech", 19.9], ["music", 18.36], ["hum", 17.94]], [["music", 77.24], ["speech", 3.43], ["whale vocalization", 3.03]], [["music", 63.86], ["didgeridoo", 14.09], ["fart", 7.5]], null, null, null, null, null, [["music", 38.01], ["snicker", 12.32], ["speech", 9.38]], [["speech", 52.15], ["music", 14.36], ["vehicle", 6.57]], null, [["music", 40.66], ["speech", 17.0], ["sound effect", 8.15]], [["music", 33.22], ["boing", 25.63], ["synthesizer", 12.91]], [["music", 60.4], ["throbbing", 4.92], ["cacophony", 2.82]], [["speech", 46.63], ["music", 24.54], ["sound effect", 3.84]], [["speech", 52.33], ["music", 17.35], ["explosion", 4.49]]], "duration": [2.54, 3.29, 2.25, 2.51, 5.36, 3.63, 8.62, 0.38, 0.96, 0.5, 1.4, 1.13, 3.03, 2.45, 0.0, 16.7, 21.46, 17.81, 4.82, 6.57]} \ No newline at end of file diff --git a/annotations_filtered/lH7EYLWHT4Q_filtered.json b/annotations_filtered/lH7EYLWHT4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af426a951222a96ee9cbf957105ab176417e3bff --- /dev/null +++ b/annotations_filtered/lH7EYLWHT4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [9.0, 10.05], [13.0, 14.1], [19.0, 20.8], [25.0, 25.44], [31.0, 31.8], [33.0, 48.98], [51.0, 58.26], [64.0, 64.29], [68.0, 71.61], [74.0, 75.84], [77.0, 78.29], [82.0, 108.28], [109.0, 109.49], [111.0, 112.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.89, 31.98, 0.0, 87.19, 0.0, 0.0, 31.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 46.15], ["speech", 26.48], ["noise", 2.16]], [["electric shaver, electric razor", 70.35], ["speech", 19.94], ["animal", 4.82]], null, null, null, null, [["whale vocalization", 39.5], ["speech", 29.98], ["fart", 5.9]], null, null], "duration": [1.13, 1.05, 1.1, 1.8, 0.44, 0.8, 15.98, 7.26, 0.29, 3.61, 1.84, 1.29, 26.28, 0.49, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/lHNgUHi-WPM_filtered.json b/annotations_filtered/lHNgUHi-WPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d69cd71670f0769c1cf58e203088f9911299abd --- /dev/null +++ b/annotations_filtered/lHNgUHi-WPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.55], [7.0, 16.8], [20.0, 34.2], [36.0, 49.38], [53.0, 57.97], [59.0, 74.02], [74.0, 75.73], [79.0, 79.51], [83.0, 83.54], [86.0, 86.86], [96.0, 96.6], [99.0, 109.83], [113.0, 113.16], [116.0, 117.36], [120.0, 130.71], [134.0, 138.74], [142.0, 147.8], [150.0, 151.61], [155.0, 159.95]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.06, 31.11, 32.98, 98.19, 59.59, 0.0, 0.0, 0.0, 0.0, 0.0, 35.29, 0.0, 0.0, 33.53, 34.16, 35.78, 0.0, 33.63], "audiomae_on_audioset": [null, [["music", 42.32], ["sidetone", 7.06], ["speech", 7.03]], [["music", 76.97], ["speech", 4.72], ["buzz", 2.17]], [["music", 71.26], ["breaking", 14.71], ["speech", 2.55]], null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 24.94], ["cattle, bovinae", 24.15], ["moo", 23.88]], null, null, [["music", 77.52], ["song", 3.47], ["singing", 3.23]], [["music", 72.76], ["mantra", 2.6], ["sampler", 1.53]], [["music", 71.93], ["musical instrument", 3.94], ["guitar", 3.92]], null, [["music", 77.82], ["mantra", 2.24], ["soul music", 1.68]]], "duration": [1.55, 9.8, 14.2, 13.38, 4.97, 15.02, 1.73, 0.51, 0.54, 0.86, 0.6, 10.83, 0.16, 1.36, 10.71, 4.74, 5.8, 1.61, 4.95]} \ No newline at end of file diff --git a/annotations_filtered/lHodSSB_YpM_filtered.json b/annotations_filtered/lHodSSB_YpM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56b41a09b1c842ed25bbf033b1b8f94ea2cfee29 --- /dev/null +++ b/annotations_filtered/lHodSSB_YpM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.76], [41.0, 42.23], [43.0, 43.98], [45.0, 45.12], [53.0, 52.98], [56.0, 56.56], [64.0, 63.96], [65.0, 65.69], [68.0, 68.62], [70.0, 69.77], [70.0, 72.39], [73.0, 73.35], [74.0, 74.29], [75.0, 75.93], [79.0, 79.57], [87.0, 86.86], [91.0, 91.32], [93.0, 94.76], [98.0, 97.9], [101.0, 101.9], [103.0, 104.04], [106.0, 106.32], [109.0, 109.19], [110.0, 112.99], [122.0, 122.13], [124.0, 126.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.24, 0.0, 37.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 20.8], ["whale vocalization", 18.05], ["roaring cats (lions, tigers)", 11.81]]], "duration": [0.76, 1.23, 0.98, 0.12, -0.02, 0.56, -0.04, 0.69, 0.62, -0.23, 2.39, 0.35, 0.29, 0.93, 0.57, -0.14, 0.32, 1.76, -0.1, 0.9, 1.04, 0.32, 0.19, 2.99, 0.13, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/lHqGIe8AZ1g_filtered.json b/annotations_filtered/lHqGIe8AZ1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3457533b8fa0e504d29e96954ff577c50cdee492 --- /dev/null +++ b/annotations_filtered/lHqGIe8AZ1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [9.0, 9.76], [12.0, 12.65], [14.0, 14.64], [22.0, 22.06], [26.0, 25.78], [27.0, 28.0], [29.0, 30.18], [36.0, 37.59], [45.0, 46.45], [47.0, 48.71], [50.0, 51.12], [56.0, 57.28], [67.0, 68.69], [72.0, 71.64], [74.0, 76.3], [77.0, 77.08], [85.0, 86.54], [89.0, 88.97], [90.0, 91.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.76, 0.65, 0.64, 0.06, -0.22, 1.0, 1.18, 1.59, 1.45, 1.71, 1.12, 1.28, 1.69, -0.36, 2.3, 0.08, 1.54, -0.03, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/lHxzWs9NcS0_filtered.json b/annotations_filtered/lHxzWs9NcS0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df7410f076f221d2f091ed63ea06eedb8147c97e --- /dev/null +++ b/annotations_filtered/lHxzWs9NcS0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 20.51], [21.0, 24.87], [31.0, 31.9], [35.0, 37.39], [47.0, 50.79], [57.0, 57.7], [62.0, 62.13], [75.0, 74.8], [83.0, 84.89], [87.0, 88.32], [89.0, 88.52], [89.0, 90.1], [96.0, 96.25], [107.0, 109.07], [122.0, 122.69], [127.0, 127.06], [129.0, 128.75], [131.0, 131.06], [137.0, 137.88], [139.0, 148.2], [149.0, 151.02], [156.0, 157.05]], "keep_status": [true, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [41.66, 42.88, 0.0, 33.75, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.59, 0.0, 0.0, 0.0, 0.0, 0.0, 29.31, 29.63, 0.0], "audiomae_on_audioset": [[["sidetone", 19.22], ["noise", 16.32], ["speech", 13.5]], [["speech", 36.16], ["beatboxing", 22.28], ["music", 9.35]], null, [["speech", 75.54], ["music", 9.95], ["boing", 1.55]], [["bleat", 16.38], ["sheep", 15.38], ["music", 14.62]], null, null, null, null, null, null, null, null, [["speech", 49.79], ["music", 6.75], ["livestock, farm animals, working animals", 6.52]], null, null, null, null, null, [["music", 80.2], ["whack, thwack", 4.76], ["speech", 2.68]], [["music", 31.24], ["cattle, bovinae", 9.87], ["moo", 9.49]], null], "duration": [8.51, 3.87, 0.9, 2.39, 3.79, 0.7, 0.13, -0.2, 1.89, 1.32, -0.48, 1.1, 0.25, 2.07, 0.69, 0.06, -0.25, 0.06, 0.88, 9.2, 2.02, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/lI-ty9MfICM_filtered.json b/annotations_filtered/lI-ty9MfICM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ca413f8b2b94e9be4ce99f88ab253943e315b31 --- /dev/null +++ b/annotations_filtered/lI-ty9MfICM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.63], [10.0, 9.78], [10.0, 9.9], [12.0, 12.93], [16.0, 21.71], [24.0, 27.18], [27.0, 32.09], [34.0, 34.35], [37.0, 37.59], [44.0, 45.76]], "keep_status": [true, false, false, false, true, false, true, false, false, false], "silence_prob": [32.14, 0.0, 0.0, 0.0, 31.79, 31.56, 31.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 30.41], ["speech", 22.73], ["throbbing", 14.65]], null, null, null, [["music", 36.06], ["brass instrument", 9.85], ["trombone", 7.28]], [["speech", 40.87], ["music", 22.16], ["vehicle", 7.02]], [["music", 61.34], ["theremin", 4.31], ["musical instrument", 3.34]], null, null, null], "duration": [8.63, -0.22, -0.1, 0.93, 5.71, 3.18, 5.09, 0.35, 0.59, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/lISBP_fPg1s_filtered.json b/annotations_filtered/lISBP_fPg1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..612dbac8c65033c1322a0e19cfcfeb2198c55531 --- /dev/null +++ b/annotations_filtered/lISBP_fPg1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.48], [18.0, 19.89], [21.0, 21.9], [25.0, 25.46], [29.0, 30.08], [31.0, 31.67], [35.0, 36.26], [37.0, 38.62], [39.0, 40.36], [43.0, 43.71], [46.0, 47.07], [48.0, 50.97], [51.0, 51.06], [51.0, 64.35], [67.0, 68.72], [69.0, 69.45], [71.0, 71.49], [74.0, 74.04], [76.0, 78.46], [82.0, 82.24], [89.0, 92.69], [96.0, 96.87], [99.0, 99.57], [100.0, 100.63], [104.0, 104.52], [109.0, 110.02], [114.0, 115.96], [124.0, 124.39], [126.0, 125.91], [127.0, 127.75], [129.0, 129.37], [132.0, 145.72], [148.0, 148.93], [150.0, 151.48], [153.0, 157.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 55.39, 0.0, 0.0, 0.0, 0.0, 60.7, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 40.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.01], ["musical instrument", 14.3], ["synthesizer", 5.68]]], "duration": [0.48, 1.89, 0.9, 0.46, 1.08, 0.67, 1.26, 1.62, 1.36, 0.71, 1.07, 2.97, 0.06, 13.35, 1.72, 0.45, 0.49, 0.04, 2.46, 0.24, 3.69, 0.87, 0.57, 0.63, 0.52, 1.02, 1.96, 0.39, -0.09, 0.75, 0.37, 13.72, 0.93, 1.48, 4.67]} \ No newline at end of file diff --git a/annotations_filtered/lISiW7wcIVc_filtered.json b/annotations_filtered/lISiW7wcIVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d37f053f32c06e542ee35c4210ea20f08a5abd35 --- /dev/null +++ b/annotations_filtered/lISiW7wcIVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.66], [15.0, 17.29], [21.0, 26.06], [34.0, 34.82], [39.0, 39.38], [43.0, 45.25], [46.0, 46.89], [58.0, 59.16], [60.0, 60.47], [65.0, 67.83], [68.0, 68.28], [80.0, 88.64], [95.0, 102.86], [103.0, 102.95], [103.0, 104.14], [111.0, 111.7], [116.0, 116.14], [117.0, 123.47], [126.0, 139.99], [140.0, 145.94], [151.0, 162.99], [169.0, 169.45], [178.0, 181.95], [186.0, 189.3], [190.0, 190.93], [192.0, 193.63], [195.0, 205.7], [207.0, 207.44], [208.0, 207.94], [212.0, 218.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 74.44, 68.93, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 60.23, 0.0, 60.89, 39.0, 0.0, 0.0, 0.0, 0.0, 77.7, 46.83, 49.09, 39.28, 0.0, 36.22, 35.39, 0.0, 0.0, 56.48, 0.0, 0.0, 64.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.73], ["speech", 14.9], ["synthesizer", 9.77]], null, null, null, null, null, [["music", 51.19], ["speech", 13.2], ["mains hum", 9.44]], [["hum", 32.36], ["mains hum", 14.82], ["sidetone", 9.13]], [["mains hum", 45.75], ["hum", 28.22], ["fly, housefly", 2.86]], null, [["speech", 56.27], ["sidetone", 5.61], ["music", 3.31]], [["insect", 36.38], ["fly, housefly", 30.12], ["mosquito", 14.42]], null, null, null, null, null, null], "duration": [0.66, 2.29, 5.06, 0.82, 0.38, 2.25, 0.89, 1.16, 0.47, 2.83, 0.28, 8.64, 7.86, -0.05, 1.14, 0.7, 0.14, 6.47, 13.99, 5.94, 11.99, 0.45, 3.95, 3.3, 0.93, 1.63, 10.7, 0.44, -0.06, 6.47]} \ No newline at end of file diff --git a/annotations_filtered/lIVO6oEk4Hk_filtered.json b/annotations_filtered/lIVO6oEk4Hk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..713ae9e1a525d5dde4444ea174b71bfc5eaab79e --- /dev/null +++ b/annotations_filtered/lIVO6oEk4Hk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.34], [10.0, 19.77], [22.0, 29.29], [35.0, 36.0], [38.0, 38.38], [44.0, 45.86], [47.0, 48.37], [74.0, 74.39], [78.0, 80.38]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [100.0, 98.59, 30.54, 0.0, 0.0, 0.0, 0.0, 0.0, 31.09], "audiomae_on_audioset": [null, null, [["mains hum", 48.68], ["hum", 36.69], ["throbbing", 5.8]], null, null, null, null, null, [["music", 23.01], ["throbbing", 15.15], ["hum", 9.76]]], "duration": [2.34, 9.77, 7.29, 1.0, 0.38, 1.86, 1.37, 0.39, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/lIbBAWzE6H8_filtered.json b/annotations_filtered/lIbBAWzE6H8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c01b1aa87e805a43e980ae77c694cf0d9249666 --- /dev/null +++ b/annotations_filtered/lIbBAWzE6H8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 71.24], [75.0, 75.29], [80.0, 86.16], [100.0, 100.48], [120.0, 122.49], [125.0, 124.83], [134.0, 134.01], [136.0, 136.66], [149.0, 148.83], [155.0, 155.92], [158.0, 180.27], [180.0, 189.97], [197.0, 203.23], [204.0, 204.96]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [30.73, 0.0, 31.27, 0.0, 29.84, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 28.93, 31.77, 0.0], "audiomae_on_audioset": [[["music", 72.98], ["throbbing", 3.16], ["musical instrument", 1.96]], null, [["speech", 37.52], ["music", 21.79], ["hum", 8.29]], null, [["music", 53.44], ["crack", 11.16], ["speech", 6.97]], null, null, null, null, null, [["throbbing", 40.9], ["music", 23.35], ["hum", 19.29]], [["music", 38.17], ["livestock, farm animals, working animals", 11.93], ["cattle, bovinae", 6.75]], [["livestock, farm animals, working animals", 47.72], ["cattle, bovinae", 32.51], ["moo", 19.4]], null], "duration": [24.24, 0.29, 6.16, 0.48, 2.49, -0.17, 0.01, 0.66, -0.17, 0.92, 22.27, 9.97, 6.23, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/lIbKD5ovjok_filtered.json b/annotations_filtered/lIbKD5ovjok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b993e544e8de19f220e6a4e0f7f0578e1b51482f --- /dev/null +++ b/annotations_filtered/lIbKD5ovjok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.76], [10.0, 12.23], [13.0, 15.03], [16.0, 22.86], [24.0, 25.51], [26.0, 26.96], [28.0, 28.63], [29.0, 31.36], [32.0, 34.08], [35.0, 38.72], [39.0, 43.41], [44.0, 47.46], [49.0, 50.04], [52.0, 57.54], [60.0, 72.52], [75.0, 77.41], [79.0, 81.9], [86.0, 87.59], [88.0, 92.99], [94.0, 95.01], [95.0, 96.01], [97.0, 98.49], [100.0, 102.3], [104.0, 105.06], [105.0, 106.12], [108.0, 112.77], [114.0, 149.37], [152.0, 164.61], [166.0, 166.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.28, 52.51, 99.82, 84.8, 0.0, 0.0, 0.0, 74.44, 66.15, 99.44, 46.94, 61.87, 0.0, 94.81, 38.43, 59.07, 55.53, 0.0, 30.03, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 99.68, 0.0, 68.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 32.49], ["music", 9.56], ["hum", 8.84]], null, null, null, [["breaking", 46.51], ["speech", 36.26], ["crack", 4.58]], null, null, null, [["fart", 17.1], ["crushing", 16.16], ["crunch", 11.3]], null, null, null, null, null, null, null, null, null, null], "duration": [3.76, 2.23, 2.03, 6.86, 1.51, 0.96, 0.63, 2.36, 2.08, 3.72, 4.41, 3.46, 1.04, 5.54, 12.52, 2.41, 2.9, 1.59, 4.99, 1.01, 1.01, 1.49, 2.3, 1.06, 1.12, 4.77, 35.37, 12.61, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/lIk-3o2CkM8_filtered.json b/annotations_filtered/lIk-3o2CkM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fc83e2e1eb6049bf57facacfc4fd8dc4fa3156b --- /dev/null +++ b/annotations_filtered/lIk-3o2CkM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.22], [20.0, 23.21], [29.0, 30.3], [43.0, 43.9], [51.0, 52.81], [55.0, 55.81], [58.0, 58.01], [61.0, 61.43], [67.0, 67.76], [77.0, 77.48], [83.0, 83.89], [86.0, 86.61], [103.0, 104.28], [113.0, 112.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [66.27, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.22, 3.21, 1.3, 0.9, 1.81, 0.81, 0.01, 0.43, 0.76, 0.48, 0.89, 0.61, 1.28, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/lJ7F2kWLGuE_filtered.json b/annotations_filtered/lJ7F2kWLGuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1df98e9800131dec1792704ae53f6a527cb4f4f1 --- /dev/null +++ b/annotations_filtered/lJ7F2kWLGuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [1.0, 1.21], [3.0, 2.91], [7.0, 7.99], [14.0, 15.16], [18.0, 21.52], [24.0, 24.44], [27.0, 27.65], [32.0, 33.44], [36.0, 36.37], [58.0, 64.91], [68.0, 69.13], [71.0, 72.08], [79.0, 81.19], [82.0, 83.78], [89.0, 89.82], [94.0, 94.1], [99.0, 100.47], [105.0, 107.91], [109.0, 110.29], [116.0, 117.95], [128.0, 130.49], [131.0, 132.51], [142.0, 143.83], [147.0, 146.82], [148.0, 148.9], [149.0, 151.55], [152.0, 163.14], [165.0, 166.53], [169.0, 171.76], [173.0, 188.01], [191.0, 191.34], [193.0, 198.1], [199.0, 199.72], [202.0, 205.14], [209.0, 211.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.85, 0.0, 0.0, 0.0, 0.0, 34.55, 0.0, 0.0, 32.3, 0.0, 0.0, 0.0, 0.0, 38.97, 0.0, 0.0, 36.95, 0.0, 0.0, 0.0, 0.0, 33.83, 28.67, 0.0, 32.56, 28.68, 0.0, 50.46, 0.0, 74.76, 36.59], "audiomae_on_audioset": [null, null, null, null, null, [["music", 61.8], ["synthesizer", 17.46], ["musical instrument", 2.25]], null, null, null, null, [["music", 60.66], ["synthesizer", 6.59], ["cacophony", 4.17]], null, null, [["music", 59.99], ["synthesizer", 14.03], ["cacophony", 2.83]], null, null, null, null, [["music", 76.31], ["synthesizer", 4.57], ["musical instrument", 2.7]], null, null, [["music", 40.27], ["speech", 34.79], ["liquid", 1.85]], null, null, null, null, [["speech", 33.99], ["music", 33.52], ["hum", 7.05]], [["music", 65.02], ["hum", 7.37], ["throbbing", 7.03]], null, [["music", 49.81], ["electronic music", 4.48], ["house music", 2.7]], [["music", 77.89], ["throbbing", 8.92], ["hum", 4.47]], null, null, null, null, [["insect", 26.52], ["fly, housefly", 23.37], ["bee, wasp, etc.", 15.11]]], "duration": [0.0, 0.21, -0.09, 0.99, 1.16, 3.52, 0.44, 0.65, 1.44, 0.37, 6.91, 1.13, 1.08, 2.19, 1.78, 0.82, 0.1, 1.47, 2.91, 1.29, 1.95, 2.49, 1.51, 1.83, -0.18, 0.9, 2.55, 11.14, 1.53, 2.76, 15.01, 0.34, 5.1, 0.72, 3.14, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/lJ83ILGA8yI_filtered.json b/annotations_filtered/lJ83ILGA8yI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f2832ab32e7f3b4d56670d0f554e4fa10a38390 --- /dev/null +++ b/annotations_filtered/lJ83ILGA8yI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.98], [16.0, 19.13], [22.0, 23.21], [25.0, 26.33], [31.0, 36.73], [40.0, 43.33], [44.0, 45.08], [48.0, 48.81], [50.0, 52.22], [56.0, 58.23], [60.0, 61.72], [63.0, 65.33], [73.0, 74.16], [75.0, 77.55], [81.0, 81.57], [85.0, 87.1], [92.0, 99.33], [101.0, 103.2], [105.0, 107.28], [108.0, 108.55], [109.0, 109.81], [110.0, 130.13], [134.0, 138.54], [141.0, 142.35], [145.0, 170.18], [171.0, 175.96], [177.0, 183.22], [185.0, 186.63], [188.0, 189.84], [190.0, 191.4]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.29, 0.0, 0.0, 44.23, 94.37, 0.0, 0.0, 79.24, 68.15, 0.0, 42.98, 0.0, 49.68, 0.0, 69.61, 40.52, 99.21, 99.88, 0.0, 0.0, 49.54, 91.98, 0.0, 68.41, 67.13, 71.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 43.09], ["hum", 9.05], ["mains hum", 6.4]], null, null, null, null, null, null, [["music", 53.57], ["speech", 11.8], ["hum", 7.8]], null, [["music", 44.42], ["sonar", 7.86], ["soundtrack music", 6.66]], null, null, [["music", 41.07], ["speech", 18.4], ["hum", 15.75]], null, null, null, null, [["speech", 38.55], ["music", 20.73], ["hum", 17.48]], null, null, null, null, null, null, null, null], "duration": [1.98, 3.13, 1.21, 1.33, 5.73, 3.33, 1.08, 0.81, 2.22, 2.23, 1.72, 2.33, 1.16, 2.55, 0.57, 2.1, 7.33, 2.2, 2.28, 0.55, 0.81, 20.13, 4.54, 1.35, 25.18, 4.96, 6.22, 1.63, 1.84, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/lJIPM69YQNY_filtered.json b/annotations_filtered/lJIPM69YQNY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0578440c5747dbc003a4ed1aa1936320542495f --- /dev/null +++ b/annotations_filtered/lJIPM69YQNY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.55], [56.0, 57.23], [61.0, 69.74], [72.0, 80.6], [82.0, 83.57], [87.0, 88.15], [93.0, 93.31], [101.0, 102.39], [109.0, 109.19], [111.0, 111.32], [119.0, 119.26], [120.0, 120.55], [123.0, 122.88], [126.0, 126.28]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 54.36, 34.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.69], ["drum machine", 6.93], ["synthesizer", 6.93]], null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 1.23, 8.74, 8.6, 1.57, 1.15, 0.31, 1.39, 0.19, 0.32, 0.26, 0.55, -0.12, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/lJVIu_wNm4g_filtered.json b/annotations_filtered/lJVIu_wNm4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66766dddcbb1283ea3fbbd22d704b587a21b35ca --- /dev/null +++ b/annotations_filtered/lJVIu_wNm4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.75], [9.0, 14.71], [15.0, 15.6], [17.0, 33.56], [37.0, 71.44], [73.0, 107.32], [109.0, 115.38]], "keep_status": [false, false, false, true, false, false, true], "silence_prob": [0.0, 34.02, 0.0, 31.09, 0.0, 0.0, 31.09], "audiomae_on_audioset": [null, [["speech", 43.7], ["music", 20.3], ["animal", 12.45]], null, [["livestock, farm animals, working animals", 24.54], ["music", 23.52], ["cattle, bovinae", 6.99]], null, null, [["music", 55.72], ["musical instrument", 8.61], ["synthesizer", 3.22]]], "duration": [0.75, 5.71, 0.6, 16.56, 34.44, 34.32, 6.38]} \ No newline at end of file diff --git a/annotations_filtered/lJf8EW9800o_filtered.json b/annotations_filtered/lJf8EW9800o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5552831fbbfc2f56927b1286c2ba7e556e471295 --- /dev/null +++ b/annotations_filtered/lJf8EW9800o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.79], [28.0, 39.23], [43.0, 47.97], [57.0, 71.59], [74.0, 80.4], [82.0, 112.55], [115.0, 115.74], [119.0, 118.71], [119.0, 120.9], [125.0, 129.64], [130.0, 137.44], [142.0, 149.88], [150.0, 154.21], [155.0, 158.5], [159.0, 161.23], [162.0, 162.63]], "keep_status": [true, true, true, true, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [29.97, 30.66, 29.52, 29.87, 29.11, 0.0, 0.0, 0.0, 0.0, 54.5, 40.4, 32.41, 61.27, 63.96, 46.09, 0.0], "audiomae_on_audioset": [[["music", 49.89], ["mains hum", 8.81], ["hum", 6.01]], [["music", 41.29], ["vehicle", 7.29], ["hum", 7.04]], [["speech", 40.55], ["vehicle", 23.46], ["car", 5.68]], [["vehicle", 33.56], ["car", 22.07], ["race car, auto racing", 14.02]], [["speech", 37.17], ["vehicle", 10.71], ["foghorn", 7.81]], null, null, null, null, null, [["music", 29.39], ["throbbing", 23.21], ["hum", 8.37]], [["music", 64.04], ["synthesizer", 14.03], ["musical instrument", 3.49]], null, null, [["music", 59.07], ["theremin", 7.11], ["singing bowl", 4.6]], null], "duration": [3.79, 11.23, 4.97, 14.59, 6.4, 30.55, 0.74, -0.29, 1.9, 4.64, 7.44, 7.88, 4.21, 3.5, 2.23, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/lJiMlgvygvc_filtered.json b/annotations_filtered/lJiMlgvygvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/lJiMlgvygvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/lJjxm4xTVKk_filtered.json b/annotations_filtered/lJjxm4xTVKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbd09f4b2bf30ee0f11dd2e1f7523f5f3695e177 --- /dev/null +++ b/annotations_filtered/lJjxm4xTVKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [4.0, 8.04], [9.0, 10.3], [13.0, 15.92], [17.0, 19.18], [24.0, 23.7], [25.0, 25.44], [28.0, 29.74], [32.0, 33.24], [35.0, 36.61], [45.0, 46.53], [48.0, 60.25], [61.0, 64.45], [65.0, 65.84], [66.0, 67.19], [68.0, 69.08], [72.0, 76.23], [77.0, 77.8], [84.0, 85.09], [86.0, 85.95], [88.0, 89.36], [90.0, 90.68], [98.0, 98.17], [99.0, 99.67], [103.0, 102.91], [104.0, 104.28], [105.0, 105.0], [108.0, 108.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.79, 0.0, 42.19, 48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.4, 30.91, 0.0, 0.0, 0.0, 52.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.12], ["hum", 16.16], ["throbbing", 8.9]], null, [["music", 50.84], ["hum", 14.53], ["throbbing", 7.46]], [["hum", 35.78], ["music", 24.08], ["gong", 11.15]], null, null, null, null, null, null, [["speech", 43.23], ["music", 14.02], ["burst, pop", 9.33]], [["explosion", 18.2], ["music", 12.43], ["hum", 9.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 4.04, 1.3, 2.92, 2.18, -0.3, 0.44, 1.74, 1.24, 1.61, 1.53, 12.25, 3.45, 0.84, 1.19, 1.08, 4.23, 0.8, 1.09, -0.05, 1.36, 0.68, 0.17, 0.67, -0.09, 0.28, 0.0, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/lJuxU-aVeT4_filtered.json b/annotations_filtered/lJuxU-aVeT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d3e412244d86b67f3c109c0d09e083dd948d0ca --- /dev/null +++ b/annotations_filtered/lJuxU-aVeT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.91], [24.0, 24.41], [26.0, 47.24], [48.0, 48.57], [49.0, 55.65], [57.0, 57.23], [59.0, 72.71], [76.0, 78.63], [82.0, 92.1], [101.0, 105.66], [107.0, 107.64], [110.0, 114.57]], "keep_status": [false, false, true, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 37.02, 0.0, 38.23, 0.0, 40.09, 45.62, 35.5, 35.2, 0.0, 31.14], "audiomae_on_audioset": [null, null, [["noise", 37.56], ["music", 18.5], ["theremin", 13.79]], null, [["music", 51.73], ["speech", 24.25], ["thunk", 8.88]], null, [["music", 41.54], ["speech", 29.78], ["knock", 6.06]], [["music", 26.87], ["hum", 25.66], ["mains hum", 23.36]], [["music", 57.08], ["speech", 6.61], ["knock", 2.46]], [["music", 39.1], ["carnatic music", 8.84], ["drum", 6.99]], null, [["music", 17.29], ["speech", 14.53], ["foghorn", 7.97]]], "duration": [0.91, 0.41, 21.24, 0.57, 6.65, 0.23, 13.71, 2.63, 10.1, 4.66, 0.64, 4.57]} \ No newline at end of file diff --git a/annotations_filtered/lKBbFHMEvDc_filtered.json b/annotations_filtered/lKBbFHMEvDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92910403568e0c5a347b55a8cc2df572b5561299 --- /dev/null +++ b/annotations_filtered/lKBbFHMEvDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.97], [7.0, 7.53], [9.0, 9.44], [11.0, 11.91], [13.0, 15.04], [16.0, 29.05], [30.0, 30.92], [33.0, 33.94], [36.0, 37.03], [38.0, 38.33], [39.0, 40.24], [42.0, 42.13], [43.0, 43.48], [44.0, 46.13], [49.0, 54.01], [55.0, 56.54], [57.0, 57.25], [58.0, 58.87], [59.0, 60.22], [61.0, 61.45], [62.0, 64.99], [66.0, 66.09], [67.0, 68.05], [68.0, 69.52], [71.0, 71.86], [73.0, 73.23], [75.0, 76.2], [80.0, 80.76], [83.0, 83.42], [86.0, 87.07], [88.0, 88.38], [89.0, 89.82], [92.0, 92.26], [100.0, 99.79], [102.0, 102.52], [104.0, 104.79], [109.0, 109.73], [112.0, 112.18], [116.0, 117.15], [119.0, 119.89], [121.0, 121.78], [123.0, 125.05], [127.0, 127.2], [129.0, 129.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.64, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.7, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.15], ["sidetone", 9.87], ["dial tone", 5.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.93], ["speech", 20.39], ["didgeridoo", 8.48]], null, null], "duration": [0.97, 0.53, 0.44, 0.91, 2.04, 13.05, 0.92, 0.94, 1.03, 0.33, 1.24, 0.13, 0.48, 2.13, 5.01, 1.54, 0.25, 0.87, 1.22, 0.45, 2.99, 0.09, 1.05, 1.52, 0.86, 0.23, 1.2, 0.76, 0.42, 1.07, 0.38, 0.82, 0.26, -0.21, 0.52, 0.79, 0.73, 0.18, 1.15, 0.89, 0.78, 2.05, 0.2, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/lKE3zh_Hxqw_filtered.json b/annotations_filtered/lKE3zh_Hxqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a7ddd8f099651a82aa8599b486bd828ab0e00ba --- /dev/null +++ b/annotations_filtered/lKE3zh_Hxqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.48], [7.0, 10.29], [24.0, 25.12], [35.0, 35.26], [36.0, 39.31], [45.0, 50.18], [51.0, 69.69], [70.0, 71.96], [74.0, 75.91], [77.0, 80.84], [82.0, 82.59], [84.0, 84.33], [87.0, 87.1], [89.0, 91.86], [93.0, 93.46], [96.0, 97.77], [101.0, 102.49], [103.0, 105.38], [108.0, 109.41], [111.0, 112.29], [113.0, 113.83], [117.0, 117.59], [121.0, 124.04], [125.0, 126.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.31, 0.0, 0.0, 76.7, 33.43, 85.9, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 65.22], ["fart", 29.29], ["radio", 0.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 3.29, 1.12, 0.26, 3.31, 5.18, 18.69, 1.96, 1.91, 3.84, 0.59, 0.33, 0.1, 2.86, 0.46, 1.77, 1.49, 2.38, 1.41, 1.29, 0.83, 0.59, 3.04, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/lKEihcQaa_g_filtered.json b/annotations_filtered/lKEihcQaa_g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..362502cd49f0be92ad072c6cdcb122673e134b4a --- /dev/null +++ b/annotations_filtered/lKEihcQaa_g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.38], [14.0, 16.06], [16.0, 17.39], [19.0, 19.45], [20.0, 45.89], [50.0, 51.26], [53.0, 53.43], [57.0, 93.48], [96.0, 96.16]], "keep_status": [false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 36.24, 0.0, 0.0, 31.52, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 14.4], ["music", 11.56], ["vehicle", 3.17]], null, null, [["hum", 13.76], ["gong", 13.23], ["speech", 12.4]], null, null, null, null], "duration": [0.38, 2.06, 1.39, 0.45, 25.89, 1.26, 0.43, 36.48, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/lKJ8pyN8Cm4_filtered.json b/annotations_filtered/lKJ8pyN8Cm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8394dd9fc951a8731036897af36fdfae0450663d --- /dev/null +++ b/annotations_filtered/lKJ8pyN8Cm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.27], [4.0, 6.47], [8.0, 8.51], [9.0, 9.42], [11.0, 11.91], [13.0, 14.81], [16.0, 19.03], [20.0, 21.81], [23.0, 26.65], [27.0, 28.51], [29.0, 30.21], [31.0, 33.22], [34.0, 37.47], [39.0, 41.52], [43.0, 43.68], [46.0, 46.53], [48.0, 48.63], [61.0, 61.91], [62.0, 63.37], [65.0, 65.38], [66.0, 66.92], [68.0, 68.35], [71.0, 72.01], [73.0, 73.95], [77.0, 77.41], [78.0, 78.75], [82.0, 81.77], [85.0, 85.46], [91.0, 91.25], [93.0, 93.24], [95.0, 95.59], [99.0, 99.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 84.43, 0.0, 0.0, 100.0, 99.95, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.27, 2.47, 0.51, 0.42, 0.91, 1.81, 3.03, 1.81, 3.65, 1.51, 1.21, 2.22, 3.47, 2.52, 0.68, 0.53, 0.63, 0.91, 1.37, 0.38, 0.92, 0.35, 1.01, 0.95, 0.41, 0.75, -0.23, 0.46, 0.25, 0.24, 0.59, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/lKStI-3GHDc_filtered.json b/annotations_filtered/lKStI-3GHDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4091a82bce9b7b518bac37989e3e1236d4392d5 --- /dev/null +++ b/annotations_filtered/lKStI-3GHDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.99], [9.0, 10.77], [12.0, 16.28], [19.0, 19.33], [25.0, 25.17], [25.0, 29.39], [34.0, 50.87], [55.0, 61.53], [67.0, 67.22], [68.0, 68.34], [70.0, 74.92], [79.0, 86.83], [87.0, 97.85], [104.0, 120.12], [122.0, 124.12]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, true, true, true, true], "silence_prob": [0.0, 0.0, 30.48, 0.0, 0.0, 29.56, 30.05, 30.03, 0.0, 0.0, 30.52, 29.88, 30.19, 30.34, 29.48], "audiomae_on_audioset": [null, null, [["music", 51.15], ["breaking", 5.47], ["noise", 3.27]], null, null, [["music", 30.41], ["throbbing", 28.9], ["hum", 5.75]], [["music", 51.91], ["throbbing", 17.71], ["hum", 3.71]], [["music", 43.9], ["speech", 20.96], ["throbbing", 11.48]], null, null, [["music", 22.79], ["speech", 19.01], ["fly, housefly", 10.14]], [["music", 37.99], ["cattle, bovinae", 9.1], ["speech", 5.43]], [["throbbing", 22.73], ["music", 14.78], ["hum", 13.85]], [["music", 12.25], ["speech", 11.9], ["hum", 11.21]], [["music", 27.76], ["speech", 7.77], ["electronic music", 6.5]]], "duration": [0.99, 1.77, 4.28, 0.33, 0.17, 4.39, 16.87, 6.53, 0.22, 0.34, 4.92, 7.83, 10.85, 16.12, 2.12]} \ No newline at end of file diff --git a/annotations_filtered/lKeaVq6fUpw_filtered.json b/annotations_filtered/lKeaVq6fUpw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1813f540793f70944fe92632c208ffcaad78c0e1 --- /dev/null +++ b/annotations_filtered/lKeaVq6fUpw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 26.47], [29.0, 35.21], [36.0, 38.3], [39.0, 40.24], [44.0, 44.49], [46.0, 46.55], [50.0, 50.13], [55.0, 55.44], [57.0, 59.31], [62.0, 62.88], [64.0, 64.52], [67.0, 67.86], [70.0, 70.26], [71.0, 72.06], [73.0, 75.84], [77.0, 78.6], [80.0, 80.6], [81.0, 83.42], [88.0, 88.53], [90.0, 90.93], [92.0, 93.92], [95.0, 96.04], [101.0, 101.21], [103.0, 104.41], [108.0, 110.46], [114.0, 115.28], [116.0, 117.49], [119.0, 119.89], [121.0, 124.44], [126.0, 127.48], [131.0, 132.6], [135.0, 134.84], [137.0, 138.64], [141.0, 141.83], [145.0, 147.06]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [47.35, 52.92, 54.23, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 59.86, 0.0, 0.0, 45.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0, 0.0, 0.0, 42.33, 0.0, 0.0, 0.0, 0.0, 0.0, 51.02], "audiomae_on_audioset": [[["mains hum", 22.08], ["hum", 21.12], ["fly, housefly", 6.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 25.96], ["mains hum", 17.8], ["music", 11.23]], null, null, null, null, null, null, null, null, null, null, [["rumble", 23.89], ["creak", 19.51], ["hum", 11.5]], null, null, null, null, null, null], "duration": [6.47, 6.21, 2.3, 1.24, 0.49, 0.55, 0.13, 0.44, 2.31, 0.88, 0.52, 0.86, 0.26, 1.06, 2.84, 1.6, 0.6, 2.42, 0.53, 0.93, 1.92, 1.04, 0.21, 1.41, 2.46, 1.28, 1.49, 0.89, 3.44, 1.48, 1.6, -0.16, 1.64, 0.83, 2.06]} \ No newline at end of file diff --git a/annotations_filtered/lKh7qSp6zIc_filtered.json b/annotations_filtered/lKh7qSp6zIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2320cef9398ea52abca079cbb500148709bd274a --- /dev/null +++ b/annotations_filtered/lKh7qSp6zIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.62], [15.0, 15.11], [17.0, 17.63], [19.0, 18.86], [23.0, 22.81], [25.0, 27.55], [31.0, 32.71], [35.0, 35.7], [42.0, 42.21], [43.0, 43.92], [45.0, 45.6], [46.0, 47.33], [51.0, 51.83], [53.0, 53.7], [57.0, 57.33], [59.0, 59.22], [62.0, 66.75], [68.0, 68.72], [71.0, 74.93], [76.0, 79.89], [84.0, 85.16], [95.0, 96.87]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.59, 0.0, 34.31, 58.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["explosion", 41.97], ["eruption", 13.05], ["burst, pop", 8.96]], null, null, null, null, null, null, null, null, null, null, [["effects unit", 18.09], ["noise", 15.11], ["synthesizer", 11.03]], null, [["explosion", 22.75], ["burst, pop", 18.67], ["gunshot, gunfire", 13.9]], null, null, null], "duration": [0.62, 0.11, 0.63, -0.14, -0.19, 2.55, 1.71, 0.7, 0.21, 0.92, 0.6, 1.33, 0.83, 0.7, 0.33, 0.22, 4.75, 0.72, 3.93, 3.89, 1.16, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/lKqBsgfSSU8_filtered.json b/annotations_filtered/lKqBsgfSSU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbb691fe0507a25b221686c5a6d6c19842bc22c9 --- /dev/null +++ b/annotations_filtered/lKqBsgfSSU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.12], [11.0, 13.73], [17.0, 17.74], [22.0, 23.65], [27.0, 32.56], [36.0, 37.18], [38.0, 39.45], [40.0, 42.18], [42.0, 45.15], [47.0, 56.08], [58.0, 62.85], [64.0, 77.65], [81.0, 82.39], [86.0, 88.74], [92.0, 96.75], [97.0, 102.63], [105.0, 108.19], [110.0, 111.13], [112.0, 113.63], [118.0, 122.69], [124.0, 130.33], [132.0, 137.27], [139.0, 141.0], [143.0, 148.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.87, 41.12, 0.0, 0.0, 94.37, 0.0, 0.0, 73.82, 50.86, 99.99, 62.17, 66.51, 0.0, 99.98, 89.54, 61.37, 87.74, 0.0, 0.0, 88.46, 63.96, 66.03, 70.02, 36.47], "audiomae_on_audioset": [null, [["sine wave", 45.11], ["speech", 21.99], ["dial tone", 14.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.0], ["singing bowl", 25.96], ["hum", 6.57]]], "duration": [7.12, 2.73, 0.74, 1.65, 5.56, 1.18, 1.45, 2.18, 3.15, 9.08, 4.85, 13.65, 1.39, 2.74, 4.75, 5.63, 3.19, 1.13, 1.63, 4.69, 6.33, 5.27, 2.0, 5.44]} \ No newline at end of file diff --git a/annotations_filtered/lKqS8lnlJsc_filtered.json b/annotations_filtered/lKqS8lnlJsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c974ca75900f122971df7f9f54f5f095ff6523b --- /dev/null +++ b/annotations_filtered/lKqS8lnlJsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.19], [46.0, 46.85], [59.0, 61.99], [67.0, 66.95], [75.0, 75.44], [76.0, 78.95], [79.0, 82.04], [83.0, 83.07], [86.0, 87.25], [89.0, 91.45], [93.0, 93.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.84, 0.0, 0.0, 29.94, 29.3, 0.0, 0.0, 29.61, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 46.5], ["moo", 29.88], ["livestock, farm animals, working animals", 18.5]], null, null, [["music", 75.13], ["electronic music", 5.2], ["drum machine", 4.77]], [["music", 74.39], ["drum machine", 5.43], ["synthesizer", 5.2]], null, null, [["music", 67.64], ["electronic music", 5.23], ["synthesizer", 2.75]], null], "duration": [0.19, 0.85, 2.99, -0.05, 0.44, 2.95, 3.04, 0.07, 1.25, 2.45, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/lKv7aGku2RQ_filtered.json b/annotations_filtered/lKv7aGku2RQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66e6dd4c699fa7253316b2add17f7efaab485a4c --- /dev/null +++ b/annotations_filtered/lKv7aGku2RQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.0], [22.0, 22.89], [24.0, 26.72], [28.0, 28.92], [30.0, 30.89], [76.0, 79.0], [79.0, 79.84], [90.0, 90.96]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 34.2, 0.0, 0.0, 29.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["animal", 41.42], ["dog", 17.26], ["domestic animals, pets", 14.02]], null, null, [["civil defense siren", 27.31], ["vehicle", 16.41], ["siren", 10.26]], null, null], "duration": [1.0, 0.89, 2.72, 0.92, 0.89, 3.0, 0.84, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/lKwghMLo0AY_filtered.json b/annotations_filtered/lKwghMLo0AY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41af875f076b2ae587b35ade6c868fdd61bbb8b9 --- /dev/null +++ b/annotations_filtered/lKwghMLo0AY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.86], [12.0, 15.94], [20.0, 20.68], [22.0, 21.98], [25.0, 25.39], [26.0, 27.03], [28.0, 28.85], [29.0, 29.27], [30.0, 30.4], [37.0, 37.62], [38.0, 42.84], [44.0, 44.68], [45.0, 45.91], [47.0, 48.02], [51.0, 54.04], [58.0, 63.14], [68.0, 68.47], [79.0, 79.22], [85.0, 85.31], [86.0, 86.16], [88.0, 88.35], [89.0, 89.67], [93.0, 94.22], [106.0, 106.52], [107.0, 107.52], [114.0, 114.83], [119.0, 119.08], [122.0, 124.07], [128.0, 129.07], [130.0, 131.73], [138.0, 139.58], [148.0, 148.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.59, 0.0, 0.0, 0.0, 99.84, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 3.94, 0.68, -0.02, 0.39, 1.03, 0.85, 0.27, 0.4, 0.62, 4.84, 0.68, 0.91, 1.02, 3.04, 5.14, 0.47, 0.22, 0.31, 0.16, 0.35, 0.67, 1.22, 0.52, 0.52, 0.83, 0.08, 2.07, 1.07, 1.73, 1.58, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/lLItY-Oyvt0_filtered.json b/annotations_filtered/lLItY-Oyvt0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39c906b201ac1bc3eb3175d48d08652230059cff --- /dev/null +++ b/annotations_filtered/lLItY-Oyvt0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.7], [12.0, 12.7], [14.0, 16.53], [20.0, 30.57], [32.0, 42.13], [43.0, 44.78], [46.0, 67.95], [69.0, 94.04], [96.0, 103.45], [104.0, 103.94], [104.0, 104.45], [108.0, 129.36], [130.0, 143.63], [146.0, 150.79], [152.0, 152.17], [153.0, 153.86], [155.0, 157.11], [158.0, 167.34], [171.0, 172.0], [174.0, 190.43], [198.0, 201.43], [202.0, 201.53], [202.0, 201.58], [202.0, 201.63], [202.0, 201.75], [202.0, 204.3]], "keep_status": [false, false, true, true, true, false, true, true, true, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.75, 28.56, 29.53, 0.0, 30.38, 30.4, 30.29, 0.0, 0.0, 28.83, 29.17, 31.07, 0.0, 0.0, 33.83, 29.64, 0.0, 33.01, 32.83, 0.0, 0.0, 0.0, 0.0, 30.34], "audiomae_on_audioset": [null, null, [["rumble", 19.53], ["hum", 18.0], ["mains hum", 12.79]], [["buzz", 27.86], ["music", 12.68], ["vehicle", 11.43]], [["music", 28.05], ["buzz", 15.05], ["hum", 10.2]], null, [["music", 41.07], ["whack, thwack", 13.87], ["speech", 10.92]], [["music", 52.64], ["speech", 7.88], ["didgeridoo", 5.65]], [["music", 30.24], ["mains hum", 23.14], ["fly, housefly", 9.01]], null, null, [["music", 62.73], ["didgeridoo", 7.26], ["mains hum", 5.43]], [["music", 34.44], ["mains hum", 9.88], ["buzz", 7.82]], [["music", 15.8], ["speech", 15.1], ["didgeridoo", 11.91]], null, null, [["music", 72.51], ["speech", 7.2], ["hum", 1.76]], [["music", 32.84], ["buzz", 22.48], ["hum", 13.54]], null, [["music", 38.59], ["speech", 23.34], ["scary music", 11.99]], [["speech", 53.17], ["music", 16.7], ["foghorn", 3.71]], null, null, null, null, [["music", 53.52], ["theremin", 16.3], ["thunk", 9.87]]], "duration": [1.7, 0.7, 2.53, 10.57, 10.13, 1.78, 21.95, 25.04, 7.45, -0.06, 0.45, 21.36, 13.63, 4.79, 0.17, 0.86, 2.11, 9.34, 1.0, 16.43, 3.43, -0.47, -0.42, -0.37, -0.25, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/lLX3wpgs32Y_filtered.json b/annotations_filtered/lLX3wpgs32Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..342716d5a10301b9233a35b31d4c7b73468e513a --- /dev/null +++ b/annotations_filtered/lLX3wpgs32Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.59], [16.0, 16.04], [17.0, 18.1], [27.0, 26.94], [27.0, 27.75], [46.0, 46.33], [57.0, 57.91], [62.0, 66.39]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 42.0], ["fart", 13.27], ["livestock, farm animals, working animals", 4.2]]], "duration": [1.59, 0.04, 1.1, -0.06, 0.75, 0.33, 0.91, 4.39]} \ No newline at end of file diff --git a/annotations_filtered/lLbWBsRVUAU_filtered.json b/annotations_filtered/lLbWBsRVUAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6baa86d373e0698e6070e4c235ab2b3c6045ecaa --- /dev/null +++ b/annotations_filtered/lLbWBsRVUAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.67], [8.0, 9.12], [11.0, 11.25], [13.0, 19.52], [21.0, 24.11], [25.0, 26.35], [34.0, 36.02], [37.0, 37.54], [43.0, 43.71], [45.0, 45.08], [56.0, 56.49], [60.0, 60.4], [62.0, 62.24], [65.0, 65.11], [74.0, 74.83], [77.0, 77.58], [80.0, 80.54], [89.0, 89.38], [92.0, 92.3], [94.0, 94.14], [103.0, 103.91], [105.0, 105.65], [108.0, 108.43], [125.0, 124.8], [127.0, 127.21], [130.0, 131.65], [134.0, 135.01], [135.0, 135.99], [136.0, 145.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.22, 64.29, 0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.67, 1.12, 0.25, 6.52, 3.11, 1.35, 2.02, 0.54, 0.71, 0.08, 0.49, 0.4, 0.24, 0.11, 0.83, 0.58, 0.54, 0.38, 0.3, 0.14, 0.91, 0.65, 0.43, -0.2, 0.21, 1.65, 1.01, 0.99, 9.07]} \ No newline at end of file diff --git a/annotations_filtered/lLeY8-bhEuQ_filtered.json b/annotations_filtered/lLeY8-bhEuQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b98846df6e46877346c0c3241858b722087b2d3b --- /dev/null +++ b/annotations_filtered/lLeY8-bhEuQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 60.59], [62.0, 77.94]], "keep_status": [false, true], "silence_prob": [30.45, 29.75], "audiomae_on_audioset": [[["music", 41.32], ["hum", 24.57], ["mains hum", 12.34]], [["music", 44.43], ["livestock, farm animals, working animals", 10.96], ["whale vocalization", 5.23]]], "duration": [28.59, 15.94]} \ No newline at end of file diff --git a/annotations_filtered/lLepw8cs6eQ_filtered.json b/annotations_filtered/lLepw8cs6eQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb1f01af0cbbf4540eacae4e32bcfb6e42d1e5fa --- /dev/null +++ b/annotations_filtered/lLepw8cs6eQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.44], [18.0, 48.86], [49.0, 51.09], [52.0, 52.95], [54.0, 54.8], [57.0, 57.69], [58.0, 64.34], [65.0, 65.55], [66.0, 66.45], [67.0, 94.39], [95.0, 94.88], [98.0, 118.47], [121.0, 134.54], [138.0, 150.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.36, 0.0, 50.26, 0.0, 0.0, 0.0, 52.39, 0.0, 0.0, 50.66, 0.0, 54.63, 58.81, 56.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.44, 30.86, 2.09, 0.95, 0.8, 0.69, 6.34, 0.55, 0.45, 27.39, -0.12, 20.47, 13.54, 12.89]} \ No newline at end of file diff --git a/annotations_filtered/lLgOrvsA9tw_filtered.json b/annotations_filtered/lLgOrvsA9tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a0da1e033c78f0d5c7716ba1410ec700ee8127f --- /dev/null +++ b/annotations_filtered/lLgOrvsA9tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.62], [31.0, 32.64], [48.0, 51.33], [57.0, 59.43], [78.0, 80.37], [112.0, 112.67]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 31.31, 35.15, 32.58, 0.0], "audiomae_on_audioset": [null, null, [["music", 71.5], ["didgeridoo", 16.66], ["musical instrument", 2.84]], [["music", 37.99], ["timpani", 11.07], ["musical instrument", 6.93]], [["music", 50.63], ["didgeridoo", 13.74], ["musical instrument", 7.09]], null], "duration": [1.62, 1.64, 3.33, 2.43, 2.37, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/lMA48vIxajE_filtered.json b/annotations_filtered/lMA48vIxajE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23f6be0b61332a0b805815df49bfa8fd9a8c560d --- /dev/null +++ b/annotations_filtered/lMA48vIxajE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.45], [9.0, 9.86], [28.0, 27.78], [30.0, 30.03], [35.0, 34.64], [47.0, 48.25], [53.0, 52.91], [58.0, 58.36], [59.0, 60.74], [62.0, 63.1], [65.0, 67.51], [69.0, 69.85], [78.0, 77.62], [79.0, 85.78], [88.0, 88.59], [93.0, 93.72], [95.0, 95.15], [98.0, 98.31], [101.0, 101.7], [105.0, 105.27], [106.0, 106.66], [113.0, 113.53], [116.0, 116.28], [119.0, 118.88], [121.0, 121.37], [130.0, 130.44], [132.0, 132.68], [134.0, 137.47], [138.0, 138.47], [141.0, 144.34], [146.0, 145.94], [147.0, 147.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 97.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.45, 0.86, -0.22, 0.03, -0.36, 1.25, -0.09, 0.36, 1.74, 1.1, 2.51, 0.85, -0.38, 6.78, 0.59, 0.72, 0.15, 0.31, 0.7, 0.27, 0.66, 0.53, 0.28, -0.12, 0.37, 0.44, 0.68, 3.47, 0.47, 3.34, -0.06, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/lMXVWQCa_MY_filtered.json b/annotations_filtered/lMXVWQCa_MY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4266f95291d1113d6b8ee100f0bb5bc40af74ae1 --- /dev/null +++ b/annotations_filtered/lMXVWQCa_MY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.13], [19.0, 26.2], [26.0, 26.23], [28.0, 29.62], [30.0, 31.16], [33.0, 45.33], [46.0, 62.11], [62.0, 64.81], [65.0, 69.69], [72.0, 73.84], [76.0, 77.92], [82.0, 81.94], [82.0, 83.96], [85.0, 86.95], [110.0, 111.79], [113.0, 114.12], [116.0, 116.11], [117.0, 117.21], [118.0, 118.59], [119.0, 119.55], [120.0, 120.16], [121.0, 123.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [62.47, 52.27, 0.0, 0.0, 0.0, 86.09, 79.07, 49.78, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 49.2], ["mains hum", 29.23], ["speech", 6.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.12], ["radio", 11.8], ["hum", 10.87]]], "duration": [10.13, 7.2, 0.23, 1.62, 1.16, 12.33, 16.11, 2.81, 4.69, 1.84, 1.92, -0.06, 1.96, 1.95, 1.79, 1.12, 0.11, 0.21, 0.59, 0.55, 0.16, 2.28]} \ No newline at end of file diff --git a/annotations_filtered/lMiVewLfZKI_filtered.json b/annotations_filtered/lMiVewLfZKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cecff14033eb65dc8135b3a8e1e9cfe673afd832 --- /dev/null +++ b/annotations_filtered/lMiVewLfZKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.39], [11.0, 11.37], [14.0, 25.46], [26.0, 26.47], [30.0, 30.54], [31.0, 158.09]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 23.08], ["hum", 23.03], ["electric shaver, electric razor", 12.27]], null, null, null], "duration": [1.39, 0.37, 11.46, 0.47, 0.54, 127.09]} \ No newline at end of file diff --git a/annotations_filtered/lMilbGNSGtI_filtered.json b/annotations_filtered/lMilbGNSGtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bbc310a693b0a821d63c3bc5e4574a281824258 --- /dev/null +++ b/annotations_filtered/lMilbGNSGtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.81], [9.0, 9.73], [11.0, 12.6], [13.0, 14.98], [16.0, 23.6], [25.0, 26.03], [30.0, 31.4], [32.0, 32.51], [34.0, 33.66], [34.0, 34.47], [38.0, 38.35], [43.0, 46.33], [47.0, 54.35], [56.0, 71.85], [81.0, 81.73], [83.0, 84.3], [87.0, 88.92], [94.0, 93.83], [94.0, 96.33], [98.0, 98.61], [99.0, 118.62], [126.0, 126.33], [127.0, 141.0], [142.0, 142.94], [144.0, 145.37], [147.0, 148.22], [152.0, 154.36], [156.0, 158.73], [161.0, 161.18], [162.0, 178.92], [180.0, 181.84], [187.0, 187.71], [189.0, 201.28], [202.0, 202.46], [204.0, 204.58], [206.0, 210.69], [212.0, 212.8], [214.0, 213.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 43.58, 40.66, 0.0, 0.0, 0.0, 0.0, 45.72, 0.0, 33.27, 0.0, 91.3, 0.0, 0.0, 0.0, 96.17, 59.68, 0.0, 82.79, 0.0, 0.0, 47.46, 0.0, 0.0, 34.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 66.16], ["synthesizer", 8.61], ["effects unit", 6.47]], null, null, null, null, null, null, null, [["music", 25.11], ["speech", 12.59], ["theremin", 12.45]], [["music", 46.54], ["theremin", 35.45], ["didgeridoo", 5.6]], null, null, null, null, [["speech", 42.32], ["music", 13.89], ["field recording", 2.56]], null, [["music", 36.72], ["speech", 20.55], ["brass instrument", 10.45]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.06], ["music", 34.19], ["boing", 1.77]], null, null, [["hum", 47.93], ["music", 16.42], ["mains hum", 10.23]], null, null], "duration": [-0.19, 0.73, 1.6, 1.98, 7.6, 1.03, 1.4, 0.51, -0.34, 0.47, 0.35, 3.33, 7.35, 15.85, 0.73, 1.3, 1.92, -0.17, 2.33, 0.61, 19.62, 0.33, 14.0, 0.94, 1.37, 1.22, 2.36, 2.73, 0.18, 16.92, 1.84, 0.71, 12.28, 0.46, 0.58, 4.69, 0.8, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/lMmTZ7oTDRI_filtered.json b/annotations_filtered/lMmTZ7oTDRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed5676440c0772efd4b07dcce050d2c3ebf8826e --- /dev/null +++ b/annotations_filtered/lMmTZ7oTDRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.82], [11.0, 32.49], [34.0, 37.94], [40.0, 40.71], [43.0, 47.07], [50.0, 51.53], [52.0, 55.53], [56.0, 58.26], [60.0, 67.76], [68.0, 72.67], [74.0, 76.1]], "keep_status": [false, true, true, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 35.71, 46.33, 0.0, 40.59, 0.0, 49.0, 43.85, 42.6, 50.41, 61.27], "audiomae_on_audioset": [null, [["speech", 27.19], ["siren", 17.7], ["emergency vehicle", 14.57]], [["speech", 27.49], ["vehicle", 14.72], ["hum", 7.9]], null, [["mains hum", 21.14], ["hum", 20.6], ["vehicle", 6.47]], null, [["hum", 52.14], ["mains hum", 21.08], ["throbbing", 10.16]], [["hum", 18.47], ["music", 15.58], ["throbbing", 10.71]], [["hum", 28.39], ["speech", 19.34], ["music", 10.3]], null, null], "duration": [1.82, 21.49, 3.94, 0.71, 4.07, 1.53, 3.53, 2.26, 7.76, 4.67, 2.1]} \ No newline at end of file diff --git a/annotations_filtered/lMrKsKQWrl8_filtered.json b/annotations_filtered/lMrKsKQWrl8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57948b577e37628db839a2ca2d292aab7d0c06e8 --- /dev/null +++ b/annotations_filtered/lMrKsKQWrl8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [7.0, 8.29], [10.0, 10.64], [13.0, 13.74], [16.0, 16.6], [18.0, 19.21], [22.0, 22.76], [25.0, 39.11], [40.0, 41.82], [49.0, 49.76], [56.0, 56.52], [60.0, 67.83], [68.0, 70.38], [74.0, 74.63], [77.0, 79.08], [84.0, 84.28], [87.0, 88.16], [89.0, 106.34], [115.0, 118.02], [119.0, 122.86], [123.0, 122.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 99.84, 98.86, 0.0, 99.96, 0.0, 0.0, 95.91, 100.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 1.29, 0.64, 0.74, 0.6, 1.21, 0.76, 14.11, 1.82, 0.76, 0.52, 7.83, 2.38, 0.63, 2.08, 0.28, 1.16, 17.34, 3.02, 3.86, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/lMtWWls4oas_filtered.json b/annotations_filtered/lMtWWls4oas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d759de0d200e02a9fe92651f85bc58918801db1b --- /dev/null +++ b/annotations_filtered/lMtWWls4oas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [3.0, 4.4], [6.0, 6.88], [7.0, 7.94], [20.0, 21.61], [25.0, 25.22], [28.0, 28.98], [32.0, 32.36], [34.0, 35.63], [39.0, 39.28], [42.0, 62.36], [65.0, 86.97], [88.0, 88.79], [92.0, 104.65], [106.0, 107.28], [109.0, 109.19], [115.0, 115.55], [116.0, 116.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.03, 31.82, 0.0, 33.27, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 43.9], ["music", 34.22], ["throbbing", 7.26]], [["music", 37.16], ["speech", 33.01], ["foghorn", 4.24]], null, [["music", 59.89], ["hum", 11.82], ["mains hum", 7.74]], null, null, null, null], "duration": [0.25, 1.4, 0.88, 0.94, 1.61, 0.22, 0.98, 0.36, 1.63, 0.28, 20.36, 21.97, 0.79, 12.65, 1.28, 0.19, 0.55, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/lN4oFlIKm7A_filtered.json b/annotations_filtered/lN4oFlIKm7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..180ccf17ff4bb8dee556d75bca7f8ce362d4a71d --- /dev/null +++ b/annotations_filtered/lN4oFlIKm7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.65], [5.0, 74.58], [75.0, 75.61], [87.0, 93.39]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 78.89], "audiomae_on_audioset": [null, null, null, null], "duration": [-0.35, 69.58, 0.61, 6.39]} \ No newline at end of file diff --git a/annotations_filtered/lNFbbWOM5FU_filtered.json b/annotations_filtered/lNFbbWOM5FU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6f454d902adf86650480ec3120cff697cc4ac83 --- /dev/null +++ b/annotations_filtered/lNFbbWOM5FU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 22.69], [24.0, 31.75], [34.0, 73.82], [74.0, 124.88], [132.0, 132.04], [138.0, 140.48], [141.0, 141.71], [146.0, 146.31], [156.0, 185.84]], "keep_status": [true, false, false, false, false, true, false, false, false], "silence_prob": [38.94, 37.08, 0.0, 0.0, 0.0, 34.04, 0.0, 0.0, 37.74], "audiomae_on_audioset": [[["music", 54.98], ["musical instrument", 6.87], ["vibraphone", 5.26]], [["music", 79.79], ["musical instrument", 6.44], ["synthesizer", 3.15]], null, null, null, [["music", 55.32], ["musical instrument", 7.42], ["theremin", 7.23]], null, null, [["music", 55.11], ["musical instrument", 9.68], ["brass instrument", 9.43]]], "duration": [13.69, 7.75, 39.82, 50.88, 0.04, 2.48, 0.71, 0.31, 29.84]} \ No newline at end of file diff --git a/annotations_filtered/lNHheEljm5s_filtered.json b/annotations_filtered/lNHheEljm5s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..057dd45c03e2ae3218dd91a2b555aae7574c797e --- /dev/null +++ b/annotations_filtered/lNHheEljm5s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[94.0, 125.81]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [31.81]} \ No newline at end of file diff --git a/annotations_filtered/lNVb-ZNIO-A_filtered.json b/annotations_filtered/lNVb-ZNIO-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..483b74a6b1662aea32e0aa1b154600a8ad9ee957 --- /dev/null +++ b/annotations_filtered/lNVb-ZNIO-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 76.42], [77.0, 77.5], [78.0, 79.84], [81.0, 93.8], [97.0, 107.92], [111.0, 111.45], [118.0, 118.15], [119.0, 119.31], [120.0, 133.66], [135.0, 135.6], [137.0, 138.91], [140.0, 141.62], [142.0, 145.69], [147.0, 148.73], [150.0, 150.5], [156.0, 155.95], [161.0, 162.03], [165.0, 169.69], [172.0, 174.65], [176.0, 178.06], [178.0, 186.0], [186.0, 186.19]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 47.82, 33.97, 0.0, 0.0, 0.0, 31.74, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0, 0.0, 0.0, 38.59, 83.7, 67.76, 30.21, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 48.99], ["fart", 10.05], ["synthesizer", 4.58]], [["music", 30.45], ["speech", 22.84], ["throbbing", 10.04]], null, null, null, [["music", 32.69], ["hum", 22.43], ["throbbing", 18.35]], null, null, null, [["insect", 29.35], ["music", 15.33], ["fly, housefly", 8.45]], null, null, null, null, [["livestock, farm animals, working animals", 13.16], ["moo", 11.8], ["fly, housefly", 11.51]], null, null, [["whale vocalization", 23.94], ["livestock, farm animals, working animals", 18.95], ["speech", 14.03]], null], "duration": [60.42, 0.5, 1.84, 12.8, 10.92, 0.45, 0.15, 0.31, 13.66, 0.6, 1.91, 1.62, 3.69, 1.73, 0.5, -0.05, 1.03, 4.69, 2.65, 2.06, 8.0, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/lNWV7T5KlRE_filtered.json b/annotations_filtered/lNWV7T5KlRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..099587f7261383fa544ebdfd6fe57f43b9895e8a --- /dev/null +++ b/annotations_filtered/lNWV7T5KlRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.47], [7.0, 10.72], [12.0, 13.68], [14.0, 15.04], [16.0, 16.66], [18.0, 19.74], [21.0, 40.2], [41.0, 41.22], [46.0, 48.0], [51.0, 51.71], [53.0, 56.52], [57.0, 58.21], [59.0, 59.75], [61.0, 62.85], [63.0, 70.5], [73.0, 73.6], [75.0, 76.55], [78.0, 78.6], [79.0, 78.7], [79.0, 79.49], [82.0, 82.39], [84.0, 88.03], [88.0, 89.29], [91.0, 93.26], [96.0, 96.52], [98.0, 100.9], [101.0, 101.38], [102.0, 104.38], [106.0, 106.61], [108.0, 110.66], [112.0, 112.19], [113.0, 114.76], [117.0, 117.34], [121.0, 122.42], [123.0, 127.55], [129.0, 129.63], [132.0, 132.7], [140.0, 143.68], [145.0, 145.35], [146.0, 146.53], [149.0, 149.35], [152.0, 160.22], [162.0, 162.57], [163.0, 167.56], [168.0, 168.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, true, false, true, false, true, false, false, false, false, true, false, false, true, false, false, false, true, false, true, false], "silence_prob": [58.89, 55.6, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 81.35, 0.0, 85.17, 0.0, 0.0, 0.0, 32.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26, 0.0, 34.67, 0.0, 33.91, 0.0, 31.83, 0.0, 31.01, 0.0, 0.0, 0.0, 0.0, 31.4, 0.0, 0.0, 30.68, 0.0, 0.0, 0.0, 30.94, 0.0, 33.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 34.38], ["mosquito", 14.3], ["insect", 7.66]], null, null, null, null, null, null, [["burst, pop", 12.94], ["music", 11.61], ["explosion", 11.06]], null, [["music", 32.46], ["shofar", 22.52], ["wind instrument, woodwind instrument", 11.06]], null, [["music", 25.19], ["mains hum", 6.65], ["didgeridoo", 5.94]], null, [["music", 34.94], ["mains hum", 13.95], ["hum", 11.43]], null, [["music", 54.33], ["electronic music", 4.36], ["synthesizer", 3.67]], null, null, null, null, [["speech", 29.53], ["music", 21.68], ["vehicle", 7.03]], null, null, [["hum", 21.79], ["mains hum", 10.31], ["music", 9.14]], null, null, null, [["music", 57.73], ["boing", 4.73], ["speech", 4.5]], null, [["hum", 21.93], ["mains hum", 17.1], ["music", 9.22]], null], "duration": [2.47, 3.72, 1.68, 1.04, 0.66, 1.74, 19.2, 0.22, 2.0, 0.71, 3.52, 1.21, 0.75, 1.85, 7.5, 0.6, 1.55, 0.6, -0.3, 0.49, 0.39, 4.03, 1.29, 2.26, 0.52, 2.9, 0.38, 2.38, 0.61, 2.66, 0.19, 1.76, 0.34, 1.42, 4.55, 0.63, 0.7, 3.68, 0.35, 0.53, 0.35, 8.22, 0.57, 4.56, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/lNXTKVxOmfk_filtered.json b/annotations_filtered/lNXTKVxOmfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..418986d5fb494324dd2bb026c537f562c4a5bac3 --- /dev/null +++ b/annotations_filtered/lNXTKVxOmfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.83], [6.0, 7.15], [8.0, 10.34], [12.0, 12.7], [14.0, 18.5], [21.0, 28.83], [32.0, 32.56], [37.0, 37.91], [39.0, 43.41], [47.0, 48.52], [49.0, 54.16], [56.0, 69.89], [71.0, 79.68], [80.0, 81.99], [82.0, 87.47], [88.0, 117.98], [126.0, 144.83], [147.0, 150.13], [151.0, 152.91], [154.0, 156.54], [157.0, 162.04]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 44.52, 0.0, 82.07, 79.94, 0.0, 0.0, 77.87, 0.0, 65.67, 65.79, 51.66, 0.0, 65.91, 70.3, 74.13, 61.57, 0.0, 80.29, 38.27], "audiomae_on_audioset": [null, null, [["speech", 53.54], ["telephone", 12.16], ["busy signal", 3.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.78], ["speech", 14.78], ["musical instrument", 4.74]]], "duration": [1.83, 1.15, 2.34, 0.7, 4.5, 7.83, 0.56, 0.91, 4.41, 1.52, 5.16, 13.89, 8.68, 1.99, 5.47, 29.98, 18.83, 3.13, 1.91, 2.54, 5.04]} \ No newline at end of file diff --git a/annotations_filtered/lO8EJQzkYxg_filtered.json b/annotations_filtered/lO8EJQzkYxg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc043a433274180b9e787e4a0cb4f8abc083d8e6 --- /dev/null +++ b/annotations_filtered/lO8EJQzkYxg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 35.77], [39.0, 59.64], [61.0, 70.61], [74.0, 75.19], [76.0, 93.07]], "keep_status": [false, true, false, false, false], "silence_prob": [29.7, 28.98, 29.52, 0.0, 29.0], "audiomae_on_audioset": [[["music", 58.35], ["throbbing", 13.27], ["whack, thwack", 2.03]], [["vehicle", 17.13], ["car", 15.97], ["skidding", 12.27]], [["music", 46.11], ["throbbing", 25.61], ["hum", 6.63]], null, [["music", 39.42], ["throbbing", 26.2], ["hum", 25.21]]], "duration": [8.77, 20.64, 9.61, 1.19, 17.07]} \ No newline at end of file diff --git a/annotations_filtered/lOR8JBFySr8_filtered.json b/annotations_filtered/lOR8JBFySr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73ea4aee6c7c0d3dc8bdc2e83dc054aa3e21c137 --- /dev/null +++ b/annotations_filtered/lOR8JBFySr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 28.48], [28.0, 28.51], [30.0, 42.84], [45.0, 81.4], [82.0, 88.52], [91.0, 121.27], [125.0, 142.64]], "keep_status": [true, false, true, false, false, false, false], "silence_prob": [29.6, 0.0, 29.24, 0.0, 50.31, 0.0, 30.33], "audiomae_on_audioset": [[["speech", 24.08], ["fly, housefly", 13.11], ["music", 6.54]], null, [["music", 48.51], ["whack, thwack", 4.78], ["speech", 4.76]], null, null, null, [["music", 77.67], ["scary music", 5.17], ["hum", 2.18]]], "duration": [21.48, 0.51, 12.84, 36.4, 6.52, 30.27, 17.64]} \ No newline at end of file diff --git a/annotations_filtered/lOaaPz6E6ms_filtered.json b/annotations_filtered/lOaaPz6E6ms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ff0c4701b67817bffbc94b0c5bbc086209e95ae --- /dev/null +++ b/annotations_filtered/lOaaPz6E6ms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.7], [9.0, 10.91], [13.0, 13.76], [16.0, 18.82], [28.0, 33.52], [34.0, 36.26], [39.0, 39.75], [43.0, 44.66], [46.0, 46.9], [49.0, 50.3], [54.0, 66.93], [69.0, 71.36], [73.0, 74.38], [76.0, 83.05], [84.0, 85.75], [89.0, 92.89], [94.0, 94.98], [97.0, 97.83], [101.0, 106.79], [109.0, 111.18], [112.0, 116.41], [117.0, 120.12], [121.0, 122.99], [123.0, 128.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 100.0, 85.72, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 98.8, 0.0, 99.94, 0.0, 0.0, 100.0, 93.91, 97.92, 100.0, 0.0, 97.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.7, 1.91, 0.76, 2.82, 5.52, 2.26, 0.75, 1.66, 0.9, 1.3, 12.93, 2.36, 1.38, 7.05, 1.75, 3.89, 0.98, 0.83, 5.79, 2.18, 4.41, 3.12, 1.99, 5.75]} \ No newline at end of file diff --git a/annotations_filtered/lOgPGO4JnaA_filtered.json b/annotations_filtered/lOgPGO4JnaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2764d9177a89692ccce462cb128a06dc3f5e5071 --- /dev/null +++ b/annotations_filtered/lOgPGO4JnaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.68], [10.0, 12.82], [15.0, 18.45], [20.0, 20.58], [22.0, 23.85], [26.0, 26.28], [32.0, 32.54], [34.0, 38.04], [39.0, 39.97], [41.0, 41.77], [46.0, 47.09], [50.0, 51.98], [53.0, 57.64], [60.0, 59.68], [64.0, 65.16], [69.0, 73.55], [78.0, 79.64], [82.0, 83.22], [84.0, 90.44], [92.0, 94.51], [95.0, 96.92], [98.0, 99.23], [100.0, 100.9], [103.0, 103.45], [107.0, 107.08], [109.0, 112.36], [114.0, 120.9], [124.0, 127.16], [129.0, 129.49], [132.0, 134.0], [135.0, 136.83], [137.0, 137.83], [140.0, 140.98], [142.0, 142.55], [147.0, 147.95], [150.0, 151.48], [154.0, 156.2], [157.0, 160.37], [163.0, 165.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.48, 98.27, 99.05, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 78.89, 0.0, 0.0, 53.04, 43.2, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 64.75, 41.64, 0.0, 48.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.43, 56.18, 67.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.83], ["electronic music", 4.99], ["silence", 3.16]], null, null, null, null, null, null, null, [["music", 50.46], ["electronic music", 15.2], ["singing bowl", 12.96]], null, [["speech", 35.03], ["music", 20.03], ["whale vocalization", 16.99]], null, null, null, null, null, null, [["music", 49.02], ["singing bowl", 15.92], ["gong", 9.9]], null, null], "duration": [2.68, 2.82, 3.45, 0.58, 1.85, 0.28, 0.54, 4.04, 0.97, 0.77, 1.09, 1.98, 4.64, -0.32, 1.16, 4.55, 1.64, 1.22, 6.44, 2.51, 1.92, 1.23, 0.9, 0.45, 0.08, 3.36, 6.9, 3.16, 0.49, 2.0, 1.83, 0.83, 0.98, 0.55, 0.95, 1.48, 2.2, 3.37, 2.2]} \ No newline at end of file diff --git a/annotations_filtered/lOmeZW0N10k_filtered.json b/annotations_filtered/lOmeZW0N10k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e08ba51b10261647d8fd7f6a038d1fb681bb5c7 --- /dev/null +++ b/annotations_filtered/lOmeZW0N10k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.05], [8.0, 10.3], [16.0, 16.56], [19.0, 19.77], [36.0, 37.34], [38.0, 43.66], [46.0, 46.84], [52.0, 52.68], [54.0, 54.97], [59.0, 61.26], [67.0, 69.74], [71.0, 81.18], [83.0, 83.34], [89.0, 89.82], [91.0, 92.97], [100.0, 100.92], [105.0, 106.42]], "keep_status": [false, true, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 45.72, 0.0, 0.0, 0.0, 43.53, 0.0, 0.0, 0.0, 36.1, 42.26, 44.43, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["throbbing", 27.73], ["hum", 25.42], ["music", 11.61]], null, null, null, [["music", 52.31], ["throbbing", 6.62], ["sampler", 6.51]], null, null, null, [["music", 32.67], ["throbbing", 23.08], ["hum", 15.7]], [["music", 53.01], ["throbbing", 3.2], ["electronica", 1.78]], [["music", 42.79], ["speech", 17.41], ["hum", 9.11]], null, null, null, null, null], "duration": [0.05, 2.3, 0.56, 0.77, 1.34, 5.66, 0.84, 0.68, 0.97, 2.26, 2.74, 10.18, 0.34, 0.82, 1.97, 0.92, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/lP-A8UaVbLE_filtered.json b/annotations_filtered/lP-A8UaVbLE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..076e7aed57ba93abb208967bb855a2d9080368b3 --- /dev/null +++ b/annotations_filtered/lP-A8UaVbLE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.69], [9.0, 9.14], [10.0, 11.1], [12.0, 14.2], [16.0, 18.64], [20.0, 20.7], [21.0, 39.28], [46.0, 55.51], [59.0, 65.04], [67.0, 70.82], [71.0, 76.05], [79.0, 79.19], [83.0, 98.46], [105.0, 107.15], [114.0, 116.51], [118.0, 119.4], [123.0, 128.34], [130.0, 146.57], [149.0, 149.74], [150.0, 152.09], [158.0, 161.05], [163.0, 167.48], [173.0, 175.0]], "keep_status": [false, false, false, true, true, false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.76, 41.64, 0.0, 29.62, 29.61, 45.4, 64.63, 55.11, 0.0, 38.58, 73.06, 75.07, 0.0, 85.17, 36.68, 0.0, 80.82, 87.74, 77.2, 55.46], "audiomae_on_audioset": [null, null, null, [["speech", 23.51], ["music", 14.15], ["pulse", 6.42]], [["hum", 33.2], ["rumble", 8.64], ["sonar", 8.55]], null, [["mains hum", 52.94], ["hum", 24.12], ["music", 4.66]], [["speech", 69.8], ["explosion", 6.54], ["music", 6.37]], [["sine wave", 18.53], ["chirp tone", 17.27], ["tuning fork", 8.97]], null, null, null, [["music", 20.65], ["throbbing", 19.78], ["hum", 14.96]], null, null, null, null, [["static", 14.44], ["white noise", 12.67], ["hum", 10.44]], null, null, null, null, null], "duration": [1.69, 0.14, 1.1, 2.2, 2.64, 0.7, 18.28, 9.51, 6.04, 3.82, 5.05, 0.19, 15.46, 2.15, 2.51, 1.4, 5.34, 16.57, 0.74, 2.09, 3.05, 4.48, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/lP8EYYjPEmc_filtered.json b/annotations_filtered/lP8EYYjPEmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae868302132c56f527f7d998b495f417339f18bd --- /dev/null +++ b/annotations_filtered/lP8EYYjPEmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 31.48], [33.0, 34.72], [35.0, 37.39], [43.0, 43.34], [44.0, 45.93], [47.0, 48.29], [50.0, 58.48], [59.0, 60.34], [61.0, 61.69], [62.0, 63.59], [81.0, 81.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.72, 2.39, 0.34, 1.93, 1.29, 8.48, 1.34, 0.69, 1.59, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/lPB6exj8Kgo_filtered.json b/annotations_filtered/lPB6exj8Kgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aa201f3746c06c17e1fc08f0e9c925eb7f03825 --- /dev/null +++ b/annotations_filtered/lPB6exj8Kgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 76.94], [78.0, 175.56]], "keep_status": [true, false], "silence_prob": [41.93, 0.0], "audiomae_on_audioset": [[["animal", 38.49], ["music", 21.66], ["speech", 6.93]], null], "duration": [18.94, 97.56]} \ No newline at end of file diff --git a/annotations_filtered/lPCt2BBqR2k_filtered.json b/annotations_filtered/lPCt2BBqR2k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96ab70f89780cd15024c41786c09fce035ab56e1 --- /dev/null +++ b/annotations_filtered/lPCt2BBqR2k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.25], [11.0, 11.85], [13.0, 13.63], [18.0, 18.96], [23.0, 24.06], [25.0, 25.42], [26.0, 26.89], [29.0, 37.27], [38.0, 38.99], [39.0, 43.68], [44.0, 46.01], [49.0, 53.69], [58.0, 60.94], [62.0, 62.02]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, true, false], "silence_prob": [54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.91, 0.0, 50.86, 38.59, 35.12, 49.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 18.89], ["hum", 11.9], ["music", 7.86]], null, null, [["speech", 50.33], ["music", 7.63], ["clip-clop", 5.47]], [["speech", 69.18], ["music", 6.91], ["radio", 5.45]], [["music", 25.75], ["whale vocalization", 8.13], ["hum", 6.01]], null], "duration": [8.25, 0.85, 0.63, 0.96, 1.06, 0.42, 0.89, 8.27, 0.99, 4.68, 2.01, 4.69, 2.94, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/lPE1uBdcB8Y_filtered.json b/annotations_filtered/lPE1uBdcB8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..177a3bb8618059fb9058cf0f68c10b56b807b868 --- /dev/null +++ b/annotations_filtered/lPE1uBdcB8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 36.34], [37.0, 42.38], [46.0, 91.42], [95.0, 117.19], [118.0, 125.88], [127.0, 128.49], [129.0, 129.32], [129.0, 130.79]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [57.48, 54.83, 0.0, 95.37, 96.04, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [9.34, 5.38, 45.42, 22.19, 7.88, 1.49, 0.32, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/lPMSGTfK4Aw_filtered.json b/annotations_filtered/lPMSGTfK4Aw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37094c444a5a48b539b8a23d23b6e17c392fe1a7 --- /dev/null +++ b/annotations_filtered/lPMSGTfK4Aw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 29.35], [31.0, 31.53], [33.0, 34.11], [36.0, 36.56], [39.0, 40.44], [44.0, 44.56], [48.0, 49.82], [51.0, 52.46], [54.0, 54.9], [58.0, 58.72], [73.0, 73.67], [78.0, 80.47], [82.0, 82.44], [84.0, 84.3], [87.0, 89.53], [92.0, 100.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 0.0, 0.0, 85.17, 57.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.35, 0.53, 1.11, 0.56, 1.44, 0.56, 1.82, 1.46, 0.9, 0.72, 0.67, 2.47, 0.44, 0.3, 2.53, 8.82]} \ No newline at end of file diff --git a/annotations_filtered/lPOo7SzR7Sc_filtered.json b/annotations_filtered/lPOo7SzR7Sc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b741aa8c58bae2afd949325fd40c5b5636141a59 --- /dev/null +++ b/annotations_filtered/lPOo7SzR7Sc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.03], [13.0, 13.59], [14.0, 16.5], [22.0, 41.45], [43.0, 46.55], [49.0, 49.69], [50.0, 49.81], [50.0, 53.91], [55.0, 54.94], [55.0, 59.14], [62.0, 64.03], [69.0, 69.74], [71.0, 73.18], [82.0, 84.67], [85.0, 132.36], [133.0, 143.8], [144.0, 145.1], [146.0, 149.45]], "keep_status": [false, false, true, false, false, false, false, true, false, false, true, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 45.62, 38.06, 35.37, 0.0, 0.0, 32.83, 0.0, 28.92, 39.27, 0.0, 39.74, 45.36, 0.0, 29.74, 0.0, 50.46], "audiomae_on_audioset": [null, null, [["speech", 26.26], ["music", 20.21], ["hum", 16.81]], [["music", 37.73], ["hum", 25.61], ["throbbing", 14.8]], [["music", 35.2], ["burping, eructation", 32.43], ["grunt", 7.02]], null, null, [["music", 30.45], ["didgeridoo", 15.23], ["throbbing", 9.46]], null, [["speech", 52.31], ["music", 34.08], ["electric shaver, electric razor", 2.81]], [["croak", 25.18], ["frog", 18.02], ["music", 12.86]], null, [["didgeridoo", 22.66], ["music", 21.7], ["hum", 12.45]], [["music", 59.62], ["hum", 6.35], ["musical instrument", 4.77]], null, [["music", 20.56], ["sound effect", 8.33], ["explosion", 5.74]], null, null], "duration": [0.03, 0.59, 2.5, 19.45, 3.55, 0.69, -0.19, 3.91, -0.06, 4.14, 2.03, 0.74, 2.18, 2.67, 47.36, 10.8, 1.1, 3.45]} \ No newline at end of file diff --git a/annotations_filtered/lPe61El1_3E_filtered.json b/annotations_filtered/lPe61El1_3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e22900a52e494dec19e87e7932a0f5a04b8861da --- /dev/null +++ b/annotations_filtered/lPe61El1_3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.61], [15.0, 15.72], [21.0, 21.66], [61.0, 64.25], [65.0, 69.58], [73.0, 73.58], [76.0, 76.62], [81.0, 84.3], [96.0, 97.07], [99.0, 100.08], [106.0, 107.84], [110.0, 110.83], [113.0, 113.48], [115.0, 116.53], [123.0, 123.53]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.26, 32.88, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 24.31], ["music", 10.9], ["livestock, farm animals, working animals", 8.17]], [["music", 24.65], ["livestock, farm animals, working animals", 9.74], ["animal", 8.47]], null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.72, 0.66, 3.25, 4.58, 0.58, 0.62, 3.3, 1.07, 1.08, 1.84, 0.83, 0.48, 1.53, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/lPfrzsQ2-Qo_filtered.json b/annotations_filtered/lPfrzsQ2-Qo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0076b9f168695dc9d08444ad9e6d69066bb6207f --- /dev/null +++ b/annotations_filtered/lPfrzsQ2-Qo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.18], [11.0, 14.15], [15.0, 22.81], [27.0, 29.12], [34.0, 35.68], [39.0, 47.26], [48.0, 49.65], [50.0, 58.92], [60.0, 64.64], [67.0, 70.78], [71.0, 74.22], [76.0, 82.05], [84.0, 86.05], [87.0, 103.71], [105.0, 113.75], [115.0, 118.12], [119.0, 121.54], [123.0, 125.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 99.99, 100.0, 100.0, 100.0, 99.98, 100.0, 99.65, 97.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.18, 3.15, 7.81, 2.12, 1.68, 8.26, 1.65, 8.92, 4.64, 3.78, 3.22, 6.05, 2.05, 16.71, 8.75, 3.12, 2.54, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/lPrJqB8ljAE_filtered.json b/annotations_filtered/lPrJqB8ljAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56e42eed0f02a09636ade558223461841801526f --- /dev/null +++ b/annotations_filtered/lPrJqB8ljAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.65], [24.0, 26.3], [28.0, 29.71], [32.0, 56.42], [58.0, 79.86], [81.0, 97.56], [98.0, 98.41], [98.0, 98.51], [99.0, 99.55], [101.0, 103.18], [104.0, 104.53], [107.0, 108.89], [110.0, 110.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.58, 37.53, 0.0, 29.76, 29.97, 31.2, 0.0, 0.0, 0.0, 50.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 41.57], ["music", 17.2], ["throbbing", 14.82]], [["hum", 43.84], ["throbbing", 34.28], ["mains hum", 12.94]], null, [["music", 68.57], ["throbbing", 13.76], ["hum", 8.17]], [["hum", 29.01], ["mains hum", 28.48], ["music", 17.81]], [["music", 53.55], ["speech", 19.8], ["sidetone", 4.4]], null, null, null, null, null, null, null], "duration": [2.65, 2.3, 1.71, 24.42, 21.86, 16.56, 0.41, 0.51, 0.55, 2.18, 0.53, 1.89, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/lPrOstRqB1o_filtered.json b/annotations_filtered/lPrOstRqB1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9314ba516e9961c17518dd288b4503056470800b --- /dev/null +++ b/annotations_filtered/lPrOstRqB1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.26], [10.0, 40.07], [46.0, 79.54], [82.0, 87.42], [88.0, 87.57], [88.0, 93.07], [96.0, 110.61], [116.0, 127.45]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 59.42, 0.0, 62.89, 60.23, 57.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.26, 30.07, 33.54, 5.42, -0.43, 5.07, 14.61, 11.45]} \ No newline at end of file diff --git a/annotations_filtered/lPr_GBMu4O4_filtered.json b/annotations_filtered/lPr_GBMu4O4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..806cd0fc77df5bfa2e59f431a34e49b2ed4f8368 --- /dev/null +++ b/annotations_filtered/lPr_GBMu4O4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.85], [13.0, 15.09], [18.0, 19.09], [21.0, 21.51], [22.0, 23.04], [26.0, 28.09], [29.0, 51.17], [53.0, 54.21], [56.0, 59.93], [61.0, 62.16], [63.0, 64.15], [65.0, 65.96], [68.0, 68.62], [70.0, 72.49], [74.0, 74.51], [76.0, 77.84], [80.0, 83.93], [85.0, 86.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 53.84, 0.0, 0.0, 0.0, 100.0, 60.23, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 88.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.85, 2.09, 1.09, 0.51, 1.04, 2.09, 22.17, 1.21, 3.93, 1.16, 1.15, 0.96, 0.62, 2.49, 0.51, 1.84, 3.93, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/lQ2RStfZii0_filtered.json b/annotations_filtered/lQ2RStfZii0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6684bf27926c319a19bb5307ab037d3f79b1cfa6 --- /dev/null +++ b/annotations_filtered/lQ2RStfZii0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.62], [4.0, 6.29], [8.0, 8.68], [9.0, 9.54], [12.0, 14.32], [16.0, 15.94], [16.0, 17.22], [20.0, 19.99], [23.0, 43.95], [53.0, 69.42], [71.0, 81.48], [82.0, 92.04], [95.0, 98.51], [110.0, 119.52], [121.0, 131.16], [136.0, 137.24], [149.0, 149.28], [153.0, 155.24], [158.0, 159.8]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 98.66, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 38.63, 32.34, 42.58, 36.11, 39.28, 37.59, 39.75, 0.0, 0.0, 61.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 34.59], ["speech", 28.63], ["hum", 15.29]], [["hum", 27.76], ["music", 21.8], ["mains hum", 16.94]], [["music", 78.99], ["throbbing", 6.36], ["hum", 1.93]], [["music", 39.09], ["thump, thud", 27.04], ["whack, thwack", 7.0]], [["speech", 68.51], ["whack, thwack", 6.23], ["music", 2.92]], [["music", 40.91], ["whack, thwack", 7.85], ["noise", 7.55]], [["music", 37.1], ["speech", 15.9], ["throbbing", 14.08]], null, null, null, null], "duration": [-0.38, 2.29, 0.68, 0.54, 2.32, -0.06, 1.22, -0.01, 20.95, 16.42, 10.48, 10.04, 3.51, 9.52, 10.16, 1.24, 0.28, 2.24, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/lQ8JIa98kAw_filtered.json b/annotations_filtered/lQ8JIa98kAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa36845d09e021fe1e50f7b802a7b229315c52b3 --- /dev/null +++ b/annotations_filtered/lQ8JIa98kAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.25], [11.0, 11.64], [15.0, 16.07], [23.0, 23.01], [23.0, 23.04], [26.0, 27.92], [29.0, 31.28], [32.0, 35.02], [37.0, 47.34], [52.0, 56.37], [57.0, 57.16], [58.0, 60.29], [63.0, 64.23], [69.0, 69.65], [70.0, 72.47], [73.0, 77.11], [79.0, 81.72], [83.0, 84.03], [84.0, 90.51]], "keep_status": [true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [42.06, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 77.36, 41.83, 34.4, 0.0, 37.37, 0.0, 0.0, 70.16, 46.29, 36.93, 0.0, 36.01], "audiomae_on_audioset": [[["speech", 31.68], ["music", 13.12], ["musical instrument", 3.7]], null, null, null, null, null, null, null, [["music", 15.15], ["livestock, farm animals, working animals", 13.22], ["cattle, bovinae", 12.87]], [["music", 41.3], ["musical instrument", 12.82], ["guitar", 11.29]], null, [["music", 55.5], ["musical instrument", 15.76], ["guitar", 8.74]], null, null, null, [["sidetone", 41.24], ["speech", 19.05], ["hum", 18.17]], [["fly, housefly", 50.08], ["insect", 13.13], ["mosquito", 7.33]], null, [["music", 75.11], ["musical instrument", 5.23], ["guitar", 3.82]]], "duration": [2.25, 0.64, 1.07, 0.01, 0.04, 1.92, 2.28, 3.02, 10.34, 4.37, 0.16, 2.29, 1.23, 0.65, 2.47, 4.11, 2.72, 1.03, 6.51]} \ No newline at end of file diff --git a/annotations_filtered/lQWvCntonxE_filtered.json b/annotations_filtered/lQWvCntonxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6ec96439a7217d1ad93a5cd5ffdf55f244fd9e7 --- /dev/null +++ b/annotations_filtered/lQWvCntonxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.21], [24.0, 25.2], [26.0, 26.84], [28.0, 32.8], [35.0, 35.8], [36.0, 38.23], [40.0, 41.47], [43.0, 45.47], [46.0, 46.47], [47.0, 50.13], [51.0, 52.89], [53.0, 54.58], [55.0, 55.86], [58.0, 58.45], [61.0, 61.74], [63.0, 63.31], [64.0, 67.53], [68.0, 76.2]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.4, 0.0, 44.93, 0.0, 31.87, 0.0, 53.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.76, 57.97], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 40.55], ["frog", 17.8], ["animal", 11.88]], null, [["speech", 29.31], ["sidetone", 20.2], ["radio", 19.12]], null, [["speech", 29.3], ["animal", 27.36], ["dog", 8.61]], null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 1.2, 0.84, 4.8, 0.8, 2.23, 1.47, 2.47, 0.47, 3.13, 1.89, 1.58, 0.86, 0.45, 0.74, 0.31, 3.53, 8.2]} \ No newline at end of file diff --git a/annotations_filtered/lQbw0_5O8CQ_filtered.json b/annotations_filtered/lQbw0_5O8CQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..740959594395b86e64e86806973153d4ebfcce77 --- /dev/null +++ b/annotations_filtered/lQbw0_5O8CQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.17], [1.0, 3.2], [4.0, 4.68], [6.0, 6.88], [8.0, 8.68], [9.0, 9.63], [10.0, 10.91], [12.0, 12.33], [15.0, 16.55], [18.0, 18.67], [22.0, 22.71], [27.0, 28.46], [35.0, 36.85], [39.0, 39.68], [43.0, 46.35], [47.0, 47.93], [49.0, 50.14], [52.0, 53.05], [57.0, 57.28], [58.0, 58.99], [65.0, 65.77], [76.0, 77.01], [81.0, 81.14], [82.0, 83.19], [97.0, 97.28], [98.0, 99.17], [101.0, 101.22], [102.0, 105.63], [108.0, 108.19], [110.0, 111.38], [113.0, 114.02], [116.0, 116.19], [118.0, 119.08], [119.0, 121.71], [123.0, 124.06], [127.0, 127.92], [129.0, 133.84], [135.0, 135.7], [136.0, 136.9], [138.0, 140.02], [141.0, 141.13]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 43.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 50.66, 0.0, 0.0, 45.08, 0.0], "audiomae_on_audioset": [null, [["music", 36.7], ["beatboxing", 8.2], ["musical instrument", 7.7]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 84.23], ["telephone", 6.75], ["sidetone", 2.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.18], ["musical instrument", 5.66], ["theremin", 4.85]], null], "duration": [0.17, 2.2, 0.68, 0.88, 0.68, 0.63, 0.91, 0.33, 1.55, 0.67, 0.71, 1.46, 1.85, 0.68, 3.35, 0.93, 1.14, 1.05, 0.28, 0.99, 0.77, 1.01, 0.14, 1.19, 0.28, 1.17, 0.22, 3.63, 0.19, 1.38, 1.02, 0.19, 1.08, 2.71, 1.06, 0.92, 4.84, 0.7, 0.9, 2.02, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/lQfG0D7wPKA_filtered.json b/annotations_filtered/lQfG0D7wPKA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c15d106792a8fc5aa7ba305db98c76ce7c1f1730 --- /dev/null +++ b/annotations_filtered/lQfG0D7wPKA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.37], [13.0, 13.29], [17.0, 16.75], [21.0, 21.74], [23.0, 25.57], [33.0, 33.32], [36.0, 36.22], [58.0, 58.09], [68.0, 67.88], [76.0, 77.65], [84.0, 84.55], [90.0, 90.09], [93.0, 94.78], [96.0, 96.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 0.29, -0.25, 0.74, 2.57, 0.32, 0.22, 0.09, -0.12, 1.65, 0.55, 0.09, 1.78, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/lQhQeus0ItY_filtered.json b/annotations_filtered/lQhQeus0ItY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..846217812d3fe1ca31dea12af69b788b9c2fcfb1 --- /dev/null +++ b/annotations_filtered/lQhQeus0ItY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [5.0, 4.99], [6.0, 6.07], [7.0, 7.26], [10.0, 10.45], [11.0, 18.5], [19.0, 19.52], [21.0, 21.68], [25.0, 25.68], [27.0, 27.31], [30.0, 31.13], [35.0, 35.48], [37.0, 37.94], [38.0, 39.82], [44.0, 45.15], [45.0, 47.22], [52.0, 57.97], [58.0, 58.72], [62.0, 62.19], [65.0, 66.23], [67.0, 68.44], [70.0, 71.66], [72.0, 72.54], [74.0, 75.1], [78.0, 81.13], [83.0, 84.43], [86.0, 85.95], [86.0, 86.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.72, 38.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 74.34], ["fart", 5.47], ["beatboxing", 1.96]], null, null, null, null, null, null, null, null, null, [["speech", 83.12], ["dial tone", 5.48], ["busy signal", 3.38]], [["speech", 34.69], ["sidetone", 28.33], ["whale vocalization", 8.18]], null, null, null, null, null, null, null, [["speech", 28.08], ["grunt", 12.07], ["groan", 7.83]], null, null, null], "duration": [0.99, -0.01, 0.07, 0.26, 0.45, 7.5, 0.52, 0.68, 0.68, 0.31, 1.13, 0.48, 0.94, 1.82, 1.15, 2.22, 5.97, 0.72, 0.19, 1.23, 1.44, 1.66, 0.54, 1.1, 3.13, 1.43, -0.05, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/lQoMIGl_NTU_filtered.json b/annotations_filtered/lQoMIGl_NTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdf3f0d20ea2c526ea9179f03decd252fc00c2f1 --- /dev/null +++ b/annotations_filtered/lQoMIGl_NTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.74], [16.0, 18.39], [20.0, 22.11], [24.0, 24.76], [25.0, 26.18], [31.0, 31.89], [34.0, 33.84], [38.0, 50.92], [54.0, 54.36], [56.0, 56.13], [59.0, 60.76], [62.0, 61.94], [65.0, 65.94], [67.0, 67.69], [69.0, 69.16], [71.0, 71.07], [71.0, 71.52], [72.0, 72.17], [73.0, 73.79]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.7, 30.85, 0.0, 0.0, 0.0, 0.0, 34.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["cattle, bovinae", 31.27], ["whale vocalization", 26.87], ["moo", 17.51]], [["roaring cats (lions, tigers)", 30.5], ["roar", 15.0], ["wild animals", 13.36]], null, null, null, null, [["music", 85.05], ["synthesizer", 1.49], ["whale vocalization", 1.4]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.74, 2.39, 2.11, 0.76, 1.18, 0.89, -0.16, 12.92, 0.36, 0.13, 1.76, -0.06, 0.94, 0.69, 0.16, 0.07, 0.52, 0.17, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/lQr3va8emXg_filtered.json b/annotations_filtered/lQr3va8emXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b07720bd99df4593484210373115c6bccd7dcdcf --- /dev/null +++ b/annotations_filtered/lQr3va8emXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[86.0, 130.44], [134.0, 136.95], [139.0, 205.9], [207.0, 207.52]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 30.05, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 42.11], ["throbbing", 8.65], ["hum", 7.21]], null, null], "duration": [44.44, 2.95, 66.9, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/lR6vy0i_rRU_filtered.json b/annotations_filtered/lR6vy0i_rRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e52ebb2187e572402750d00fc2fcbf47e68b2085 --- /dev/null +++ b/annotations_filtered/lR6vy0i_rRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 22.6], [23.0, 24.02], [25.0, 41.2], [42.0, 42.85], [44.0, 45.03]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [-0.4, 1.02, 16.2, 0.85, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/lR8KTwcC8fc_filtered.json b/annotations_filtered/lR8KTwcC8fc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10fb1751d309537ea6bf399ef9acdb6d283bc9a8 --- /dev/null +++ b/annotations_filtered/lR8KTwcC8fc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.64], [9.0, 9.86], [13.0, 13.81], [19.0, 19.28], [23.0, 24.04], [28.0, 28.83], [29.0, 30.65], [32.0, 32.46], [34.0, 34.8], [41.0, 41.62], [42.0, 43.01], [51.0, 51.38], [52.0, 52.95], [62.0, 62.75], [65.0, 64.94], [68.0, 69.58], [72.0, 78.56], [79.0, 92.7], [94.0, 97.29], [104.0, 106.08], [108.0, 108.41], [109.0, 110.52], [112.0, 112.48], [114.0, 114.27], [117.0, 117.09], [118.0, 126.0], [127.0, 132.81], [138.0, 140.17], [143.0, 143.75], [147.0, 149.94], [155.0, 156.32], [161.0, 162.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.2, 39.94, 43.15, 54.1, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 75.39, 84.07, 0.0, 71.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.96], ["burst, pop", 17.38], ["explosion", 15.32]], [["telephone dialing, dtmf", 46.55], ["busy signal", 11.47], ["beep, bleep", 8.24]], [["music", 45.73], ["speech", 9.11], ["musical instrument", 1.99]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.86, 0.81, 0.28, 1.04, 0.83, 1.65, 0.46, 0.8, 0.62, 1.01, 0.38, 0.95, 0.75, -0.06, 1.58, 6.56, 13.7, 3.29, 2.08, 0.41, 1.52, 0.48, 0.27, 0.09, 8.0, 5.81, 2.17, 0.75, 2.94, 1.32, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/lRAsSTNZD8g_filtered.json b/annotations_filtered/lRAsSTNZD8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c18d1d0316b2449241afa04524741cceeda7e1c1 --- /dev/null +++ b/annotations_filtered/lRAsSTNZD8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [5.0, 8.9], [10.0, 11.64], [13.0, 13.42], [15.0, 15.47], [18.0, 19.89], [21.0, 28.04], [29.0, 30.64], [32.0, 79.81], [82.0, 83.37], [84.0, 84.91], [86.0, 87.79], [88.0, 104.8], [109.0, 125.88], [131.0, 146.15], [150.0, 150.77], [155.0, 155.88], [163.0, 164.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 0.0, 33.45, 42.72, 43.48, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.93], ["music", 17.84], ["civil defense siren", 17.73]], [["whale vocalization", 51.99], ["music", 34.32], ["theremin", 4.96]], [["speech", 85.64], ["music", 3.28], ["sidetone", 2.42]], null, null, null], "duration": [0.73, 3.9, 1.64, 0.42, 0.47, 1.89, 7.04, 1.64, 47.81, 1.37, 0.91, 1.79, 16.8, 16.88, 15.15, 0.77, 0.88, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/lRQXQXsXIm8_filtered.json b/annotations_filtered/lRQXQXsXIm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..add3da405bf0c97e1d584acf356e75d804a245fc --- /dev/null +++ b/annotations_filtered/lRQXQXsXIm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.63], [68.0, 69.67], [71.0, 72.79], [77.0, 77.43], [79.0, 80.13], [83.0, 84.08]], "keep_status": [true, false, false, false, false, false], "silence_prob": [34.83, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["honk", 15.78], ["livestock, farm animals, working animals", 15.33], ["goose", 12.29]], null, null, null, null, null], "duration": [2.63, 1.67, 1.79, 0.43, 1.13, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/lRVUsY_rcCo_filtered.json b/annotations_filtered/lRVUsY_rcCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06e7bdc08a4d4103c8662daa605530c8abc318ff --- /dev/null +++ b/annotations_filtered/lRVUsY_rcCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [5.0, 5.26], [6.0, 7.11], [8.0, 9.12], [10.0, 11.4], [13.0, 17.02], [20.0, 22.4], [25.0, 32.02], [34.0, 34.75]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 54.63, 55.89, 33.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 15.14], ["cattle, bovinae", 12.04], ["noise", 10.3]], null], "duration": [1.17, 0.26, 1.11, 1.12, 1.4, 4.02, 2.4, 7.02, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/lRlgx_GFwyI_filtered.json b/annotations_filtered/lRlgx_GFwyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/lRlgx_GFwyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/lRpBlNgu8j4_filtered.json b/annotations_filtered/lRpBlNgu8j4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbb545f65e0d5759b78caedf5c16212da749abb1 --- /dev/null +++ b/annotations_filtered/lRpBlNgu8j4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.64], [28.0, 28.38], [31.0, 32.05], [35.0, 35.34], [41.0, 42.21], [56.0, 68.1], [69.0, 69.67], [72.0, 73.41], [76.0, 75.69], [77.0, 78.31], [83.0, 82.86], [87.0, 87.67], [92.0, 92.38], [96.0, 96.85], [101.0, 102.15], [108.0, 109.27], [110.0, 110.81], [113.0, 114.27], [119.0, 119.84], [121.0, 122.08], [127.0, 127.77], [129.0, 130.11], [131.0, 166.43], [167.0, 167.68], [168.0, 179.78]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.45], "audiomae_on_audioset": [null, null, null, null, null, [["music", 33.15], ["musical instrument", 9.12], ["speech", 7.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.84], ["applause", 11.94], ["crowd", 11.12]]], "duration": [0.64, 0.38, 1.05, 0.34, 1.21, 12.1, 0.67, 1.41, -0.31, 1.31, -0.14, 0.67, 0.38, 0.85, 1.15, 1.27, 0.81, 1.27, 0.84, 1.08, 0.77, 1.11, 35.43, 0.68, 11.78]} \ No newline at end of file diff --git a/annotations_filtered/lRzsGDSofxo_filtered.json b/annotations_filtered/lRzsGDSofxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b6b78402113ecea201d0651e4292e177f4369ae --- /dev/null +++ b/annotations_filtered/lRzsGDSofxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.62], [12.0, 15.28], [16.0, 21.54], [31.0, 31.19], [32.0, 40.95], [42.0, 42.36], [43.0, 58.31], [62.0, 65.31], [72.0, 104.85], [107.0, 117.8], [120.0, 120.14], [124.0, 125.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.25, 65.09, 46.5, 0.0, 48.1, 0.0, 40.41, 54.76, 0.0, 63.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 76.64], ["musical instrument", 3.59], ["guitar", 2.93]], null, [["music", 75.7], ["musical instrument", 5.91], ["synthesizer", 4.28]], null, [["music", 72.62], ["speech", 8.86], ["skateboard", 2.3]], null, null, null, null, null], "duration": [6.62, 3.28, 5.54, 0.19, 8.95, 0.36, 15.31, 3.31, 32.85, 10.8, 0.14, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/lS1KFyakAPE_filtered.json b/annotations_filtered/lS1KFyakAPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ae4edaac7e924f5eb2d9c62c4e6d686890fa5b8 --- /dev/null +++ b/annotations_filtered/lS1KFyakAPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.21], [20.0, 20.22], [21.0, 21.9], [23.0, 22.87], [23.0, 25.71], [39.0, 38.58], [39.0, 38.62], [40.0, 40.07], [41.0, 42.08], [61.0, 60.89], [62.0, 62.8], [64.0, 67.05], [68.0, 69.58], [72.0, 76.08], [78.0, 79.62], [81.0, 81.26], [85.0, 85.5], [95.0, 95.54], [96.0, 96.74], [100.0, 100.84], [103.0, 103.49], [104.0, 104.87], [109.0, 109.53], [111.0, 112.5]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.7, 0.0, 32.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 48.75], ["guitar", 9.65], ["musical instrument", 7.64]], null, null, null, null, null, null, [["speech", 83.59], ["beatboxing", 5.76], ["whack, thwack", 1.73]], null, [["speech", 72.6], ["bouncing", 6.54], ["ping", 3.78]], null, null, null, null, null, null, null, null, null, null], "duration": [0.21, 0.22, 0.9, -0.13, 2.71, -0.42, -0.38, 0.07, 1.08, -0.11, 0.8, 3.05, 1.58, 4.08, 1.62, 0.26, 0.5, 0.54, 0.74, 0.84, 0.49, 0.87, 0.53, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/lS9V0oDrPfs_filtered.json b/annotations_filtered/lS9V0oDrPfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/lS9V0oDrPfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/lSTkEHpkMf8_filtered.json b/annotations_filtered/lSTkEHpkMf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b2ad868a0151ec83055d05fa1a9cc7fbe4a8731 --- /dev/null +++ b/annotations_filtered/lSTkEHpkMf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.39], [13.0, 14.45], [15.0, 16.44], [17.0, 18.67], [20.0, 24.6], [25.0, 26.54], [28.0, 30.06], [31.0, 32.59], [36.0, 37.49], [39.0, 41.4], [44.0, 45.67], [47.0, 49.38], [51.0, 53.06], [54.0, 57.01], [58.0, 60.34], [64.0, 65.77], [67.0, 68.94], [70.0, 72.35], [75.0, 76.33], [79.0, 80.45], [82.0, 84.64], [87.0, 88.74], [91.0, 91.81], [95.0, 95.44], [97.0, 100.97], [102.0, 104.33], [105.0, 108.85], [109.0, 117.21], [118.0, 121.44]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.04, 0.0, 0.0, 0.0, 39.43, 0.0, 57.09, 0.0, 0.0, 46.19, 0.0, 58.72, 46.79, 45.24, 47.01, 0.0, 0.0, 84.43, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 87.19, 86.82, 54.5, 63.74, 53.72], "audiomae_on_audioset": [[["music", 56.38], ["theremin", 8.61], ["musical instrument", 5.29]], null, null, null, [["mains hum", 27.7], ["speech", 26.0], ["hum", 15.36]], null, null, null, null, [["mains hum", 54.89], ["hum", 24.01], ["noise", 5.07]], null, null, [["music", 59.0], ["theremin", 15.06], ["radio", 3.42]], [["mains hum", 32.94], ["speech", 21.54], ["hum", 14.1]], [["whale vocalization", 19.67], ["speech", 13.74], ["music", 12.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.39, 1.45, 1.44, 1.67, 4.6, 1.54, 2.06, 1.59, 1.49, 2.4, 1.67, 2.38, 2.06, 3.01, 2.34, 1.77, 1.94, 2.35, 1.33, 1.45, 2.64, 1.74, 0.81, 0.44, 3.97, 2.33, 3.85, 8.21, 3.44]} \ No newline at end of file diff --git a/annotations_filtered/lScMakd7h6w_filtered.json b/annotations_filtered/lScMakd7h6w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f616af182040d0881a9ce8d9bf8f35209e11c4d1 --- /dev/null +++ b/annotations_filtered/lScMakd7h6w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.99], [15.0, 19.52], [20.0, 23.21], [24.0, 30.43], [36.0, 41.05], [43.0, 44.49], [46.0, 48.39], [51.0, 52.32], [53.0, 52.52], [53.0, 56.59]], "keep_status": [false, true, false, false, true, false, true, false, false, false], "silence_prob": [51.07, 47.74, 51.55, 50.21, 30.18, 0.0, 30.51, 0.0, 0.0, 35.54], "audiomae_on_audioset": [null, [["speech", 24.68], ["hum", 23.98], ["mains hum", 15.5]], null, null, [["fly, housefly", 17.37], ["music", 15.88], ["didgeridoo", 11.52]], null, [["music", 33.16], ["fly, housefly", 15.73], ["static", 6.86]], null, null, [["speech", 71.07], ["music", 10.16], ["clang", 3.52]]], "duration": [7.99, 4.52, 3.21, 6.43, 5.05, 1.49, 2.39, 1.32, -0.48, 3.59]} \ No newline at end of file diff --git a/annotations_filtered/lSzT54HTpeY_filtered.json b/annotations_filtered/lSzT54HTpeY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1182c485707cc16b47432587d002c798d7782af0 --- /dev/null +++ b/annotations_filtered/lSzT54HTpeY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 129.25]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [126.25]} \ No newline at end of file diff --git a/annotations_filtered/lTWY11J9Z3o_filtered.json b/annotations_filtered/lTWY11J9Z3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..503a2e8bedf6f616eba6082dbc30f4cc8bc707bf --- /dev/null +++ b/annotations_filtered/lTWY11J9Z3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [5.0, 4.85], [7.0, 7.48], [14.0, 17.73], [20.0, 26.37], [27.0, 28.41], [29.0, 29.0], [31.0, 31.56], [35.0, 40.68], [46.0, 47.02], [58.0, 58.55], [61.0, 61.42], [63.0, 68.1], [72.0, 72.33], [74.0, 74.9], [78.0, 79.59], [82.0, 86.85], [88.0, 88.42], [91.0, 91.67], [93.0, 93.93], [100.0, 103.47], [105.0, 105.9], [117.0, 117.22], [124.0, 124.24], [125.0, 150.99], [154.0, 157.11], [159.0, 159.06], [159.0, 160.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 94.22, 55.46, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 65.55, 0.0, 0.0, 0.0, 72.31, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 0.0, 35.24, 55.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.71], ["hum", 14.09], ["mains hum", 11.1]], null, null, null], "duration": [0.58, -0.15, 0.48, 3.73, 6.37, 1.41, 0.0, 0.56, 5.68, 1.02, 0.55, 0.42, 5.1, 0.33, 0.9, 1.59, 4.85, 0.42, 0.67, 0.93, 3.47, 0.9, 0.22, 0.24, 25.99, 3.11, 0.06, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/lTd2m2J2XmU_filtered.json b/annotations_filtered/lTd2m2J2XmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c0236f4b260c413b7906fe120e895e1567df617 --- /dev/null +++ b/annotations_filtered/lTd2m2J2XmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [5.0, 10.23], [11.0, 11.7], [16.0, 18.84], [24.0, 23.95], [31.0, 31.45], [33.0, 33.98], [35.0, 36.69], [38.0, 43.88], [47.0, 109.75], [118.0, 130.38]], "keep_status": [false, true, false, true, false, false, false, false, true, false, true], "silence_prob": [0.0, 40.97, 0.0, 43.05, 0.0, 0.0, 0.0, 0.0, 33.07, 0.0, 35.25], "audiomae_on_audioset": [null, [["music", 41.56], ["speech", 10.55], ["synthesizer", 7.65]], null, [["music", 38.44], ["effects unit", 18.06], ["sidetone", 10.71]], null, null, null, null, [["speech", 49.22], ["music", 7.98], ["horse", 4.23]], null, [["hum", 42.91], ["mains hum", 13.24], ["throbbing", 8.77]]], "duration": [0.33, 5.23, 0.7, 2.84, -0.05, 0.45, 0.98, 1.69, 5.88, 62.75, 12.38]} \ No newline at end of file diff --git a/annotations_filtered/lTiCL83_dR4_filtered.json b/annotations_filtered/lTiCL83_dR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e207062db9467a1a2d9d4b4e3138fe1912114bb --- /dev/null +++ b/annotations_filtered/lTiCL83_dR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [5.0, 5.59], [7.0, 17.2], [19.0, 19.92], [23.0, 36.9], [38.0, 42.23], [44.0, 44.0], [45.0, 47.73], [49.0, 63.61], [66.0, 66.99], [69.0, 92.16], [98.0, 97.65], [98.0, 98.73], [99.0, 100.63], [110.0, 112.29], [118.0, 124.43], [131.0, 131.57], [134.0, 134.6], [136.0, 140.83], [146.0, 147.24], [148.0, 148.66], [150.0, 150.96], [153.0, 166.95], [170.0, 170.46], [172.0, 173.94]], "keep_status": [false, false, false, false, true, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.33, 0.0, 32.74, 31.46, 0.0, 31.8, 33.85, 0.0, 31.49, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 78.21, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 67.09], ["synthesizer", 10.03], ["musical instrument", 4.13]], null, [["music", 16.24], ["hum", 13.09], ["noise", 11.62]], [["noise", 13.94], ["mains hum", 13.54], ["hum", 12.55]], null, [["noise", 26.49], ["synthesizer", 10.0], ["music", 7.95]], [["music", 58.71], ["synthesizer", 5.56], ["hum", 4.99]], null, [["music", 43.75], ["speech", 6.34], ["musical instrument", 6.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.59, 10.2, 0.92, 13.9, 4.23, 0.0, 2.73, 14.61, 0.99, 23.16, -0.35, 0.73, 1.63, 2.29, 6.43, 0.57, 0.6, 4.83, 1.24, 0.66, 0.96, 13.95, 0.46, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/lUQJN1xzKpc_filtered.json b/annotations_filtered/lUQJN1xzKpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2639401b977746761cbffe91540a3d11170b905 --- /dev/null +++ b/annotations_filtered/lUQJN1xzKpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.03], [4.0, 5.63], [7.0, 9.04], [9.0, 30.48], [31.0, 30.52], [31.0, 31.53], [33.0, 33.45], [34.0, 34.84], [35.0, 35.43], [39.0, 40.1], [42.0, 68.62], [70.0, 74.51], [76.0, 78.11], [79.0, 81.41], [83.0, 88.91], [90.0, 90.32], [91.0, 94.8], [96.0, 97.8], [98.0, 100.74], [101.0, 104.7], [105.0, 134.1], [139.0, 140.17], [141.0, 144.75], [145.0, 152.79], [157.0, 158.06], [158.0, 161.16], [165.0, 168.24], [169.0, 169.72], [170.0, 172.5], [174.0, 176.07], [181.0, 182.22], [185.0, 187.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 89.9, 52.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.36, 71.57, 76.7, 68.15, 92.15, 0.0, 89.72, 0.0, 88.64, 55.04, 34.17, 0.0, 99.62, 79.59, 0.0, 85.9, 90.25, 0.0, 89.01, 79.41, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 79.8], ["scary music", 9.55], ["soundtrack music", 1.15]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 1.63, 2.04, 21.48, -0.48, 0.53, 0.45, 0.84, 0.43, 1.1, 26.62, 4.51, 2.11, 2.41, 5.91, 0.32, 3.8, 1.8, 2.74, 3.7, 29.1, 1.17, 3.75, 7.79, 1.06, 3.16, 3.24, 0.72, 2.5, 2.07, 1.22, 2.95]} \ No newline at end of file diff --git a/annotations_filtered/lUglQukweZY_filtered.json b/annotations_filtered/lUglQukweZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..520220ff88f2e8337f93952badac2da2108f319f --- /dev/null +++ b/annotations_filtered/lUglQukweZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [36.0, 38.31], [77.0, 77.63], [82.0, 83.67], [89.0, 89.72], [99.0, 112.94], [119.0, 119.08], [145.0, 146.58], [155.0, 155.93], [162.0, 162.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.02, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 80.32], ["reggae", 2.53], ["funk", 1.63]], null, null, null, null], "duration": [0.54, 2.31, 0.63, 1.67, 0.72, 13.94, 0.08, 1.58, 0.93, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/lV2XAU1JzuI_filtered.json b/annotations_filtered/lV2XAU1JzuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ea7f32a6a230266fe5bc841d92a8d2bc25bff6d --- /dev/null +++ b/annotations_filtered/lV2XAU1JzuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.72], [21.0, 22.1], [27.0, 27.14], [35.0, 55.54], [59.0, 59.73], [62.0, 62.38], [64.0, 66.82], [70.0, 73.5], [74.0, 74.61], [75.0, 75.37], [75.0, 75.51], [78.0, 78.53], [81.0, 82.0], [84.0, 86.04], [87.0, 89.56]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 32.5, 0.0, 0.0, 35.26, 32.38, 0.0, 0.0, 0.0, 0.0, 0.0, 37.93, 31.31], "audiomae_on_audioset": [null, null, null, [["music", 30.92], ["trombone", 25.29], ["brass instrument", 24.18]], null, null, [["music", 29.7], ["saxophone", 9.94], ["speech", 7.46]], [["cattle, bovinae", 53.33], ["moo", 36.93], ["livestock, farm animals, working animals", 9.36]], null, null, null, null, null, [["music", 46.73], ["theremin", 4.96], ["hum", 4.77]], [["mantra", 39.25], ["music", 18.2], ["chant", 12.05]]], "duration": [0.72, 1.1, 0.14, 20.54, 0.73, 0.38, 2.82, 3.5, 0.61, 0.37, 0.51, 0.53, 1.0, 2.04, 2.56]} \ No newline at end of file diff --git a/annotations_filtered/lVMviKEztGw_filtered.json b/annotations_filtered/lVMviKEztGw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e26a0ed8cad36aa92071f2961c58ab6b76c5933 --- /dev/null +++ b/annotations_filtered/lVMviKEztGw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.24], [7.0, 10.88], [12.0, 12.85], [14.0, 16.83], [18.0, 18.84], [20.0, 21.2], [23.0, 27.09], [27.0, 34.59], [36.0, 41.54], [42.0, 43.17], [45.0, 55.07], [56.0, 59.27], [64.0, 65.57], [66.0, 68.59], [70.0, 70.98], [73.0, 73.65], [74.0, 75.54], [81.0, 81.7], [82.0, 86.16], [87.0, 88.65], [90.0, 91.37], [93.0, 94.58], [98.0, 98.83], [100.0, 101.73], [103.0, 103.94], [106.0, 106.39], [109.0, 108.77], [116.0, 117.83], [119.0, 120.72], [122.0, 124.07]], "keep_status": [true, false, false, true, false, false, true, true, true, false, true, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.2, 33.67, 0.0, 37.74, 0.0, 0.0, 36.15, 37.49, 33.74, 0.0, 39.85, 46.75, 0.0, 40.9, 0.0, 0.0, 0.0, 0.0, 36.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55], "audiomae_on_audioset": [[["music", 25.06], ["hum", 20.85], ["speech", 11.72]], [["music", 68.99], ["theremin", 6.19], ["whale vocalization", 3.01]], null, [["speech", 26.9], ["civil defense siren", 21.79], ["music", 7.85]], null, null, [["whale vocalization", 27.06], ["music", 19.16], ["theremin", 16.2]], [["speech", 36.56], ["music", 15.31], ["hum", 13.91]], [["mains hum", 31.09], ["hum", 14.63], ["speech", 13.89]], null, [["noise", 37.44], ["music", 19.19], ["speech", 13.01]], [["whale vocalization", 24.51], ["radio", 14.06], ["music", 10.41]], null, [["music", 24.69], ["speech", 19.6], ["sidetone", 7.77]], null, null, null, null, [["whale vocalization", 28.88], ["speech", 19.49], ["music", 17.58]], null, null, null, null, null, null, null, null, null, null, null], "duration": [3.24, 3.88, 0.85, 2.83, 0.84, 1.2, 4.09, 7.59, 5.54, 1.17, 10.07, 3.27, 1.57, 2.59, 0.98, 0.65, 1.54, 0.7, 4.16, 1.65, 1.37, 1.58, 0.83, 1.73, 0.94, 0.39, -0.23, 1.83, 1.72, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/lVSMG8FTnpw_filtered.json b/annotations_filtered/lVSMG8FTnpw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bed8cdcf03b97584287883f774df9e8ab085d8ab --- /dev/null +++ b/annotations_filtered/lVSMG8FTnpw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.11], [12.0, 12.66], [13.0, 20.24], [20.0, 21.14], [21.0, 25.66], [31.0, 36.19], [40.0, 50.89], [51.0, 133.71], [134.0, 133.88], [134.0, 153.82]], "keep_status": [true, false, false, false, false, true, false, false, false, true], "silence_prob": [37.33, 0.0, 42.74, 0.0, 39.38, 31.55, 42.67, 0.0, 0.0, 36.98], "audiomae_on_audioset": [[["music", 50.68], ["ambient music", 10.03], ["scary music", 6.46]], null, [["music", 57.43], ["didgeridoo", 17.68], ["hum", 2.71]], null, [["music", 40.39], ["theremin", 30.15], ["synthesizer", 7.47]], [["music", 50.76], ["theremin", 8.31], ["musical instrument", 3.82]], [["civil defense siren", 61.35], ["siren", 30.46], ["music", 4.02]], null, null, [["music", 49.09], ["theremin", 8.6], ["didgeridoo", 6.23]]], "duration": [2.11, 0.66, 7.24, 1.14, 4.66, 5.19, 10.89, 82.71, -0.12, 19.82]} \ No newline at end of file diff --git a/annotations_filtered/lVg2pm0YdQ0_filtered.json b/annotations_filtered/lVg2pm0YdQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9d45d38b745b95171bb3fb970d83abfd31b6f31 --- /dev/null +++ b/annotations_filtered/lVg2pm0YdQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.52], [22.0, 22.05], [42.0, 42.33], [44.0, 44.49], [46.0, 46.72], [51.0, 51.17], [80.0, 79.84], [82.0, 82.07], [86.0, 86.39], [90.0, 90.15], [92.0, 94.56], [95.0, 95.01], [95.0, 95.59], [97.0, 97.82], [98.0, 99.5], [100.0, 100.57], [107.0, 109.14], [110.0, 110.49], [135.0, 135.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.99, 0.0, 0.0, 0.0, 0.0, 0.0, 34.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 46.65], ["musical instrument", 23.25], ["guitar", 9.65]], null, null, null, null, null, [["music", 78.03], ["musical instrument", 6.12], ["piano", 2.55]], null, null], "duration": [0.52, 0.05, 0.33, 0.49, 0.72, 0.17, -0.16, 0.07, 0.39, 0.15, 2.56, 0.01, 0.59, 0.82, 1.5, 0.57, 2.14, 0.49, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/lVmwqKY9BX0_filtered.json b/annotations_filtered/lVmwqKY9BX0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64045924f3226a73cdcf49ec3c480478f58a2686 --- /dev/null +++ b/annotations_filtered/lVmwqKY9BX0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.46], [9.0, 12.75], [14.0, 14.44], [15.0, 19.99], [23.0, 23.11], [26.0, 25.93], [28.0, 27.9], [36.0, 36.02], [37.0, 38.3], [40.0, 39.6], [42.0, 44.93], [45.0, 47.98], [49.0, 49.96], [53.0, 53.62], [70.0, 71.29], [79.0, 79.61], [80.0, 84.82], [86.0, 88.25], [89.0, 90.63], [92.0, 106.81], [108.0, 110.32], [111.0, 114.3], [117.0, 117.51], [120.0, 120.06], [121.0, 124.12], [124.0, 130.28], [131.0, 132.78], [134.0, 134.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [99.9, 99.88, 0.0, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 52.1, 0.0, 0.0, 0.0, 0.0, 35.51, 99.96, 0.0, 92.64, 82.25, 89.36, 0.0, 0.0, 90.43, 47.94, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.42], ["hum", 17.51], ["mains hum", 14.88]], null, null, null, null, null, null, null, null, [["speech", 26.77], ["music", 23.94], ["synthesizer", 14.37]], null, null], "duration": [4.46, 3.75, 0.44, 4.99, 0.11, -0.07, -0.1, 0.02, 1.3, -0.4, 2.93, 2.98, 0.96, 0.62, 1.29, 0.61, 4.82, 2.25, 1.63, 14.81, 2.32, 3.3, 0.51, 0.06, 3.12, 6.28, 1.78, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/lVsH8dttw4I_filtered.json b/annotations_filtered/lVsH8dttw4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f4bec30ec5d1f41d14d0d0ae84bd8511d923945 --- /dev/null +++ b/annotations_filtered/lVsH8dttw4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.75], [7.0, 7.79], [12.0, 18.91], [21.0, 22.92], [46.0, 46.97], [51.0, 50.73], [51.0, 52.08], [52.0, 52.84], [53.0, 62.26], [68.0, 68.15], [97.0, 97.58], [100.0, 102.88], [103.0, 103.33], [104.0, 104.8], [110.0, 111.18], [112.0, 112.21], [115.0, 115.82], [117.0, 117.17], [118.0, 118.57], [120.0, 120.33], [123.0, 124.02], [125.0, 125.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.93, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 29.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 72.3], ["theremin", 6.07], ["radio", 3.44]], null, null, null, null, null, null, null, null, [["speech", 15.82], ["noise", 14.05], ["boing", 12.4]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.25, 0.79, 6.91, 1.92, 0.97, -0.27, 1.08, 0.84, 9.26, 0.15, 0.58, 2.88, 0.33, 0.8, 1.18, 0.21, 0.82, 0.17, 0.57, 0.33, 1.02, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/lW1vzy6psfE_filtered.json b/annotations_filtered/lW1vzy6psfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/lW1vzy6psfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/lW2JBJSaXUI_filtered.json b/annotations_filtered/lW2JBJSaXUI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79539fa454452382558a7c069fa257aa120e923f --- /dev/null +++ b/annotations_filtered/lW2JBJSaXUI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.54], [10.0, 13.56], [18.0, 18.57], [24.0, 34.97], [39.0, 41.84], [43.0, 43.16], [43.0, 43.95], [44.0, 44.78], [49.0, 56.59], [62.0, 62.29], [65.0, 65.99], [69.0, 70.07], [78.0, 78.98]], "keep_status": [false, true, false, true, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 30.1, 0.0, 31.31, 29.45, 0.0, 0.0, 0.0, 31.76, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 10.92], ["groan", 8.81], ["whale vocalization", 7.84]], null, [["speech", 51.13], ["whale vocalization", 8.92], ["music", 4.86]], [["whale vocalization", 48.86], ["speech", 9.14], ["music", 6.45]], null, null, null, [["speech", 25.44], ["foghorn", 19.89], ["music", 13.66]], null, null, null, null], "duration": [0.54, 3.56, 0.57, 10.97, 2.84, 0.16, 0.95, 0.78, 7.59, 0.29, 0.99, 1.07, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/lWZU3pPZWig_filtered.json b/annotations_filtered/lWZU3pPZWig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aa6956ceac89d141f7308193ecf11fa2a3005f3 --- /dev/null +++ b/annotations_filtered/lWZU3pPZWig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.22], [10.0, 15.13], [17.0, 23.58], [30.0, 31.02], [40.0, 41.45], [66.0, 66.51], [73.0, 73.48], [77.0, 77.41], [80.0, 80.82], [82.0, 82.98], [85.0, 85.04], [92.0, 92.45], [96.0, 96.18], [97.0, 97.93], [100.0, 102.79], [111.0, 112.67], [114.0, 114.62], [115.0, 117.54], [120.0, 124.56]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true], "silence_prob": [0.0, 34.42, 37.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.4, 0.0, 0.0, 40.75, 40.45], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 23.5], ["music", 20.51], ["moo", 8.59]], [["music", 44.33], ["whale vocalization", 8.19], ["musical instrument", 4.22]], null, null, null, null, null, null, null, null, null, null, null, [["music", 40.22], ["mains hum", 5.56], ["hum", 5.52]], null, null, [["mains hum", 29.68], ["hum", 24.84], ["speech", 9.55]], [["hum", 25.15], ["throbbing", 21.68], ["music", 20.52]]], "duration": [1.22, 5.13, 6.58, 1.02, 1.45, 0.51, 0.48, 0.41, 0.82, 0.98, 0.04, 0.45, 0.18, 0.93, 2.79, 1.67, 0.62, 2.54, 4.56]} \ No newline at end of file diff --git a/annotations_filtered/lWqHayjaOxo_filtered.json b/annotations_filtered/lWqHayjaOxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e544687f3571f17f8f92cc42d9eda50c95f138c0 --- /dev/null +++ b/annotations_filtered/lWqHayjaOxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.94], [17.0, 17.83], [20.0, 20.33], [28.0, 29.79], [34.0, 35.01], [38.0, 42.06], [46.0, 46.16], [47.0, 49.37]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.61, 0.0, 92.15], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 89.14], ["telephone", 3.42], ["music", 2.23]], null, null], "duration": [0.94, 0.83, 0.33, 1.79, 1.01, 4.06, 0.16, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/lX4H0NmDMck_filtered.json b/annotations_filtered/lX4H0NmDMck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a345a9226c6dfd34dfa953ecb16b524054580f9a --- /dev/null +++ b/annotations_filtered/lX4H0NmDMck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.64], [3.0, 4.94], [5.0, 4.97], [11.0, 10.77], [14.0, 21.24], [32.0, 34.08], [40.0, 53.89], [75.0, 74.85], [79.0, 79.71], [103.0, 110.78], [121.0, 121.81], [127.0, 131.57], [140.0, 148.2], [150.0, 157.77], [167.0, 167.16], [173.0, 173.26], [175.0, 175.14], [176.0, 176.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.79, 30.24, 30.28, 0.0, 0.0, 29.69, 0.0, 30.14, 30.03, 29.83, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 70.57], ["house music", 2.24], ["rattle", 1.8]], [["music", 75.01], ["afrobeat", 2.25], ["music of africa", 1.77]], [["music", 81.44], ["carnatic music", 1.82], ["reggae", 1.45]], null, null, [["music", 66.02], ["dubstep", 4.62], ["singing", 4.12]], null, [["music", 52.58], ["reggae", 12.63], ["a capella", 8.16]], [["music", 64.79], ["carnatic music", 9.9], ["musical instrument", 3.59]], [["music", 84.8], ["musical instrument", 2.25], ["carnatic music", 1.58]], null, null, null, null], "duration": [-0.36, 1.94, -0.03, -0.23, 7.24, 2.08, 13.89, -0.15, 0.71, 7.78, 0.81, 4.57, 8.2, 7.77, 0.16, 0.26, 0.14, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/lXS7GWgCBWM_filtered.json b/annotations_filtered/lXS7GWgCBWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b29dbc23e014a25db8295229d6b2e4f242343890 --- /dev/null +++ b/annotations_filtered/lXS7GWgCBWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.96], [10.0, 13.44], [15.0, 15.48], [16.0, 22.65], [23.0, 24.71], [28.0, 29.29], [30.0, 30.97], [39.0, 39.04], [41.0, 41.62], [45.0, 46.95], [58.0, 59.51], [62.0, 63.48], [67.0, 67.93], [69.0, 71.31], [74.0, 73.75], [75.0, 75.91], [80.0, 80.57], [81.0, 82.7], [86.0, 86.51], [87.0, 88.43], [89.0, 93.99], [95.0, 151.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.05, 0.0, 60.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.96, 3.44, 0.48, 6.65, 1.71, 1.29, 0.97, 0.04, 0.62, 1.95, 1.51, 1.48, 0.93, 2.31, -0.25, 0.91, 0.57, 1.7, 0.51, 1.43, 4.99, 56.8]} \ No newline at end of file diff --git a/annotations_filtered/lXtrwkdSkow_filtered.json b/annotations_filtered/lXtrwkdSkow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e102ccfa18d1410700d4a2ff75c72e97ed055fc6 --- /dev/null +++ b/annotations_filtered/lXtrwkdSkow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.32], [42.0, 46.21], [54.0, 55.24], [58.0, 59.24], [73.0, 73.08], [96.0, 98.9], [100.0, 100.13], [102.0, 103.13], [109.0, 109.14]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.57, 0.0, 0.0, 0.0, 51.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 53.96], ["music", 15.48], ["drum machine", 4.18]], null, null, null, null, null, null, null], "duration": [1.32, 4.21, 1.24, 1.24, 0.08, 2.9, 0.13, 1.13, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/lXy9Lp8bu98_filtered.json b/annotations_filtered/lXy9Lp8bu98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..920ccb8d6e0374bd38594b9661e1c5b41100d6fe --- /dev/null +++ b/annotations_filtered/lXy9Lp8bu98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [5.0, 7.42], [9.0, 9.39], [11.0, 14.37], [15.0, 14.79], [16.0, 15.82], [29.0, 29.32], [37.0, 37.4], [39.0, 40.17], [41.0, 41.96], [44.0, 44.74], [46.0, 47.98], [49.0, 50.19], [55.0, 55.21], [57.0, 58.21], [76.0, 76.67], [78.0, 78.31], [80.0, 81.03], [91.0, 92.1], [105.0, 106.14], [107.0, 107.4], [113.0, 113.88], [132.0, 134.38], [137.0, 137.54], [142.0, 145.83], [149.0, 154.85], [157.0, 157.3], [158.0, 158.95], [166.0, 167.24], [173.0, 173.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 93.29, 0.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.28, 0.0, 34.64, 29.84, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["vehicle", 32.28], ["speech", 23.15], ["skidding", 14.57]], null, [["moo", 14.6], ["livestock, farm animals, working animals", 11.33], ["cattle, bovinae", 9.37]], [["speech", 14.66], ["tuning fork", 13.49], ["ping", 6.3]], null, null, null, null], "duration": [0.96, 2.42, 0.39, 3.37, -0.21, -0.18, 0.32, 0.4, 1.17, 0.96, 0.74, 1.98, 1.19, 0.21, 1.21, 0.67, 0.31, 1.03, 1.1, 1.14, 0.4, 0.88, 2.38, 0.54, 3.83, 5.85, 0.3, 0.95, 1.24, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/lYCq6x3AHYw_filtered.json b/annotations_filtered/lYCq6x3AHYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b64fd6ffa6f8cc3747e71bb8792b17441172d98f --- /dev/null +++ b/annotations_filtered/lYCq6x3AHYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 26.08], [26.0, 55.8], [58.0, 62.5], [63.0, 65.55], [67.0, 72.71], [75.0, 117.1], [120.0, 120.36], [126.0, 129.27], [139.0, 139.78], [141.0, 142.32], [147.0, 147.58], [149.0, 162.26], [163.0, 164.47]], "keep_status": [true, false, true, false, true, false, false, true, false, false, false, true, false], "silence_prob": [32.92, 32.43, 34.44, 35.42, 33.51, 0.0, 0.0, 34.57, 0.0, 0.0, 0.0, 37.89, 0.0], "audiomae_on_audioset": [[["music", 26.98], ["bow-wow", 20.12], ["livestock, farm animals, working animals", 6.77]], [["music", 74.67], ["musical instrument", 1.85], ["speech", 1.79]], [["music", 54.19], ["synthesizer", 5.59], ["speech", 5.28]], [["music", 71.58], ["synthesizer", 4.61], ["drum machine", 3.58]], [["cattle, bovinae", 30.76], ["moo", 23.25], ["music", 15.22]], null, null, [["crushing", 39.79], ["whack, thwack", 23.85], ["boing", 3.6]], null, null, null, [["music", 38.22], ["speech", 15.1], ["hum", 9.24]], null], "duration": [23.08, 29.8, 4.5, 2.55, 5.71, 42.1, 0.36, 3.27, 0.78, 1.32, 0.58, 13.26, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/lYEy4it6m3Y_filtered.json b/annotations_filtered/lYEy4it6m3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2484540b254266384f2c1942b5065e823dc9df0 --- /dev/null +++ b/annotations_filtered/lYEy4it6m3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 27.33], [29.0, 30.03], [30.0, 30.43], [31.0, 31.75], [32.0, 32.12], [32.0, 47.46], [50.0, 50.94], [53.0, 54.45], [57.0, 57.72], [60.0, 63.61], [64.0, 76.2], [78.0, 83.1], [84.0, 92.64], [93.0, 98.51], [100.0, 101.17], [101.0, 102.84]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, true, false, true, false, false], "silence_prob": [87.55, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 40.31, 37.9, 40.14, 39.99, 38.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 33.98], ["hum", 12.85], ["speech", 6.23]], null, null, null, [["music", 53.3], ["musical instrument", 6.21], ["guitar", 3.71]], [["music", 55.31], ["mantra", 8.41], ["electronic music", 3.96]], [["music", 39.57], ["busy signal", 11.51], ["speech", 7.38]], [["music", 42.57], ["mains hum", 15.87], ["hum", 13.37]], [["speech", 28.28], ["noise", 23.55], ["hum", 11.04]], null, null], "duration": [15.33, 1.03, 0.43, 0.75, 0.12, 15.46, 0.94, 1.45, 0.72, 3.61, 12.2, 5.1, 8.64, 5.51, 1.17, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/lYGDkN8xPt8_filtered.json b/annotations_filtered/lYGDkN8xPt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..329930694eac17d7767a64c7852f6e25d353d139 --- /dev/null +++ b/annotations_filtered/lYGDkN8xPt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 44.14], [45.0, 44.95], [47.0, 62.46], [64.0, 65.6], [74.0, 74.22], [85.0, 85.35], [88.0, 88.69], [93.0, 93.63], [96.0, 106.56]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [40.77, 0.0, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42], "audiomae_on_audioset": [[["music", 72.33], ["musical instrument", 5.32], ["speech", 3.08]], null, null, null, null, null, null, null, null], "duration": [20.14, -0.05, 15.46, 1.6, 0.22, 0.35, 0.69, 0.63, 10.56]} \ No newline at end of file diff --git a/annotations_filtered/lYxVM8oNxRM_filtered.json b/annotations_filtered/lYxVM8oNxRM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5f0dba04fefc9eb99fc1716793e58b17e242306 --- /dev/null +++ b/annotations_filtered/lYxVM8oNxRM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.28], [29.0, 34.28], [36.0, 76.03], [76.0, 87.0], [89.0, 89.85], [91.0, 92.77], [95.0, 98.95], [100.0, 102.64], [104.0, 108.78], [113.0, 114.99], [116.0, 116.73], [119.0, 119.84]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [32.28, 31.76, 0.0, 44.07, 0.0, 0.0, 70.3, 83.52, 91.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 24.55], ["speech", 22.91], ["eruption", 13.98]], [["throbbing", 30.96], ["music", 22.53], ["hum", 11.0]], null, [["music", 23.77], ["throbbing", 22.52], ["hum", 16.11]], null, null, null, null, null, null, null, null], "duration": [3.28, 5.28, 40.03, 11.0, 0.85, 1.77, 3.95, 2.64, 4.78, 1.99, 0.73, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/lZ4ouD3RVKU_filtered.json b/annotations_filtered/lZ4ouD3RVKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..996061a8996064e40625bc108eb50def9af0cb4f --- /dev/null +++ b/annotations_filtered/lZ4ouD3RVKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 5.09], [13.0, 14.42], [16.0, 16.38], [21.0, 21.54], [25.0, 25.96], [35.0, 36.68], [40.0, 42.63], [54.0, 54.23], [55.0, 55.9], [58.0, 59.17], [61.0, 61.53], [62.0, 64.77], [66.0, 67.29], [69.0, 71.51], [73.0, 75.56], [77.0, 78.07], [81.0, 85.08], [90.0, 92.58], [94.0, 95.71], [99.0, 99.96], [100.0, 104.84], [106.0, 105.95], [106.0, 126.1], [128.0, 129.49], [130.0, 132.17], [133.0, 140.37], [142.0, 144.15]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.2, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 0.0, 0.0, 64.52, 0.0, 89.36, 71.29, 0.0, 59.68, 43.58, 0.0, 0.0, 38.42, 0.0, 45.43, 0.0, 88.64, 50.31, 57.56], "audiomae_on_audioset": [[["hum", 23.33], ["eruption", 16.62], ["noise", 6.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 70.41], ["music", 24.76], ["musical instrument", 0.45]], null, null, [["theremin", 83.02], ["music", 12.61], ["musical instrument", 0.78]], null, [["theremin", 44.39], ["music", 36.93], ["musical instrument", 2.89]], null, null, null, null], "duration": [5.09, 1.42, 0.38, 0.54, 0.96, 1.68, 2.63, 0.23, 0.9, 1.17, 0.53, 2.77, 1.29, 2.51, 2.56, 1.07, 4.08, 2.58, 1.71, 0.96, 4.84, -0.05, 20.1, 1.49, 2.17, 7.37, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/lZ885HzflVc_filtered.json b/annotations_filtered/lZ885HzflVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..196ec3b878a99c6253b8277f74ab5575b1bf88e5 --- /dev/null +++ b/annotations_filtered/lZ885HzflVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [8.0, 8.16], [9.0, 11.06], [13.0, 13.61], [17.0, 16.87], [24.0, 24.27], [28.0, 29.1], [32.0, 33.18], [46.0, 45.76], [52.0, 53.15], [55.0, 55.68], [59.0, 59.14], [60.0, 64.56], [67.0, 67.76], [71.0, 71.59], [76.0, 83.51], [85.0, 85.28], [87.0, 87.98], [93.0, 93.39], [94.0, 94.69], [95.0, 95.69], [97.0, 97.8], [101.0, 101.58], [104.0, 104.41], [106.0, 107.59], [110.0, 111.16], [123.0, 124.43], [126.0, 127.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 0.16, 2.06, 0.61, -0.13, 0.27, 1.1, 1.18, -0.24, 1.15, 0.68, 0.14, 4.56, 0.76, 0.59, 7.51, 0.28, 0.98, 0.39, 0.69, 0.69, 0.8, 0.58, 0.41, 1.59, 1.16, 1.43, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/lZQF83kf-a4_filtered.json b/annotations_filtered/lZQF83kf-a4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89c86f4fc6bc7c41f19fb107fca1b8f3db691efc --- /dev/null +++ b/annotations_filtered/lZQF83kf-a4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 25.3], [31.0, 31.01], [33.0, 33.57], [34.0, 98.46]], "keep_status": [true, false, false, false], "silence_prob": [41.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 55.91], ["fly, housefly", 5.41], ["vehicle", 4.2]], null, null, null], "duration": [19.3, 0.01, 0.57, 64.46]} \ No newline at end of file diff --git a/annotations_filtered/lZ_r2Q0FQ1A_filtered.json b/annotations_filtered/lZ_r2Q0FQ1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1614c302e232fbb289441db9ff745873ab2b63a --- /dev/null +++ b/annotations_filtered/lZ_r2Q0FQ1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 34.94], [35.0, 43.43], [56.0, 77.38], [78.0, 79.2], [80.0, 80.99], [86.0, 86.48], [97.0, 131.04], [133.0, 141.84]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.23, 35.1, 0.0, 0.0, 0.0, 0.0, 32.61], "audiomae_on_audioset": [null, [["music", 32.05], ["hum", 31.42], ["ambient music", 15.51]], [["hum", 40.91], ["mains hum", 18.79], ["music", 17.67]], null, null, null, null, [["music", 76.46], ["mantra", 5.09], ["chant", 3.59]]], "duration": [-0.06, 8.43, 21.38, 1.2, 0.99, 0.48, 34.04, 8.84]} \ No newline at end of file diff --git a/annotations_filtered/l_7z4h0soHg_filtered.json b/annotations_filtered/l_7z4h0soHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/l_7z4h0soHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/l_a2GN0Ix4o_filtered.json b/annotations_filtered/l_a2GN0Ix4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d0165685020f50d2ddee682dc8af69c67ee94d3 --- /dev/null +++ b/annotations_filtered/l_a2GN0Ix4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.55], [15.0, 14.66], [17.0, 17.05], [20.0, 19.97], [24.0, 24.83], [27.0, 30.16], [31.0, 34.21], [38.0, 38.5], [39.0, 40.02], [44.0, 46.18], [50.0, 50.77], [52.0, 53.28], [59.0, 59.49], [64.0, 64.49], [70.0, 70.26], [71.0, 73.26], [77.0, 79.27], [81.0, 81.28], [88.0, 89.18], [95.0, 95.42], [99.0, 99.74], [102.0, 102.74], [103.0, 103.65], [106.0, 106.56], [107.0, 108.35], [109.0, 110.22], [114.0, 114.62], [117.0, 117.95], [118.0, 118.91], [120.0, 120.83], [124.0, 124.68], [126.0, 126.25]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 55.46, 32.05, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 73.06, 38.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 43.6], ["cattle, bovinae", 7.31], ["moo", 5.51]], null, null, null, null, null, null, null, null, null, [["speech", 33.52], ["boing", 24.68], ["music", 7.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.55, -0.34, 0.05, -0.03, 0.83, 3.16, 3.21, 0.5, 1.02, 2.18, 0.77, 1.28, 0.49, 0.49, 0.26, 2.26, 2.27, 0.28, 1.18, 0.42, 0.74, 0.74, 0.65, 0.56, 1.35, 1.22, 0.62, 0.95, 0.91, 0.83, 0.68, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/lb6nAmbkk9Y_filtered.json b/annotations_filtered/lb6nAmbkk9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20bc857a34dad0428de6902a4c96497271f178f9 --- /dev/null +++ b/annotations_filtered/lb6nAmbkk9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.56], [4.0, 4.24], [5.0, 5.76], [7.0, 8.92], [9.0, 9.86], [10.0, 10.74], [14.0, 16.34], [23.0, 23.73], [24.0, 25.29], [28.0, 28.26], [46.0, 47.24], [53.0, 54.72], [56.0, 56.03], [59.0, 61.16], [62.0, 63.29], [65.0, 65.18], [73.0, 74.31], [78.0, 78.76], [79.0, 80.65], [83.0, 84.59], [90.0, 91.4], [95.0, 96.9], [98.0, 98.04], [100.0, 102.37], [104.0, 104.46], [125.0, 127.4], [137.0, 139.24], [142.0, 142.86], [144.0, 145.77], [147.0, 147.51], [156.0, 157.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 0.24, 0.76, 1.92, 0.86, 0.74, 2.34, 0.73, 1.29, 0.26, 1.24, 1.72, 0.03, 2.16, 1.29, 0.18, 1.31, 0.76, 1.65, 1.59, 1.4, 1.9, 0.04, 2.37, 0.46, 2.4, 2.24, 0.86, 1.77, 0.51, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/lbIbVWmpcCg_filtered.json b/annotations_filtered/lbIbVWmpcCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4fe40e9b12a41dd4cad6bb190e7af1394e6d3cf --- /dev/null +++ b/annotations_filtered/lbIbVWmpcCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [13.0, 13.53], [34.0, 34.64], [44.0, 44.79], [46.0, 46.25], [49.0, 49.33], [49.0, 49.37], [53.0, 54.58], [55.0, 54.65], [63.0, 63.58], [78.0, 78.39], [94.0, 95.08], [96.0, 98.96], [111.0, 111.6], [114.0, 114.72], [126.0, 127.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["bee, wasp, etc.", 46.06], ["fly, housefly", 16.28], ["insect", 10.2]], null, null, null], "duration": [1.05, 0.53, 0.64, 0.79, 0.25, 0.33, 0.37, 1.58, -0.35, 0.58, 0.39, 1.08, 2.96, 0.6, 0.72, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/lbdeAhpIPhE_filtered.json b/annotations_filtered/lbdeAhpIPhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f244baf00c66736720c1fe5d584a12d33098a272 --- /dev/null +++ b/annotations_filtered/lbdeAhpIPhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.29], [18.0, 19.23], [24.0, 26.13], [28.0, 28.48], [32.0, 32.22], [33.0, 33.86], [36.0, 37.07], [40.0, 40.41], [42.0, 48.49], [51.0, 51.04], [54.0, 55.24], [57.0, 57.13], [61.0, 61.33], [62.0, 62.34], [64.0, 65.82], [66.0, 72.28], [73.0, 77.7], [81.0, 82.04], [84.0, 84.27], [85.0, 89.4], [90.0, 92.3], [94.0, 94.53], [96.0, 97.65], [99.0, 98.95], [99.0, 99.5], [100.0, 103.81], [104.0, 106.37], [108.0, 125.64], [128.0, 130.6], [136.0, 136.88], [137.0, 138.52], [140.0, 142.43], [145.0, 144.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 40.12, 0.0, 0.0, 0.0, 0.0, 0.0, 32.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.91, 41.52, 0.0, 0.0, 35.11, 32.33, 0.0, 0.0, 0.0, 0.0, 36.18, 32.82, 31.58, 56.4, 0.0, 0.0, 39.72, 0.0], "audiomae_on_audioset": [null, null, [["music", 71.0], ["thunk", 3.5], ["drum", 2.98]], null, null, null, null, null, [["music", 85.16], ["speech", 3.45], ["electronic music", 0.8]], null, null, null, null, null, null, [["music", 37.71], ["boing", 25.64], ["speech", 10.64]], [["music", 54.15], ["speech", 16.68], ["synthesizer", 4.33]], null, null, [["music", 62.5], ["noise", 3.6], ["speech", 2.95]], [["music", 41.41], ["trombone", 16.7], ["didgeridoo", 16.24]], null, null, null, null, [["music", 59.55], ["theremin", 8.15], ["musical instrument", 5.08]], [["music", 53.0], ["didgeridoo", 33.09], ["musical instrument", 2.84]], [["music", 64.51], ["buzz", 4.13], ["sheep", 3.91]], null, null, null, [["music", 44.49], ["animal", 9.76], ["ice cream truck, ice cream van", 5.58]], null], "duration": [0.29, 1.23, 2.13, 0.48, 0.22, 0.86, 1.07, 0.41, 6.49, 0.04, 1.24, 0.13, 0.33, 0.34, 1.82, 6.28, 4.7, 1.04, 0.27, 4.4, 2.3, 0.53, 1.65, -0.05, 0.5, 3.81, 2.37, 17.64, 2.6, 0.88, 1.52, 2.43, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/lbiymQJsC8M_filtered.json b/annotations_filtered/lbiymQJsC8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61e46e3af109536bc3e5260a684af6a5132831f5 --- /dev/null +++ b/annotations_filtered/lbiymQJsC8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [8.0, 14.3], [15.0, 22.0], [22.0, 24.98], [27.0, 27.65], [28.0, 30.72], [33.0, 33.42], [44.0, 43.8], [50.0, 51.27], [56.0, 58.01], [59.0, 60.25], [63.0, 63.83], [66.0, 68.35], [69.0, 70.61]], "keep_status": [false, false, true, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 32.95, 31.99, 30.95, 0.0, 30.27, 0.0, 0.0, 0.0, 36.99, 0.0, 0.0, 46.83, 0.0], "audiomae_on_audioset": [null, [["electric shaver, electric razor", 49.45], ["speech", 25.81], ["mains hum", 8.01]], [["speech", 23.16], ["sidetone", 19.64], ["electric shaver, electric razor", 12.21]], [["livestock, farm animals, working animals", 22.22], ["fly, housefly", 13.31], ["moo", 12.8]], null, [["moo", 45.69], ["livestock, farm animals, working animals", 29.35], ["cattle, bovinae", 22.32]], null, null, null, [["speech", 39.01], ["music", 5.0], ["inside, small room", 4.83]], null, null, [["whale vocalization", 30.31], ["music", 10.42], ["echo", 4.99]], null], "duration": [1.05, 6.3, 7.0, 2.98, 0.65, 2.72, 0.42, -0.2, 1.27, 2.01, 1.25, 0.83, 2.35, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/lbqDuUjm4aU_filtered.json b/annotations_filtered/lbqDuUjm4aU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aa8a53316378b2443b96cc74723015af9621e1b --- /dev/null +++ b/annotations_filtered/lbqDuUjm4aU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.75], [7.0, 8.99], [12.0, 13.9], [18.0, 20.41], [23.0, 23.85], [27.0, 27.89], [30.0, 31.19], [33.0, 35.24], [37.0, 38.75], [42.0, 42.26], [45.0, 46.67], [49.0, 51.21], [58.0, 58.51], [61.0, 61.42], [62.0, 63.44], [70.0, 71.32], [73.0, 74.71], [80.0, 80.82], [83.0, 84.59], [90.0, 91.37], [93.0, 93.45], [97.0, 97.12], [115.0, 120.04], [121.0, 122.67], [123.0, 125.51], [126.0, 127.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 56.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.75, 1.99, 1.9, 2.41, 0.85, 0.89, 1.19, 2.24, 1.75, 0.26, 1.67, 2.21, 0.51, 0.42, 1.44, 1.32, 1.71, 0.82, 1.59, 1.37, 0.45, 0.12, 5.04, 1.67, 2.51, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/lc0UIhNuudQ_filtered.json b/annotations_filtered/lc0UIhNuudQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d78f06653dd70904aa4d5f037f444931ed970d0 --- /dev/null +++ b/annotations_filtered/lc0UIhNuudQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.71], [9.0, 9.93], [13.0, 14.45], [16.0, 15.77], [17.0, 19.41], [24.0, 34.89], [35.0, 36.63], [41.0, 43.87], [45.0, 46.45], [47.0, 48.88], [50.0, 51.16], [54.0, 53.67], [59.0, 59.31], [74.0, 87.03], [88.0, 89.83], [92.0, 92.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.34, 0.0, 0.0, 0.0, 53.53, 64.07, 0.0, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 30.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.65], ["speech", 17.84], ["didgeridoo", 16.78]], null, null], "duration": [4.71, 0.93, 1.45, -0.23, 2.41, 10.89, 1.63, 2.87, 1.45, 1.88, 1.16, -0.33, 0.31, 13.03, 1.83, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/lcIuJs1vHrg_filtered.json b/annotations_filtered/lcIuJs1vHrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d41b2f5bd0c7fb7446e0829b74ae3e9aa19e1bbf --- /dev/null +++ b/annotations_filtered/lcIuJs1vHrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [3.0, 3.54], [4.0, 5.04], [8.0, 7.62], [8.0, 13.04], [14.0, 16.88], [19.0, 20.28], [20.0, 38.04], [38.0, 38.84], [41.0, 45.98], [47.0, 48.93], [49.0, 50.16], [56.0, 74.09], [74.0, 74.75], [75.0, 75.78], [80.0, 80.25], [81.0, 84.43], [87.0, 109.44], [120.0, 138.37], [141.0, 141.56], [143.0, 144.56], [147.0, 169.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 98.19, 0.0, 98.86, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 99.31, 79.76, 97.54, 0.0, 0.0, 58.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.54, 1.04, -0.38, 5.04, 2.88, 1.28, 18.04, 0.84, 4.98, 1.93, 1.16, 18.09, 0.75, 0.78, 0.25, 3.43, 22.44, 18.37, 0.56, 1.56, 22.13]} \ No newline at end of file diff --git a/annotations_filtered/ld9ehvuVu-8_filtered.json b/annotations_filtered/ld9ehvuVu-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25cb4160d828e51a1de8fe4ebddc6f3bdea81829 --- /dev/null +++ b/annotations_filtered/ld9ehvuVu-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.23], [12.0, 12.34], [15.0, 15.74], [16.0, 16.8], [18.0, 17.98], [18.0, 18.01], [19.0, 20.93], [23.0, 23.8], [26.0, 26.45], [33.0, 33.67], [36.0, 36.56], [38.0, 37.98], [42.0, 43.23], [55.0, 56.42], [70.0, 71.32], [71.0, 71.79], [78.0, 80.08], [81.0, 82.31], [84.0, 84.62], [87.0, 87.74], [90.0, 90.9], [91.0, 92.21], [95.0, 95.27], [95.0, 95.4], [96.0, 98.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 0.34, 0.74, 0.8, -0.02, 0.01, 1.93, 0.8, 0.45, 0.67, 0.56, -0.02, 1.23, 1.42, 1.32, 0.79, 2.08, 1.31, 0.62, 0.74, 0.9, 1.21, 0.27, 0.4, 2.2]} \ No newline at end of file diff --git a/annotations_filtered/le6AAhqa_8U_filtered.json b/annotations_filtered/le6AAhqa_8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16a2997c636889d1b5f95dc326835774161bce8c --- /dev/null +++ b/annotations_filtered/le6AAhqa_8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.85], [3.0, 3.1], [8.0, 8.04], [9.0, 9.9], [16.0, 16.51], [17.0, 18.01], [18.0, 19.26], [22.0, 22.91], [25.0, 25.35], [26.0, 26.7], [31.0, 31.53], [33.0, 34.05], [37.0, 37.54], [39.0, 39.93], [45.0, 45.06], [49.0, 49.64], [51.0, 51.31], [61.0, 61.1], [64.0, 64.27], [68.0, 68.52], [71.0, 71.93], [75.0, 76.81], [78.0, 79.41], [80.0, 82.65], [85.0, 85.35], [89.0, 89.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.15, 0.1, 0.04, 0.9, 0.51, 1.01, 1.26, 0.91, 0.35, 0.7, 0.53, 1.05, 0.54, 0.93, 0.06, 0.64, 0.31, 0.1, 0.27, 0.52, 0.93, 1.81, 1.41, 2.65, 0.35, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/leQiIU7fzPs_filtered.json b/annotations_filtered/leQiIU7fzPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c7de4f1ee9487cd25d528d0ed2210204664dc05 --- /dev/null +++ b/annotations_filtered/leQiIU7fzPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 30.97], [34.0, 43.26]], "keep_status": [true, true], "silence_prob": [32.7, 31.15], "audiomae_on_audioset": [[["music", 18.66], ["vehicle", 11.45], ["outside, rural or natural", 4.32]], [["music", 31.21], ["breaking", 16.8], ["brass instrument", 5.49]]], "duration": [12.97, 9.26]} \ No newline at end of file diff --git a/annotations_filtered/leSpIIaEblk_filtered.json b/annotations_filtered/leSpIIaEblk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..648b4539942f96866db262885c00adaf12822ef7 --- /dev/null +++ b/annotations_filtered/leSpIIaEblk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.01], [19.0, 41.17], [45.0, 81.01], [82.0, 82.56], [87.0, 97.24], [100.0, 102.19], [103.0, 127.18]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [29.92, 29.69, 0.0, 0.0, 31.04, 30.62, 39.52], "audiomae_on_audioset": [[["music", 42.55], ["sidetone", 28.89], ["throbbing", 6.1]], [["music", 63.48], ["throbbing", 22.71], ["hum", 3.52]], null, null, [["throbbing", 30.08], ["music", 24.51], ["speech", 22.82]], [["music", 46.12], ["breaking", 20.6], ["boom", 6.48]], [["music", 45.8], ["throbbing", 14.93], ["electronic music", 6.43]]], "duration": [4.01, 22.17, 36.01, 0.56, 10.24, 2.19, 24.18]} \ No newline at end of file diff --git a/annotations_filtered/lf3MqrE07I4_filtered.json b/annotations_filtered/lf3MqrE07I4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8054a445f97b117a894c145f9edfeb131f3fd5d9 --- /dev/null +++ b/annotations_filtered/lf3MqrE07I4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 38.75], [41.0, 107.38], [110.0, 110.46], [119.0, 119.31], [124.0, 127.75], [129.0, 133.03], [135.0, 137.02], [138.0, 139.72], [142.0, 152.44], [153.0, 172.12], [172.0, 174.99], [177.0, 177.48]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [31.85, 0.0, 0.0, 0.0, 91.98, 96.66, 99.62, 0.0, 36.15, 31.72, 42.62, 0.0], "audiomae_on_audioset": [[["music", 48.29], ["synthesizer", 15.98], ["throbbing", 10.64]], null, null, null, null, null, null, null, [["music", 60.02], ["sound effect", 4.77], ["synthesizer", 3.59]], [["music", 60.42], ["buzz", 10.6], ["sound effect", 3.64]], [["sine wave", 24.84], ["beep, bleep", 16.75], ["music", 12.15]], null], "duration": [21.75, 66.38, 0.46, 0.31, 3.75, 4.03, 2.02, 1.72, 10.44, 19.12, 2.99, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/lfJ7WzyoZH8_filtered.json b/annotations_filtered/lfJ7WzyoZH8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9002b49fe6a2a5ba71c94a02ce059c55e2eb6c6 --- /dev/null +++ b/annotations_filtered/lfJ7WzyoZH8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.29]], "keep_status": [false], "silence_prob": [38.68], "audiomae_on_audioset": [[["music", 58.49], ["musical instrument", 8.84], ["didgeridoo", 5.99]]], "duration": [4.29]} \ No newline at end of file diff --git a/annotations_filtered/lfKcANi5Zrk_filtered.json b/annotations_filtered/lfKcANi5Zrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c990a1e6aca30e56ecf2b5a9c32c1e101cb06875 --- /dev/null +++ b/annotations_filtered/lfKcANi5Zrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.31], [13.0, 13.29], [14.0, 14.27], [14.0, 20.17], [22.0, 23.38], [24.0, 25.19], [30.0, 30.82], [32.0, 34.74], [36.0, 36.42], [37.0, 38.72], [40.0, 41.37], [43.0, 44.02], [45.0, 46.67], [47.0, 49.38], [50.0, 52.24], [54.0, 60.45], [62.0, 63.1], [65.0, 66.34], [67.0, 68.94], [70.0, 71.47], [73.0, 78.38], [80.0, 80.23], [82.0, 86.39], [89.0, 89.7], [91.0, 96.21], [99.0, 99.67], [104.0, 106.25], [109.0, 113.48], [115.0, 115.26], [122.0, 122.99], [125.0, 128.7], [129.0, 128.76], [129.0, 129.15], [129.0, 132.75], [133.0, 133.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 99.1, 100.0, 0.0, 0.0, 0.0, 0.0, 52.27, 0.0, 69.34, 0.0, 79.76, 0.0, 100.0, 97.33, 0.0, 0.0, 89.54, 0.0, 0.0, 68.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 0.29, 0.27, 6.17, 1.38, 1.19, 0.82, 2.74, 0.42, 1.72, 1.37, 1.02, 1.67, 2.38, 2.24, 6.45, 1.1, 1.34, 1.94, 1.47, 5.38, 0.23, 4.39, 0.7, 5.21, 0.67, 2.25, 4.48, 0.26, 0.99, 3.7, -0.24, 0.15, 3.75, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/lfObLA5H4Rg_filtered.json b/annotations_filtered/lfObLA5H4Rg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b1be62eae7a5c8ae8d5aac69ac54ccf880096de --- /dev/null +++ b/annotations_filtered/lfObLA5H4Rg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [5.0, 43.63], [44.0, 45.55], [52.0, 54.18], [55.0, 146.01], [147.0, 148.0]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.53, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.33], ["mains hum", 9.22], ["hum", 7.71]], null, null], "duration": [0.33, 38.63, 1.55, 2.18, 91.01, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/lfUlATBIer8_filtered.json b/annotations_filtered/lfUlATBIer8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..869e16fad0aba3a7730a8fb89e907dc402ffca62 --- /dev/null +++ b/annotations_filtered/lfUlATBIer8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 27.28], [29.0, 30.55], [34.0, 36.05], [39.0, 43.44], [47.0, 49.55], [51.0, 52.08], [52.0, 56.17], [63.0, 62.94], [68.0, 70.5], [72.0, 72.57], [90.0, 90.1], [121.0, 121.85], [125.0, 125.02], [126.0, 126.71]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [37.35, 0.0, 40.9, 32.24, 33.16, 0.0, 39.12, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.49], ["synthesizer", 9.82], ["throbbing", 4.34]], null, [["hum", 25.98], ["music", 24.98], ["mains hum", 14.48]], [["music", 41.23], ["throbbing", 18.37], ["hum", 17.23]], [["music", 83.6], ["video game music", 1.88], ["soundtrack music", 1.09]], null, [["music", 50.98], ["speech", 11.12], ["musical instrument", 4.93]], null, null, null, null, null, null, null], "duration": [24.28, 1.55, 2.05, 4.44, 2.55, 1.08, 4.17, -0.06, 2.5, 0.57, 0.1, 0.85, 0.02, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/lfXtePMdNMk_filtered.json b/annotations_filtered/lfXtePMdNMk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08f89c090ae332d62f4fa65e4736cae572861409 --- /dev/null +++ b/annotations_filtered/lfXtePMdNMk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.02], [33.0, 78.92], [81.0, 108.72], [110.0, 110.42], [111.0, 111.43], [112.0, 112.83], [114.0, 124.95]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 31.05, 0.0, 0.0, 0.0, 37.43], "audiomae_on_audioset": [null, null, [["music", 50.77], ["speech", 19.81], ["musical instrument", 2.84]], null, null, null, [["speech", 42.5], ["hum", 13.12], ["breaking", 7.86]]], "duration": [1.02, 45.92, 27.72, 0.42, 0.43, 0.83, 10.95]} \ No newline at end of file diff --git a/annotations_filtered/lfeYgfKa2cY_filtered.json b/annotations_filtered/lfeYgfKa2cY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/lfeYgfKa2cY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/lfrC_mA6o8o_filtered.json b/annotations_filtered/lfrC_mA6o8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b952da18e8fd53c5eb8ff3d3831bea544e70dd3 --- /dev/null +++ b/annotations_filtered/lfrC_mA6o8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.07], [15.0, 16.38], [24.0, 24.44], [25.0, 25.14], [31.0, 31.33], [36.0, 36.68], [37.0, 37.67], [42.0, 42.6], [53.0, 53.05], [78.0, 78.44], [92.0, 97.87], [115.0, 116.75], [120.0, 126.76], [138.0, 148.74], [150.0, 160.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, true, true], "silence_prob": [89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.93, 0.0, 38.2, 34.56, 37.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 22.06], ["cowbell", 20.49], ["moo", 14.37]], null, [["speech", 57.05], ["music", 6.08], ["fart", 4.89]], [["speech", 42.34], ["boing", 10.79], ["radio", 6.24]], [["speech", 25.02], ["moo", 5.34], ["cattle, bovinae", 4.76]]], "duration": [8.07, 1.38, 0.44, 0.14, 0.33, 0.68, 0.67, 0.6, 0.05, 0.44, 5.87, 1.75, 6.76, 10.74, 10.37]} \ No newline at end of file diff --git a/annotations_filtered/lgRkMyW_J5U_filtered.json b/annotations_filtered/lgRkMyW_J5U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..658d8fdbf5f73bef2b5de63d53989e2b09670f03 --- /dev/null +++ b/annotations_filtered/lgRkMyW_J5U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.79], [7.0, 11.33], [18.0, 22.08], [27.0, 29.39], [33.0, 33.03], [35.0, 36.61], [38.0, 40.09], [42.0, 43.92], [47.0, 47.68], [56.0, 56.79], [60.0, 60.84], [73.0, 75.44], [82.0, 93.5], [94.0, 95.35], [97.0, 98.74], [102.0, 105.87], [106.0, 107.67], [111.0, 114.99], [116.0, 116.77]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.09, 78.38, 57.32, 0.0, 0.0, 47.01, 0.0, 0.0, 0.0, 0.0, 41.6, 32.75, 0.0, 0.0, 32.58, 0.0, 35.84, 0.0], "audiomae_on_audioset": [null, [["music", 26.39], ["humming", 10.41], ["effects unit", 6.75]], null, null, null, null, [["music", 61.36], ["mantra", 12.78], ["carnatic music", 3.17]], null, null, null, null, [["music", 50.55], ["theremin", 24.99], ["musical instrument", 2.93]], [["music", 77.31], ["throbbing", 2.46], ["electronic music", 2.32]], null, null, [["music", 72.41], ["didgeridoo", 4.03], ["electronic music", 1.7]], null, [["mantra", 32.51], ["music", 30.24], ["chant", 9.76]], null], "duration": [-0.21, 4.33, 4.08, 2.39, 0.03, 1.61, 2.09, 1.92, 0.68, 0.79, 0.84, 2.44, 11.5, 1.35, 1.74, 3.87, 1.67, 3.99, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/lh3qxTgaa1Y_filtered.json b/annotations_filtered/lh3qxTgaa1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b189efe57b5779d438c392c53f6f492aeba0ea12 --- /dev/null +++ b/annotations_filtered/lh3qxTgaa1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.75], [8.0, 25.98], [27.0, 27.89], [31.0, 30.86], [32.0, 33.32], [40.0, 40.1], [40.0, 40.98], [41.0, 42.43], [46.0, 49.2], [51.0, 52.03], [55.0, 55.17], [56.0, 57.23], [58.0, 58.65], [60.0, 64.25], [68.0, 69.06], [71.0, 72.15], [75.0, 74.93], [81.0, 82.59], [83.0, 83.88], [87.0, 87.07], [91.0, 95.47], [96.0, 96.31], [98.0, 98.47], [99.0, 107.0], [114.0, 119.23], [120.0, 120.19], [123.0, 124.44], [125.0, 125.52], [130.0, 130.64], [132.0, 142.45]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 44.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.74, 0.0, 0.0, 0.0, 0.0, 41.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.72, 0.0, 0.0, 33.17, 31.95, 0.0, 0.0, 0.0, 0.0, 30.02], "audiomae_on_audioset": [null, [["speech", 36.49], ["music", 24.18], ["radio", 9.01]], null, null, null, null, null, null, [["fart", 24.07], ["music", 13.99], ["beatboxing", 3.44]], null, null, null, null, [["music", 69.31], ["musical instrument", 5.88], ["synthesizer", 3.39]], null, null, null, null, null, null, [["music", 62.0], ["musical instrument", 5.17], ["synthesizer", 4.15]], null, null, [["didgeridoo", 38.52], ["music", 31.33], ["theremin", 8.17]], [["music", 41.21], ["didgeridoo", 17.49], ["theremin", 11.82]], null, null, null, null, [["music", 46.4], ["groan", 8.99], ["echo", 5.69]]], "duration": [0.75, 17.98, 0.89, -0.14, 1.32, 0.1, 0.98, 1.43, 3.2, 1.03, 0.17, 1.23, 0.65, 4.25, 1.06, 1.15, -0.07, 1.59, 0.88, 0.07, 4.47, 0.31, 0.47, 8.0, 5.23, 0.19, 1.44, 0.52, 0.64, 10.45]} \ No newline at end of file diff --git a/annotations_filtered/lh5IiK9eQhA_filtered.json b/annotations_filtered/lh5IiK9eQhA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..106a57553fbbc3b3430826e1055aba0cd48c2d97 --- /dev/null +++ b/annotations_filtered/lh5IiK9eQhA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.01], [19.0, 30.89], [34.0, 33.81], [38.0, 45.69], [47.0, 50.58], [55.0, 59.43], [61.0, 61.75], [62.0, 63.27], [65.0, 73.13], [74.0, 77.68], [80.0, 81.16], [86.0, 89.4], [92.0, 93.04], [95.0, 105.17], [106.0, 107.13], [108.0, 119.77], [122.0, 124.48]], "keep_status": [false, true, false, true, true, true, false, false, true, true, false, true, false, true, false, false, true], "silence_prob": [0.0, 29.91, 0.0, 30.14, 29.87, 30.57, 0.0, 0.0, 29.95, 29.87, 0.0, 30.08, 0.0, 29.64, 0.0, 29.84, 30.6], "audiomae_on_audioset": [null, [["music", 56.88], ["throbbing", 7.79], ["speech", 4.92]], null, [["music", 60.22], ["electronic music", 4.03], ["cacophony", 3.88]], [["music", 56.94], ["electronic music", 9.51], ["throbbing", 3.36]], [["speech", 28.5], ["music", 10.41], ["rumble", 5.85]], null, null, [["vehicle", 19.85], ["music", 17.45], ["car", 16.87]], [["speech", 46.34], ["music", 8.17], ["sound effect", 7.91]], null, [["whale vocalization", 47.55], ["cattle, bovinae", 11.31], ["livestock, farm animals, working animals", 10.41]], null, [["music", 46.63], ["didgeridoo", 7.7], ["electronic music", 5.88]], null, [["music", 45.26], ["throbbing", 22.28], ["hum", 8.01]], [["car", 21.69], ["music", 15.7], ["vehicle", 15.26]]], "duration": [0.01, 11.89, -0.19, 7.69, 3.58, 4.43, 0.75, 1.27, 8.13, 3.68, 1.16, 3.4, 1.04, 10.17, 1.13, 11.77, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/lh6Y9EU0wPQ_filtered.json b/annotations_filtered/lh6Y9EU0wPQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c7eac1fedb0a8406df073511ee37ce31487ba44 --- /dev/null +++ b/annotations_filtered/lh6Y9EU0wPQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.72], [10.0, 11.04], [12.0, 13.81], [15.0, 21.14], [22.0, 23.97], [25.0, 26.2], [27.0, 30.35], [34.0, 34.86], [36.0, 40.8], [43.0, 43.24], [44.0, 55.68], [56.0, 56.83], [58.0, 58.14], [60.0, 64.42], [65.0, 67.29], [69.0, 70.04], [72.0, 73.21], [75.0, 77.79], [78.0, 79.07], [80.0, 85.6], [92.0, 91.86], [93.0, 97.07], [97.0, 98.88], [100.0, 105.98]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [94.07, 0.0, 0.0, 86.27, 0.0, 0.0, 58.64, 0.0, 34.28, 0.0, 43.56, 0.0, 0.0, 50.11, 67.89, 0.0, 0.0, 37.71, 0.0, 48.39, 0.0, 40.11, 0.0, 49.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 26.81], ["mosquito", 14.78], ["animal", 11.86]], null, [["speech", 23.49], ["music", 16.93], ["electric shaver, electric razor", 12.56]], null, null, null, null, null, null, [["music", 77.86], ["piano", 3.72], ["keyboard (musical)", 2.43]], null, [["music", 35.14], ["guitar", 9.78], ["effects unit", 7.87]], null, [["speech", 38.85], ["music", 9.75], ["musical instrument", 2.9]], null, [["music", 44.76], ["speech", 20.83], ["musical instrument", 7.76]]], "duration": [2.72, 1.04, 1.81, 6.14, 1.97, 1.2, 3.35, 0.86, 4.8, 0.24, 11.68, 0.83, 0.14, 4.42, 2.29, 1.04, 1.21, 2.79, 1.07, 5.6, -0.14, 4.07, 1.88, 5.98]} \ No newline at end of file diff --git a/annotations_filtered/lh9z3hPGqgM_filtered.json b/annotations_filtered/lh9z3hPGqgM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d715030ddfb9f4b04704f647f203a1ef53f8a355 --- /dev/null +++ b/annotations_filtered/lh9z3hPGqgM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 64.77], [68.0, 69.25], [72.0, 72.17], [77.0, 78.38], [80.0, 83.12], [84.0, 128.76]], "keep_status": [false, false, false, false, false, false], "silence_prob": [51.44, 0.0, 0.0, 0.0, 74.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [3.77, 1.25, 0.17, 1.38, 3.12, 44.76]} \ No newline at end of file diff --git a/annotations_filtered/lhAQ43EIZ-g_filtered.json b/annotations_filtered/lhAQ43EIZ-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ee09cd2eb45eacf5975815b2a9dd61dacca93a4 --- /dev/null +++ b/annotations_filtered/lhAQ43EIZ-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [5.0, 5.93], [10.0, 19.25], [19.0, 65.26], [68.0, 82.16], [85.0, 98.69], [101.0, 106.51], [111.0, 111.43], [112.0, 116.04], [117.0, 119.45], [120.0, 121.53], [124.0, 125.51], [126.0, 129.69], [130.0, 130.32], [135.0, 136.32], [138.0, 148.26], [151.0, 150.96], [152.0, 154.65], [155.0, 156.09], [160.0, 160.02], [160.0, 162.87], [163.0, 163.76], [164.0, 164.44], [164.0, 164.57], [165.0, 165.11], [175.0, 175.64], [177.0, 177.94], [179.0, 181.13], [184.0, 187.19], [196.0, 223.4], [227.0, 227.38], [229.0, 230.18]], "keep_status": [false, false, true, false, true, false, true, false, true, true, false, false, true, false, false, true, false, true, false, false, true, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 30.72, 0.0, 29.64, 31.08, 32.43, 0.0, 43.45, 41.64, 0.0, 0.0, 37.41, 0.0, 0.0, 30.65, 0.0, 36.35, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.05, 32.1, 38.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 47.24], ["groan", 9.47], ["hum", 5.85]], null, [["music", 52.21], ["cacophony", 4.27], ["smash, crash", 3.25]], [["music", 52.59], ["didgeridoo", 13.37], ["throbbing", 4.37]], [["music", 40.5], ["throbbing", 8.44], ["hum", 4.72]], null, [["music", 54.84], ["speech", 6.96], ["synthesizer", 6.65]], [["music", 33.93], ["speech", 29.31], ["foghorn", 6.08]], null, null, [["speech", 49.17], ["music", 14.87], ["crow", 4.57]], null, null, [["music", 27.01], ["speech", 20.16], ["didgeridoo", 14.49]], null, [["fly, housefly", 29.05], ["speech", 16.79], ["insect", 15.02]], null, null, [["whale vocalization", 29.17], ["mains hum", 7.14], ["animal", 6.05]], null, null, null, null, null, null, [["fly, housefly", 14.55], ["whale vocalization", 7.61], ["hum", 5.98]], [["livestock, farm animals, working animals", 15.16], ["cattle, bovinae", 12.73], ["music", 11.31]], [["music", 60.18], ["speech", 22.27], ["musical instrument", 1.9]], null, null], "duration": [0.48, 0.93, 9.25, 46.26, 14.16, 13.69, 5.51, 0.43, 4.04, 2.45, 1.53, 1.51, 3.69, 0.32, 1.32, 10.26, -0.04, 2.65, 1.09, 0.02, 2.87, 0.76, 0.44, 0.57, 0.11, 0.64, 0.94, 2.13, 3.19, 27.4, 0.38, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/lhGtoYnSdl8_filtered.json b/annotations_filtered/lhGtoYnSdl8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba17bc40570c8a594e37cd2897296e096b554b9f --- /dev/null +++ b/annotations_filtered/lhGtoYnSdl8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [2.0, 1.75], [6.0, 7.57], [8.0, 9.48], [11.0, 18.87], [26.0, 25.73], [27.0, 29.03], [31.0, 30.92], [32.0, 34.33], [35.0, 39.68], [41.0, 63.76], [65.0, 72.06], [74.0, 74.76], [78.0, 79.2], [79.0, 81.3], [82.0, 82.43], [86.0, 87.42], [88.0, 91.29], [96.0, 96.75], [97.0, 98.05], [100.0, 99.81], [101.0, 101.58], [102.0, 101.88]], "keep_status": [false, false, false, false, true, false, false, false, true, true, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.31, 0.0, 64.18, 0.0, 30.38, 31.48, 30.16, 36.6, 0.0, 0.0, 41.05, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 43.59], ["synthesizer", 15.55], ["ambient music", 7.65]], null, null, null, [["music", 43.16], ["gong", 7.04], ["sound effect", 5.71]], [["music", 41.46], ["synthesizer", 16.3], ["musical instrument", 5.92]], [["music", 57.02], ["theremin", 10.18], ["synthesizer", 7.89]], [["speech", 36.63], ["music", 16.38], ["sidetone", 6.06]], null, null, [["speech", 35.8], ["music", 7.38], ["sidetone", 7.16]], null, null, null, null, null, null, null, null], "duration": [0.35, -0.25, 1.57, 1.48, 7.87, -0.27, 2.03, -0.08, 2.33, 4.68, 22.76, 7.06, 0.76, 1.2, 2.3, 0.43, 1.42, 3.29, 0.75, 1.05, -0.19, 0.58, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/lhHv2EyaaNc_filtered.json b/annotations_filtered/lhHv2EyaaNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..907877036ef2c2f715d4ac5b1cba16de365d29ea --- /dev/null +++ b/annotations_filtered/lhHv2EyaaNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.09], [6.0, 6.25], [7.0, 7.97], [11.0, 12.07], [25.0, 26.45], [29.0, 30.72], [33.0, 34.59], [43.0, 44.15], [53.0, 53.3]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["boing", 38.5], ["speech", 28.6], ["moo", 3.61]], null, null, null, null, null, null, null, null], "duration": [2.09, 0.25, 0.97, 1.07, 1.45, 1.72, 1.59, 1.15, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/lhbHTjMLN5c_filtered.json b/annotations_filtered/lhbHTjMLN5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f272e4084c7055ad8050d0d735c0841db5d9d0e --- /dev/null +++ b/annotations_filtered/lhbHTjMLN5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.77], [22.0, 22.82], [25.0, 25.96], [32.0, 33.08], [34.0, 34.13], [36.0, 37.71], [39.0, 39.55], [42.0, 42.67], [46.0, 47.76], [51.0, 51.22], [51.0, 51.97], [54.0, 54.92], [57.0, 59.17], [61.0, 62.68], [63.0, 64.79], [67.0, 83.1], [93.0, 95.84], [105.0, 105.93], [107.0, 115.48], [116.0, 118.17], [119.0, 135.68], [136.0, 165.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, true], "silence_prob": [35.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.71, 0.0, 0.0, 48.69, 56.7, 0.0, 38.22, 53.53, 35.39, 31.33], "audiomae_on_audioset": [[["fart", 84.23], ["music", 4.73], ["speech", 3.45]], null, null, null, null, null, null, null, null, null, null, null, [["fart", 69.45], ["speech", 15.4], ["inside, small room", 0.89]], null, null, [["speech", 25.65], ["bee, wasp, etc.", 15.04], ["fly, housefly", 11.3]], null, null, [["speech", 36.94], ["noise", 8.85], ["frog", 5.63]], null, [["music", 22.38], ["hum", 21.79], ["throbbing", 15.6]], [["music", 23.91], ["buzz", 18.92], ["breaking", 10.01]]], "duration": [7.77, 0.82, 0.96, 1.08, 0.13, 1.71, 0.55, 0.67, 1.76, 0.22, 0.97, 0.92, 2.17, 1.68, 1.79, 16.1, 2.84, 0.93, 8.48, 2.17, 16.68, 29.05]} \ No newline at end of file diff --git a/annotations_filtered/lhsWHmJiaXE_filtered.json b/annotations_filtered/lhsWHmJiaXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1746ea0a7b1b37527807e504bca8bb386d40d266 --- /dev/null +++ b/annotations_filtered/lhsWHmJiaXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.73], [5.0, 6.1], [9.0, 9.73], [11.0, 11.4], [13.0, 13.74], [15.0, 15.43], [17.0, 17.09], [20.0, 20.9], [22.0, 24.8], [26.0, 26.94], [29.0, 29.15], [30.0, 30.33], [31.0, 31.97], [33.0, 33.49], [35.0, 34.99], [36.0, 37.12], [39.0, 39.65], [46.0, 46.82], [47.0, 49.42], [51.0, 51.63], [54.0, 56.83], [63.0, 63.46], [69.0, 70.02], [74.0, 74.83], [77.0, 76.96], [78.0, 79.0], [79.0, 80.37], [81.0, 81.45], [84.0, 84.28], [96.0, 96.85], [98.0, 98.02], [101.0, 110.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.61, 0.0, 38.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.87], ["music", 18.17], ["rumble", 12.49]], null, [["music", 55.98], ["soundtrack music", 12.25], ["synthesizer", 3.33]], null, null, null, null, null, null, null, null, null, null, [["hum", 54.04], ["mains hum", 16.81], ["music", 5.55]]], "duration": [2.73, 1.1, 0.73, 0.4, 0.74, 0.43, 0.09, 0.9, 2.8, 0.94, 0.15, 0.33, 0.97, 0.49, -0.01, 1.12, 0.65, 0.82, 2.42, 0.63, 2.83, 0.46, 1.02, 0.83, -0.04, 1.0, 1.37, 0.45, 0.28, 0.85, 0.02, 9.44]} \ No newline at end of file diff --git a/annotations_filtered/li2zByHeanQ_filtered.json b/annotations_filtered/li2zByHeanQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a865f23c55681b1d2548255d6c69750b56085e97 --- /dev/null +++ b/annotations_filtered/li2zByHeanQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 42.09], [47.0, 51.56], [53.0, 54.4], [55.0, 62.38], [64.0, 66.19], [71.0, 75.29]], "keep_status": [true, true, false, false, true, false], "silence_prob": [31.42, 45.36, 0.0, 45.43, 45.36, 44.78], "audiomae_on_audioset": [[["music", 46.89], ["smash, crash", 12.36], ["throbbing", 9.15]], [["hum", 25.45], ["throbbing", 17.35], ["mains hum", 15.34]], null, [["mains hum", 39.12], ["hum", 33.44], ["throbbing", 9.54]], [["music", 37.88], ["hum", 10.38], ["mains hum", 6.62]], [["music", 54.84], ["throbbing", 11.1], ["electronic music", 5.27]]], "duration": [7.09, 4.56, 1.4, 7.38, 2.19, 4.29]} \ No newline at end of file diff --git a/annotations_filtered/liK550asDSw_filtered.json b/annotations_filtered/liK550asDSw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf7bb2f00ec3643ff81cc9de26d64474ef2081c5 --- /dev/null +++ b/annotations_filtered/liK550asDSw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.37], [12.0, 12.5], [13.0, 14.18], [15.0, 15.7], [16.0, 16.82], [17.0, 17.54], [19.0, 19.97], [21.0, 22.13], [23.0, 23.89], [24.0, 24.88], [26.0, 25.95], [27.0, 27.24], [30.0, 30.65], [32.0, 33.02], [36.0, 36.95], [37.0, 39.82], [41.0, 42.04], [43.0, 59.71], [61.0, 64.83], [68.0, 68.93], [70.0, 70.43], [73.0, 73.57], [74.0, 74.53], [78.0, 78.38], [81.0, 82.8], [84.0, 88.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.93, 0.0, 87.92, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.37, 0.5, 1.18, 0.7, 0.82, 0.54, 0.97, 1.13, 0.89, 0.88, -0.05, 0.24, 0.65, 1.02, 0.95, 2.82, 1.04, 16.71, 3.83, 0.93, 0.43, 0.57, 0.53, 0.38, 1.8, 4.16]} \ No newline at end of file diff --git a/annotations_filtered/lixII1thTO4_filtered.json b/annotations_filtered/lixII1thTO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06c1e4beb0be01cbdf85910d4eea3995cb17d5e7 --- /dev/null +++ b/annotations_filtered/lixII1thTO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.4], [38.0, 38.26], [40.0, 41.64], [46.0, 46.31], [52.0, 69.25], [72.0, 71.98], [74.0, 76.08], [87.0, 91.61], [93.0, 92.87], [96.0, 99.27], [106.0, 111.13]], "keep_status": [false, false, false, false, true, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.04, 0.0, 29.73, 39.05, 0.0, 30.28, 31.22], "audiomae_on_audioset": [null, null, null, null, [["music", 27.42], ["livestock, farm animals, working animals", 14.98], ["animal", 9.31]], null, [["vehicle", 24.03], ["moo", 7.92], ["car", 6.91]], [["music", 59.78], ["musical instrument", 8.27], ["plucked string instrument", 2.63]], null, [["music", 20.73], ["moo", 18.72], ["cattle, bovinae", 13.52]], [["music", 49.2], ["theremin", 4.71], ["speech", 3.48]]], "duration": [0.4, 0.26, 1.64, 0.31, 17.25, -0.02, 2.08, 4.61, -0.13, 3.27, 5.13]} \ No newline at end of file diff --git a/annotations_filtered/lj59KyjwK3c_filtered.json b/annotations_filtered/lj59KyjwK3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/lj59KyjwK3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ljAdSzBv0ug_filtered.json b/annotations_filtered/ljAdSzBv0ug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7afe786723cf195246f4a689d86215ca682e1b2a --- /dev/null +++ b/annotations_filtered/ljAdSzBv0ug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [6.0, 7.13], [12.0, 12.85], [14.0, 15.89], [16.0, 20.04], [21.0, 27.84], [31.0, 31.62], [35.0, 36.21], [38.0, 38.62], [41.0, 42.47], [43.0, 44.66], [48.0, 48.63], [58.0, 60.07], [62.0, 61.96], [62.0, 65.8], [66.0, 65.87], [81.0, 81.55], [86.0, 86.63], [87.0, 87.67], [90.0, 92.55], [94.0, 96.3], [97.0, 97.8], [99.0, 99.74], [103.0, 103.2], [104.0, 104.99], [106.0, 106.41], [112.0, 113.78], [116.0, 118.81], [119.0, 121.73], [122.0, 121.76], [122.0, 121.8], [122.0, 121.83], [122.0, 121.86], [122.0, 122.23], [122.0, 124.33], [125.0, 133.64], [136.0, 137.64], [138.0, 139.21], [141.0, 142.08], [146.0, 157.38], [164.0, 165.59], [169.0, 169.57], [175.0, 176.4], [177.0, 178.09], [181.0, 181.04]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.35, 35.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.86, 0.0, 34.96, 0.0, 0.0, 0.0, 0.0, 47.08, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.47, 57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 43.1, 51.55, 0.0, 0.0, 0.0, 32.01, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 60.58], ["music", 12.33], ["noise", 2.4]], [["speech", 25.28], ["clip-clop", 19.0], ["horse", 11.28]], null, null, null, null, null, null, [["hum", 35.15], ["music", 18.81], ["throbbing", 18.41]], null, [["music", 54.24], ["didgeridoo", 12.7], ["speech", 7.6]], null, null, null, null, [["animal", 16.48], ["music", 14.75], ["dog", 6.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.77], ["music", 29.91], ["inside, small room", 4.03]], null, null, null, null, [["music", 52.85], ["speech", 22.8], ["hum", 4.32]], null, null, null, null, null], "duration": [0.56, 1.13, 0.85, 1.89, 4.04, 6.84, 0.62, 1.21, 0.62, 1.47, 1.66, 0.63, 2.07, -0.04, 3.8, -0.13, 0.55, 0.63, 0.67, 2.55, 2.3, 0.8, 0.74, 0.2, 0.99, 0.41, 1.78, 2.81, 2.73, -0.24, -0.2, -0.17, -0.14, 0.23, 2.33, 8.64, 1.64, 1.21, 1.08, 11.38, 1.59, 0.57, 1.4, 1.09, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/ljK_2ZT44jA_filtered.json b/annotations_filtered/ljK_2ZT44jA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69e0ed6711516a8a6449bb45c8efcc41d1305a38 --- /dev/null +++ b/annotations_filtered/ljK_2ZT44jA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.55], [23.0, 24.12], [28.0, 28.26], [33.0, 34.62], [73.0, 95.77]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.57], "audiomae_on_audioset": [null, null, null, null, [["music", 59.84], ["music of latin america", 5.86], ["brass instrument", 4.2]]], "duration": [0.55, 1.12, 0.26, 1.62, 22.77]} \ No newline at end of file diff --git a/annotations_filtered/ljMuEDlInLo_filtered.json b/annotations_filtered/ljMuEDlInLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eea80e80ddbde93355d7ff0b3d53b2d760f5faec --- /dev/null +++ b/annotations_filtered/ljMuEDlInLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.42], [17.0, 17.91], [22.0, 22.72], [25.0, 27.06], [35.0, 35.61], [36.0, 36.48], [39.0, 39.21], [43.0, 46.45], [50.0, 51.81], [58.0, 58.67], [64.0, 64.66], [67.0, 67.74]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [33.01, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 31.83, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["baby laughter", 18.67], ["echo", 14.09], ["chuckle, chortle", 12.45]], null, null, null, null, null, null, [["laughter", 34.3], ["snicker", 14.92], ["baby laughter", 11.89]], null, null, null, null], "duration": [2.42, 0.91, 0.72, 2.06, 0.61, 0.48, 0.21, 3.45, 1.81, 0.67, 0.66, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/ljdH53Ro0xQ_filtered.json b/annotations_filtered/ljdH53Ro0xQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a773d25a712e4ff49353851ed475c8381c3a937e --- /dev/null +++ b/annotations_filtered/ljdH53Ro0xQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.55], [13.0, 15.82], [16.0, 17.25], [20.0, 22.55], [28.0, 37.07], [39.0, 41.52], [45.0, 47.01], [48.0, 51.11], [52.0, 53.94], [55.0, 56.62], [59.0, 60.83], [64.0, 66.5], [68.0, 69.87], [72.0, 75.07], [78.0, 81.5], [84.0, 87.07], [88.0, 89.73], [91.0, 92.62], [95.0, 96.53], [98.0, 98.76], [100.0, 105.92], [106.0, 106.83], [108.0, 109.8], [112.0, 121.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.62, 59.59, 0.0, 98.1, 65.67, 99.78, 98.36, 87.55, 0.0, 0.0, 0.0, 92.48, 0.0, 98.36, 59.42, 99.73, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 98.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.55, 2.82, 1.25, 2.55, 9.07, 2.52, 2.01, 3.11, 1.94, 1.62, 1.83, 2.5, 1.87, 3.07, 3.5, 3.07, 1.73, 1.62, 1.53, 0.76, 5.92, 0.83, 1.8, 9.66]} \ No newline at end of file diff --git a/annotations_filtered/ljzkCBZuHM4_filtered.json b/annotations_filtered/ljzkCBZuHM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2411bea7ad04f5250aa6d6d97e44b98bdb78d36 --- /dev/null +++ b/annotations_filtered/ljzkCBZuHM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [7.0, 7.7], [8.0, 8.8], [10.0, 11.57], [19.0, 20.12], [21.0, 23.04], [25.0, 25.22], [30.0, 32.22], [33.0, 34.01], [35.0, 36.1], [37.0, 37.88], [46.0, 47.02], [48.0, 48.84], [52.0, 55.12], [57.0, 60.88], [62.0, 63.22], [64.0, 65.2], [71.0, 71.07], [78.0, 78.0], [111.0, 114.47], [115.0, 116.94]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.38, 0.0, 35.42, 0.0, 0.0, 0.0, 0.0, 0.0, 36.25, 47.86, 0.0, 0.0, 0.0, 0.0, 74.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 54.68], ["sidetone", 5.24], ["radio", 3.51]], null, [["boing", 71.26], ["breaking", 4.31], ["speech", 3.36]], null, null, null, null, null, [["animal", 14.05], ["music", 10.75], ["dog", 8.44]], [["speech", 40.52], ["fly, housefly", 10.98], ["sidetone", 6.69]], null, null, null, null, null, null], "duration": [0.96, 0.7, 0.8, 1.57, 1.12, 2.04, 0.22, 2.22, 1.01, 1.1, 0.88, 1.02, 0.84, 3.12, 3.88, 1.22, 1.2, 0.07, 0.0, 3.47, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/lk1As4QnaCc_filtered.json b/annotations_filtered/lk1As4QnaCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83761a0bfa35daee04d65a3cab29de900f6ebbcf --- /dev/null +++ b/annotations_filtered/lk1As4QnaCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.39], [26.0, 26.84], [28.0, 29.91]], "keep_status": [false, false, false], "silence_prob": [71.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [5.39, 0.84, 1.91]} \ No newline at end of file diff --git a/annotations_filtered/lkMilWJJR_U_filtered.json b/annotations_filtered/lkMilWJJR_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b8ced2257f4c1c65bc3fbb33e9d1856683088da --- /dev/null +++ b/annotations_filtered/lkMilWJJR_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [5.0, 5.88], [6.0, 9.93], [11.0, 15.35], [16.0, 19.74], [21.0, 22.28], [26.0, 27.03], [29.0, 30.87], [33.0, 33.17], [35.0, 62.06], [63.0, 70.28], [74.0, 83.96], [84.0, 84.0], [84.0, 84.13], [84.0, 84.2], [84.0, 86.07], [88.0, 91.52], [93.0, 96.06], [98.0, 101.14]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 94.95, 99.65, 98.99, 0.0, 0.0, 0.0, 0.0, 33.36, 31.57, 58.98, 0.0, 0.0, 0.0, 43.69, 84.98, 92.15, 97.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["fly, housefly", 21.22], ["music", 13.6], ["insect", 12.41]], [["music", 31.45], ["hum", 30.65], ["throbbing", 17.81]], null, null, null, null, [["music", 37.83], ["speech", 17.78], ["hum", 9.69]], null, null, null], "duration": [1.31, 0.88, 3.93, 4.35, 3.74, 1.28, 1.03, 1.87, 0.17, 27.06, 7.28, 9.96, 0.0, 0.13, 0.2, 2.07, 3.52, 3.06, 3.14]} \ No newline at end of file diff --git a/annotations_filtered/lkT9aqC6Tqw_filtered.json b/annotations_filtered/lkT9aqC6Tqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a28353378e1ce186c54e65c6ac8cddf44ec62ec --- /dev/null +++ b/annotations_filtered/lkT9aqC6Tqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 58.35], [66.0, 67.36], [69.0, 69.06]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [37.35, 1.36, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/lkoWhWGcVR4_filtered.json b/annotations_filtered/lkoWhWGcVR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc6a3177fed57b41b5b286aafc4fed28eef5b709 --- /dev/null +++ b/annotations_filtered/lkoWhWGcVR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [8.0, 9.22], [11.0, 12.23], [14.0, 15.08], [18.0, 19.79], [20.0, 20.98], [23.0, 23.67], [24.0, 24.39], [26.0, 30.27], [34.0, 34.55], [37.0, 38.06], [47.0, 47.63], [50.0, 64.56], [69.0, 69.45], [72.0, 72.23], [73.0, 74.6], [75.0, 76.89], [80.0, 94.74], [97.0, 100.01], [102.0, 102.88], [109.0, 109.53], [110.0, 110.64], [116.0, 116.85], [122.0, 122.69], [128.0, 133.19], [135.0, 135.18], [136.0, 137.74], [140.0, 141.17], [144.0, 145.83], [147.0, 147.88], [149.0, 149.42], [153.0, 158.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 72.75, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.08], ["clip-clop", 10.82], ["horse", 9.25]]], "duration": [0.63, 1.22, 1.23, 1.08, 1.79, 0.98, 0.67, 0.39, 4.27, 0.55, 1.06, 0.63, 14.56, 0.45, 0.23, 1.6, 1.89, 14.74, 3.01, 0.88, 0.53, 0.64, 0.85, 0.69, 5.19, 0.18, 1.74, 1.17, 1.83, 0.88, 0.42, 5.84]} \ No newline at end of file diff --git a/annotations_filtered/lkq-Fd9TU8k_filtered.json b/annotations_filtered/lkq-Fd9TU8k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95038593654b19565c5f7453a2b8618c91559548 --- /dev/null +++ b/annotations_filtered/lkq-Fd9TU8k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.85], [11.0, 19.9], [21.0, 21.76], [22.0, 22.86], [23.0, 24.16], [26.0, 28.0], [31.0, 31.04], [32.0, 33.15], [35.0, 35.77], [36.0, 36.95], [42.0, 41.77], [42.0, 41.96], [43.0, 43.41], [44.0, 44.25], [47.0, 47.38], [49.0, 50.43], [55.0, 55.41], [60.0, 60.52], [78.0, 82.39], [100.0, 99.99], [109.0, 109.75], [110.0, 113.44], [115.0, 115.55], [117.0, 117.44], [118.0, 119.1], [127.0, 128.14], [149.0, 150.43], [153.0, 154.08], [155.0, 155.12], [157.0, 162.09], [167.0, 167.07], [178.0, 178.23], [179.0, 180.2], [195.0, 196.55], [199.0, 198.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.27, 0.0, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["crushing", 91.75], ["throbbing", 0.83], ["hum", 0.66]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.85, 8.9, 0.76, 0.86, 1.16, 2.0, 0.04, 1.15, 0.77, 0.95, -0.23, -0.04, 0.41, 0.25, 0.38, 1.43, 0.41, 0.52, 4.39, -0.01, 0.75, 3.44, 0.55, 0.44, 1.1, 1.14, 1.43, 1.08, 0.12, 5.09, 0.07, 0.23, 1.2, 1.55, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/ll5qiWa6YDk_filtered.json b/annotations_filtered/ll5qiWa6YDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60f7a820a03d5592854744dc76edeb94f03776fa --- /dev/null +++ b/annotations_filtered/ll5qiWa6YDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 27.24], [28.0, 30.1], [35.0, 36.59], [37.0, 51.09], [51.0, 59.54], [62.0, 63.64], [65.0, 67.09], [68.0, 69.74], [73.0, 74.65], [77.0, 78.49], [80.0, 81.31], [85.0, 110.66]], "keep_status": [false, true, false, true, false, false, true, false, false, false, false, true], "silence_prob": [33.16, 34.04, 0.0, 30.5, 30.08, 0.0, 35.91, 0.0, 0.0, 0.0, 0.0, 30.15], "audiomae_on_audioset": [[["whale vocalization", 53.11], ["mains hum", 15.59], ["hum", 14.6]], [["whale vocalization", 16.97], ["music", 16.15], ["speech", 15.6]], null, [["music", 28.75], ["hum", 27.45], ["mains hum", 10.2]], [["music", 60.31], ["theremin", 13.07], ["musical instrument", 9.11]], null, [["music", 29.44], ["hum", 16.39], ["mains hum", 11.7]], null, null, null, null, [["speech", 44.76], ["music", 16.79], ["hum", 8.36]]], "duration": [2.24, 2.1, 1.59, 14.09, 8.54, 1.64, 2.09, 1.74, 1.65, 1.49, 1.31, 25.66]} \ No newline at end of file diff --git a/annotations_filtered/llTSaDl6Pcg_filtered.json b/annotations_filtered/llTSaDl6Pcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7898b3e5aef9e9fa96b3d04b700f88fc6874c98 --- /dev/null +++ b/annotations_filtered/llTSaDl6Pcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.19], [6.0, 6.98], [8.0, 10.76], [19.0, 18.77], [19.0, 22.18], [22.0, 22.27], [22.0, 30.65], [31.0, 32.22], [33.0, 34.82], [37.0, 41.72], [44.0, 45.06], [49.0, 50.99], [53.0, 54.24], [56.0, 58.6], [66.0, 67.22], [74.0, 74.53], [76.0, 77.67], [79.0, 81.16], [83.0, 94.96], [95.0, 96.94], [100.0, 101.66], [103.0, 104.7], [107.0, 108.45], [110.0, 112.41], [115.0, 117.53], [119.0, 122.34], [123.0, 125.49], [127.0, 135.7], [137.0, 137.73], [139.0, 143.78], [145.0, 146.64], [150.0, 151.33], [152.0, 154.89], [156.0, 157.2], [158.0, 159.7], [161.0, 165.59], [166.0, 171.48], [177.0, 178.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 0.0, 52.1, 0.0, 80.11, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 99.62, 81.0, 0.0, 0.0, 0.0, 0.0, 99.85, 99.98, 99.93, 86.45, 72.75, 0.0, 53.22, 0.0, 0.0, 73.36, 0.0, 0.0, 98.36, 72.46, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.98, 2.76, -0.23, 3.18, 0.27, 8.65, 1.22, 1.82, 4.72, 1.06, 1.99, 1.24, 2.6, 1.22, 0.53, 1.67, 2.16, 11.96, 1.94, 1.66, 1.7, 1.45, 2.41, 2.53, 3.34, 2.49, 8.7, 0.73, 4.78, 1.64, 1.33, 2.89, 1.2, 1.7, 4.59, 5.48, 1.88]} \ No newline at end of file diff --git a/annotations_filtered/lllLnc58CoI_filtered.json b/annotations_filtered/lllLnc58CoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3a42c19a9d53d41016d0bd0d4f6a4d691ddf16f --- /dev/null +++ b/annotations_filtered/lllLnc58CoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 80.32], [81.0, 103.15], [105.0, 105.38], [108.0, 108.6], [110.0, 112.29], [113.0, 115.15], [116.0, 117.26]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [92.97, 47.82, 0.0, 0.0, 49.4, 99.8, 0.0], "audiomae_on_audioset": [null, [["speech", 19.81], ["hum", 18.34], ["mains hum", 9.28]], null, null, [["speech", 78.62], ["sidetone", 4.83], ["radio", 1.61]], null, null], "duration": [13.32, 22.15, 0.38, 0.6, 2.29, 2.15, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/llzXzUe2KAk_filtered.json b/annotations_filtered/llzXzUe2KAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d1bb8b35bc74b5aeaf142449d450bb884f7a77c --- /dev/null +++ b/annotations_filtered/llzXzUe2KAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.24], [22.0, 39.53], [41.0, 71.14], [76.0, 85.24], [87.0, 97.39], [102.0, 146.2], [149.0, 163.86], [166.0, 167.76], [169.0, 176.55]], "keep_status": [true, true, false, true, false, false, true, false, true], "silence_prob": [33.35, 36.62, 0.0, 33.63, 50.91, 0.0, 32.74, 0.0, 31.98], "audiomae_on_audioset": [[["music", 40.19], ["throbbing", 12.45], ["hum", 8.39]], [["hum", 41.06], ["throbbing", 14.74], ["mains hum", 8.38]], null, [["throbbing", 22.05], ["hum", 20.33], ["music", 18.69]], null, null, [["music", 42.53], ["throbbing", 9.28], ["cacophony", 8.55]], null, [["hum", 26.62], ["throbbing", 21.53], ["mains hum", 16.86]]], "duration": [5.24, 17.53, 30.14, 9.24, 10.39, 44.2, 14.86, 1.76, 7.55]} \ No newline at end of file diff --git a/annotations_filtered/lmDII7sMIF8_filtered.json b/annotations_filtered/lmDII7sMIF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa13e0af91f7f0059b88147088db76789c3b0b26 --- /dev/null +++ b/annotations_filtered/lmDII7sMIF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.16], [42.0, 42.6], [47.0, 47.66], [56.0, 56.13], [60.0, 61.25], [63.0, 63.34], [68.0, 68.27], [71.0, 71.09], [74.0, 74.75], [76.0, 76.96], [79.0, 79.3], [82.0, 82.49], [87.0, 87.02], [87.0, 88.6], [90.0, 90.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.6, 0.66, 0.13, 1.25, 0.34, 0.27, 0.09, 0.75, 0.96, 0.3, 0.49, 0.02, 1.6, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/lmlX39gM9-c_filtered.json b/annotations_filtered/lmlX39gM9-c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58a8f0c9cf65dc581ddd80681a6e2ec4784eef3a --- /dev/null +++ b/annotations_filtered/lmlX39gM9-c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [8.0, 9.49], [12.0, 13.24], [15.0, 15.18], [16.0, 18.12], [19.0, 20.43], [22.0, 31.78], [35.0, 43.19], [44.0, 46.09], [48.0, 48.34], [52.0, 56.88], [60.0, 68.81], [69.0, 68.94], [69.0, 70.65], [74.0, 75.83], [77.0, 102.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.63, 0.0, 35.2, 64.63, 64.63, 0.0, 57.97, 45.36, 0.0, 0.0, 0.0, 64.97], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 38.73], ["hum", 25.78], ["throbbing", 16.5]], null, null, null, null, [["speech", 52.02], ["music", 17.17], ["hum", 5.2]], null, null, null, null], "duration": [0.81, 1.49, 1.24, 0.18, 2.12, 1.43, 9.78, 8.19, 2.09, 0.34, 4.88, 8.81, -0.06, 1.65, 1.83, 25.2]} \ No newline at end of file diff --git a/annotations_filtered/lnPDc4XE77w_filtered.json b/annotations_filtered/lnPDc4XE77w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb1b217136dc421a5d094a8022506a05178c8283 --- /dev/null +++ b/annotations_filtered/lnPDc4XE77w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.43], [1.0, 5.61], [6.0, 7.42], [11.0, 16.63], [18.0, 20.36], [21.0, 23.25], [27.0, 31.06], [32.0, 32.73], [36.0, 38.62], [39.0, 38.87], [40.0, 40.61], [42.0, 49.38], [51.0, 51.9], [54.0, 54.01], [56.0, 70.24], [71.0, 72.0], [76.0, 76.49], [82.0, 83.03], [85.0, 89.82], [94.0, 109.92], [114.0, 117.07], [119.0, 120.16], [120.0, 127.13], [132.0, 134.52], [135.0, 144.53], [146.0, 146.57], [150.0, 167.95], [170.0, 171.69], [172.0, 172.57], [176.0, 192.62], [199.0, 201.8]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true], "silence_prob": [0.0, 30.91, 0.0, 37.23, 59.42, 84.43, 55.81, 0.0, 37.04, 0.0, 0.0, 36.35, 0.0, 0.0, 34.39, 0.0, 0.0, 0.0, 30.78, 30.86, 33.06, 0.0, 33.14, 30.87, 30.8, 0.0, 29.66, 0.0, 0.0, 29.86, 31.48], "audiomae_on_audioset": [null, [["music", 71.77], ["speech", 7.04], ["didgeridoo", 3.57]], null, [["music", 33.82], ["didgeridoo", 31.01], ["speech", 2.92]], null, null, null, null, [["music", 35.45], ["speech", 17.27], ["noise", 8.94]], null, null, [["music", 30.37], ["livestock, farm animals, working animals", 21.03], ["cattle, bovinae", 7.53]], null, null, [["music", 21.84], ["sound effect", 6.88], ["hum", 6.75]], null, null, null, [["music", 52.88], ["whack, thwack", 17.42], ["smash, crash", 3.16]], [["music", 49.31], ["breaking", 24.55], ["speech", 14.13]], [["music", 72.43], ["boing", 5.73], ["didgeridoo", 2.64]], null, [["music", 65.63], ["speech", 7.7], ["smash, crash", 5.06]], [["clang", 36.17], ["speech", 16.58], ["ding", 10.47]], [["music", 39.33], ["speech", 38.53], ["quack", 3.39]], null, [["cattle, bovinae", 14.9], ["moo", 13.78], ["livestock, farm animals, working animals", 13.49]], null, null, [["whale vocalization", 81.73], ["music", 3.16], ["vehicle", 1.95]], [["speech", 18.66], ["beatboxing", 13.5], ["music", 10.29]]], "duration": [1.43, 4.61, 1.42, 5.63, 2.36, 2.25, 4.06, 0.73, 2.62, -0.13, 0.61, 7.38, 0.9, 0.01, 14.24, 1.0, 0.49, 1.03, 4.82, 15.92, 3.07, 1.16, 7.13, 2.52, 9.53, 0.57, 17.95, 1.69, 0.57, 16.62, 2.8]} \ No newline at end of file diff --git a/annotations_filtered/lnQRXfjI664_filtered.json b/annotations_filtered/lnQRXfjI664_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..238068aedbd892e7b08405a52c9bd39287c3fc58 --- /dev/null +++ b/annotations_filtered/lnQRXfjI664_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [6.0, 7.05], [19.0, 20.34], [22.0, 30.92], [31.0, 32.43], [33.0, 34.18], [35.0, 37.52], [38.0, 39.33], [40.0, 41.07], [42.0, 45.66], [48.0, 50.67], [52.0, 53.3], [54.0, 55.9], [57.0, 56.93], [57.0, 60.24], [61.0, 78.17], [82.0, 82.75], [83.0, 88.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 50.31, 0.0, 0.0, 62.07, 0.0, 0.0, 57.48, 51.44, 0.0, 0.0, 0.0, 51.82, 41.98, 0.0, 31.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.0], ["musical instrument", 7.73], ["wind instrument, woodwind instrument", 5.32]], null, [["music", 45.66], ["speech", 12.55], ["synthesizer", 4.19]]], "duration": [0.75, 1.05, 1.34, 8.92, 1.43, 1.18, 2.52, 1.33, 1.07, 3.66, 2.67, 1.3, 1.9, -0.07, 3.24, 17.17, 0.75, 5.99]} \ No newline at end of file diff --git a/annotations_filtered/lnYzb6P_1Wg_filtered.json b/annotations_filtered/lnYzb6P_1Wg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7a8ba2b9830625e6171138c7b8fa2adcb9cac3a --- /dev/null +++ b/annotations_filtered/lnYzb6P_1Wg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 2.96], [5.0, 36.59], [38.0, 91.64]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.5, 1.96, 31.59, 53.64]} \ No newline at end of file diff --git a/annotations_filtered/lnf-VO8gIGg_filtered.json b/annotations_filtered/lnf-VO8gIGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..545fe4cc9e3bf3fc6bb77c3968451e1db7feb695 --- /dev/null +++ b/annotations_filtered/lnf-VO8gIGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.55], [1.0, 0.58], [1.0, 0.65], [1.0, 0.78], [1.0, 0.9], [1.0, 1.0], [9.0, 9.93], [13.0, 14.88], [17.0, 18.12], [25.0, 30.15], [35.0, 37.67], [48.0, 48.57], [49.0, 54.21], [58.0, 66.97], [74.0, 79.73], [82.0, 83.19], [84.0, 87.44], [89.0, 89.67], [91.0, 93.09], [94.0, 105.11], [108.0, 116.97], [120.0, 125.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 94.22, 0.0, 48.06, 85.54, 94.95, 0.0, 94.37, 0.0, 97.92, 37.16, 50.81, 36.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.96], ["speech", 25.52], ["hum", 8.56]], null, null, null, null, null, null, [["music", 25.36], ["fly, housefly", 15.13], ["didgeridoo", 10.71]], null, [["speech", 36.27], ["hum", 14.74], ["music", 9.04]]], "duration": [-0.45, -0.42, -0.35, -0.22, -0.1, 0.0, 0.93, 1.88, 1.12, 5.15, 2.67, 0.57, 5.21, 8.97, 5.73, 1.19, 3.44, 0.67, 2.09, 11.11, 8.97, 5.39]} \ No newline at end of file diff --git a/annotations_filtered/lnfpTgAQ0Ys_filtered.json b/annotations_filtered/lnfpTgAQ0Ys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef525b23219d13c63457607962566ad649491e6c --- /dev/null +++ b/annotations_filtered/lnfpTgAQ0Ys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.83], [14.0, 18.13], [19.0, 23.99], [25.0, 28.51], [29.0, 34.08], [35.0, 42.55], [44.0, 45.05], [46.0, 46.47], [48.0, 50.08], [53.0, 54.73], [56.0, 60.17], [62.0, 64.66], [66.0, 66.8], [67.0, 69.48], [75.0, 75.49], [77.0, 79.44], [80.0, 81.82], [82.0, 83.2], [84.0, 84.94], [88.0, 88.43], [90.0, 95.76], [102.0, 102.54], [104.0, 105.27], [108.0, 108.3], [113.0, 114.66], [116.0, 119.97], [121.0, 122.42], [124.0, 126.12], [128.0, 129.19], [133.0, 133.24], [140.0, 142.62], [146.0, 152.52], [154.0, 155.22], [156.0, 159.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.92, 72.9, 99.56, 100.0, 96.89, 92.64, 0.0, 0.0, 74.44, 0.0, 89.54, 90.78, 0.0, 99.65, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 91.13, 0.0, 0.0, 99.84, 99.26, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.83, 4.13, 4.99, 3.51, 5.08, 7.55, 1.05, 0.47, 2.08, 1.73, 4.17, 2.66, 0.8, 2.48, 0.49, 2.44, 1.82, 1.2, 0.94, 0.43, 5.76, 0.54, 1.27, 0.3, 1.66, 3.97, 1.42, 2.12, 1.19, 0.24, 2.62, 6.52, 1.22, 3.88]} \ No newline at end of file diff --git a/annotations_filtered/lniVpfK5SW8_filtered.json b/annotations_filtered/lniVpfK5SW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efe0965fc8af44dd9e9f86521abdfb8a018ac46b --- /dev/null +++ b/annotations_filtered/lniVpfK5SW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 32.85], [34.0, 34.48], [43.0, 75.14], [76.0, 75.88], [76.0, 140.68], [142.0, 146.18], [148.0, 147.73]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [29.25, 0.0, 0.0, 0.0, 0.0, 32.39, 0.0], "audiomae_on_audioset": [[["electric shaver, electric razor", 15.45], ["didgeridoo", 13.84], ["speech", 13.24]], null, null, null, null, [["music", 50.14], ["throbbing", 20.72], ["hum", 4.49]], null], "duration": [13.85, 0.48, 32.14, -0.12, 64.68, 4.18, -0.27]} \ No newline at end of file diff --git a/annotations_filtered/loVYzYPJBTE_filtered.json b/annotations_filtered/loVYzYPJBTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8be61fddb5e716a46fd6e43fe3407649d1a33b3 --- /dev/null +++ b/annotations_filtered/loVYzYPJBTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [6.0, 5.75], [13.0, 13.27], [19.0, 18.93], [20.0, 21.24], [22.0, 23.21], [24.0, 25.1], [30.0, 49.5], [53.0, 53.6], [54.0, 61.72], [64.0, 64.37], [68.0, 76.01], [78.0, 96.15], [102.0, 109.66], [110.0, 113.9], [122.0, 129.07], [131.0, 134.25]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, true, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.33, 0.0, 32.28, 0.0, 31.44, 31.18, 31.38, 31.74, 31.42, 32.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 43.62], ["moo", 6.13], ["cattle, bovinae", 6.05]], null, [["music", 54.19], ["crowd", 4.19], ["electronic music", 3.02]], null, [["music", 28.75], ["cattle, bovinae", 9.99], ["moo", 9.28]], [["music", 67.51], ["vehicle", 3.95], ["motorcycle", 3.72]], [["music", 58.43], ["speech", 3.78], ["throbbing", 3.05]], [["music", 45.16], ["speech", 18.77], ["sidetone", 13.28]], [["music", 32.82], ["speech", 18.31], ["livestock, farm animals, working animals", 2.44]], [["music", 52.48], ["rock and roll", 7.31], ["cacophony", 3.78]]], "duration": [0.72, -0.25, 0.27, -0.07, 1.24, 1.21, 1.1, 19.5, 0.6, 7.72, 0.37, 8.01, 18.15, 7.66, 3.9, 7.07, 3.25]} \ No newline at end of file diff --git a/annotations_filtered/lot6apnbKk4_filtered.json b/annotations_filtered/lot6apnbKk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1c9195cef32940ed1c4032985858ad2ef36dea7 --- /dev/null +++ b/annotations_filtered/lot6apnbKk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.82], [28.0, 28.02], [31.0, 31.09], [33.0, 38.57], [40.0, 45.86], [48.0, 48.36], [55.0, 55.54], [62.0, 71.49], [76.0, 84.1], [89.0, 96.77], [98.0, 105.56], [111.0, 118.27], [158.0, 158.5], [162.0, 162.23], [164.0, 166.19]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.81, 37.59, 0.0, 0.0, 35.08, 37.83, 38.19, 43.05, 38.71, 0.0, 0.0, 59.07], "audiomae_on_audioset": [null, null, null, [["mains hum", 30.3], ["music", 22.5], ["hum", 19.47]], [["music", 54.79], ["speech", 24.7], ["foghorn", 3.16]], null, null, [["music", 72.77], ["musical instrument", 12.42], ["classical music", 2.43]], [["music", 31.79], ["speech", 29.7], ["hum", 4.22]], [["hum", 29.76], ["speech", 21.84], ["music", 19.11]], [["music", 33.11], ["hum", 25.95], ["mains hum", 9.24]], [["music", 46.57], ["speech", 19.61], ["outside, rural or natural", 5.68]], null, null, null], "duration": [0.82, 0.02, 0.09, 5.57, 5.86, 0.36, 0.54, 9.49, 8.1, 7.77, 7.56, 7.27, 0.5, 0.23, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/louBM-Mix7s_filtered.json b/annotations_filtered/louBM-Mix7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0433a7ae98867035ccf727ec0222f5ae2a9e4eef --- /dev/null +++ b/annotations_filtered/louBM-Mix7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 18.87], [20.0, 21.51], [23.0, 24.49], [25.0, 32.63], [34.0, 34.45], [35.0, 35.24], [36.0, 36.8], [38.0, 38.6], [39.0, 40.24], [41.0, 43.06], [45.0, 46.53], [49.0, 49.5], [50.0, 50.3], [51.0, 60.66], [61.0, 61.96], [65.0, 65.1], [66.0, 65.72], [74.0, 73.82], [74.0, 74.73], [75.0, 79.03], [79.0, 79.69], [81.0, 80.79], [81.0, 80.84], [85.0, 85.95], [87.0, 87.25], [90.0, 90.75], [91.0, 91.86], [93.0, 93.41], [95.0, 95.05], [97.0, 97.44], [99.0, 99.47], [101.0, 101.9], [103.0, 105.46], [106.0, 106.03], [106.0, 107.03], [107.0, 107.86], [110.0, 110.03], [111.0, 111.33], [112.0, 112.85], [115.0, 115.89], [117.0, 120.18], [121.0, 121.31], [122.0, 123.04], [124.0, 125.54], [128.0, 129.14], [130.0, 131.25]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.35, 0.0, 0.0, 32.14, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 37.97, 0.0, 0.0, 0.0, 0.0, 0.0, 32.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.54, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 31.85], ["speech", 23.27], ["radio", 12.16]], null, null, [["didgeridoo", 21.74], ["speech", 16.48], ["music", 12.97]], null, null, null, null, null, null, null, null, null, [["speech", 75.4], ["radio", 6.6], ["telephone", 4.2]], null, null, null, null, null, [["animal", 28.5], ["speech", 24.88], ["domestic animals, pets", 3.36]], null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 19.97], ["moo", 15.26], ["radio", 10.87]], null, null, null, null, null, null, null, [["music", 56.73], ["musical instrument", 13.87], ["synthesizer", 8.62]], null, null, null, null, null], "duration": [4.87, 1.51, 1.49, 7.63, 0.45, 0.24, 0.8, 0.6, 1.24, 2.06, 1.53, 0.5, 0.3, 9.66, 0.96, 0.1, -0.28, -0.18, 0.73, 4.03, 0.69, -0.21, -0.16, 0.95, 0.25, 0.75, 0.86, 0.41, 0.05, 0.44, 0.47, 0.9, 2.46, 0.03, 1.03, 0.86, 0.03, 0.33, 0.85, 0.89, 3.18, 0.31, 1.04, 1.54, 1.14, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/lp0FOpFdWi8_filtered.json b/annotations_filtered/lp0FOpFdWi8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5f1844f901160c17ddf89d5f63deafc7186a3a8 --- /dev/null +++ b/annotations_filtered/lp0FOpFdWi8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.87], [14.0, 15.43], [18.0, 20.39], [22.0, 22.49], [23.0, 23.5], [25.0, 27.78], [29.0, 30.7], [35.0, 37.98], [39.0, 40.83], [41.0, 45.6], [46.0, 46.21], [49.0, 55.56], [60.0, 60.22], [68.0, 70.97], [75.0, 77.14], [78.0, 81.51], [83.0, 83.57], [85.0, 85.19], [91.0, 92.38], [95.0, 95.72], [97.0, 99.3], [100.0, 101.12], [102.0, 105.76], [106.0, 110.12], [111.0, 111.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.85, 0.0, 99.91, 0.0, 0.0, 100.0, 0.0, 89.19, 0.0, 98.01, 0.0, 95.37, 0.0, 99.44, 99.68, 97.92, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 99.05, 83.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.87, 1.43, 2.39, 0.49, 0.5, 2.78, 1.7, 2.98, 1.83, 4.6, 0.21, 6.56, 0.22, 2.97, 2.14, 3.51, 0.57, 0.19, 1.38, 0.72, 2.3, 1.12, 3.76, 4.12, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/lp1s4-tc2U0_filtered.json b/annotations_filtered/lp1s4-tc2U0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8367f17b85b9586d250ba7366ff90d3a9b9b7830 --- /dev/null +++ b/annotations_filtered/lp1s4-tc2U0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.67], [11.0, 12.38], [16.0, 18.3], [19.0, 55.95], [58.0, 66.82], [69.0, 141.81], [143.0, 160.47], [166.0, 184.89], [190.0, 216.4]], "keep_status": [false, false, true, false, false, false, true, false, false], "silence_prob": [30.21, 0.0, 30.27, 0.0, 30.65, 0.0, 30.08, 29.93, 31.64], "audiomae_on_audioset": [[["hum", 39.92], ["mains hum", 25.51], ["throbbing", 16.7]], null, [["music", 45.35], ["musical instrument", 6.68], ["thunk", 6.52]], null, [["music", 52.67], ["speech", 21.18], ["synthesizer", 7.76]], null, [["music", 51.42], ["speech", 9.2], ["synthesizer", 4.85]], [["music", 61.9], ["throbbing", 13.68], ["hum", 8.94]], [["hum", 33.6], ["music", 27.8], ["throbbing", 22.84]]], "duration": [4.67, 1.38, 2.3, 36.95, 8.82, 72.81, 17.47, 18.89, 26.4]} \ No newline at end of file diff --git a/annotations_filtered/lpod4qQzO7Q_filtered.json b/annotations_filtered/lpod4qQzO7Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ae15b605d58341bbeb7c79e955bc9f73cad6872 --- /dev/null +++ b/annotations_filtered/lpod4qQzO7Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 29.05], [33.0, 33.89], [36.0, 40.64]], "keep_status": [false, false, false], "silence_prob": [31.03, 0.0, 28.85], "audiomae_on_audioset": [[["music", 62.34], ["theremin", 5.55], ["speech", 5.14]], null, [["music", 36.58], ["mains hum", 28.2], ["hum", 9.61]]], "duration": [2.05, 0.89, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/lpwrDEfCESg_filtered.json b/annotations_filtered/lpwrDEfCESg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3335891237f995541638ccee712d441350cf563 --- /dev/null +++ b/annotations_filtered/lpwrDEfCESg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.67], [13.0, 12.97], [15.0, 15.35], [28.0, 29.42], [30.0, 50.67], [54.0, 59.93], [61.0, 61.13], [62.0, 63.14], [65.0, 72.45], [74.0, 77.13], [80.0, 80.74], [82.0, 84.5], [94.0, 95.42], [96.0, 97.33], [100.0, 100.62], [103.0, 104.84], [106.0, 108.03], [112.0, 115.32]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.06, 30.72, 0.0, 0.0, 43.35, 61.87, 0.0, 32.6, 0.0, 0.0, 0.0, 0.0, 60.89, 29.59], "audiomae_on_audioset": [null, null, null, null, [["speech", 29.65], ["music", 25.17], ["theremin", 24.12]], [["livestock, farm animals, working animals", 33.85], ["music", 13.51], ["animal", 13.01]], null, null, [["mains hum", 31.65], ["hum", 30.42], ["music", 12.82]], null, null, [["livestock, farm animals, working animals", 13.53], ["animal", 11.59], ["speech", 10.37]], null, null, null, null, null, [["speech", 22.51], ["cattle, bovinae", 7.4], ["fly, housefly", 7.23]]], "duration": [0.67, -0.03, 0.35, 1.42, 20.67, 5.93, 0.13, 1.14, 7.45, 3.13, 0.74, 2.5, 1.42, 1.33, 0.62, 1.84, 2.03, 3.32]} \ No newline at end of file diff --git a/annotations_filtered/lpyg94OzHK0_filtered.json b/annotations_filtered/lpyg94OzHK0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7484ef154c60cb5a1c0bb0577aed089481a38a29 --- /dev/null +++ b/annotations_filtered/lpyg94OzHK0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.8], [5.0, 10.79], [12.0, 12.23], [13.0, 14.17], [16.0, 17.91], [18.0, 18.0], [20.0, 20.8], [23.0, 23.94], [26.0, 27.3], [30.0, 30.91], [34.0, 34.67], [37.0, 38.48], [41.0, 42.67], [45.0, 46.84], [49.0, 50.5], [53.0, 54.26], [57.0, 57.81], [60.0, 61.38], [64.0, 64.84], [72.0, 76.69], [78.0, 82.51], [84.0, 87.25], [88.0, 88.65], [89.0, 93.28], [93.0, 95.22], [98.0, 98.61], [101.0, 101.83], [107.0, 124.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 32.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 99.1, 90.43, 0.0, 34.31, 49.87, 0.0, 0.0, 30.56], "audiomae_on_audioset": [null, [["speech", 71.92], ["sidetone", 4.77], ["noise", 4.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 42.74], ["fly, housefly", 4.84], ["noise", 3.54]], [["music", 25.09], ["speech", 9.8], ["beatboxing", 8.74]], null, null, [["speech", 16.46], ["cacophony", 12.28], ["noise", 8.37]]], "duration": [0.8, 5.79, 0.23, 1.17, 1.91, 0.0, 0.8, 0.94, 1.3, 0.91, 0.67, 1.48, 1.67, 1.84, 1.5, 1.26, 0.81, 1.38, 0.84, 4.69, 4.51, 3.25, 0.65, 4.28, 2.22, 0.61, 0.83, 17.12]} \ No newline at end of file diff --git a/annotations_filtered/lqdyZpgCnXQ_filtered.json b/annotations_filtered/lqdyZpgCnXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c92bb7c14446d1ce605c98de6a6801d0b163091 --- /dev/null +++ b/annotations_filtered/lqdyZpgCnXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [5.0, 5.56], [12.0, 13.19], [16.0, 16.63], [17.0, 16.66], [18.0, 19.53], [54.0, 54.48], [59.0, 59.51]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.0, 0.56, 1.19, 0.63, -0.34, 1.53, 0.48, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/lqnKLTA2GVE_filtered.json b/annotations_filtered/lqnKLTA2GVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..153ed7709e8a8a041394dabdb6736a06cd8281dc --- /dev/null +++ b/annotations_filtered/lqnKLTA2GVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 45.23], [47.0, 48.46], [53.0, 53.79], [55.0, 67.73], [69.0, 70.02], [73.0, 148.96]], "keep_status": [false, false, false, true, false, false], "silence_prob": [58.64, 0.0, 0.0, 31.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 48.09], ["hum", 9.83], ["explosion", 6.36]], null, null], "duration": [9.23, 1.46, 0.79, 12.73, 1.02, 75.96]} \ No newline at end of file diff --git a/annotations_filtered/lr7pyggTmmY_filtered.json b/annotations_filtered/lr7pyggTmmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21ce3ba4353ac7bd245fd500f44dfd996d46ceeb --- /dev/null +++ b/annotations_filtered/lr7pyggTmmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.32], [7.0, 7.23], [11.0, 14.15], [19.0, 19.82], [22.0, 23.09], [30.0, 31.36], [35.0, 35.7], [38.0, 38.01], [53.0, 54.94], [63.0, 66.31], [67.0, 67.9], [77.0, 78.11], [81.0, 88.48], [89.0, 90.51], [93.0, 98.51], [100.0, 100.82], [112.0, 121.37], [123.0, 137.37], [139.0, 141.3], [144.0, 149.64], [152.0, 153.22], [154.0, 156.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [99.71, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 89.54, 0.0, 36.44, 0.0, 62.37, 46.4, 88.83, 33.04, 0.0, 33.49], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.73], ["beatboxing", 35.33], ["music", 2.72]], null, null, [["music", 40.49], ["insect", 7.25], ["singing bowl", 5.7]], null, [["music", 13.83], ["mains hum", 9.9], ["noise", 6.25]], null, [["throbbing", 29.31], ["music", 27.97], ["hum", 27.82]]], "duration": [2.32, 0.23, 3.15, 0.82, 1.09, 1.36, 0.7, 0.01, 1.94, 3.31, 0.9, 1.11, 7.48, 1.51, 5.51, 0.82, 9.37, 14.37, 2.3, 5.64, 1.22, 2.49]} \ No newline at end of file diff --git a/annotations_filtered/lrGIfJdbUHY_filtered.json b/annotations_filtered/lrGIfJdbUHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e12b83194bff8466e34c6ecec0123709c6ffd58 --- /dev/null +++ b/annotations_filtered/lrGIfJdbUHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.12], [10.0, 26.37], [27.0, 28.04], [32.0, 39.92], [41.0, 41.03], [42.0, 44.1], [45.0, 46.43], [49.0, 50.52], [54.0, 56.47], [66.0, 77.06], [78.0, 83.76], [84.0, 95.81], [97.0, 97.41], [98.0, 99.49], [107.0, 134.45]], "keep_status": [false, true, false, true, false, true, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 31.68, 0.0, 31.22, 0.0, 32.66, 0.0, 0.0, 30.36, 33.89, 33.0, 31.06, 0.0, 0.0, 31.77], "audiomae_on_audioset": [null, [["music", 39.37], ["mosquito", 10.37], ["buzz", 7.89]], null, [["groan", 18.01], ["speech", 16.0], ["music", 10.05]], null, [["music", 51.45], ["speech", 11.16], ["radio", 7.24]], null, null, [["whale vocalization", 17.28], ["grunt", 10.36], ["music", 5.71]], [["whack, thwack", 33.93], ["music", 28.32], ["speech", 9.32]], [["music", 35.48], ["speech", 8.25], ["boing", 7.48]], [["speech", 61.92], ["music", 12.55], ["hum", 2.99]], null, null, [["mains hum", 22.33], ["music", 19.15], ["hum", 17.68]]], "duration": [1.12, 16.37, 1.04, 7.92, 0.03, 2.1, 1.43, 1.52, 2.47, 11.06, 5.76, 11.81, 0.41, 1.49, 27.45]} \ No newline at end of file diff --git a/annotations_filtered/lrhNPS4nbmQ_filtered.json b/annotations_filtered/lrhNPS4nbmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19402ea9c5a2cb41866fc478f5e3d11ec0a89339 --- /dev/null +++ b/annotations_filtered/lrhNPS4nbmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [5.0, 5.68], [8.0, 9.78], [11.0, 12.6], [18.0, 18.27], [20.0, 19.8], [21.0, 21.78], [24.0, 24.88], [26.0, 26.87], [28.0, 28.97], [31.0, 31.73], [48.0, 48.76], [61.0, 88.45], [90.0, 90.8], [92.0, 92.55], [94.0, 94.58], [96.0, 96.99], [99.0, 99.3], [102.0, 102.41], [105.0, 106.29], [108.0, 108.13], [114.0, 114.91], [119.0, 119.43], [122.0, 122.52], [123.0, 123.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 47.53], ["throbbing", 17.98], ["gong", 11.05]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.68, 1.78, 1.6, 0.27, -0.2, 0.78, 0.88, 0.87, 0.97, 0.73, 0.76, 27.45, 0.8, 0.55, 0.58, 0.99, 0.3, 0.41, 1.29, 0.13, 0.91, 0.43, 0.52, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/lsa5PDPgJmI_filtered.json b/annotations_filtered/lsa5PDPgJmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e1ce03d5b9b2cb1f3f89c63df1675b497866560 --- /dev/null +++ b/annotations_filtered/lsa5PDPgJmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [6.0, 8.85], [10.0, 11.8], [13.0, 14.57], [26.0, 26.0], [33.0, 33.24], [34.0, 34.45], [36.0, 38.28], [40.0, 62.82]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 35.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 61.53], ["throbbing", 19.75], ["hum", 8.28]]], "duration": [1.26, 2.85, 1.8, 1.57, 0.0, 0.24, 0.45, 2.28, 22.82]} \ No newline at end of file diff --git a/annotations_filtered/lscdNc0qTnI_filtered.json b/annotations_filtered/lscdNc0qTnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e0b82cdebd7123d7d2360490013463563bfe1f5 --- /dev/null +++ b/annotations_filtered/lscdNc0qTnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 18.5], [24.0, 37.12], [38.0, 40.53], [42.0, 42.63], [43.0, 81.84], [89.0, 91.25], [100.0, 101.82], [104.0, 105.9], [111.0, 112.83], [121.0, 122.69], [125.0, 126.87], [128.0, 129.36]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.92, 47.39, 51.34, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.98], ["hum", 11.17], ["mains hum", 7.09]], [["music", 34.67], ["speech", 12.98], ["hum", 5.61]], null, null, null, null, null, null, null, null, null, null], "duration": [8.5, 13.12, 2.53, 0.63, 38.84, 2.25, 1.82, 1.9, 1.83, 1.69, 1.87, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/lsmWjQdGHMI_filtered.json b/annotations_filtered/lsmWjQdGHMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc75117444146fcdf36798292532199121d91715 --- /dev/null +++ b/annotations_filtered/lsmWjQdGHMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.16], [12.0, 12.8], [14.0, 15.63], [20.0, 21.0], [23.0, 22.76], [23.0, 23.45], [26.0, 26.91], [29.0, 30.06], [35.0, 36.26], [37.0, 37.42], [38.0, 38.33], [40.0, 41.96], [44.0, 44.85], [48.0, 48.88], [51.0, 52.2], [55.0, 56.34], [57.0, 57.23], [60.0, 60.44], [62.0, 63.63], [65.0, 65.47], [66.0, 68.32], [72.0, 79.51], [81.0, 82.83], [84.0, 85.58], [87.0, 88.7], [91.0, 91.69], [94.0, 95.23], [96.0, 96.97], [98.0, 98.07], [99.0, 100.09], [101.0, 107.15], [108.0, 108.28], [109.0, 109.81], [112.0, 114.35], [119.0, 120.82], [121.0, 123.43], [124.0, 148.09], [149.0, 158.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.78, 0.0, 0.0, 66.63, 0.0, 73.67, 68.67, 76.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.41], ["singing bowl", 8.06], ["wind instrument, woodwind instrument", 3.68]], null, null, null, null, null, null, null], "duration": [0.16, 0.8, 1.63, 1.0, -0.24, 0.45, 0.91, 1.06, 1.26, 0.42, 0.33, 1.96, 0.85, 0.88, 1.2, 1.34, 0.23, 0.44, 1.63, 0.47, 2.32, 7.51, 1.83, 1.58, 1.7, 0.69, 1.23, 0.97, 0.07, 1.09, 6.15, 0.28, 0.81, 2.35, 1.82, 2.43, 24.09, 9.79]} \ No newline at end of file diff --git a/annotations_filtered/lssQ4w2V4XM_filtered.json b/annotations_filtered/lssQ4w2V4XM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed741694a1fd17d89cc9e8929f24a435fe916fc8 --- /dev/null +++ b/annotations_filtered/lssQ4w2V4XM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.76], [11.0, 13.26], [26.0, 33.99], [37.0, 37.29], [38.0, 40.22], [42.0, 41.77], [42.0, 42.09], [42.0, 42.48], [42.0, 52.64], [68.0, 71.52], [82.0, 92.79], [97.0, 110.3], [115.0, 135.8], [137.0, 137.1]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 37.83, 32.02, 0.0, 32.88, 0.0, 0.0, 0.0, 31.92, 28.59, 30.35, 29.22, 29.39, 0.0], "audiomae_on_audioset": [null, [["hum", 23.53], ["mains hum", 17.34], ["music", 14.97]], [["music", 64.05], ["noise", 5.08], ["synthesizer", 3.5]], null, [["chant", 37.24], ["music", 32.1], ["choir", 7.28]], null, null, null, [["beatboxing", 75.94], ["vocal music", 13.56], ["music", 6.44]], [["music", 61.77], ["didgeridoo", 2.63], ["synthetic singing", 2.46]], [["music", 87.8], ["electronic music", 2.72], ["didgeridoo", 2.52]], [["music", 86.33], ["electronic music", 1.61], ["buzz", 0.88]], [["music", 55.93], ["beatboxing", 7.77], ["didgeridoo", 6.89]], null], "duration": [0.76, 2.26, 7.99, 0.29, 2.22, -0.23, 0.09, 0.48, 10.64, 3.52, 10.79, 13.3, 20.8, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/lsxZwAnu8LQ_filtered.json b/annotations_filtered/lsxZwAnu8LQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2081a1b3db7aabd37e81543a50704b7abc68167a --- /dev/null +++ b/annotations_filtered/lsxZwAnu8LQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.23], [15.0, 15.69], [17.0, 23.41], [33.0, 33.12], [41.0, 41.93], [52.0, 51.93], [61.0, 64.08], [67.0, 79.02], [80.0, 97.17], [97.0, 97.75], [103.0, 121.91], [122.0, 122.86], [124.0, 124.43]], "keep_status": [false, false, true, false, false, false, false, true, false, false, true, false, false], "silence_prob": [65.09, 0.0, 33.59, 0.0, 0.0, 0.0, 99.91, 46.86, 69.61, 0.0, 36.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 25.5], ["whack, thwack", 10.01], ["explosion", 6.91]], null, null, null, null, [["explosion", 12.9], ["burst, pop", 10.96], ["firecracker", 10.3]], null, null, [["music", 23.35], ["hum", 15.2], ["didgeridoo", 14.05]], null, null], "duration": [3.23, 0.69, 6.41, 0.12, 0.93, -0.07, 3.08, 12.02, 17.17, 0.75, 18.91, 0.86, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/lt3h5Ez9t4g_filtered.json b/annotations_filtered/lt3h5Ez9t4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ed92b66e887e915090218c2c272e3a936366085 --- /dev/null +++ b/annotations_filtered/lt3h5Ez9t4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.78], [9.0, 8.78], [28.0, 29.39], [32.0, 33.59], [35.0, 36.09], [41.0, 41.37], [45.0, 46.79], [58.0, 60.76], [73.0, 74.87], [77.0, 77.25], [80.0, 80.59], [84.0, 84.48], [87.0, 87.45], [89.0, 90.19], [93.0, 93.61], [95.0, 95.55], [98.0, 100.09], [102.0, 104.84], [106.0, 106.17], [109.0, 113.59], [114.0, 114.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 38.22, 0.0, 40.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 42.36], ["speech", 8.92], ["sound effect", 7.0]], null, [["music", 33.43], ["bleat", 22.82], ["sheep", 12.06]], null], "duration": [1.78, -0.22, 1.39, 1.59, 1.09, 0.37, 1.79, 2.76, 1.87, 0.25, 0.59, 0.48, 0.45, 1.19, 0.61, 0.55, 2.09, 2.84, 0.17, 4.59, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/ltY3ZLA6dA8_filtered.json b/annotations_filtered/ltY3ZLA6dA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7611ad235c2326e405a2b86e6b38550deaad6a9d --- /dev/null +++ b/annotations_filtered/ltY3ZLA6dA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 29.56], [31.0, 31.28], [40.0, 42.31], [43.0, 49.42], [57.0, 57.25], [58.0, 66.77], [69.0, 68.88], [69.0, 72.1], [73.0, 73.85], [75.0, 86.66], [89.0, 89.02], [93.0, 96.77], [100.0, 108.35], [111.0, 111.92], [119.0, 122.07]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [34.0, 0.0, 69.61, 38.45, 0.0, 36.75, 0.0, 52.62, 0.0, 36.06, 0.0, 41.1, 35.3, 0.0, 35.62], "audiomae_on_audioset": [[["music", 29.82], ["throbbing", 22.06], ["hum", 13.1]], null, null, [["hum", 32.96], ["music", 24.57], ["mains hum", 9.85]], null, [["music", 49.43], ["speech", 26.35], ["boing", 2.95]], null, null, null, [["music", 72.03], ["throbbing", 5.07], ["sitar", 3.98]], null, [["music", 55.05], ["musical instrument", 9.04], ["guitar", 7.41]], [["music", 31.68], ["throbbing", 15.04], ["hum", 8.19]], null, [["music", 47.53], ["didgeridoo", 16.72], ["speech", 14.75]]], "duration": [21.56, 0.28, 2.31, 6.42, 0.25, 8.77, -0.12, 3.1, 0.85, 11.66, 0.02, 3.77, 8.35, 0.92, 3.07]} \ No newline at end of file diff --git a/annotations_filtered/ltmHZiXkb9c_filtered.json b/annotations_filtered/ltmHZiXkb9c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/ltmHZiXkb9c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ltwRv-C1EFQ_filtered.json b/annotations_filtered/ltwRv-C1EFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90107dce722390dced485a12f4f2f3e9936ee6c1 --- /dev/null +++ b/annotations_filtered/ltwRv-C1EFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [7.0, 9.26], [12.0, 19.48], [21.0, 21.71], [24.0, 25.93], [29.0, 30.38], [34.0, 34.82], [38.0, 40.09], [41.0, 42.08], [47.0, 49.18], [53.0, 53.42], [54.0, 56.84], [58.0, 60.17], [62.0, 63.95]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 34.02, 36.29, 0.0, 0.0, 0.0, 0.0, 37.33, 0.0, 90.43, 0.0, 88.83, 59.42, 0.0], "audiomae_on_audioset": [null, [["speech", 44.47], ["sidetone", 7.04], ["radio", 6.75]], [["cattle, bovinae", 17.04], ["speech", 12.27], ["whack, thwack", 11.34]], null, null, null, null, [["sidetone", 30.88], ["speech", 15.89], ["chirp tone", 9.37]], null, null, null, null, null, null], "duration": [0.83, 2.26, 7.48, 0.71, 1.93, 1.38, 0.82, 2.09, 1.08, 2.18, 0.42, 2.84, 2.17, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/lu2-RuTwlto_filtered.json b/annotations_filtered/lu2-RuTwlto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f58a33fbe7516e9ab61cdeedeabf58d2ff9272d --- /dev/null +++ b/annotations_filtered/lu2-RuTwlto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 45.0], [60.0, 62.36], [79.0, 79.12], [79.0, 79.15], [81.0, 82.73], [88.0, 92.53], [94.0, 94.63], [95.0, 98.05], [98.0, 99.57], [100.0, 100.74], [102.0, 102.56], [103.0, 104.23], [106.0, 116.48], [119.0, 124.7], [130.0, 133.71], [151.0, 151.02], [169.0, 169.6]], "keep_status": [true, true, false, false, false, true, false, true, false, false, false, false, true, true, true, false, false], "silence_prob": [31.68, 30.55, 0.0, 0.0, 0.0, 31.84, 0.0, 31.66, 0.0, 0.0, 0.0, 0.0, 31.82, 31.84, 32.27, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.2], ["speech", 5.89], ["boing", 5.84]], [["speech", 39.17], ["music", 21.44], ["cacophony", 4.93]], null, null, null, [["speech", 51.05], ["music", 9.01], ["basketball bounce", 5.98]], null, [["music", 22.34], ["throbbing", 11.66], ["smash, crash", 7.92]], null, null, null, null, [["music", 26.54], ["speech", 13.2], ["buzz", 9.81]], [["sidetone", 28.91], ["speech", 25.05], ["music", 13.89]], [["music", 18.07], ["civil defense siren", 16.11], ["theremin", 9.24]], null, null], "duration": [20.0, 2.36, 0.12, 0.15, 1.73, 4.53, 0.63, 3.05, 1.57, 0.74, 0.56, 1.23, 10.48, 5.7, 3.71, 0.02, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/lu9yr0xefYQ_filtered.json b/annotations_filtered/lu9yr0xefYQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d83e4147934601e9f61aa923b80c951c61d38eec --- /dev/null +++ b/annotations_filtered/lu9yr0xefYQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [8.0, 10.07], [19.0, 19.3], [20.0, 22.65], [24.0, 26.81], [27.0, 31.46], [32.0, 34.91], [36.0, 39.51], [43.0, 43.23], [46.0, 51.87], [52.0, 51.95], [52.0, 53.47], [54.0, 55.63], [57.0, 57.48], [58.0, 59.73], [61.0, 62.16], [63.0, 63.27], [64.0, 63.98], [80.0, 80.94], [85.0, 86.05], [87.0, 87.51], [92.0, 92.65], [96.0, 96.69], [102.0, 104.53], [106.0, 106.81], [108.0, 108.11], [114.0, 114.78]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.32, 0.0, 68.41, 49.59, 34.7, 44.78, 60.42, 0.0, 65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 50.92], ["radio", 18.79], ["music", 10.77]], null, null, [["speech", 65.63], ["radio", 13.44], ["noise", 4.19]], [["speech", 40.82], ["music", 15.84], ["theremin", 10.72]], [["speech", 28.33], ["siren", 12.23], ["pulse", 8.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 2.07, 0.3, 2.65, 2.81, 4.46, 2.91, 3.51, 0.23, 5.87, -0.05, 1.47, 1.63, 0.48, 1.73, 1.16, 0.27, -0.02, 0.94, 1.05, 0.51, 0.65, 0.69, 2.53, 0.81, 0.11, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/luF2eyiYlyE_filtered.json b/annotations_filtered/luF2eyiYlyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76852dd699186b0d3ce167d6a9aaa870f938029b --- /dev/null +++ b/annotations_filtered/luF2eyiYlyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.97], [7.0, 7.1], [8.0, 8.41], [13.0, 13.34], [15.0, 15.16], [17.0, 18.4], [20.0, 21.64], [22.0, 22.52], [23.0, 23.21], [24.0, 24.16], [34.0, 38.62], [40.0, 40.49], [41.0, 53.08], [58.0, 57.84], [58.0, 58.55], [60.0, 60.17], [62.0, 62.33], [67.0, 67.34], [68.0, 68.55], [91.0, 92.69], [106.0, 106.71], [116.0, 116.87], [120.0, 120.38], [122.0, 121.78], [122.0, 123.01], [147.0, 150.15], [151.0, 151.26], [154.0, 154.25], [156.0, 156.68], [159.0, 159.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.47, 0.0, 34.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 40.51], ["brass instrument", 8.58], ["speech", 7.49]], null, [["music", 31.13], ["theremin", 23.8], ["speech", 14.83]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.2], ["theremin", 13.29], ["musical instrument", 6.13]], null, null, null, null], "duration": [-0.03, 0.1, 0.41, 0.34, 0.16, 1.4, 1.64, 0.52, 0.21, 0.16, 4.62, 0.49, 12.08, -0.16, 0.55, 0.17, 0.33, 0.34, 0.55, 1.69, 0.71, 0.87, 0.38, -0.22, 1.01, 3.15, 0.26, 0.25, 0.68, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/lufECeWtN34_filtered.json b/annotations_filtered/lufECeWtN34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e9190e5f85f96bef8dd0ce661fbc00a3020b590 --- /dev/null +++ b/annotations_filtered/lufECeWtN34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.86], [7.0, 80.42], [82.0, 110.37]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 30.58], "audiomae_on_audioset": [null, null, [["music", 47.93], ["hum", 6.19], ["sound effect", 4.44]]], "duration": [0.86, 73.42, 28.37]} \ No newline at end of file diff --git a/annotations_filtered/luhE1BFZN9U_filtered.json b/annotations_filtered/luhE1BFZN9U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02d0473d895d4e335f8cdec37bc57464deb65f48 --- /dev/null +++ b/annotations_filtered/luhE1BFZN9U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 16.71], [17.0, 18.94], [21.0, 22.69], [23.0, 24.92], [26.0, 27.78], [29.0, 32.05], [33.0, 35.88], [36.0, 39.26], [40.0, 45.67], [47.0, 48.54], [50.0, 53.54], [54.0, 78.66], [79.0, 85.78], [86.0, 113.64], [114.0, 121.29], [122.0, 122.45]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [72.9, 0.0, 0.0, 0.0, 0.0, 99.87, 69.34, 72.46, 44.04, 0.0, 97.11, 30.37, 30.9, 33.72, 84.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 28.02], ["frog", 23.56], ["croak", 11.95]], null, null, [["speech", 42.33], ["sine wave", 28.55], ["sidetone", 6.74]], [["speech", 30.86], ["heart sounds, heartbeat", 12.0], ["throbbing", 6.15]], [["whack, thwack", 32.06], ["speech", 12.35], ["hum", 7.11]], null, null], "duration": [14.71, 1.94, 1.69, 1.92, 1.78, 3.05, 2.88, 3.26, 5.67, 1.54, 3.54, 24.66, 6.78, 27.64, 7.29, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/luuYRrPaEpM_filtered.json b/annotations_filtered/luuYRrPaEpM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d89525cb853f6c84f50f64bf99c3c1edea84f95 --- /dev/null +++ b/annotations_filtered/luuYRrPaEpM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 25.81], [27.0, 27.11], [31.0, 32.53], [33.0, 42.67], [43.0, 65.62], [68.0, 76.44], [77.0, 83.94], [85.0, 119.69], [121.0, 122.1], [124.0, 124.78], [126.0, 146.87], [152.0, 153.45]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [52.92, 0.0, 0.0, 34.44, 32.18, 64.86, 36.49, 0.0, 0.0, 0.0, 32.89, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 30.48], ["throbbing", 23.89], ["hum", 18.24]], [["music", 35.58], ["speech", 28.19], ["vehicle", 7.8]], null, [["speech", 51.04], ["sine wave", 9.86], ["music", 8.79]], null, null, null, [["hum", 40.28], ["mains hum", 20.96], ["noise", 10.06]], null], "duration": [17.81, 0.11, 1.53, 9.67, 22.62, 8.44, 6.94, 34.69, 1.1, 0.78, 20.87, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/luylsO8UlhE_filtered.json b/annotations_filtered/luylsO8UlhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37de0203050377d63fc4e2c35e3d6a87a50f68f8 --- /dev/null +++ b/annotations_filtered/luylsO8UlhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.19], [21.0, 23.77], [26.0, 26.38], [28.0, 28.14], [29.0, 31.51], [34.0, 34.35], [38.0, 38.79], [46.0, 45.64], [46.0, 57.45], [59.0, 61.77], [62.0, 64.72], [65.0, 67.19], [68.0, 69.55], [71.0, 75.03], [76.0, 81.31], [85.0, 86.21], [88.0, 88.67], [91.0, 91.86], [95.0, 95.5], [96.0, 96.63], [99.0, 99.62], [102.0, 102.03], [110.0, 110.93], [112.0, 112.62], [120.0, 121.71], [123.0, 124.48], [125.0, 127.01], [130.0, 131.21], [132.0, 133.79], [137.0, 139.24], [140.0, 141.3], [142.0, 143.24], [144.0, 144.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.15, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 99.78, 99.97, 96.42, 95.09, 0.0, 85.9, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 2.77, 0.38, 0.14, 2.51, 0.35, 0.79, -0.36, 11.45, 2.77, 2.72, 2.19, 1.55, 4.03, 5.31, 1.21, 0.67, 0.86, 0.5, 0.63, 0.62, 0.03, 0.93, 0.62, 1.71, 1.48, 2.01, 1.21, 1.79, 2.24, 1.3, 1.24, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/lv_LfXcjWew_filtered.json b/annotations_filtered/lv_LfXcjWew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..839f021f2ebda29bd826145fb5cdca52094563d3 --- /dev/null +++ b/annotations_filtered/lv_LfXcjWew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.69], [4.0, 5.44], [7.0, 8.53], [10.0, 19.92], [22.0, 25.88], [30.0, 33.45], [35.0, 40.83], [45.0, 60.78], [66.0, 105.48], [106.0, 107.81], [109.0, 110.64], [111.0, 114.89]], "keep_status": [false, false, false, true, true, true, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 34.16, 46.57, 43.0, 30.1, 31.2, 0.0, 0.0, 0.0, 40.92], "audiomae_on_audioset": [null, null, null, [["white noise", 10.78], ["buzz", 10.74], ["hum", 10.04]], [["throbbing", 32.44], ["hum", 25.83], ["mains hum", 8.54]], [["eruption", 18.02], ["hum", 9.49], ["speech", 7.57]], [["hum", 26.9], ["mains hum", 15.4], ["throbbing", 10.51]], [["hum", 7.99], ["music", 7.08], ["speech", 5.1]], null, null, null, [["speech", 11.98], ["hum", 9.63], ["music", 9.55]]], "duration": [0.69, 1.44, 1.53, 9.92, 3.88, 3.45, 5.83, 15.78, 39.48, 1.81, 1.64, 3.89]} \ No newline at end of file diff --git a/annotations_filtered/lwfuUyTMpVY_filtered.json b/annotations_filtered/lwfuUyTMpVY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca934fa10fd0cf88862487e35687e48d2f254481 --- /dev/null +++ b/annotations_filtered/lwfuUyTMpVY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.24], [8.0, 9.09], [9.0, 10.79], [11.0, 12.46], [14.0, 15.08], [17.0, 22.27], [23.0, 23.72], [34.0, 34.33], [35.0, 34.87], [36.0, 36.68], [42.0, 43.19], [45.0, 50.67], [51.0, 52.73], [55.0, 54.9], [59.0, 60.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 1.09, 1.79, 1.46, 1.08, 5.27, 0.72, 0.33, -0.13, 0.68, 1.19, 5.67, 1.73, -0.1, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/lwhQK2kDfBM_filtered.json b/annotations_filtered/lwhQK2kDfBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97fb58e43c4068ce80871c2f57aae043e74d865f --- /dev/null +++ b/annotations_filtered/lwhQK2kDfBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.08], [22.0, 22.74], [24.0, 24.92], [50.0, 50.53], [55.0, 55.32], [63.0, 63.12], [65.0, 72.57], [74.0, 74.53], [75.0, 77.16], [78.0, 81.23], [88.0, 98.76], [106.0, 106.57], [108.0, 118.17], [125.0, 127.89], [130.0, 131.13]], "keep_status": [false, false, false, false, false, false, true, false, true, true, true, false, true, true, false], "silence_prob": [42.74, 0.0, 0.0, 0.0, 0.0, 0.0, 41.05, 0.0, 37.04, 30.81, 30.21, 0.0, 29.9, 31.92, 0.0], "audiomae_on_audioset": [[["music", 35.36], ["speech", 34.54], ["didgeridoo", 4.3]], null, null, null, null, null, [["music", 27.61], ["speech", 15.56], ["crushing", 11.7]], null, [["music", 41.5], ["livestock, farm animals, working animals", 8.58], ["moo", 6.47]], [["music", 36.83], ["throbbing", 13.6], ["hum", 12.28]], [["music", 28.07], ["sidetone", 20.41], ["speech", 14.59]], null, [["music", 24.04], ["hum", 18.88], ["mains hum", 15.49]], [["music", 47.22], ["guitar", 7.73], ["speech", 6.41]], null], "duration": [2.08, 0.74, 0.92, 0.53, 0.32, 0.12, 7.57, 0.53, 2.16, 3.23, 10.76, 0.57, 10.17, 2.89, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/lwkdeQQiCms_filtered.json b/annotations_filtered/lwkdeQQiCms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d62e56376dcd29da285e11d4ee169c1003acaff --- /dev/null +++ b/annotations_filtered/lwkdeQQiCms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.04], [9.0, 10.08], [12.0, 12.55], [14.0, 14.47], [16.0, 17.34], [18.0, 19.04], [21.0, 22.45], [25.0, 26.91], [28.0, 28.66], [34.0, 39.39], [44.0, 44.52], [46.0, 46.82], [50.0, 52.59], [68.0, 68.01], [82.0, 82.48], [84.0, 84.27], [101.0, 102.15], [106.0, 106.29], [110.0, 111.01], [112.0, 112.48], [118.0, 117.98], [120.0, 123.28], [124.0, 124.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 97.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 1.08, 0.55, 0.47, 1.34, 1.04, 1.45, 1.91, 0.66, 5.39, 0.52, 0.82, 2.59, 0.01, 0.48, 0.27, 1.15, 0.29, 1.01, 0.48, -0.02, 3.28, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/lwo1GnbKOW8_filtered.json b/annotations_filtered/lwo1GnbKOW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..536acba99628a2f68e401679d46b92d012d24e47 --- /dev/null +++ b/annotations_filtered/lwo1GnbKOW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.88], [13.0, 13.68], [15.0, 15.11], [16.0, 16.71], [19.0, 19.4], [21.0, 21.76], [23.0, 23.45], [24.0, 24.06], [25.0, 26.22], [32.0, 32.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, 0.68, 0.11, 0.71, 0.4, 0.76, 0.45, 0.06, 1.22, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/lwruhQqFttU_filtered.json b/annotations_filtered/lwruhQqFttU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..308446a7d5509ae70f256b5fc478eb5e80495c93 --- /dev/null +++ b/annotations_filtered/lwruhQqFttU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.75], [19.0, 21.24], [22.0, 45.2], [46.0, 49.62], [54.0, 54.33], [56.0, 62.51], [64.0, 68.57], [70.0, 72.79], [74.0, 74.26], [75.0, 77.33], [84.0, 119.91], [123.0, 123.4]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 32.72, 75.55, 36.31, 0.0, 33.58, 31.15, 33.12, 0.0, 35.74, 0.0, 0.0], "audiomae_on_audioset": [null, [["theremin", 77.68], ["music", 14.39], ["musical instrument", 1.42]], null, [["hum", 51.85], ["throbbing", 11.02], ["music", 8.39]], null, [["speech", 42.26], ["gong", 8.21], ["chirp tone", 7.5]], [["music", 35.08], ["chirp tone", 15.94], ["electronic music", 8.47]], [["throbbing", 38.17], ["hum", 30.07], ["mains hum", 5.73]], null, [["music", 14.87], ["effects unit", 10.07], ["distortion", 5.69]], null, null], "duration": [0.75, 2.24, 23.2, 3.62, 0.33, 6.51, 4.57, 2.79, 0.26, 2.33, 35.91, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/lxKvt5Z9Bok_filtered.json b/annotations_filtered/lxKvt5Z9Bok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1517d9b0ed47f67e817e099f2c1fa74cd07b2b3e --- /dev/null +++ b/annotations_filtered/lxKvt5Z9Bok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[136.0, 138.92], [141.0, 144.05]], "keep_status": [false, false], "silence_prob": [31.12, 31.98], "audiomae_on_audioset": [[["music", 49.83], ["musical instrument", 13.57], ["synthesizer", 10.94]], [["music", 55.63], ["hum", 13.74], ["synthesizer", 4.34]]], "duration": [2.92, 3.05]} \ No newline at end of file diff --git a/annotations_filtered/lxOV0MYBpeI_filtered.json b/annotations_filtered/lxOV0MYBpeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44178fd55fdcbaf33feab0aaef81ec926e675d7d --- /dev/null +++ b/annotations_filtered/lxOV0MYBpeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.2], [21.0, 21.37], [23.0, 23.35], [30.0, 35.41], [37.0, 38.03], [39.0, 39.6], [40.0, 40.54], [44.0, 44.29], [45.0, 45.2], [45.0, 46.58], [48.0, 49.1], [50.0, 50.38], [51.0, 51.7], [53.0, 55.14], [58.0, 58.24], [66.0, 65.79], [67.0, 67.68], [72.0, 72.47], [73.0, 73.6], [75.0, 75.0], [77.0, 77.36], [87.0, 87.44], [89.0, 89.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [35.72, 0.0, 0.0, 35.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.5], ["didgeridoo", 13.34], ["speech", 11.7]], null, null, [["music", 45.25], ["didgeridoo", 24.8], ["speech", 12.46]], null, null, null, null, null, null, null, null, null, [["speech", 27.49], ["music", 19.52], ["fart", 8.47]], null, null, null, null, null, null, null, null, null], "duration": [2.2, 0.37, 0.35, 5.41, 1.03, 0.6, 0.54, 0.29, 0.2, 1.58, 1.1, 0.38, 0.7, 2.14, 0.24, -0.21, 0.68, 0.47, 0.6, 0.0, 0.36, 0.44, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/lxQj06LN31A_filtered.json b/annotations_filtered/lxQj06LN31A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bedfb93b3d15565289be22812fb6aab222840e8 --- /dev/null +++ b/annotations_filtered/lxQj06LN31A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.4], [8.0, 8.29]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.4, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/lxlwKE2-3fg_filtered.json b/annotations_filtered/lxlwKE2-3fg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bf80349ea0c2934f2b054014d9f96b1186aae91 --- /dev/null +++ b/annotations_filtered/lxlwKE2-3fg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.22], [10.0, 14.15], [21.0, 21.98], [22.0, 23.79], [24.0, 24.36], [29.0, 30.48], [33.0, 36.05], [36.0, 49.25], [56.0, 57.27], [61.0, 60.76], [61.0, 64.29], [65.0, 67.37], [72.0, 72.5], [80.0, 86.1], [87.0, 86.81], [87.0, 87.52], [88.0, 88.94], [91.0, 90.91], [103.0, 103.23], [121.0, 121.22], [122.0, 122.61], [126.0, 127.11], [129.0, 130.44], [138.0, 139.62], [141.0, 142.28]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.26, 100.0, 0.0, 0.0, 0.0, 0.0, 97.33, 98.1, 0.0, 0.0, 65.44, 71.72, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 25.95], ["animal", 14.14], ["fart", 7.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.22, 4.15, 0.98, 1.79, 0.36, 1.48, 3.05, 13.25, 1.27, -0.24, 3.29, 2.37, 0.5, 6.1, -0.19, 0.52, 0.94, -0.09, 0.23, 0.22, 0.61, 1.11, 1.44, 1.62, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/lyM65FpQLlM_filtered.json b/annotations_filtered/lyM65FpQLlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9abf89c0bcbf9866e5c5fcc22faf546136efba9 --- /dev/null +++ b/annotations_filtered/lyM65FpQLlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [5.0, 6.22], [8.0, 7.94], [13.0, 14.76], [16.0, 20.68], [21.0, 23.85], [25.0, 28.58], [30.0, 32.88], [35.0, 35.58], [37.0, 37.4], [40.0, 42.18], [45.0, 77.57], [80.0, 91.05], [96.0, 107.45], [110.0, 125.41], [126.0, 128.24], [129.0, 129.98], [134.0, 134.57], [136.0, 136.27], [137.0, 137.42], [138.0, 140.61], [141.0, 149.94], [152.0, 163.24], [168.0, 171.49], [172.0, 172.66], [173.0, 181.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.44, 78.04, 99.16, 86.27, 0.0, 0.0, 70.44, 0.0, 34.6, 32.13, 30.49, 79.94, 0.0, 0.0, 0.0, 0.0, 42.15, 68.02, 54.43, 54.63, 0.0, 64.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.36], ["ambient music", 29.84], ["synthesizer", 5.99]], [["music", 58.48], ["theremin", 8.7], ["ambient music", 6.87]], [["music", 47.92], ["speech", 9.81], ["mains hum", 8.98]], null, null, null, null, null, [["music", 61.61], ["effects unit", 10.54], ["synthesizer", 3.49]], null, null, null, null, null], "duration": [0.49, 1.22, -0.06, 1.76, 4.68, 2.85, 3.58, 2.88, 0.58, 0.4, 2.18, 32.57, 11.05, 11.45, 15.41, 2.24, 0.98, 0.57, 0.27, 0.42, 2.61, 8.94, 11.24, 3.49, 0.66, 8.53]} \ No newline at end of file diff --git a/annotations_filtered/lyQ1m8xbJW0_filtered.json b/annotations_filtered/lyQ1m8xbJW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a581744d5384ac6f7ac6482760da5aa1c4a0c8bb --- /dev/null +++ b/annotations_filtered/lyQ1m8xbJW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.81], [20.0, 19.7], [20.0, 20.07], [24.0, 24.66], [25.0, 25.52], [28.0, 28.71], [33.0, 33.32], [46.0, 46.16], [49.0, 49.72], [66.0, 66.34], [67.0, 68.23], [72.0, 71.91], [73.0, 73.33], [77.0, 109.16], [112.0, 128.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.63], ["boing", 8.06], ["speech", 2.26]]], "duration": [-0.19, -0.3, 0.07, 0.66, 0.52, 0.71, 0.32, 0.16, 0.72, 0.34, 1.23, -0.09, 0.33, 32.16, 16.14]} \ No newline at end of file diff --git a/annotations_filtered/lyd4tC8LH1s_filtered.json b/annotations_filtered/lyd4tC8LH1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3fb4bc6099d0ad066ece7f729649187f16183cf --- /dev/null +++ b/annotations_filtered/lyd4tC8LH1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [7.0, 21.98], [23.0, 22.99], [24.0, 32.29], [35.0, 52.61], [54.0, 57.32], [58.0, 57.94], [69.0, 69.03], [70.0, 73.77], [75.0, 78.27], [78.0, 78.41], [78.0, 78.92], [87.0, 87.98], [89.0, 107.08], [112.0, 116.33], [118.0, 118.35]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, false], "silence_prob": [0.0, 30.75, 0.0, 30.85, 31.02, 89.9, 0.0, 0.0, 30.97, 32.28, 0.0, 0.0, 0.0, 36.0, 33.77, 0.0], "audiomae_on_audioset": [null, [["speech", 59.56], ["beatboxing", 17.26], ["didgeridoo", 5.96]], null, [["fart", 48.01], ["speech", 19.38], ["whack, thwack", 8.39]], [["speech", 57.36], ["whack, thwack", 12.23], ["music", 4.98]], null, null, null, [["breaking", 21.08], ["smash, crash", 17.8], ["speech", 9.76]], [["speech", 33.14], ["boing", 27.27], ["music", 9.56]], null, null, null, [["ding", 14.64], ["speech", 12.63], ["animal", 8.53]], [["beatboxing", 32.25], ["speech", 24.09], ["music", 13.37]], null], "duration": [0.3, 14.98, -0.01, 8.29, 17.61, 3.32, -0.06, 0.03, 3.77, 3.27, 0.41, 0.92, 0.98, 18.08, 4.33, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/lyu3QUjAFtw_filtered.json b/annotations_filtered/lyu3QUjAFtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c54fa0f2d4a6efdd5659aade0400dc8ddc923901 --- /dev/null +++ b/annotations_filtered/lyu3QUjAFtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.52], [30.0, 34.45], [36.0, 37.89], [44.0, 44.19], [45.0, 46.74], [49.0, 49.94], [55.0, 59.27], [68.0, 71.52], [86.0, 87.07], [97.0, 101.11], [104.0, 105.0], [108.0, 109.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.98, 0.0, 0.0, 0.0, 0.0, 41.5, 60.23, 0.0, 54.17, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 57.93], ["theremin", 7.72], ["chant", 6.01]], null, null, null, null, [["music", 63.51], ["theremin", 5.16], ["chant", 4.89]], null, null, null, null, null], "duration": [0.52, 4.45, 1.89, 0.19, 1.74, 0.94, 4.27, 3.52, 1.07, 4.11, 1.0, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/lyuwBW9lNa8_filtered.json b/annotations_filtered/lyuwBW9lNa8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec6e56ae4f2078816faa22a3bd0879f7f52ae34d --- /dev/null +++ b/annotations_filtered/lyuwBW9lNa8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 56.69], [58.0, 60.96], [62.0, 67.02], [68.0, 74.01], [77.0, 78.33], [83.0, 86.95], [88.0, 93.88], [95.0, 95.61], [96.0, 98.46], [99.0, 100.31], [102.0, 109.44], [110.0, 109.68], [110.0, 109.71], [110.0, 118.02], [119.0, 130.1], [130.0, 132.54]], "keep_status": [false, false, true, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 52.16, 48.74, 55.53, 0.0, 69.47, 42.88, 0.0, 37.62, 0.0, 29.21, 0.0, 0.0, 32.76, 96.89, 98.1], "audiomae_on_audioset": [null, null, [["music", 49.55], ["singing bowl", 10.95], ["ambient music", 4.29]], null, null, null, [["music", 47.68], ["synthesizer", 5.48], ["musical instrument", 3.89]], null, [["music", 64.62], ["guitar", 11.84], ["effects unit", 8.16]], null, [["music", 37.41], ["effects unit", 8.42], ["reverberation", 7.38]], null, null, [["neigh, whinny", 59.2], ["horse", 13.02], ["animal", 4.94]], null, null], "duration": [55.69, 2.96, 5.02, 6.01, 1.33, 3.95, 5.88, 0.61, 2.46, 1.31, 7.44, -0.32, -0.29, 8.02, 11.1, 2.54]} \ No newline at end of file diff --git a/annotations_filtered/lyvAjZw6O_Q_filtered.json b/annotations_filtered/lyvAjZw6O_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9dcdb290d01ef74b576d2ded650424e49712bc3f --- /dev/null +++ b/annotations_filtered/lyvAjZw6O_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [6.0, 7.65], [17.0, 18.03], [21.0, 22.06], [26.0, 27.14], [29.0, 29.83], [31.0, 32.95], [39.0, 39.53], [42.0, 42.57], [46.0, 46.84], [52.0, 52.12], [53.0, 53.7], [55.0, 55.81], [58.0, 60.39], [61.0, 62.4], [63.0, 64.08], [68.0, 68.94], [79.0, 81.5], [85.0, 85.77], [88.0, 88.79], [107.0, 107.91], [114.0, 114.51], [117.0, 117.53], [121.0, 121.68], [123.0, 123.99], [126.0, 129.86], [130.0, 131.41], [134.0, 135.58], [141.0, 141.93], [144.0, 144.53], [146.0, 147.16], [150.0, 151.77], [153.0, 154.28], [155.0, 160.71], [162.0, 162.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 1.65, 1.03, 1.06, 1.14, 0.83, 1.95, 0.53, 0.57, 0.84, 0.12, 0.7, 0.81, 2.39, 1.4, 1.08, 0.94, 2.5, 0.77, 0.79, 0.91, 0.51, 0.53, 0.68, 0.99, 3.86, 1.41, 1.58, 0.93, 0.53, 1.16, 1.77, 1.28, 5.71, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/lz98akbX_NE_filtered.json b/annotations_filtered/lz98akbX_NE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13a8cd681423f61f9befff951f9b4c2a060ca85b --- /dev/null +++ b/annotations_filtered/lz98akbX_NE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.13], [15.0, 105.73], [109.0, 108.87], [110.0, 123.09], [124.0, 129.24], [136.0, 136.58], [138.0, 140.41], [142.0, 142.84], [143.0, 148.27], [153.0, 153.64], [156.0, 156.12], [158.0, 158.18], [160.0, 175.93], [178.0, 180.98]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [91.64, 0.0, 0.0, 29.37, 51.55, 0.0, 88.46, 0.0, 35.79, 0.0, 0.0, 0.0, 38.72, 73.82], "audiomae_on_audioset": [null, null, null, [["echo", 47.53], ["whale vocalization", 12.16], ["speech", 7.15]], null, null, null, null, [["noise", 19.25], ["radio", 12.87], ["buzz", 6.14]], null, null, null, [["gurgling", 18.71], ["squish", 9.55], ["music", 9.32]], null], "duration": [7.13, 90.73, -0.13, 13.09, 5.24, 0.58, 2.41, 0.84, 5.27, 0.64, 0.12, 0.18, 15.93, 2.98]} \ No newline at end of file diff --git a/annotations_filtered/lzJV7k-LiC4_filtered.json b/annotations_filtered/lzJV7k-LiC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1de9428acb7b78f858750a44cff3c9a892bb11e0 --- /dev/null +++ b/annotations_filtered/lzJV7k-LiC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.63], [1.0, 0.75], [7.0, 10.71], [11.0, 13.85], [22.0, 29.88], [31.0, 32.51], [35.0, 36.31], [37.0, 37.3], [38.0, 49.62], [54.0, 55.48], [58.0, 58.72], [61.0, 65.18], [68.0, 70.5], [74.0, 77.65], [81.0, 83.56], [89.0, 90.41], [93.0, 93.88], [98.0, 104.38], [106.0, 113.53], [116.0, 143.23], [148.0, 154.68]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 52.62, 55.18, 32.07, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 79.76, 53.4, 49.45, 69.88, 0.0, 0.0, 32.68, 31.63, 31.07, 30.91], "audiomae_on_audioset": [null, null, null, null, [["boing", 27.29], ["speech", 19.04], ["whack, thwack", 10.15]], null, null, null, null, null, null, null, null, [["music", 60.86], ["lullaby", 4.02], ["musical instrument", 3.83]], null, null, null, [["music", 71.18], ["synthesizer", 2.38], ["singing", 2.04]], [["music", 68.38], ["singing", 2.87], ["throbbing", 2.0]], [["music", 71.19], ["singing", 3.92], ["pop music", 2.94]], [["speech", 37.48], ["music", 23.49], ["fart", 6.01]]], "duration": [-0.37, -0.25, 3.71, 2.85, 7.88, 1.51, 1.31, 0.3, 11.62, 1.48, 0.72, 4.18, 2.5, 3.65, 2.56, 1.41, 0.88, 6.38, 7.53, 27.23, 6.68]} \ No newline at end of file diff --git a/annotations_filtered/lzo2hgdDUDw_filtered.json b/annotations_filtered/lzo2hgdDUDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be46567604352748e8eba3524a4d2299a7a9f3a5 --- /dev/null +++ b/annotations_filtered/lzo2hgdDUDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.21], [10.0, 14.15], [19.0, 35.4], [38.0, 38.69], [39.0, 39.6], [40.0, 45.0], [47.0, 67.78], [71.0, 91.83]], "keep_status": [false, true, true, false, false, false, true, false], "silence_prob": [0.0, 48.91, 42.0, 0.0, 0.0, 59.51, 36.45, 38.66], "audiomae_on_audioset": [null, [["fly, housefly", 21.48], ["speech", 16.96], ["insect", 10.99]], [["speech", 32.72], ["buzz", 14.25], ["fly, housefly", 6.07]], null, null, null, [["speech", 30.11], ["fly, housefly", 17.37], ["insect", 11.65]], [["music", 64.57], ["didgeridoo", 13.46], ["speech", 3.5]]], "duration": [1.21, 4.15, 16.4, 0.69, 0.6, 5.0, 20.78, 20.83]} \ No newline at end of file diff --git a/annotations_filtered/m-1vkYcqRRw_filtered.json b/annotations_filtered/m-1vkYcqRRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b9d4245630fc9714b91883b8c00bcd40643682d --- /dev/null +++ b/annotations_filtered/m-1vkYcqRRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.06], [21.0, 29.2], [31.0, 33.05], [36.0, 41.23], [50.0, 50.9], [52.0, 53.4], [58.0, 58.95], [61.0, 68.84], [72.0, 72.39], [73.0, 73.31], [74.0, 89.67], [93.0, 100.16], [102.0, 105.12], [106.0, 107.03], [108.0, 114.1], [115.0, 124.09], [125.0, 128.12]], "keep_status": [false, true, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 36.38, 43.48, 47.98, 0.0, 0.0, 0.0, 40.01, 0.0, 0.0, 51.12, 39.07, 84.8, 0.0, 71.14, 71.72, 91.3], "audiomae_on_audioset": [null, [["vehicle", 12.93], ["music", 12.35], ["hum", 8.38]], [["hum", 23.2], ["mains hum", 20.6], ["pulse", 6.22]], [["music", 36.26], ["noise", 12.25], ["hum", 6.68]], null, null, null, [["sidetone", 76.22], ["speech", 7.52], ["radio", 2.76]], null, null, null, [["fly, housefly", 12.14], ["electric shaver, electric razor", 11.88], ["music", 11.38]], null, null, null, null, null], "duration": [0.06, 8.2, 2.05, 5.23, 0.9, 1.4, 0.95, 7.84, 0.39, 0.31, 15.67, 7.16, 3.12, 1.03, 6.1, 9.09, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/m-2WmcLl_PQ_filtered.json b/annotations_filtered/m-2WmcLl_PQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa9c363c2742ff788a0c09592a8f54bbef84cd97 --- /dev/null +++ b/annotations_filtered/m-2WmcLl_PQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.9], [4.0, 4.28], [6.0, 6.99], [10.0, 11.28], [12.0, 55.76], [58.0, 89.61], [92.0, 138.32], [140.0, 179.36], [180.0, 179.98]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.9, 0.28, 0.99, 1.28, 43.76, 31.61, 46.32, 39.36, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/m-3Ohq-bVFA_filtered.json b/annotations_filtered/m-3Ohq-bVFA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f622398d75c5cf1f38eaf2ec077484ebd21fde12 --- /dev/null +++ b/annotations_filtered/m-3Ohq-bVFA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.49], [14.0, 15.8], [19.0, 20.61], [21.0, 23.28], [25.0, 26.42], [30.0, 30.99], [33.0, 33.84], [35.0, 36.09], [38.0, 39.55], [41.0, 42.38], [44.0, 45.2], [48.0, 49.05], [51.0, 54.45], [55.0, 57.2], [58.0, 59.29], [61.0, 61.16], [63.0, 62.85], [75.0, 79.83], [90.0, 91.2], [92.0, 94.02], [95.0, 96.25], [97.0, 100.21], [102.0, 102.19], [105.0, 106.62]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [31.73, 0.0, 0.0, 34.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.35, 31.11, 0.0, 0.0, 0.0, 35.37, 0.0, 31.81, 0.0, 83.52, 0.0, 0.0], "audiomae_on_audioset": [[["music", 57.9], ["electronic music", 10.75], ["speech", 7.83]], null, null, [["music", 48.57], ["speech", 14.65], ["electronic music", 3.62]], null, null, null, null, null, null, null, null, [["music", 50.72], ["ambient music", 9.9], ["electronic music", 9.71]], [["music", 51.38], ["hum", 14.83], ["sonar", 6.87]], null, null, null, [["music", 54.78], ["telephone bell ringing", 15.38], ["telephone", 11.98]], null, [["gong", 35.51], ["music", 17.23], ["musical instrument", 9.99]], null, null, null, null], "duration": [2.49, 1.8, 1.61, 2.28, 1.42, 0.99, 0.84, 1.09, 1.55, 1.38, 1.2, 1.05, 3.45, 2.2, 1.29, 0.16, -0.15, 4.83, 1.2, 2.02, 1.25, 3.21, 0.19, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/m-ETkZmPNiM_filtered.json b/annotations_filtered/m-ETkZmPNiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..870861f1971ed86c643857470c2f5f50662c60dc --- /dev/null +++ b/annotations_filtered/m-ETkZmPNiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.86], [18.0, 18.6], [24.0, 24.07], [33.0, 33.67], [36.0, 36.44], [40.0, 42.89], [43.0, 44.34], [47.0, 47.93], [48.0, 48.9], [50.0, 50.77], [53.0, 59.81], [64.0, 64.35], [65.0, 65.94], [68.0, 71.32], [73.0, 93.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 100.0, 51.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.6, 0.07, 0.67, 0.44, 2.89, 1.34, 0.93, 0.9, 0.77, 6.81, 0.35, 0.94, 3.32, 20.23]} \ No newline at end of file diff --git a/annotations_filtered/m-L3k3ElIQE_filtered.json b/annotations_filtered/m-L3k3ElIQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..275a324f794abbacdeccf33770ef94949fb880c7 --- /dev/null +++ b/annotations_filtered/m-L3k3ElIQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.32], [9.0, 10.98], [16.0, 16.43], [20.0, 20.34], [31.0, 31.78], [34.0, 33.99], [37.0, 37.96], [41.0, 41.82], [46.0, 46.08], [47.0, 47.16], [51.0, 50.99], [66.0, 67.66], [70.0, 71.49], [75.0, 75.71], [81.0, 84.65], [86.0, 87.08], [89.0, 89.41], [91.0, 91.03], [91.0, 102.22], [104.0, 105.65], [115.0, 116.75], [119.0, 121.69], [131.0, 132.95], [139.0, 140.75], [142.0, 143.23], [145.0, 145.74], [148.0, 149.72], [158.0, 157.99], [159.0, 160.79], [164.0, 165.75], [168.0, 168.98], [170.0, 171.36], [172.0, 172.81], [180.0, 180.49], [190.0, 191.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.72, 0.0, 0.0, 0.0, 38.1, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.47], ["sidetone", 10.06], ["sine wave", 2.32]], null, null, null, [["hum", 43.08], ["mains hum", 25.94], ["speech", 13.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 1.98, 0.43, 0.34, 0.78, -0.01, 0.96, 0.82, 0.08, 0.16, -0.01, 1.66, 1.49, 0.71, 3.65, 1.08, 0.41, 0.03, 11.22, 1.65, 1.75, 2.69, 1.95, 1.75, 1.23, 0.74, 1.72, -0.01, 1.79, 1.75, 0.98, 1.36, 0.81, 0.49, 1.81]} \ No newline at end of file diff --git a/annotations_filtered/m-OaVzrf_vc_filtered.json b/annotations_filtered/m-OaVzrf_vc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c888a40ee30afb85c19fab9f9b840898a947e7f --- /dev/null +++ b/annotations_filtered/m-OaVzrf_vc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [6.0, 6.88], [11.0, 13.12], [15.0, 15.7], [22.0, 23.41], [25.0, 26.6], [29.0, 30.16], [34.0, 37.56], [51.0, 52.54], [53.0, 55.32], [59.0, 66.16], [70.0, 72.18], [74.0, 78.24], [79.0, 79.84], [81.0, 81.77], [84.0, 84.42], [87.0, 91.27], [92.0, 95.28], [97.0, 97.24], [98.0, 97.98], [102.0, 102.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 96.89, 100.0, 0.0, 0.0, 0.0, 99.62, 72.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.6, 0.88, 2.12, 0.7, 1.41, 1.6, 1.16, 3.56, 1.54, 2.32, 7.16, 2.18, 4.24, 0.84, 0.77, 0.42, 4.27, 3.28, 0.24, -0.02, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/m-PsCZ_57MY_filtered.json b/annotations_filtered/m-PsCZ_57MY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6d28ad14484d731ed290d7d669a6417d858c3ff --- /dev/null +++ b/annotations_filtered/m-PsCZ_57MY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [5.0, 6.84], [8.0, 13.56], [15.0, 15.57], [16.0, 17.46], [18.0, 19.14], [27.0, 28.14], [33.0, 34.35], [36.0, 36.21], [37.0, 38.47], [39.0, 40.05], [41.0, 43.11], [44.0, 45.5], [49.0, 54.6], [55.0, 59.36], [61.0, 60.93], [62.0, 62.72], [67.0, 67.22], [68.0, 76.27], [77.0, 78.31], [84.0, 85.02], [92.0, 98.69], [103.0, 104.35], [108.0, 109.29], [112.0, 111.99], [118.0, 117.78], [125.0, 127.14], [128.0, 128.92], [130.0, 130.3], [133.0, 138.0], [141.0, 160.14], [164.0, 173.2], [175.0, 175.0]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.09, 0.0, 29.32, 29.74, 0.0, 0.0, 0.0, 28.97, 0.0, 0.0, 29.77, 0.0, 0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 29.75, 28.39, 29.02, 0.0], "audiomae_on_audioset": [null, null, [["music", 51.86], ["hum", 7.53], ["synthesizer", 7.02]], null, null, null, null, null, null, null, null, [["whoosh, swoosh, swish", 18.02], ["rumble", 14.96], ["whack, thwack", 14.12]], null, [["mains hum", 25.35], ["music", 16.09], ["hum", 15.37]], [["rumble", 14.62], ["hum", 9.17], ["mains hum", 8.6]], null, null, null, [["speech", 66.48], ["hum", 10.55], ["mains hum", 4.29]], null, null, [["music", 54.46], ["whale vocalization", 14.94], ["stomach rumble", 7.78]], null, null, null, null, [["frog", 18.78], ["throbbing", 13.77], ["croak", 13.07]], null, null, [["music", 49.56], ["speech", 20.01], ["throbbing", 2.22]], [["speech", 27.03], ["rumble", 19.25], ["music", 12.91]], [["music", 42.43], ["hum", 22.61], ["mains hum", 8.98]], null], "duration": [0.59, 1.84, 5.56, 0.57, 1.46, 1.14, 1.14, 1.35, 0.21, 1.47, 1.05, 2.11, 1.5, 5.6, 4.36, -0.07, 0.72, 0.22, 8.27, 1.31, 1.02, 6.69, 1.35, 1.29, -0.01, -0.22, 2.14, 0.92, 0.3, 5.0, 19.14, 9.2, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/m-YWYdwcexU_filtered.json b/annotations_filtered/m-YWYdwcexU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a013d87c6b3de4894a86d698a3a13debcfd36b3 --- /dev/null +++ b/annotations_filtered/m-YWYdwcexU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.91], [21.0, 25.76], [27.0, 28.05], [29.0, 30.82], [32.0, 34.53], [35.0, 36.32], [37.0, 38.04], [39.0, 39.78], [46.0, 48.84], [50.0, 50.43], [52.0, 53.86], [60.0, 61.23], [64.0, 64.37], [71.0, 71.04], [74.0, 75.3], [76.0, 77.48], [121.0, 121.15], [122.0, 122.69], [126.0, 127.82]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.32, 0.0, 0.0, 33.32, 0.0, 0.0, 0.0, 45.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 39.89], ["mains hum", 30.44], ["music", 6.99]], null, null, [["sidetone", 38.89], ["speech", 15.41], ["whale vocalization", 4.86]], null, null, null, [["fly, housefly", 16.55], ["music", 14.98], ["insect", 13.8]], null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 4.76, 1.05, 1.82, 2.53, 1.32, 1.04, 0.78, 2.84, 0.43, 1.86, 1.23, 0.37, 0.04, 1.3, 1.48, 0.15, 0.69, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/m03MTJCH0Ns_filtered.json b/annotations_filtered/m03MTJCH0Ns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdc4a89929d50a9b493e00bbeac057b07625b8cd --- /dev/null +++ b/annotations_filtered/m03MTJCH0Ns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [25.0, 25.46], [29.0, 30.27], [35.0, 40.76], [43.0, 43.36], [52.0, 53.03]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.75, 0.46, 1.27, 5.76, 0.36, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/m0DbfOnOBQo_filtered.json b/annotations_filtered/m0DbfOnOBQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..423c7726876ef6434971b68fc9219f5e5512c1c5 --- /dev/null +++ b/annotations_filtered/m0DbfOnOBQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 27.3], [28.0, 48.03], [48.0, 89.45], [90.0, 90.09], [91.0, 100.48], [102.0, 105.0], [106.0, 147.11], [148.0, 151.12], [155.0, 161.59], [163.0, 163.58], [164.0, 175.0], [179.0, 180.5], [182.0, 182.51], [183.0, 183.57], [187.0, 189.19]], "keep_status": [false, true, false, false, false, true, false, true, true, false, true, false, false, false, true], "silence_prob": [100.0, 30.48, 0.0, 0.0, 29.39, 35.11, 0.0, 35.87, 35.2, 0.0, 30.79, 0.0, 0.0, 0.0, 32.7], "audiomae_on_audioset": [null, [["speech", 26.76], ["fly, housefly", 13.96], ["music", 11.18]], null, null, [["music", 67.6], ["whack, thwack", 4.18], ["sound effect", 3.09]], [["creak", 41.38], ["music", 13.57], ["hum", 7.6]], null, [["speech", 54.76], ["livestock, farm animals, working animals", 8.77], ["roaring cats (lions, tigers)", 5.46]], [["music", 19.95], ["animal", 19.28], ["wild animals", 7.54]], null, [["music", 22.72], ["animal", 19.01], ["hum", 13.3]], null, null, null, [["music", 36.37], ["speech", 12.12], ["hum", 10.85]]], "duration": [4.3, 20.03, 41.45, 0.09, 9.48, 3.0, 41.11, 3.12, 6.59, 0.58, 11.0, 1.5, 0.51, 0.57, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/m0XrO4YJyeI_filtered.json b/annotations_filtered/m0XrO4YJyeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f87c945b44cff4ce434fea30693f229c34d26b70 --- /dev/null +++ b/annotations_filtered/m0XrO4YJyeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.71], [10.0, 11.91], [13.0, 15.04], [20.0, 20.6], [30.0, 30.57], [32.0, 32.34], [33.0, 33.76], [39.0, 39.85], [48.0, 53.57], [56.0, 64.62], [69.0, 68.81], [69.0, 74.04], [78.0, 81.21], [93.0, 95.12], [107.0, 114.44], [115.0, 116.73], [124.0, 124.55]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 36.2, 0.0, 0.0, 0.0, 0.0, 0.0, 45.18, 33.42, 0.0, 40.29, 44.78, 71.14, 34.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 63.52], ["speech", 11.62], ["throbbing", 2.82]], null, null, null, null, null, [["singing bowl", 14.62], ["arrow", 13.62], ["music", 9.13]], [["music", 59.08], ["speech", 14.57], ["throbbing", 3.72]], null, [["music", 28.06], ["boing", 17.9], ["mosquito", 3.76]], [["speech", 31.18], ["music", 21.88], ["grunt", 1.91]], null, [["music", 60.38], ["chant", 8.85], ["effects unit", 3.3]], null, null], "duration": [0.71, 1.91, 2.04, 0.6, 0.57, 0.34, 0.76, 0.85, 5.57, 8.62, -0.19, 5.04, 3.21, 2.12, 7.44, 1.73, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/m0etOugqkPU_filtered.json b/annotations_filtered/m0etOugqkPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99f31956df5cab3263c42640bd8cf9e3773feb97 --- /dev/null +++ b/annotations_filtered/m0etOugqkPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.65], [15.0, 16.02], [25.0, 40.64], [58.0, 66.5], [68.0, 68.71], [70.0, 77.89], [80.0, 83.37], [90.0, 98.98], [117.0, 118.59], [123.0, 127.04], [127.0, 128.58], [135.0, 138.97], [143.0, 148.54], [149.0, 155.55], [157.0, 159.0], [167.0, 168.0]], "keep_status": [false, false, false, true, false, false, true, true, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 29.87, 30.45, 0.0, 31.57, 31.03, 31.92, 0.0, 34.49, 0.0, 36.25, 33.45, 30.73, 31.25, 0.0], "audiomae_on_audioset": [null, null, [["music", 81.99], ["didgeridoo", 1.89], ["carnatic music", 1.52]], [["speech", 25.6], ["music", 22.64], ["mosquito", 5.51]], null, [["speech", 55.38], ["hum", 9.58], ["music", 9.37]], [["music", 52.4], ["speech", 11.99], ["electronic music", 2.68]], [["fly, housefly", 21.8], ["music", 11.27], ["livestock, farm animals, working animals", 10.15]], null, [["music", 38.56], ["speech", 30.61], ["musical instrument", 2.6]], null, [["music", 38.67], ["speech", 15.64], ["hum", 3.91]], [["music", 56.4], ["didgeridoo", 5.35], ["drum and bass", 4.78]], [["music", 77.63], ["hum", 3.55], ["electronic music", 2.71]], [["music", 46.3], ["speech", 14.24], ["boing", 3.74]], null], "duration": [-0.35, 1.02, 15.64, 8.5, 0.71, 7.89, 3.37, 8.98, 1.59, 4.04, 1.58, 3.97, 5.54, 6.55, 2.0, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/m0z6-iFR-S8_filtered.json b/annotations_filtered/m0z6-iFR-S8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc3ccd48b67e82c2cef773f2827a08a9fa65346d --- /dev/null +++ b/annotations_filtered/m0z6-iFR-S8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.81], [19.0, 19.82], [45.0, 45.82], [50.0, 50.48], [52.0, 52.73], [67.0, 67.53], [73.0, 74.29], [83.0, 83.17], [85.0, 86.02], [88.0, 88.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.82, 0.82, 0.48, 0.73, 0.53, 1.29, 0.17, 1.02, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/m1JgMM8b9_w_filtered.json b/annotations_filtered/m1JgMM8b9_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e52913a84901615120cb277b4e6405dadf1bf5a8 --- /dev/null +++ b/annotations_filtered/m1JgMM8b9_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.37], [29.0, 29.98], [30.0, 32.43], [33.0, 36.44], [38.0, 39.23], [42.0, 43.21], [49.0, 49.17], [50.0, 50.85], [56.0, 59.48], [61.0, 61.86], [64.0, 67.93], [70.0, 81.26], [82.0, 83.74], [85.0, 89.67], [91.0, 93.55], [95.0, 96.16], [98.0, 100.52], [102.0, 102.86], [104.0, 105.43], [106.0, 108.4], [110.0, 110.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.68, 70.72, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 86.27, 39.34, 0.0, 56.4, 94.52, 0.0, 82.07, 0.0, 0.0, 66.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 81.77], ["hum", 2.4], ["musical instrument", 1.96]], null, null, null, null, null, null, null, null, null], "duration": [0.37, 0.98, 2.43, 3.44, 1.23, 1.21, 0.17, 0.85, 3.48, 0.86, 3.93, 11.26, 1.74, 4.67, 2.55, 1.16, 2.52, 0.86, 1.43, 2.4, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/m1p-vJzqPKw_filtered.json b/annotations_filtered/m1p-vJzqPKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffb64ae10b36f2d88ea5f0f072974228d8934914 --- /dev/null +++ b/annotations_filtered/m1p-vJzqPKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.11], [17.0, 16.65], [17.0, 17.0], [18.0, 57.89], [60.0, 59.95], [61.0, 76.49], [80.0, 86.36], [88.0, 158.35]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 41.4, 30.77, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 53.99], ["mains hum", 12.26], ["speech", 12.12]], [["speech", 37.07], ["explosion", 12.25], ["rumble", 10.12]], null], "duration": [1.11, -0.35, 0.0, 39.89, -0.05, 15.49, 6.36, 70.35]} \ No newline at end of file diff --git a/annotations_filtered/m1t9QOSYqYM_filtered.json b/annotations_filtered/m1t9QOSYqYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..346caa2a6561e14ef914cde34ddfea33b9fbf4e2 --- /dev/null +++ b/annotations_filtered/m1t9QOSYqYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.99], [16.0, 16.78], [18.0, 18.54], [21.0, 22.01], [28.0, 28.61], [31.0, 32.41], [33.0, 42.94], [44.0, 44.58], [52.0, 52.41], [55.0, 55.59], [59.0, 58.97], [60.0, 70.11], [72.0, 85.94], [89.0, 91.49], [93.0, 93.16], [94.0, 94.73], [96.0, 97.28], [99.0, 99.81], [101.0, 101.34], [104.0, 103.99], [105.0, 106.64], [110.0, 111.43], [112.0, 111.77], [112.0, 117.91], [119.0, 121.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [33.51, 0.0, 0.0, 0.0, 0.0, 0.0, 56.63, 0.0, 0.0, 0.0, 0.0, 33.72, 95.09, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.62, 43.64], "audiomae_on_audioset": [[["speech", 80.1], ["synthesizer", 2.74], ["thunk", 2.06]], null, null, null, null, null, null, null, null, null, null, [["speech", 80.88], ["whack, thwack", 2.53], ["hum", 1.41]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 88.11], ["inside, small room", 2.66], ["inside, large room or hall", 1.47]], [["fly, housefly", 5.3], ["animal", 4.61], ["frog", 4.38]]], "duration": [5.99, 0.78, 0.54, 1.01, 0.61, 1.41, 9.94, 0.58, 0.41, 0.59, -0.03, 10.11, 13.94, 2.49, 0.16, 0.73, 1.28, 0.81, 0.34, -0.01, 1.64, 1.43, -0.23, 5.91, 2.2]} \ No newline at end of file diff --git a/annotations_filtered/m2REqMDEXNU_filtered.json b/annotations_filtered/m2REqMDEXNU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87ee84aaabaf9b0fb2147a9bf792c278430c59ad --- /dev/null +++ b/annotations_filtered/m2REqMDEXNU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.45], [14.0, 16.26], [17.0, 17.46], [19.0, 28.58], [30.0, 31.83], [33.0, 34.23], [35.0, 35.9], [39.0, 39.24], [42.0, 42.15], [45.0, 49.11], [50.0, 53.05], [55.0, 57.54], [60.0, 70.48], [73.0, 76.79], [80.0, 80.2], [82.0, 83.79], [86.0, 86.7], [87.0, 91.25], [94.0, 94.73], [99.0, 100.13], [101.0, 102.44], [110.0, 113.39], [117.0, 117.32], [120.0, 120.04], [127.0, 128.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.83, 65.09, 0.0, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 97.43, 96.77, 62.27, 100.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.45, 2.26, 0.46, 9.58, 1.83, 1.23, 0.9, 0.24, 0.15, 4.11, 3.05, 2.54, 10.48, 3.79, 0.2, 1.79, 0.7, 4.25, 0.73, 1.13, 1.44, 3.39, 0.32, 0.04, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/m2cUbp6Vkfs_filtered.json b/annotations_filtered/m2cUbp6Vkfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61a66372793f6680982e73ced7638fcae88bcd8b --- /dev/null +++ b/annotations_filtered/m2cUbp6Vkfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.37], [19.0, 18.71], [19.0, 25.07], [32.0, 32.16], [33.0, 43.93], [47.0, 59.59], [60.0, 61.64], [64.0, 84.67], [92.0, 98.04], [98.0, 104.23], [116.0, 148.1], [172.0, 172.88]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [32.51, 0.0, 32.93, 0.0, 32.93, 33.38, 0.0, 32.86, 32.67, 33.1, 0.0, 0.0], "audiomae_on_audioset": [[["music", 68.92], ["musical instrument", 8.12], ["synthesizer", 4.06]], null, [["music", 59.2], ["trombone", 13.41], ["musical instrument", 3.79]], null, [["music", 79.1], ["trombone", 7.86], ["musical instrument", 2.97]], [["music", 66.46], ["musical instrument", 8.16], ["trombone", 3.7]], null, [["vehicle", 13.26], ["car", 10.39], ["race car, auto racing", 9.77]], [["music", 64.6], ["musical instrument", 6.1], ["effects unit", 5.97]], [["music", 42.05], ["musical instrument", 10.69], ["didgeridoo", 8.85]], null, null], "duration": [6.37, -0.29, 6.07, 0.16, 10.93, 12.59, 1.64, 20.67, 6.04, 6.23, 32.1, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/m2giPgQXSn4_filtered.json b/annotations_filtered/m2giPgQXSn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee4dcf33bb86445fbaaf49ed754112eb4fb24d83 --- /dev/null +++ b/annotations_filtered/m2giPgQXSn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.75], [8.0, 8.6], [16.0, 16.73], [20.0, 21.32], [23.0, 23.41], [25.0, 26.54], [30.0, 33.62], [37.0, 38.77], [42.0, 43.17], [45.0, 45.25], [48.0, 47.63], [48.0, 49.03], [55.0, 54.84], [62.0, 62.38], [66.0, 67.02], [78.0, 77.97], [79.0, 79.61], [84.0, 85.11], [91.0, 91.22], [93.0, 93.53], [104.0, 104.57], [115.0, 115.21], [121.0, 121.29], [128.0, 128.44], [130.0, 130.35], [131.0, 131.92], [132.0, 132.87], [135.0, 135.63], [139.0, 139.01], [142.0, 142.62], [145.0, 147.02], [148.0, 149.79], [154.0, 155.17], [157.0, 162.35], [164.0, 166.51], [168.0, 170.02]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 34.59, 31.53, 31.19], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 50.36], ["synthesizer", 6.55], ["radio", 5.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 48.39], ["whale vocalization", 34.61], ["speech", 6.61]], [["music", 30.98], ["percussion", 8.46], ["speech", 7.21]], [["sidetone", 65.52], ["speech", 20.38], ["radio", 2.97]]], "duration": [-0.25, 0.6, 0.73, 1.32, 0.41, 1.54, 3.62, 1.77, 1.17, 0.25, -0.37, 1.03, -0.16, 0.38, 1.02, -0.03, 0.61, 1.11, 0.22, 0.53, 0.57, 0.21, 0.29, 0.44, 0.35, 0.92, 0.87, 0.63, 0.01, 0.62, 2.02, 1.79, 1.17, 5.35, 2.51, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/m2tk7RatWsk_filtered.json b/annotations_filtered/m2tk7RatWsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4983cc731a5a5639596ea0bd7e95b6772f895b67 --- /dev/null +++ b/annotations_filtered/m2tk7RatWsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.12], [15.0, 17.98], [19.0, 19.23], [20.0, 64.25], [68.0, 76.91], [78.0, 92.72], [99.0, 112.7], [115.0, 118.94]], "keep_status": [false, false, false, false, true, false, true, true], "silence_prob": [40.09, 52.39, 0.0, 0.0, 46.97, 61.57, 30.27, 33.92], "audiomae_on_audioset": [[["hum", 49.05], ["mains hum", 22.73], ["music", 12.74]], null, null, null, [["hum", 20.94], ["mains hum", 20.15], ["rumble", 15.72]], null, [["hum", 18.17], ["speech", 10.66], ["mains hum", 9.7]], [["music", 28.05], ["throbbing", 12.93], ["hum", 11.46]]], "duration": [7.12, 2.98, 0.23, 44.25, 8.91, 14.72, 13.7, 3.94]} \ No newline at end of file diff --git a/annotations_filtered/m31MSgGEIAk_filtered.json b/annotations_filtered/m31MSgGEIAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9439042b286d30162c845456c8825c53846c31b --- /dev/null +++ b/annotations_filtered/m31MSgGEIAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.32], [34.0, 34.82], [36.0, 37.81], [39.0, 42.42], [43.0, 44.49], [51.0, 55.21], [55.0, 68.79], [73.0, 84.16], [88.0, 89.8], [103.0, 109.63], [114.0, 128.01], [129.0, 129.76], [131.0, 131.52], [136.0, 136.29], [139.0, 138.96], [141.0, 142.18], [144.0, 145.84], [147.0, 148.37], [150.0, 150.67], [151.0, 152.93], [154.0, 154.94], [156.0, 161.45], [162.0, 162.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.25, 0.0, 50.76, 65.32, 37.26, 0.0, 88.83, 67.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 54.62], ["sidetone", 15.81], ["radio", 3.64]], null, null, null, [["speech", 63.7], ["cough", 21.33], ["whack, thwack", 2.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 82.33], ["sidetone", 8.58], ["busy signal", 3.03]], null], "duration": [0.32, 0.82, 1.81, 3.42, 1.49, 4.21, 13.79, 11.16, 1.8, 6.63, 14.01, 0.76, 0.52, 0.29, -0.04, 1.18, 1.84, 1.37, 0.67, 1.93, 0.94, 5.45, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/m3262E3sfb8_filtered.json b/annotations_filtered/m3262E3sfb8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..053288880568f5034ea7ca1497d7a6d4ccb82536 --- /dev/null +++ b/annotations_filtered/m3262E3sfb8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 49.33], [51.0, 59.58], [64.0, 65.65]], "keep_status": [false, true, false], "silence_prob": [0.0, 33.33, 0.0], "audiomae_on_audioset": [null, [["music", 46.31], ["animal", 4.84], ["livestock, farm animals, working animals", 3.75]], null], "duration": [34.33, 8.58, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/m3QyTiNVwWA_filtered.json b/annotations_filtered/m3QyTiNVwWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ba5306aae48dc69d0ca3aff8ff518fdaf91da13 --- /dev/null +++ b/annotations_filtered/m3QyTiNVwWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.95], [6.0, 6.69], [8.0, 10.54], [11.0, 18.13], [23.0, 31.36], [34.0, 37.52], [40.0, 40.2], [46.0, 57.13], [58.0, 65.43], [67.0, 67.49], [70.0, 79.39]], "keep_status": [false, false, true, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 42.06, 34.96, 34.36, 43.61, 0.0, 32.78, 32.92, 0.0, 30.53], "audiomae_on_audioset": [null, null, [["hum", 19.81], ["music", 17.19], ["mains hum", 14.76]], [["chant", 33.88], ["music", 24.64], ["mantra", 15.32]], [["music", 33.2], ["chant", 20.95], ["carnatic music", 4.26]], [["whale vocalization", 66.91], ["music", 11.22], ["hum", 3.03]], null, [["music", 53.36], ["hum", 17.4], ["mains hum", 8.64]], [["mains hum", 40.7], ["hum", 21.24], ["speech", 10.96]], null, [["speech", 29.61], ["fly, housefly", 10.51], ["hum", 6.95]]], "duration": [1.95, 0.69, 2.54, 7.13, 8.36, 3.52, 0.2, 11.13, 7.43, 0.49, 9.39]} \ No newline at end of file diff --git a/annotations_filtered/m3TAK8ty_cg_filtered.json b/annotations_filtered/m3TAK8ty_cg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..125318f97ec485881b0cdb18267a6e64475d5073 --- /dev/null +++ b/annotations_filtered/m3TAK8ty_cg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 32.29], [63.0, 64.89], [70.0, 81.21]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 28.62], "audiomae_on_audioset": [null, null, [["buzz", 27.45], ["music", 20.19], ["speech", 11.32]]], "duration": [32.29, 1.89, 11.21]} \ No newline at end of file diff --git a/annotations_filtered/m3XsVwEuULw_filtered.json b/annotations_filtered/m3XsVwEuULw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..734f137bd569b1163e98b7043163cff096d77669 --- /dev/null +++ b/annotations_filtered/m3XsVwEuULw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.37], [12.0, 13.1], [14.0, 22.52], [27.0, 30.01], [35.0, 44.95], [48.0, 64.83], [65.0, 70.01], [71.0, 71.96], [73.0, 73.03], [73.0, 78.75], [85.0, 87.93], [88.0, 106.64], [108.0, 114.39], [118.0, 120.09], [121.0, 134.32], [138.0, 138.21], [139.0, 142.48], [145.0, 147.63]], "keep_status": [false, false, false, true, true, false, true, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.89, 42.13, 39.08, 34.08, 36.31, 0.0, 0.0, 35.5, 36.41, 36.02, 35.87, 35.36, 54.63, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, [["music", 51.58], ["drum and bass", 13.63], ["speech", 9.2]], [["music", 44.63], ["speech", 9.61], ["drum machine", 4.85]], [["music", 57.85], ["didgeridoo", 8.1], ["musical instrument", 3.98]], [["music", 57.99], ["buzz", 12.16], ["didgeridoo", 5.44]], [["sidetone", 32.78], ["music", 19.94], ["hum", 11.06]], null, null, [["music", 37.13], ["speech", 15.12], ["boing", 14.17]], [["music", 74.33], ["cacophony", 4.47], ["speech", 3.27]], [["music", 58.01], ["boing", 27.32], ["didgeridoo", 1.69]], [["music", 42.06], ["sidetone", 12.8], ["speech", 12.57]], [["music", 54.63], ["speech", 12.05], ["throbbing", 5.31]], null, null, null, null], "duration": [0.37, 1.1, 8.52, 3.01, 9.95, 16.83, 5.01, 0.96, 0.03, 5.75, 2.93, 18.64, 6.39, 2.09, 13.32, 0.21, 3.48, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/m3qnMx_kA2A_filtered.json b/annotations_filtered/m3qnMx_kA2A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f69ab121120dd15584280e8e3cf77ec49eb0186 --- /dev/null +++ b/annotations_filtered/m3qnMx_kA2A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.13], [7.0, 10.32], [17.0, 17.83], [19.0, 19.57], [26.0, 27.5], [30.0, 30.5], [32.0, 34.64], [36.0, 38.25], [39.0, 40.42], [53.0, 52.81], [61.0, 61.67], [62.0, 62.61], [64.0, 63.85], [66.0, 70.95], [76.0, 79.52], [81.0, 86.63], [90.0, 90.95], [91.0, 93.36], [94.0, 97.06], [102.0, 102.09], [103.0, 103.74], [104.0, 107.86], [114.0, 127.8], [128.0, 128.73], [132.0, 132.87], [133.0, 137.37]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, true], "silence_prob": [59.24, 58.89, 0.0, 0.0, 0.0, 0.0, 42.91, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 40.68, 50.31, 36.99, 0.0, 36.04, 40.33, 0.0, 0.0, 35.1, 34.67, 0.0, 0.0, 34.01], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 16.39], ["music", 11.23], ["throbbing", 10.57]], [["speech", 37.44], ["frog", 14.95], ["music", 12.23]], null, null, null, null, null, [["music", 26.1], ["speech", 16.62], ["throbbing", 5.28]], null, [["mains hum", 34.8], ["hum", 29.58], ["music", 8.5]], null, [["speech", 56.6], ["fly, housefly", 3.32], ["field recording", 3.11]], [["speech", 15.42], ["music", 15.14], ["gong", 13.25]], null, null, [["music", 45.14], ["speech", 30.01], ["mains hum", 2.22]], [["hum", 31.12], ["music", 28.11], ["throbbing", 18.88]], null, null, [["speech", 30.51], ["music", 28.05], ["mains hum", 7.81]]], "duration": [4.13, 3.32, 0.83, 0.57, 1.5, 0.5, 2.64, 2.25, 1.42, -0.19, 0.67, 0.61, -0.15, 4.95, 3.52, 5.63, 0.95, 2.36, 3.06, 0.09, 0.74, 3.86, 13.8, 0.73, 0.87, 4.37]} \ No newline at end of file diff --git a/annotations_filtered/m3s7ZwpFCsc_filtered.json b/annotations_filtered/m3s7ZwpFCsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dfae7a467e9fcec73e2da10e0aa243675d3a440 --- /dev/null +++ b/annotations_filtered/m3s7ZwpFCsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.83], [8.0, 8.31], [9.0, 13.88], [21.0, 28.54], [30.0, 31.01], [31.0, 32.76], [33.0, 34.37], [34.0, 34.96], [40.0, 40.1], [43.0, 43.85], [46.0, 46.68], [47.0, 54.36], [58.0, 58.43], [72.0, 72.81], [74.0, 76.1], [83.0, 83.47], [87.0, 88.21], [91.0, 94.95], [97.0, 98.07], [99.0, 99.82], [100.0, 101.48], [102.0, 103.11], [104.0, 107.3], [109.0, 109.71], [111.0, 123.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 87.55, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 67.51, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 92.31, 0.0, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 0.31, 4.88, 7.54, 1.01, 1.76, 1.37, 0.96, 0.1, 0.85, 0.68, 7.36, 0.43, 0.81, 2.1, 0.47, 1.21, 3.95, 1.07, 0.82, 1.48, 1.11, 3.3, 0.71, 12.2]} \ No newline at end of file diff --git a/annotations_filtered/m43-bLl6ZwI_filtered.json b/annotations_filtered/m43-bLl6ZwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ae46fa6805fdf7d267d6a33f04e7249d17d5afa --- /dev/null +++ b/annotations_filtered/m43-bLl6ZwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 25.73], [28.0, 62.92], [64.0, 68.98]], "keep_status": [false, false, false], "silence_prob": [29.59, 0.0, 29.66], "audiomae_on_audioset": [[["hum", 49.53], ["mains hum", 37.73], ["throbbing", 3.04]], null, [["speech", 59.43], ["throbbing", 7.17], ["music", 6.39]]], "duration": [10.73, 34.92, 4.98]} \ No newline at end of file diff --git a/annotations_filtered/m49ub45c8AI_filtered.json b/annotations_filtered/m49ub45c8AI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a718d4dc0d1693e1502f4b059b1af754c42dffb9 --- /dev/null +++ b/annotations_filtered/m49ub45c8AI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[84.0, 108.85], [110.0, 127.21], [129.0, 129.2], [139.0, 142.2]], "keep_status": [true, true, false, false], "silence_prob": [32.22, 28.85, 0.0, 33.97], "audiomae_on_audioset": [[["quack", 20.46], ["duck", 13.62], ["sonar", 10.72]], [["machine gun", 21.54], ["speech", 16.54], ["boom", 11.63]], null, [["whale vocalization", 51.06], ["speech", 35.95], ["music", 1.27]]], "duration": [24.85, 17.21, 0.2, 3.2]} \ No newline at end of file diff --git a/annotations_filtered/m4SWkyqSFxM_filtered.json b/annotations_filtered/m4SWkyqSFxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abc770eb1f76ffeb02f678e54031be72e16cf707 --- /dev/null +++ b/annotations_filtered/m4SWkyqSFxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [4.0, 4.62], [7.0, 8.53], [19.0, 20.6], [23.0, 23.45], [40.0, 40.36], [46.0, 47.07], [49.0, 49.15]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.25, 0.62, 1.53, 1.6, 0.45, 0.36, 1.07, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/m4VP7c5UCdE_filtered.json b/annotations_filtered/m4VP7c5UCdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2c774c42fb5f2ba4c352e6081c5c3625fd1d49f --- /dev/null +++ b/annotations_filtered/m4VP7c5UCdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 24.21], [24.0, 46.53], [48.0, 48.07]], "keep_status": [false, false, false], "silence_prob": [31.52, 33.16, 0.0], "audiomae_on_audioset": [[["fart", 69.67], ["whale vocalization", 13.59], ["music", 4.03]], [["fart", 37.02], ["whale vocalization", 29.16], ["stomach rumble", 12.67]], null], "duration": [6.21, 22.53, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/m4a6jkZiOkM_filtered.json b/annotations_filtered/m4a6jkZiOkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..511ad1f8cd81d6979752f6c497a3642c24369ebc --- /dev/null +++ b/annotations_filtered/m4a6jkZiOkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.27], [13.0, 14.35], [15.0, 16.82], [18.0, 18.42], [19.0, 20.63], [23.0, 24.07], [25.0, 26.86], [32.0, 33.47], [38.0, 41.66], [44.0, 45.66], [46.0, 48.79], [50.0, 51.85], [53.0, 66.06], [67.0, 70.23], [71.0, 72.69], [74.0, 85.6], [87.0, 89.8], [93.0, 95.81], [97.0, 98.76], [102.0, 104.33], [110.0, 111.28], [112.0, 113.66], [115.0, 116.88], [118.0, 120.78], [122.0, 137.34], [138.0, 140.22], [141.0, 144.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 99.76, 0.0, 99.99, 99.36, 0.0, 99.65, 99.91, 99.95, 0.0, 99.1, 0.0, 0.0, 0.0, 96.42, 71.43, 98.93, 87.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.27, 1.35, 1.82, 0.42, 1.63, 1.07, 1.86, 1.47, 3.66, 1.66, 2.79, 1.85, 13.06, 3.23, 1.69, 11.6, 2.8, 2.81, 1.76, 2.33, 1.28, 1.66, 1.88, 2.78, 15.34, 2.22, 3.49]} \ No newline at end of file diff --git a/annotations_filtered/m5-bSlttk18_filtered.json b/annotations_filtered/m5-bSlttk18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9788c47931e8cad141e313d4f104b79491e6b165 --- /dev/null +++ b/annotations_filtered/m5-bSlttk18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.46], [8.0, 8.34], [11.0, 11.13], [15.0, 15.25], [20.0, 20.19], [39.0, 38.82], [41.0, 42.53], [44.0, 45.06], [47.0, 47.22], [51.0, 52.24], [56.0, 55.95], [58.0, 59.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 0.34, 0.13, 0.25, 0.19, -0.18, 1.53, 1.06, 0.22, 1.24, -0.05, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/m5Qi_YVxd5M_filtered.json b/annotations_filtered/m5Qi_YVxd5M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09448e8259650ae51d3da7d18d970fa680e1fdad --- /dev/null +++ b/annotations_filtered/m5Qi_YVxd5M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [5.0, 5.61], [13.0, 13.49], [16.0, 16.38], [18.0, 18.52], [19.0, 21.83], [24.0, 24.66], [26.0, 26.82], [28.0, 30.79], [37.0, 37.49], [39.0, 40.14], [45.0, 48.47], [49.0, 51.81], [53.0, 54.28], [55.0, 56.66], [58.0, 58.83], [59.0, 59.71], [64.0, 64.22], [66.0, 66.58], [72.0, 73.65], [74.0, 75.34], [77.0, 77.58], [79.0, 79.05], [83.0, 83.22], [83.0, 87.2], [93.0, 93.09], [95.0, 94.73], [97.0, 97.17], [98.0, 99.84], [100.0, 101.28], [102.0, 104.94], [106.0, 106.76], [109.0, 111.54], [113.0, 117.58], [119.0, 127.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.98, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 70.16, 44.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.06], ["music", 12.86], ["didgeridoo", 5.5]], null, null, null, null, null, null, null, null, null, [["hum", 20.63], ["mains hum", 13.35], ["chirp tone", 7.52]]], "duration": [0.23, 0.61, 0.49, 0.38, 0.52, 2.83, 0.66, 0.82, 2.79, 0.49, 1.14, 3.47, 2.81, 1.28, 1.66, 0.83, 0.71, 0.22, 0.58, 1.65, 1.34, 0.58, 0.05, 0.22, 4.2, 0.09, -0.27, 0.17, 1.84, 1.28, 2.94, 0.76, 2.54, 4.58, 8.28]} \ No newline at end of file diff --git a/annotations_filtered/m5bPIty4Dww_filtered.json b/annotations_filtered/m5bPIty4Dww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..893fd01b9df771782cb8193f914bac222ff6fa0f --- /dev/null +++ b/annotations_filtered/m5bPIty4Dww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.71], [11.0, 13.9], [15.0, 16.23], [20.0, 20.31], [21.0, 22.38], [23.0, 25.74], [29.0, 31.24], [32.0, 33.44], [34.0, 34.57], [37.0, 38.45], [41.0, 42.87], [45.0, 45.91], [49.0, 49.1], [52.0, 54.28], [55.0, 60.1], [65.0, 67.14], [69.0, 69.55], [74.0, 74.88], [77.0, 79.27], [80.0, 79.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 55.96, 0.0, 0.0, 0.0, 99.16, 99.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.32, 99.59, 99.93, 0.0, 0.0, 30.03, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 48.06], ["sneeze", 7.74], ["speech", 4.71]], null], "duration": [1.71, 2.9, 1.23, 0.31, 1.38, 2.74, 2.24, 1.44, 0.57, 1.45, 1.87, 0.91, 0.1, 2.28, 5.1, 2.14, 0.55, 0.88, 2.27, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/m5n7XpAv46A_filtered.json b/annotations_filtered/m5n7XpAv46A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80b5c9cf51108a962b6a89901ec3208345fa8270 --- /dev/null +++ b/annotations_filtered/m5n7XpAv46A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.87], [9.0, 9.58], [12.0, 13.24], [18.0, 18.86], [20.0, 19.94], [21.0, 22.52], [26.0, 27.13], [28.0, 27.82], [32.0, 32.97], [37.0, 49.57], [51.0, 51.76]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.33, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 44.24], ["speech", 14.41], ["busy signal", 4.68]], null], "duration": [0.87, 0.58, 1.24, 0.86, -0.06, 1.52, 1.13, -0.18, 0.97, 12.57, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/m5p1wM1ZHQ0_filtered.json b/annotations_filtered/m5p1wM1ZHQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aa08d19830fc1b7e8db911645a738ff919a6ce8 --- /dev/null +++ b/annotations_filtered/m5p1wM1ZHQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[65.0, 90.49], [91.0, 96.69], [98.0, 99.35], [100.0, 100.65]], "keep_status": [false, false, false, false], "silence_prob": [33.17, 50.61, 0.0, 0.0], "audiomae_on_audioset": [[["music", 31.73], ["hum", 21.37], ["mains hum", 17.53]], null, null, null], "duration": [25.49, 5.69, 1.35, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/m5rfQ59cc0o_filtered.json b/annotations_filtered/m5rfQ59cc0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43e2cdd8a7655e6cfe434abbe24764037f8b53de --- /dev/null +++ b/annotations_filtered/m5rfQ59cc0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [6.0, 7.03], [8.0, 16.61], [19.0, 19.84], [20.0, 26.91], [30.0, 40.49], [41.0, 41.66], [43.0, 63.58], [64.0, 64.45], [65.0, 65.55], [66.0, 68.3], [71.0, 71.69], [73.0, 73.3], [79.0, 80.81], [88.0, 89.07], [97.0, 97.8]], "keep_status": [false, false, true, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.03, 0.0, 35.03, 35.0, 0.0, 33.59, 0.0, 0.0, 34.39, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 39.68], ["fart", 8.62], ["animal", 2.89]], null, [["speech", 51.9], ["fly, housefly", 10.89], ["insect", 7.42]], [["speech", 84.49], ["music", 3.96], ["animal", 1.64]], null, [["music", 53.36], ["throbbing", 7.58], ["didgeridoo", 4.18]], null, null, [["music", 43.74], ["musical instrument", 9.17], ["plucked string instrument", 7.24]], null, null, null, null, null], "duration": [0.45, 1.03, 8.61, 0.84, 6.91, 10.49, 0.66, 20.58, 0.45, 0.55, 2.3, 0.69, 0.3, 1.81, 1.07, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/m6eVFDJA9EM_filtered.json b/annotations_filtered/m6eVFDJA9EM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c1e421f2a1ddb59aec64f65b8e4605a18ba3505 --- /dev/null +++ b/annotations_filtered/m6eVFDJA9EM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.75], [17.0, 17.64], [18.0, 18.13], [44.0, 44.95], [50.0, 50.28], [54.0, 55.07], [56.0, 56.62], [58.0, 65.96], [66.0, 67.31], [77.0, 86.22], [88.0, 90.12], [91.0, 91.37], [95.0, 96.57], [99.0, 100.18], [105.0, 108.03], [109.0, 115.01], [116.0, 119.33], [122.0, 130.92], [132.0, 132.88], [135.0, 136.19], [138.0, 139.87], [141.0, 142.84], [144.0, 144.81], [146.0, 146.65], [149.0, 149.01], [153.0, 154.04], [155.0, 154.9], [157.0, 162.75], [166.0, 170.04], [174.0, 175.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 58.05, 82.97, 0.0, 0.0, 0.0, 67.13, 52.51, 46.09, 65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.18, 90.78, 0.0], "audiomae_on_audioset": [[["music", 50.3], ["speech", 27.62], ["burst, pop", 2.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 37.5], ["mains hum", 29.91], ["speech", 11.86]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.75, 0.64, 0.13, 0.95, 0.28, 1.07, 0.62, 7.96, 1.31, 9.22, 2.12, 0.37, 1.57, 1.18, 3.03, 6.01, 3.33, 8.92, 0.88, 1.19, 1.87, 1.84, 0.81, 0.65, 0.01, 1.04, -0.1, 5.75, 4.04, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/m6kFCNsnQpQ_filtered.json b/annotations_filtered/m6kFCNsnQpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3e8a849391b33fd5139a9ec56a50255e16cec8d --- /dev/null +++ b/annotations_filtered/m6kFCNsnQpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.37], [9.0, 10.35], [11.0, 13.8], [16.0, 17.78], [19.0, 23.92], [26.0, 26.1], [28.0, 28.88], [30.0, 32.14], [33.0, 34.05], [35.0, 35.11], [35.0, 36.21], [37.0, 48.19], [49.0, 50.21], [51.0, 51.97], [55.0, 56.08], [57.0, 57.27], [58.0, 59.63], [61.0, 62.94], [65.0, 65.38], [67.0, 67.83], [69.0, 69.11], [69.0, 69.21], [74.0, 75.42], [79.0, 85.06], [86.0, 87.79], [89.0, 91.52], [95.0, 100.7], [102.0, 120.23], [122.0, 132.92], [133.0, 134.64], [136.0, 136.43], [137.0, 137.57], [138.0, 139.08], [143.0, 143.13], [145.0, 149.94], [153.0, 167.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 54.56, 0.0, 99.97, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.81, 0.0, 99.97, 34.43, 45.59, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 30.01, 32.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["telephone bell ringing", 68.27], ["telephone", 16.97], ["ringtone", 3.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 67.49], ["speech", 23.32], ["radio", 5.16]], [["speech", 66.52], ["sidetone", 14.26], ["stomach rumble", 4.68]], [["music", 54.58], ["speech", 15.05], ["musical instrument", 7.93]], null, null, null, null, null, [["carnatic music", 24.84], ["music", 13.58], ["roar", 9.12]], [["speech", 11.65], ["grunt", 9.83], ["livestock, farm animals, working animals", 7.36]]], "duration": [0.37, 1.35, 2.8, 1.78, 4.92, 0.1, 0.88, 2.14, 1.05, 0.11, 1.21, 11.19, 1.21, 0.97, 1.08, 0.27, 1.63, 1.94, 0.38, 0.83, 0.11, 0.21, 1.42, 6.06, 1.79, 2.52, 5.7, 18.23, 10.92, 1.64, 0.43, 0.57, 1.08, 0.13, 4.94, 14.14]} \ No newline at end of file diff --git a/annotations_filtered/m6ux3-Z03B4_filtered.json b/annotations_filtered/m6ux3-Z03B4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f8ae55510015b46323698435f88d4e30d5eee56 --- /dev/null +++ b/annotations_filtered/m6ux3-Z03B4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.31], [16.0, 17.42], [18.0, 23.53], [24.0, 27.62], [35.0, 35.67], [42.0, 42.47], [44.0, 45.25], [46.0, 46.06], [46.0, 46.95], [47.0, 55.24], [56.0, 57.62], [58.0, 60.13], [63.0, 63.48], [67.0, 70.06], [70.0, 71.78], [72.0, 85.89], [86.0, 88.13]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, true, false, true, false, true, true], "silence_prob": [0.0, 0.0, 39.88, 42.51, 0.0, 0.0, 0.0, 0.0, 0.0, 38.42, 0.0, 38.83, 0.0, 40.61, 0.0, 37.0, 41.52], "audiomae_on_audioset": [null, null, [["whale vocalization", 37.08], ["throbbing", 15.32], ["hum", 13.18]], [["thunk", 6.03], ["whack, thwack", 3.97], ["crushing", 3.83]], null, null, null, null, null, [["speech", 56.49], ["crack", 16.48], ["crushing", 9.76]], null, [["speech", 43.72], ["sidetone", 9.27], ["music", 8.15]], null, [["music", 13.35], ["hum", 11.16], ["sonar", 8.77]], null, [["crushing", 28.72], ["speech", 12.2], ["music", 9.61]], [["sidetone", 24.94], ["speech", 19.71], ["chirp tone", 6.87]]], "duration": [1.31, 1.42, 5.53, 3.62, 0.67, 0.47, 1.25, 0.06, 0.95, 8.24, 1.62, 2.13, 0.48, 3.06, 1.78, 13.89, 2.13]} \ No newline at end of file diff --git a/annotations_filtered/m7HLqZP-l7E_filtered.json b/annotations_filtered/m7HLqZP-l7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9eaaf742755227a0dea99caa3167fe7c684e967 --- /dev/null +++ b/annotations_filtered/m7HLqZP-l7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.79], [27.0, 27.08], [29.0, 29.44], [32.0, 33.96], [36.0, 36.58], [39.0, 39.21], [42.0, 44.17], [44.0, 46.09], [48.0, 48.83], [49.0, 48.93], [49.0, 48.96], [51.0, 51.29], [52.0, 72.79], [75.0, 93.63], [98.0, 97.77], [104.0, 103.91], [110.0, 123.67], [126.0, 126.64], [128.0, 137.03], [142.0, 170.97], [176.0, 178.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.39, 66.51, 0.0, 0.0, 0.0, 0.0, 29.62, 31.22, 0.0, 0.0, 30.85, 0.0, 29.45, 30.16, 32.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.74], ["speech", 20.14], ["musical instrument", 2.67]], [["music", 88.72], ["throbbing", 1.82], ["synthesizer", 1.52]], null, null, [["music", 38.25], ["hum", 21.72], ["throbbing", 18.93]], null, [["cattle, bovinae", 33.89], ["music", 23.22], ["livestock, farm animals, working animals", 17.66]], [["music", 59.81], ["speech", 11.22], ["boing", 4.64]], [["music", 45.33], ["theremin", 18.19], ["musical instrument", 8.55]]], "duration": [0.79, 0.08, 0.44, 1.96, 0.58, 0.21, 2.17, 2.09, 0.83, -0.07, -0.04, 0.29, 20.79, 18.63, -0.23, -0.09, 13.67, 0.64, 9.03, 28.97, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/m7_LwdyNsIQ_filtered.json b/annotations_filtered/m7_LwdyNsIQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13914c02c796c5e287166eb4387386f2b9d41a06 --- /dev/null +++ b/annotations_filtered/m7_LwdyNsIQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.47], [5.0, 13.66], [15.0, 21.05], [22.0, 27.01], [27.0, 33.99], [35.0, 35.48], [37.0, 43.8], [45.0, 50.43], [51.0, 53.7], [55.0, 54.84], [57.0, 57.87], [58.0, 61.7], [64.0, 66.14], [69.0, 70.48], [71.0, 71.56], [72.0, 72.81], [76.0, 78.19], [80.0, 82.63], [84.0, 90.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 99.91, 91.47, 0.0, 66.88, 94.81, 99.4, 0.0, 0.0, 99.21, 94.07, 0.0, 0.0, 0.0, 98.59, 99.26, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.47, 8.66, 6.05, 5.01, 6.99, 0.48, 6.8, 5.43, 2.7, -0.16, 0.87, 3.7, 2.14, 1.48, 0.56, 0.81, 2.19, 2.63, 6.32]} \ No newline at end of file diff --git a/annotations_filtered/m7mbDPykHoc_filtered.json b/annotations_filtered/m7mbDPykHoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8ffe97bdaf5814bbb6ec4a4d6ecef2a774194c9 --- /dev/null +++ b/annotations_filtered/m7mbDPykHoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.42], [11.0, 11.77], [13.0, 13.54], [17.0, 17.64], [18.0, 18.35], [19.0, 19.2], [20.0, 20.04], [21.0, 21.66], [24.0, 25.05], [25.0, 26.33], [28.0, 30.48], [31.0, 32.36], [35.0, 36.02], [38.0, 40.47], [42.0, 42.09], [44.0, 45.59], [47.0, 47.33], [51.0, 51.95], [53.0, 53.52], [54.0, 55.29], [56.0, 57.06], [58.0, 58.9], [60.0, 60.71], [62.0, 62.28], [63.0, 63.76], [67.0, 68.76], [70.0, 71.73], [75.0, 75.96], [76.0, 76.45], [78.0, 77.97], [78.0, 78.61], [80.0, 80.89], [81.0, 81.51], [83.0, 84.15], [85.0, 86.48], [87.0, 89.16], [89.0, 90.39], [91.0, 91.18], [93.0, 95.72], [96.0, 97.92], [102.0, 102.9], [109.0, 109.7], [110.0, 110.69], [114.0, 114.96], [121.0, 121.41], [122.0, 122.49], [123.0, 123.57], [132.0, 132.14], [135.0, 135.04], [136.0, 136.8], [139.0, 139.92], [141.0, 141.34], [142.0, 143.6], [146.0, 146.52], [147.0, 150.53], [151.0, 153.08], [155.0, 155.43], [157.0, 157.05], [159.0, 159.78], [165.0, 166.01], [167.0, 169.6], [172.0, 173.03], [175.0, 175.47], [177.0, 177.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.32, 0.0, 0.0, 45.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.36, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.6, 96.42, 0.0, 0.0, 0.0, 0.0, 65.2, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 71.98], ["frog", 4.6], ["sheep", 2.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.34], ["sidetone", 12.67], ["hum", 8.49]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 0.77, 0.54, 0.64, 0.35, 0.2, 0.04, 0.66, 1.05, 1.33, 2.48, 1.36, 1.02, 2.47, 0.09, 1.59, 0.33, 0.95, 0.52, 1.29, 1.06, 0.9, 0.71, 0.28, 0.76, 1.76, 1.73, 0.96, 0.45, -0.03, 0.61, 0.89, 0.51, 1.15, 1.48, 2.16, 1.39, 0.18, 2.72, 1.92, 0.9, 0.7, 0.69, 0.96, 0.41, 0.49, 0.57, 0.14, 0.04, 0.8, 0.92, 0.34, 1.6, 0.52, 3.53, 2.08, 0.43, 0.05, 0.78, 1.01, 2.6, 1.03, 0.47, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/m7xTE3rvkDk_filtered.json b/annotations_filtered/m7xTE3rvkDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..106f4e2095268a4f0ffd6ac354ae181586b9522a --- /dev/null +++ b/annotations_filtered/m7xTE3rvkDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.12], [9.0, 9.17], [10.0, 11.52], [18.0, 17.85], [19.0, 33.78], [34.0, 34.91], [36.0, 44.9], [48.0, 50.73], [52.0, 56.83], [61.0, 69.94], [71.0, 74.16], [77.0, 88.87], [90.0, 90.12], [91.0, 97.28], [98.0, 125.9], [127.0, 127.62], [129.0, 129.84], [132.0, 132.93], [135.0, 137.22], [138.0, 139.29], [140.0, 148.78], [149.0, 150.9], [154.0, 160.3], [165.0, 182.76], [187.0, 187.1], [188.0, 191.05], [194.0, 196.67]], "keep_status": [true, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false], "silence_prob": [40.62, 0.0, 0.0, 0.0, 32.74, 0.0, 31.84, 32.43, 34.18, 31.69, 32.36, 35.05, 0.0, 34.72, 38.67, 0.0, 0.0, 0.0, 33.62, 0.0, 32.32, 0.0, 42.74, 31.16, 0.0, 30.66, 52.56], "audiomae_on_audioset": [[["music", 34.63], ["speech", 14.0], ["throbbing", 9.35]], null, null, null, [["music", 67.82], ["boing", 13.0], ["clang", 2.77]], null, [["music", 66.18], ["throbbing", 8.88], ["hum", 5.9]], [["speech", 44.51], ["artillery fire", 8.36], ["explosion", 4.1]], [["mains hum", 29.46], ["hum", 21.7], ["music", 18.38]], [["music", 30.83], ["speech", 27.99], ["didgeridoo", 7.27]], [["music", 43.38], ["hum", 8.71], ["throbbing", 7.24]], [["music", 67.76], ["throbbing", 5.69], ["hum", 5.03]], null, [["music", 70.39], ["throbbing", 8.8], ["electronic music", 2.57]], [["music", 60.44], ["hum", 6.12], ["throbbing", 5.82]], null, null, null, [["music", 40.24], ["whack, thwack", 7.52], ["throbbing", 7.11]], null, [["music", 42.34], ["speech", 41.59], ["throbbing", 1.51]], null, [["fly, housefly", 29.61], ["music", 13.02], ["mosquito", 11.99]], [["throbbing", 62.62], ["music", 16.92], ["hum", 10.54]], null, [["noise", 26.13], ["throbbing", 16.75], ["hum", 14.05]], null], "duration": [6.12, 0.17, 1.52, -0.15, 14.78, 0.91, 8.9, 2.73, 4.83, 8.94, 3.16, 11.87, 0.12, 6.28, 27.9, 0.62, 0.84, 0.93, 2.22, 1.29, 8.78, 1.9, 6.3, 17.76, 0.1, 3.05, 2.67]} \ No newline at end of file diff --git a/annotations_filtered/m7xTvb-FAhQ_filtered.json b/annotations_filtered/m7xTvb-FAhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5c21e507d59f2a9cd8d713a296c83eb6df035e2 --- /dev/null +++ b/annotations_filtered/m7xTvb-FAhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.25], [4.0, 12.36], [13.0, 13.32], [16.0, 16.55], [18.0, 18.93], [20.0, 21.07], [23.0, 22.96], [24.0, 24.24], [25.0, 24.9], [26.0, 27.18], [28.0, 27.95], [28.0, 28.44], [29.0, 29.56], [31.0, 31.08], [36.0, 38.35], [39.0, 40.07], [42.0, 42.21], [44.0, 44.51], [46.0, 46.55], [49.0, 50.68], [52.0, 54.9], [58.0, 59.71], [60.0, 61.72], [63.0, 63.56], [64.0, 64.84], [66.0, 66.9], [67.0, 68.45], [71.0, 73.08], [75.0, 75.09], [76.0, 76.87], [78.0, 78.71], [80.0, 82.22], [97.0, 97.97], [105.0, 106.79], [108.0, 108.77], [114.0, 114.42], [117.0, 127.89], [136.0, 137.46], [160.0, 161.96], [169.0, 187.61], [190.0, 190.73], [193.0, 193.18], [193.0, 196.45], [225.0, 225.32], [233.0, 240.78], [244.0, 244.0], [248.0, 251.29], [253.0, 253.79], [257.0, 257.32], [260.0, 262.01], [263.0, 265.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 41.34, 0.0, 0.0, 36.15, 0.0, 0.0, 71.57, 0.0, 34.6, 0.0, 100.0, 0.0, 0.0, 99.76, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 78.82], ["theremin", 3.73], ["musical instrument", 2.26]], null, null, [["music", 81.17], ["theremin", 2.66], ["musical instrument", 2.21]], null, null, null, null, [["music", 71.39], ["theremin", 10.8], ["singing", 3.13]], null, null, null, null, null, null], "duration": [1.25, 8.36, 0.32, 0.55, 0.93, 1.07, -0.04, 0.24, -0.1, 1.18, -0.05, 0.44, 0.56, 0.08, 2.35, 1.07, 0.21, 0.51, 0.55, 1.68, 2.9, 1.71, 1.72, 0.56, 0.84, 0.9, 1.45, 2.08, 0.09, 0.87, 0.71, 2.22, 0.97, 1.79, 0.77, 0.42, 10.89, 1.46, 1.96, 18.61, 0.73, 0.18, 3.45, 0.32, 7.78, 0.0, 3.29, 0.79, 0.32, 2.01, 2.55]} \ No newline at end of file diff --git a/annotations_filtered/m8-_aJ1BiFE_filtered.json b/annotations_filtered/m8-_aJ1BiFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e80d38180ec70a8417b95a0a0e0d8c67f961b26e --- /dev/null +++ b/annotations_filtered/m8-_aJ1BiFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.91], [22.0, 22.22]], "keep_status": [true, false], "silence_prob": [30.51, 0.0], "audiomae_on_audioset": [[["speech", 29.36], ["music", 21.54], ["civil defense siren", 9.49]], null], "duration": [5.91, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/m89SmMCynWM_filtered.json b/annotations_filtered/m89SmMCynWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14c61bed160e880c172d26171addee58868fa903 --- /dev/null +++ b/annotations_filtered/m89SmMCynWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.91], [11.0, 12.87], [17.0, 18.49], [21.0, 26.06], [28.0, 35.11], [36.0, 39.63], [44.0, 44.17], [47.0, 47.95], [50.0, 50.65], [58.0, 64.17], [65.0, 68.03], [68.0, 68.12], [68.0, 69.52], [74.0, 74.14], [74.0, 74.68], [77.0, 77.65], [79.0, 79.15], [81.0, 81.43], [90.0, 90.73], [93.0, 93.8], [97.0, 97.55], [98.0, 98.76], [102.0, 103.1], [109.0, 114.81], [116.0, 120.85], [123.0, 123.84], [125.0, 125.37], [131.0, 131.13], [134.0, 133.91], [134.0, 135.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [74.92, 0.0, 0.0, 64.63, 68.67, 73.36, 0.0, 0.0, 0.0, 87.92, 82.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.91, 1.87, 1.49, 5.06, 7.11, 3.63, 0.17, 0.95, 0.65, 6.17, 3.03, 0.12, 1.52, 0.14, 0.68, 0.65, 0.15, 0.43, 0.73, 0.8, 0.55, 0.76, 1.1, 5.81, 4.85, 0.84, 0.37, 0.13, -0.09, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/m8Jm9_iR6cg_filtered.json b/annotations_filtered/m8Jm9_iR6cg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d297cdc1b94777a3bbb6a93f18c358ee2e9094a --- /dev/null +++ b/annotations_filtered/m8Jm9_iR6cg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 35.9], [37.0, 37.59], [39.0, 42.01], [43.0, 51.16], [52.0, 103.22], [104.0, 105.75], [107.0, 107.99], [109.0, 112.31], [114.0, 114.62], [117.0, 117.48], [119.0, 121.34], [122.0, 124.63], [127.0, 130.33]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, true, true], "silence_prob": [0.0, 0.0, 62.47, 43.2, 0.0, 0.0, 0.0, 29.48, 0.0, 0.0, 47.27, 31.46, 31.15], "audiomae_on_audioset": [null, null, null, [["music", 73.7], ["ambient music", 7.83], ["synthesizer", 3.19]], null, null, null, [["sound effect", 14.18], ["speech", 12.96], ["whack, thwack", 11.63]], null, null, [["hum", 17.85], ["mains hum", 16.74], ["fly, housefly", 5.56]], [["music", 33.32], ["hum", 12.94], ["speech", 6.28]], [["speech", 38.37], ["music", 22.18], ["sidetone", 7.84]]], "duration": [33.9, 0.59, 3.01, 8.16, 51.22, 1.75, 0.99, 3.31, 0.62, 0.48, 2.34, 2.63, 3.33]} \ No newline at end of file diff --git a/annotations_filtered/m8LWjDS3IkQ_filtered.json b/annotations_filtered/m8LWjDS3IkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e4c76d91007b5f1fb776379b0a65e8f6e594474 --- /dev/null +++ b/annotations_filtered/m8LWjDS3IkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.08], [4.0, 8.68], [10.0, 11.47], [15.0, 17.2], [18.0, 19.57], [21.0, 21.27], [22.0, 22.57], [23.0, 24.24], [26.0, 27.19], [27.0, 29.19], [30.0, 32.36], [34.0, 71.95], [72.0, 72.05], [72.0, 72.44], [73.0, 98.51], [103.0, 106.81], [107.0, 123.57], [126.0, 127.7], [128.0, 157.86], [158.0, 158.62], [160.0, 161.03]], "keep_status": [true, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [39.3, 33.64, 0.0, 45.24, 0.0, 0.0, 0.0, 0.0, 0.0, 42.17, 50.46, 0.0, 0.0, 0.0, 32.6, 30.48, 29.79, 0.0, 30.09, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 27.25], ["music", 19.89], ["mosquito", 14.46]], [["fly, housefly", 17.81], ["mosquito", 12.81], ["whack, thwack", 12.62]], null, [["music", 28.16], ["speech", 9.23], ["didgeridoo", 6.21]], null, null, null, null, null, [["mains hum", 26.94], ["hum", 17.44], ["speech", 14.2]], null, null, null, null, [["fart", 67.13], ["music", 22.23], ["cello", 1.15]], [["moo", 34.39], ["cattle, bovinae", 31.1], ["livestock, farm animals, working animals", 30.95]], [["music", 60.94], ["musical instrument", 10.4], ["didgeridoo", 6.45]], null, [["music", 27.81], ["groan", 16.6], ["cattle, bovinae", 8.24]], null, null], "duration": [2.08, 4.68, 1.47, 2.2, 1.57, 0.27, 0.57, 1.24, 1.19, 2.19, 2.36, 37.95, 0.05, 0.44, 25.51, 3.81, 16.57, 1.7, 29.86, 0.62, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/m8Mc-38C88g_filtered.json b/annotations_filtered/m8Mc-38C88g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00c052efe3ff896ba955de2e32d6e93a51c95f2e --- /dev/null +++ b/annotations_filtered/m8Mc-38C88g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.91], [5.0, 6.81], [8.0, 8.73], [10.0, 11.96], [12.0, 13.12], [17.0, 17.25], [22.0, 23.46], [34.0, 35.83], [40.0, 41.27], [43.0, 43.44], [46.0, 46.77], [47.0, 48.78], [53.0, 53.97], [58.0, 58.8], [61.0, 61.84], [64.0, 64.29], [65.0, 65.13], [77.0, 77.92], [85.0, 85.99], [88.0, 92.1], [95.0, 95.94], [96.0, 108.58], [110.0, 120.34], [121.0, 122.32], [123.0, 127.97], [133.0, 133.79], [135.0, 137.69], [145.0, 145.76], [150.0, 149.94], [150.0, 151.33], [152.0, 159.02], [161.0, 162.13], [164.0, 170.41], [171.0, 173.64], [174.0, 176.28], [177.0, 178.48], [181.0, 182.97], [185.0, 186.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 99.65, 99.96, 0.0, 93.45, 0.0, 99.96, 0.0, 0.0, 0.0, 99.96, 0.0, 99.88, 89.19, 99.05, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.91, 1.81, 0.73, 1.96, 1.12, 0.25, 1.46, 1.83, 1.27, 0.44, 0.77, 1.78, 0.97, 0.8, 0.84, 0.29, 0.13, 0.92, 0.99, 4.1, 0.94, 12.58, 10.34, 1.32, 4.97, 0.79, 2.69, 0.76, -0.06, 1.33, 7.02, 1.13, 6.41, 2.64, 2.28, 1.48, 1.97, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/m8lzyaMZ-mA_filtered.json b/annotations_filtered/m8lzyaMZ-mA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3561340430fe47999607095a646cc8047760abc4 --- /dev/null +++ b/annotations_filtered/m8lzyaMZ-mA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.08], [3.0, 3.37], [5.0, 5.59], [7.0, 8.95], [11.0, 11.13], [15.0, 15.38], [17.0, 17.66], [21.0, 21.61], [29.0, 29.51], [37.0, 37.44], [41.0, 41.23], [44.0, 44.32], [58.0, 58.33], [61.0, 61.53], [65.0, 65.2], [67.0, 66.78], [68.0, 68.27], [70.0, 70.17], [70.0, 72.1], [91.0, 91.84], [98.0, 98.81], [106.0, 106.34], [114.0, 114.42], [131.0, 131.04], [134.0, 134.0], [136.0, 135.8], [151.0, 151.9], [154.0, 154.87], [168.0, 168.52], [173.0, 172.98], [174.0, 174.51], [176.0, 175.88], [207.0, 206.96], [212.0, 212.21], [213.0, 213.48], [215.0, 214.89], [217.0, 217.71], [222.0, 222.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 0.37, 0.59, 1.95, 0.13, 0.38, 0.66, 0.61, 0.51, 0.44, 0.23, 0.32, 0.33, 0.53, 0.2, -0.22, 0.27, 0.17, 2.1, 0.84, 0.81, 0.34, 0.42, 0.04, 0.0, -0.2, 0.9, 0.87, 0.52, -0.02, 0.51, -0.12, -0.04, 0.21, 0.48, -0.11, 0.71, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/m946LkLieG8_filtered.json b/annotations_filtered/m946LkLieG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..488b15a2a124bb544613745fbe2072ce34626903 --- /dev/null +++ b/annotations_filtered/m946LkLieG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 45.69], [49.0, 64.42], [65.0, 66.31], [68.0, 68.54], [69.0, 70.44], [71.0, 72.01], [77.0, 78.06], [89.0, 89.04], [104.0, 105.14], [107.0, 110.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 15.42, 1.31, 0.54, 1.44, 1.01, 1.06, 0.04, 1.14, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/m9Gg_VQP2zw_filtered.json b/annotations_filtered/m9Gg_VQP2zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84e899885390c659d2cebeec058752403fee049d --- /dev/null +++ b/annotations_filtered/m9Gg_VQP2zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 25.81], [27.0, 27.19], [29.0, 29.86], [31.0, 33.35], [40.0, 41.37], [45.0, 46.16], [48.0, 48.56], [52.0, 52.44], [54.0, 62.13], [62.0, 102.49], [110.0, 111.38], [115.0, 119.57], [120.0, 126.67], [137.0, 140.05], [140.0, 148.2], [154.0, 157.38], [162.0, 162.24], [162.0, 172.49], [173.0, 172.94]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false, false], "silence_prob": [30.79, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 0.0, 30.93, 0.0, 0.0, 30.77, 30.49, 31.98, 34.55, 38.08, 0.0, 32.61, 0.0], "audiomae_on_audioset": [[["music", 45.65], ["boing", 16.82], ["speech", 13.45]], null, null, null, null, null, null, null, [["music", 50.05], ["sampler", 9.88], ["electronic music", 4.94]], null, null, [["music", 59.16], ["musical instrument", 7.25], ["synthesizer", 5.69]], [["music", 79.94], ["hum", 4.69], ["grunt", 2.72]], [["speech", 39.19], ["music", 18.63], ["synthesizer", 5.1]], [["speech", 45.29], ["music", 15.86], ["explosion", 11.17]], [["speech", 29.82], ["music", 27.74], ["bleat", 4.05]], null, [["fly, housefly", 45.02], ["insect", 16.7], ["speech", 11.24]], null], "duration": [13.81, 0.19, 0.86, 2.35, 1.37, 1.16, 0.56, 0.44, 8.13, 40.49, 1.38, 4.57, 6.67, 3.05, 8.2, 3.38, 0.24, 10.49, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/m9PEvezB8Nc_filtered.json b/annotations_filtered/m9PEvezB8Nc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d201d7ae34e44ef331308e4f69544716f6e30713 --- /dev/null +++ b/annotations_filtered/m9PEvezB8Nc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.02], [13.0, 20.93], [30.0, 31.43], [36.0, 36.93], [38.0, 41.76], [44.0, 64.59], [65.0, 77.92], [78.0, 80.94], [81.0, 93.68], [94.0, 98.37], [100.0, 100.47], [103.0, 102.91], [107.0, 110.0]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 99.95, 0.0, 0.0, 100.0, 83.16, 38.37, 40.57, 49.45, 86.27, 0.0, 0.0, 39.37], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 51.48], ["mains hum", 21.8], ["music", 7.02]], [["hum", 27.22], ["mains hum", 17.96], ["animal", 17.72]], [["speech", 48.71], ["buzz", 11.77], ["hum", 11.32]], null, null, null, [["speech", 29.43], ["burst, pop", 8.26], ["whack, thwack", 7.75]]], "duration": [0.02, 7.93, 1.43, 0.93, 3.76, 20.59, 12.92, 2.94, 12.68, 4.37, 0.47, -0.09, 3.0]} \ No newline at end of file diff --git a/annotations_filtered/m9Wh66FXZJQ_filtered.json b/annotations_filtered/m9Wh66FXZJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..506e444896f9764d02f418cf5141a13fd56ceb01 --- /dev/null +++ b/annotations_filtered/m9Wh66FXZJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [6.0, 6.51], [17.0, 16.98], [20.0, 23.4], [25.0, 28.88], [30.0, 29.94], [31.0, 31.63], [33.0, 33.35], [38.0, 39.01], [40.0, 40.14], [45.0, 44.96], [46.0, 46.48], [47.0, 47.82], [48.0, 49.64], [57.0, 58.58], [68.0, 68.71], [75.0, 75.34], [79.0, 79.51], [81.0, 81.46], [85.0, 85.58], [106.0, 106.62]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.48, 42.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["shofar", 12.63], ["wind instrument, woodwind instrument", 10.56], ["vehicle horn, car horn, honking", 9.05]], [["clip-clop", 20.3], ["hum", 17.5], ["horse", 13.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.37, 0.51, -0.02, 3.4, 3.88, -0.06, 0.63, 0.35, 1.01, 0.14, -0.04, 0.48, 0.82, 1.64, 1.58, 0.71, 0.34, 0.51, 0.46, 0.58, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/m9aEg5dlFOI_filtered.json b/annotations_filtered/m9aEg5dlFOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4955a5bbc919cc4ec10ba29f8f27f31e969d9c9 --- /dev/null +++ b/annotations_filtered/m9aEg5dlFOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 49.81], [50.0, 53.6], [60.0, 65.3], [67.0, 67.66], [70.0, 70.53], [71.0, 71.15], [74.0, 76.79], [79.0, 78.9], [84.0, 85.58], [87.0, 88.33], [89.0, 90.17], [93.0, 95.25], [97.0, 98.93], [100.0, 101.83], [141.0, 141.1], [153.0, 153.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 61.08, 77.2, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 54.5, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.19, 3.6, 5.3, 0.66, 0.53, 0.15, 2.79, -0.1, 1.58, 1.33, 1.17, 2.25, 1.93, 1.83, 0.1, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/m9rBv4Dn3Bk_filtered.json b/annotations_filtered/m9rBv4Dn3Bk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84f39a8dc46e6760540aaf0414efa7e3252995b2 --- /dev/null +++ b/annotations_filtered/m9rBv4Dn3Bk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.76], [24.0, 26.99], [30.0, 31.04], [32.0, 33.1], [34.0, 35.41], [36.0, 36.61], [37.0, 37.81], [38.0, 39.82], [48.0, 47.88], [51.0, 52.39], [53.0, 55.71], [72.0, 73.08], [81.0, 80.91], [83.0, 83.29], [87.0, 89.14], [90.0, 91.49], [92.0, 93.68], [95.0, 95.91], [97.0, 98.44], [100.0, 102.44], [104.0, 104.94], [106.0, 118.61], [120.0, 120.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [35.24, 37.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.37, 0.0, 0.0, 0.0, 39.27, 0.0, 0.0, 0.0, 0.0, 43.25, 0.0, 31.02, 0.0], "audiomae_on_audioset": [[["music", 65.82], ["throbbing", 11.2], ["hum", 5.19]], [["music", 58.17], ["speech", 8.88], ["musical instrument", 6.26]], null, null, null, null, null, null, null, null, [["speech", 12.78], ["throbbing", 11.05], ["hum", 9.05]], null, null, null, [["music", 74.7], ["musical instrument", 2.37], ["breaking", 1.64]], null, null, null, null, [["music", 36.05], ["speech", 26.12], ["musical instrument", 3.48]], null, [["music", 50.56], ["speech", 3.64], ["buzz", 3.28]], null], "duration": [15.76, 2.99, 1.04, 1.1, 1.41, 0.61, 0.81, 1.82, -0.12, 1.39, 2.71, 1.08, -0.09, 0.29, 2.14, 1.49, 1.68, 0.91, 1.44, 2.44, 0.94, 12.61, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/mA1FWjriD60_filtered.json b/annotations_filtered/mA1FWjriD60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e99b2af18d19a65e3207584627a443381da20ffc --- /dev/null +++ b/annotations_filtered/mA1FWjriD60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.72], [14.0, 15.53], [19.0, 23.79], [27.0, 29.84], [72.0, 74.24], [81.0, 81.58], [89.0, 89.4], [103.0, 104.36], [126.0, 127.21], [128.0, 134.79], [136.0, 137.51], [153.0, 152.98], [168.0, 178.44], [179.0, 178.7]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.16, 35.29, 31.4, 0.0, 0.0, 0.0, 0.0, 32.08, 0.0, 0.0, 30.05, 0.0], "audiomae_on_audioset": [null, null, [["music", 66.96], ["swing music", 15.32], ["music of latin america", 2.23]], [["music", 56.93], ["carnatic music", 7.56], ["musical instrument", 6.15]], [["music", 26.3], ["speech", 20.92], ["trombone", 20.35]], null, null, null, null, [["music", 61.75], ["speech", 8.95], ["singing", 4.94]], null, null, [["music", 84.82], ["swing music", 3.12], ["music of latin america", 1.33]], null], "duration": [1.72, 1.53, 4.79, 2.84, 2.24, 0.58, 0.4, 1.36, 1.21, 6.79, 1.51, -0.02, 10.44, -0.3]} \ No newline at end of file diff --git a/annotations_filtered/mAB-hSPmzjk_filtered.json b/annotations_filtered/mAB-hSPmzjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..066bb53794fb4ac910b9fe9e9f31fcfc5fa77ece --- /dev/null +++ b/annotations_filtered/mAB-hSPmzjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.84], [29.0, 32.31], [34.0, 37.84], [39.0, 39.93], [42.0, 54.41], [56.0, 60.54], [61.0, 80.37]], "keep_status": [true, true, true, false, false, false, false], "silence_prob": [30.84, 31.76, 30.27, 0.0, 30.37, 30.92, 31.55], "audiomae_on_audioset": [[["hum", 28.51], ["music", 21.67], ["musical instrument", 8.35]], [["music", 46.87], ["hum", 7.8], ["musical instrument", 4.93]], [["hum", 30.94], ["music", 22.78], ["mains hum", 11.04]], null, [["music", 51.94], ["synthesizer", 14.32], ["musical instrument", 8.32]], [["hum", 56.47], ["mains hum", 25.3], ["throbbing", 7.64]], [["music", 44.22], ["hum", 23.36], ["throbbing", 5.88]]], "duration": [5.84, 3.31, 3.84, 0.93, 12.41, 4.54, 19.37]} \ No newline at end of file diff --git a/annotations_filtered/mAD2gJTRSbI_filtered.json b/annotations_filtered/mAD2gJTRSbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73f773ba462a087616f76b5c52644cc3382917aa --- /dev/null +++ b/annotations_filtered/mAD2gJTRSbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.19], [6.0, 6.2], [7.0, 8.55], [15.0, 15.53], [18.0, 19.11], [31.0, 30.96], [33.0, 35.38], [37.0, 104.65], [109.0, 110.47], [119.0, 119.01], [119.0, 119.06], [119.0, 119.28], [126.0, 126.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 0.2, 1.55, 0.53, 1.11, -0.04, 2.38, 67.65, 1.47, 0.01, 0.06, 0.28, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/mAeceNqeNtQ_filtered.json b/annotations_filtered/mAeceNqeNtQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6df4c152aaf851d65ad6c5437352d7c3d87dcb1 --- /dev/null +++ b/annotations_filtered/mAeceNqeNtQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.16], [5.0, 27.33], [34.0, 51.06], [56.0, 69.01], [71.0, 75.36], [82.0, 93.36]], "keep_status": [true, true, true, true, true, false], "silence_prob": [40.24, 34.55, 30.36, 33.42, 37.36, 32.67], "audiomae_on_audioset": [[["music", 29.84], ["didgeridoo", 24.76], ["fly, housefly", 6.19]], [["music", 35.59], ["hum", 11.67], ["speech", 10.83]], [["music", 30.73], ["speech", 18.39], ["sidetone", 16.17]], [["music", 37.49], ["didgeridoo", 10.89], ["effects unit", 7.27]], [["music", 51.6], ["musical instrument", 5.25], ["brass instrument", 3.64]], [["music", 51.93], ["theremin", 15.88], ["effects unit", 5.05]]], "duration": [2.16, 22.33, 17.06, 13.01, 4.36, 11.36]} \ No newline at end of file diff --git a/annotations_filtered/mAs4z9GV84Q_filtered.json b/annotations_filtered/mAs4z9GV84Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13e431a02c5bd4dcb31380b918697c50f35d1f29 --- /dev/null +++ b/annotations_filtered/mAs4z9GV84Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.73], [14.0, 15.04], [17.0, 18.67], [20.0, 20.12], [21.0, 21.68], [23.0, 24.83], [26.0, 27.35], [28.0, 28.73], [30.0, 32.54], [34.0, 35.07], [36.0, 37.86], [40.0, 41.0], [43.0, 44.09], [45.0, 46.35], [52.0, 52.93], [58.0, 59.41], [67.0, 70.53], [72.0, 74.58], [82.0, 83.4], [84.0, 85.4]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.23, 54.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 29.4], ["music", 22.95], ["throbbing", 8.74]], null, null, null, null, null, null, null, [["hum", 45.86], ["mains hum", 14.72], ["throbbing", 11.92]], null, null, null], "duration": [0.73, 1.04, 1.67, 0.12, 0.68, 1.83, 1.35, 0.73, 2.54, 1.07, 1.86, 1.0, 1.09, 1.35, 0.93, 1.41, 3.53, 2.58, 1.4, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/mAtmopQxu0o_filtered.json b/annotations_filtered/mAtmopQxu0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdc071ebeb99cd99b2ac50f5d52c9be6e5a621de --- /dev/null +++ b/annotations_filtered/mAtmopQxu0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 40.54], [41.0, 44.12], [44.0, 46.79], [48.0, 50.28], [51.0, 54.28], [55.0, 59.04], [60.0, 61.74], [63.0, 64.5], [66.0, 68.42], [70.0, 71.49], [72.0, 74.21], [77.0, 77.67], [80.0, 81.04], [82.0, 82.95], [83.0, 86.9], [88.0, 89.9], [91.0, 91.07], [92.0, 92.38], [93.0, 93.48], [95.0, 96.55], [98.0, 102.41], [103.0, 104.65], [107.0, 107.76], [109.0, 110.13], [111.0, 111.94], [112.0, 113.68], [115.0, 116.45], [118.0, 119.15], [120.0, 120.85], [121.0, 121.83], [122.0, 123.08], [124.0, 125.04], [127.0, 131.06], [133.0, 134.62], [137.0, 137.24], [139.0, 140.24], [141.0, 141.64], [144.0, 145.74], [146.0, 146.92], [155.0, 155.24], [156.0, 158.33], [160.0, 161.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.09, 99.8, 91.81, 93.45, 96.54, 98.66, 0.0, 0.0, 99.4, 0.0, 99.05, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.54, 3.12, 2.79, 2.28, 3.28, 4.04, 1.74, 1.5, 2.42, 1.49, 2.21, 0.67, 1.04, 0.95, 3.9, 1.9, 0.07, 0.38, 0.48, 1.55, 4.41, 1.65, 0.76, 1.13, 0.94, 1.68, 1.45, 1.15, 0.85, 0.83, 1.08, 1.04, 4.06, 1.62, 0.24, 1.24, 0.64, 1.74, 0.92, 0.24, 2.33, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/mBUdGRqiIR4_filtered.json b/annotations_filtered/mBUdGRqiIR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19262877b2e76ce1dfbbdf2ba62b292e2347c917 --- /dev/null +++ b/annotations_filtered/mBUdGRqiIR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.75], [10.0, 65.94], [67.0, 77.67], [80.0, 81.8], [83.0, 84.79], [87.0, 87.22], [87.0, 87.3], [89.0, 91.86], [94.0, 141.88]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 48.78, 0.0, 0.0, 0.0, 0.0, 41.26, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.46], ["hum", 21.23], ["throbbing", 15.7]], null, null, null, null, [["music", 42.02], ["throbbing", 18.68], ["hum", 8.9]], null], "duration": [0.75, 55.94, 10.67, 1.8, 1.79, 0.22, 0.3, 2.86, 47.88]} \ No newline at end of file diff --git a/annotations_filtered/mBiT0g4TIYc_filtered.json b/annotations_filtered/mBiT0g4TIYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be1c32d52f387ddc392a51636900e874f8692bbc --- /dev/null +++ b/annotations_filtered/mBiT0g4TIYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [3.0, 2.96], [5.0, 5.46], [6.0, 13.36], [16.0, 15.79], [16.0, 16.63], [19.0, 19.68], [21.0, 21.46], [22.0, 22.03], [25.0, 26.0], [28.0, 28.21], [30.0, 36.39], [38.0, 38.94], [45.0, 45.12], [49.0, 51.66], [61.0, 73.13], [75.0, 82.65], [92.0, 93.48], [95.0, 101.01], [102.0, 102.64], [104.0, 137.54], [140.0, 143.24], [143.0, 143.73], [146.0, 147.53]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 0.0, 29.95, 29.65, 29.05, 0.0, 29.74, 0.0, 0.0, 33.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 26.49], ["speech", 15.68], ["mains hum", 11.2]], null, null, null, null, null, null, null, null, null, null, [["speech", 47.13], ["music", 17.81], ["didgeridoo", 2.9]], [["music", 88.27], ["musical instrument", 3.5], ["piano", 0.88]], [["music", 61.22], ["musical instrument", 5.27], ["clarinet", 3.86]], null, [["music", 56.73], ["musical instrument", 9.87], ["brass instrument", 4.36]], null, null, [["throbbing", 45.81], ["music", 18.3], ["heart sounds, heartbeat", 8.36]], null, null], "duration": [0.24, -0.04, 0.46, 7.36, -0.21, 0.63, 0.68, 0.46, 0.03, 1.0, 0.21, 6.39, 0.94, 0.12, 2.66, 12.13, 7.65, 1.48, 6.01, 0.64, 33.54, 3.24, 0.73, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/mCSno4xODKY_filtered.json b/annotations_filtered/mCSno4xODKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5238c634b4b0756e9df0616b281d1398f22dba47 --- /dev/null +++ b/annotations_filtered/mCSno4xODKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.55], [20.0, 20.22], [21.0, 22.72], [25.0, 24.66], [25.0, 27.73], [31.0, 31.67], [33.0, 36.86], [50.0, 65.2], [70.0, 82.83], [83.0, 84.75]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 57.56, 32.21, 58.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["throbbing", 26.77], ["hum", 25.4], ["mains hum", 14.93]], null, null], "duration": [0.55, 0.22, 1.72, -0.34, 2.73, 0.67, 3.86, 15.2, 12.83, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/mCVwWrfOT3s_filtered.json b/annotations_filtered/mCVwWrfOT3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df8f41c9af11dd2eabf7d8a715bf0a4b8719780f --- /dev/null +++ b/annotations_filtered/mCVwWrfOT3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.32], [11.0, 12.58], [15.0, 16.8], [19.0, 22.52], [24.0, 26.77], [29.0, 29.78], [32.0, 33.34], [34.0, 36.07], [38.0, 38.31], [42.0, 43.56], [46.0, 47.63], [49.0, 57.15], [58.0, 62.07], [63.0, 65.77], [67.0, 70.73], [71.0, 76.45], [78.0, 79.24], [81.0, 88.89], [89.0, 95.2], [96.0, 98.25], [100.0, 102.42], [103.0, 108.53], [111.0, 114.98], [116.0, 121.24], [122.0, 121.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 54.5, 47.43, 0.0, 0.0, 37.83, 0.0, 0.0, 0.0, 99.05, 99.8, 97.92, 99.26, 83.7, 0.0, 85.9, 33.35, 59.59, 60.05, 38.82, 42.91, 39.47, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 65.8], ["hum", 4.78], ["mains hum", 3.07]], null, null, [["sidetone", 42.4], ["radio", 24.06], ["speech", 16.76]], null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 39.42], ["music", 25.71], ["theremin", 7.77]], null, null, [["cowbell", 53.71], ["livestock, farm animals, working animals", 12.01], ["sidetone", 3.49]], [["music", 45.31], ["musical instrument", 10.56], ["marimba, xylophone", 3.55]], [["music", 52.58], ["theremin", 8.75], ["ambient music", 5.72]], null], "duration": [0.32, 1.58, 1.8, 3.52, 2.77, 0.78, 1.34, 2.07, 0.31, 1.56, 1.63, 8.15, 4.07, 2.77, 3.73, 5.45, 1.24, 7.89, 6.2, 2.25, 2.42, 5.53, 3.98, 5.24, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/mCbY7cAv7r8_filtered.json b/annotations_filtered/mCbY7cAv7r8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2658c1dfee5fad85f6250dffdef27f586cde0d --- /dev/null +++ b/annotations_filtered/mCbY7cAv7r8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 24.14], [40.0, 40.53], [42.0, 42.8], [61.0, 64.67], [66.0, 66.38], [69.0, 69.06], [92.0, 92.31], [103.0, 103.45], [104.0, 104.9], [112.0, 112.06], [120.0, 168.29], [168.0, 168.4], [168.0, 168.51], [169.0, 168.79], [169.0, 169.91], [170.0, 171.39], [174.0, 173.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.14, 0.53, 0.8, 3.67, 0.38, 0.06, 0.31, 0.45, 0.9, 0.06, 48.29, 0.4, 0.51, -0.21, 0.91, 1.39, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/mCdbIDiib5U_filtered.json b/annotations_filtered/mCdbIDiib5U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a91b950d84984d50cae3b686ab496bfec88fa22 --- /dev/null +++ b/annotations_filtered/mCdbIDiib5U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.12]} \ No newline at end of file diff --git a/annotations_filtered/mCfKPXX19Gw_filtered.json b/annotations_filtered/mCfKPXX19Gw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0fd8b642ed2e12c3f931d4bcb09d2966b1ba527 --- /dev/null +++ b/annotations_filtered/mCfKPXX19Gw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 30.06], [33.0, 80.65], [85.0, 106.19], [108.0, 152.63], [154.0, 153.94]], "keep_status": [false, false, true, false, false], "silence_prob": [30.6, 0.0, 33.53, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.41], ["buzzer", 16.18], ["alarm", 11.94]], null, [["music", 47.73], ["hum", 12.14], ["rumble", 9.2]], null, null], "duration": [19.06, 47.65, 21.19, 44.63, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/mCsu9hGvNEc_filtered.json b/annotations_filtered/mCsu9hGvNEc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79b0af36476acf461497fec8a278ae9f6614a7c9 --- /dev/null +++ b/annotations_filtered/mCsu9hGvNEc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.26], [5.0, 5.29], [8.0, 8.53], [10.0, 11.92], [15.0, 15.52], [16.0, 17.31], [17.0, 18.57], [20.0, 20.46], [28.0, 28.65], [31.0, 30.69], [33.0, 33.12], [36.0, 37.54], [40.0, 40.54], [43.0, 44.15], [50.0, 50.03], [58.0, 68.86], [69.0, 71.68], [73.0, 81.09], [89.0, 89.55], [107.0, 107.96], [109.0, 109.78], [118.0, 121.61], [124.0, 126.72], [127.0, 126.79], [127.0, 150.48], [151.0, 158.84], [164.0, 168.76], [169.0, 177.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 94.22, 0.0, 0.0, 0.0, 99.98, 99.98, 0.0, 99.73, 97.83, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 0.29, 0.53, 1.92, 0.52, 1.31, 1.57, 0.46, 0.65, -0.31, 0.12, 1.54, 0.54, 1.15, 0.03, 10.86, 2.68, 8.09, 0.55, 0.96, 0.78, 3.61, 2.72, -0.21, 23.48, 7.84, 4.76, 8.92]} \ No newline at end of file diff --git a/annotations_filtered/mCu3uKNGuZw_filtered.json b/annotations_filtered/mCu3uKNGuZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee4ce9e3994fe545042e67a27eaec55eeb797f1b --- /dev/null +++ b/annotations_filtered/mCu3uKNGuZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 51.19], [52.0, 62.01], [62.0, 62.97], [66.0, 65.7], [67.0, 89.51], [90.0, 103.89], [110.0, 118.66]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 28.99, 0.0, 0.0, 29.06, 29.46, 29.17], "audiomae_on_audioset": [null, [["music", 68.75], ["didgeridoo", 5.78], ["musical instrument", 2.7]], null, null, [["music", 80.41], ["boing", 2.52], ["didgeridoo", 2.35]], [["music", 76.26], ["musical instrument", 4.86], ["accordion", 2.86]], [["music", 70.83], ["speech", 4.17], ["musical instrument", 2.87]]], "duration": [1.19, 10.01, 0.97, -0.3, 22.51, 13.89, 8.66]} \ No newline at end of file diff --git a/annotations_filtered/mD7NPkG9kwg_filtered.json b/annotations_filtered/mD7NPkG9kwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd99a1e9a6aae7805ac32acbc1d1617e1fb76d7d --- /dev/null +++ b/annotations_filtered/mD7NPkG9kwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.85], [15.0, 15.48], [37.0, 37.69], [46.0, 46.55], [52.0, 53.42], [54.0, 58.95], [61.0, 62.36], [77.0, 77.62], [81.0, 81.72], [91.0, 91.49], [93.0, 93.68], [102.0, 102.17], [103.0, 103.4], [111.0, 111.94], [118.0, 119.18], [120.0, 121.86], [124.0, 126.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.15, 0.48, 0.69, 0.55, 1.42, 4.95, 1.36, 0.62, 0.72, 0.49, 0.68, 0.17, 0.4, 0.94, 1.18, 1.86, 2.98]} \ No newline at end of file diff --git a/annotations_filtered/mD83kao4Q60_filtered.json b/annotations_filtered/mD83kao4Q60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fa2dc07c869498d1196460741be4a8c803aa813 --- /dev/null +++ b/annotations_filtered/mD83kao4Q60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.19], [10.0, 10.0], [10.0, 11.7], [18.0, 19.4], [20.0, 20.56], [22.0, 22.06], [31.0, 31.97], [33.0, 34.03], [36.0, 36.64], [41.0, 41.07], [71.0, 71.59], [72.0, 75.78], [82.0, 84.08], [86.0, 87.2], [88.0, 88.59], [90.0, 95.52], [96.0, 95.55], [96.0, 95.66], [96.0, 96.03], [99.0, 101.01], [101.0, 103.4], [106.0, 109.43], [110.0, 115.28], [117.0, 117.1], [121.0, 121.91], [123.0, 123.77], [126.0, 128.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 99.82, 0.0, 0.0, 89.36, 0.0, 0.0, 0.0, 77.7, 99.99, 71.0, 98.99, 0.0, 0.0, 0.0, 36.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.65], ["speech", 24.48], ["musical instrument", 8.62]]], "duration": [1.19, 0.0, 1.7, 1.4, 0.56, 0.06, 0.97, 1.03, 0.64, 0.07, 0.59, 3.78, 2.08, 1.2, 0.59, 5.52, -0.45, -0.34, 0.03, 2.01, 2.4, 3.43, 5.28, 0.1, 0.91, 0.77, 2.28]} \ No newline at end of file diff --git a/annotations_filtered/mDI2nymYW1M_filtered.json b/annotations_filtered/mDI2nymYW1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53c6fd92db0869e7129a9b222fada5ea1a0d6ffa --- /dev/null +++ b/annotations_filtered/mDI2nymYW1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [5.0, 7.48], [10.0, 10.62], [12.0, 11.85], [34.0, 35.43]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 32.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 42.21], ["aircraft", 17.26], ["fixed-wing aircraft, airplane", 13.88]], null, null, null], "duration": [0.52, 2.48, 0.62, -0.15, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/mDLS12_a-fk_filtered.json b/annotations_filtered/mDLS12_a-fk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13fa6998b15a4b97c2553436753917e2bd35c972 --- /dev/null +++ b/annotations_filtered/mDLS12_a-fk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [5.0, 4.9], [6.0, 10.35], [14.0, 18.91], [22.0, 26.69], [30.0, 34.62], [37.0, 52.27], [54.0, 86.91], [89.0, 92.97], [94.0, 95.5], [97.0, 99.89], [102.0, 103.2], [105.0, 106.47], [108.0, 108.77], [111.0, 111.97], [113.0, 113.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 93.76, 87.55, 90.6, 95.23, 93.45, 0.0, 84.43, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, -0.1, 4.35, 4.91, 4.69, 4.62, 15.27, 32.91, 3.97, 1.5, 2.89, 1.2, 1.47, 0.77, 0.97, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/mDUSjBiHYeY_filtered.json b/annotations_filtered/mDUSjBiHYeY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9057fa210e7f0667bac14acdc12fc5ea1f86e59a --- /dev/null +++ b/annotations_filtered/mDUSjBiHYeY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.22], [2.0, 10.47], [19.0, 19.9], [21.0, 20.98], [22.0, 22.32], [23.0, 24.06], [29.0, 39.72], [42.0, 68.23], [70.0, 73.23], [74.0, 77.28], [78.0, 79.54], [80.0, 87.45], [88.0, 89.09], [90.0, 92.6], [96.0, 100.25], [104.0, 104.36], [107.0, 119.08], [120.0, 123.04], [124.0, 125.1], [126.0, 127.68]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, true, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 31.17, 0.0, 0.0, 0.0, 0.0, 34.08, 42.74, 78.21, 80.82, 0.0, 35.66, 0.0, 33.93, 36.81, 0.0, 31.75, 93.29, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 50.48], ["groan", 14.68], ["speech", 2.91]], null, null, null, null, [["music", 60.57], ["screaming", 26.02], ["wail, moan", 5.81]], [["hum", 27.61], ["throbbing", 12.84], ["mains hum", 10.23]], null, null, null, [["speech", 34.0], ["fly, housefly", 12.94], ["noise", 8.95]], null, [["speech", 37.34], ["wail, moan", 28.63], ["boing", 10.09]], [["music", 52.59], ["musical instrument", 5.5], ["speech", 3.87]], null, [["music", 44.95], ["theremin", 15.46], ["speech", 2.84]], null, null, null], "duration": [0.22, 8.47, 0.9, -0.02, 0.32, 1.06, 10.72, 26.23, 3.23, 3.28, 1.54, 7.45, 1.09, 2.6, 4.25, 0.36, 12.08, 3.04, 1.1, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/mEiLmu1IF5E_filtered.json b/annotations_filtered/mEiLmu1IF5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..750cce1570876665ce586d11d25eb8dce7302055 --- /dev/null +++ b/annotations_filtered/mEiLmu1IF5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [4.0, 6.4], [7.0, 10.42], [12.0, 44.12], [45.0, 46.6], [48.0, 48.15], [52.0, 52.71], [59.0, 58.85], [67.0, 67.73], [71.0, 71.91], [74.0, 101.6], [102.0, 103.44], [104.0, 105.75], [107.0, 107.15], [108.0, 110.96], [112.0, 112.45], [113.0, 114.34], [115.0, 115.37], [116.0, 116.28], [117.0, 117.66], [123.0, 123.21], [133.0, 134.23], [135.0, 136.7], [137.0, 138.48], [143.0, 142.62], [147.0, 147.58], [149.0, 149.61], [153.0, 153.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.41, 32.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 41.68], ["throbbing", 19.05], ["mains hum", 15.74]], null, null, null, null, null, null, null, [["music", 58.46], ["electronic music", 5.88], ["throbbing", 5.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 2.4, 3.42, 32.12, 1.6, 0.15, 0.71, -0.15, 0.73, 0.91, 27.6, 1.44, 1.75, 0.15, 2.96, 0.45, 1.34, 0.37, 0.28, 0.66, 0.21, 1.23, 1.7, 1.48, -0.38, 0.58, 0.61, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/mExTnHwAcYY_filtered.json b/annotations_filtered/mExTnHwAcYY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4197a8f89b3ed95e7567ed6568c7bb7cc2e3a96 --- /dev/null +++ b/annotations_filtered/mExTnHwAcYY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.45], [12.0, 13.47], [17.0, 23.25], [25.0, 25.35], [27.0, 27.14], [30.0, 29.93], [46.0, 51.02], [52.0, 54.04], [54.0, 56.54], [58.0, 58.46], [59.0, 67.74], [69.0, 69.15], [69.0, 74.24], [76.0, 77.9], [80.0, 80.76], [85.0, 88.05], [89.0, 93.01], [94.0, 99.03], [103.0, 104.04], [104.0, 105.11], [107.0, 107.43], [108.0, 108.92], [111.0, 116.82], [119.0, 124.36], [126.0, 127.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.66, 0.0, 84.43, 0.0, 0.0, 0.0, 100.0, 100.0, 99.4, 0.0, 99.68, 0.0, 97.33, 0.0, 0.0, 99.82, 87.37, 98.27, 0.0, 0.0, 0.0, 0.0, 89.19, 95.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.45, 1.47, 6.25, 0.35, 0.14, -0.07, 5.02, 2.04, 2.54, 0.46, 8.74, 0.15, 5.24, 1.9, 0.76, 3.05, 4.01, 5.03, 1.04, 1.11, 0.43, 0.92, 5.82, 5.36, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/mEzXLJL48nA_filtered.json b/annotations_filtered/mEzXLJL48nA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..439471e5881de31e8a80be65bd47efa21084ebba --- /dev/null +++ b/annotations_filtered/mEzXLJL48nA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 45.99], [49.0, 49.65], [51.0, 51.81], [53.0, 55.39], [58.0, 65.5], [66.0, 67.36], [68.0, 74.19], [83.0, 87.54], [90.0, 90.07], [94.0, 96.33], [101.0, 101.63], [102.0, 104.43], [109.0, 129.19], [130.0, 131.23], [134.0, 134.96]], "keep_status": [true, false, false, false, true, false, false, true, false, true, false, true, false, false, false], "silence_prob": [32.38, 0.0, 0.0, 31.39, 31.08, 0.0, 33.52, 29.98, 0.0, 32.77, 0.0, 36.15, 30.98, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.01], ["hum", 13.9], ["throbbing", 8.58]], null, null, [["music", 63.81], ["cattle, bovinae", 3.38], ["livestock, farm animals, working animals", 3.29]], [["music", 33.28], ["speech", 13.45], ["explosion", 5.78]], null, [["music", 45.01], ["speech", 25.28], ["throbbing", 7.2]], [["music", 35.45], ["hum", 16.72], ["throbbing", 11.77]], null, [["music", 62.94], ["speech", 2.9], ["musical instrument", 2.65]], null, [["fart", 46.98], ["music", 17.53], ["mains hum", 4.69]], [["music", 47.74], ["throbbing", 17.57], ["hum", 12.37]], null, null], "duration": [14.99, 0.65, 0.81, 2.39, 7.5, 1.36, 6.19, 4.54, 0.07, 2.33, 0.63, 2.43, 20.19, 1.23, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/mFA9-zsFtt8_filtered.json b/annotations_filtered/mFA9-zsFtt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54eaa71e9ac978df423d7687032a7664f6478d90 --- /dev/null +++ b/annotations_filtered/mFA9-zsFtt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 29.24], [32.0, 33.49], [36.0, 36.04], [37.0, 38.13], [39.0, 44.41], [46.0, 47.17], [50.0, 50.3], [65.0, 65.7], [68.0, 68.67], [69.0, 72.23], [73.0, 74.09], [78.0, 80.49], [84.0, 89.21], [91.0, 91.71], [95.0, 96.79], [104.0, 104.53], [112.0, 112.29], [116.0, 116.26], [117.0, 118.67], [120.0, 120.63], [121.0, 122.34], [125.0, 125.25], [126.0, 126.05], [126.0, 126.2], [130.0, 130.65], [133.0, 133.64], [140.0, 142.69], [145.0, 146.04], [146.0, 146.97], [149.0, 149.69], [150.0, 162.3], [170.0, 170.11], [171.0, 172.39], [178.0, 182.36], [189.0, 194.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [73.97, 0.0, 0.0, 0.0, 60.98, 0.0, 0.0, 0.0, 0.0, 44.15, 0.0, 43.56, 44.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.89, 0.0, 0.0, 0.0, 35.49, 0.0, 0.0, 36.35, 37.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 57.64], ["hum", 9.42], ["music", 9.02]], null, [["speech", 53.74], ["hum", 9.11], ["music", 4.8]], [["sidetone", 50.39], ["speech", 15.87], ["music", 8.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.15], ["throbbing", 5.21], ["hum", 4.17]], null, null, null, [["music", 52.64], ["trance music", 7.31], ["techno", 6.6]], null, null, [["music", 51.53], ["electronic music", 10.27], ["techno", 9.04]], [["music", 65.4], ["electronic music", 5.69], ["techno", 4.65]]], "duration": [8.24, 1.49, 0.04, 1.13, 5.41, 1.17, 0.3, 0.7, 0.67, 3.23, 1.09, 2.49, 5.21, 0.71, 1.79, 0.53, 0.29, 0.26, 1.67, 0.63, 1.34, 0.25, 0.05, 0.2, 0.65, 0.64, 2.69, 1.04, 0.97, 0.69, 12.3, 0.11, 1.39, 4.36, 5.26]} \ No newline at end of file diff --git a/annotations_filtered/mFBIlYRQBLI_filtered.json b/annotations_filtered/mFBIlYRQBLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af23542241aef1aee54d1cf77f03994affc1cd20 --- /dev/null +++ b/annotations_filtered/mFBIlYRQBLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.84], [14.0, 18.99], [19.0, 21.96], [23.0, 26.27], [29.0, 32.34], [33.0, 36.85], [38.0, 39.75], [42.0, 42.99], [45.0, 63.71], [66.0, 69.06], [73.0, 74.49], [75.0, 81.43], [82.0, 86.51], [89.0, 91.89], [92.0, 108.63], [110.0, 110.93], [113.0, 116.87], [119.0, 128.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 100.0, 96.54, 100.0, 100.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 90.25, 97.43, 100.0, 100.0, 0.0, 100.0, 98.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.84, 4.99, 2.96, 3.27, 3.34, 3.85, 1.75, 0.99, 18.71, 3.06, 1.49, 6.43, 4.51, 2.89, 16.63, 0.93, 3.87, 9.92]} \ No newline at end of file diff --git a/annotations_filtered/mFH_r2w28rM_filtered.json b/annotations_filtered/mFH_r2w28rM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c2f47a4926bfc154b42530d439d5064eddb98ee --- /dev/null +++ b/annotations_filtered/mFH_r2w28rM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.19], [0.0, 0.43], [6.0, 5.85], [8.0, 8.7], [13.0, 15.9], [25.0, 25.15], [26.0, 26.37], [32.0, 32.31], [36.0, 36.21], [38.0, 39.14], [40.0, 40.47], [44.0, 44.47], [51.0, 52.54], [65.0, 74.85], [75.0, 79.24], [80.0, 81.77], [90.0, 89.83], [94.0, 94.29], [95.0, 94.91], [101.0, 103.22], [105.0, 105.44], [106.0, 107.55], [116.0, 117.56], [119.0, 119.23], [121.0, 121.98], [131.0, 130.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 85.35, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.43, -0.15, 0.7, 2.9, 0.15, 0.37, 0.31, 0.21, 1.14, 0.47, 0.47, 1.54, 9.85, 4.24, 1.77, -0.17, 0.29, -0.09, 2.22, 0.44, 1.55, 1.56, 0.23, 0.98, -0.26]} \ No newline at end of file diff --git a/annotations_filtered/mFXxro8aD3A_filtered.json b/annotations_filtered/mFXxro8aD3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f89b1d8192df9f92c9ecab6a47a31b022c2eeb82 --- /dev/null +++ b/annotations_filtered/mFXxro8aD3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.68], [11.0, 11.15], [12.0, 12.82], [19.0, 19.03], [26.0, 26.62]], "keep_status": [false, false, false, false, false], "silence_prob": [29.13, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 59.22], ["speech", 24.05], ["musical instrument", 5.47]], null, null, null, null], "duration": [3.68, 0.15, 0.82, 0.03, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/mFcz_U62r6s_filtered.json b/annotations_filtered/mFcz_U62r6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58fa3c35d4147549de40be9f018ff0645c6a556e --- /dev/null +++ b/annotations_filtered/mFcz_U62r6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 16.19], [17.0, 24.02], [32.0, 34.97], [39.0, 43.19], [44.0, 55.32]], "keep_status": [false, true, true, true, true], "silence_prob": [50.76, 44.75, 38.5, 33.77, 37.85], "audiomae_on_audioset": [null, [["music", 53.63], ["hum", 6.61], ["speech", 4.51]], [["speech", 46.36], ["hum", 6.78], ["vehicle", 2.57]], [["music", 15.37], ["speech", 13.84], ["hum", 11.35]], [["speech", 50.76], ["breaking", 6.93], ["hum", 5.99]]], "duration": [15.19, 7.02, 2.97, 4.19, 11.32]} \ No newline at end of file diff --git a/annotations_filtered/mFglGV3n5SM_filtered.json b/annotations_filtered/mFglGV3n5SM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/mFglGV3n5SM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/mFj1lf3ECK8_filtered.json b/annotations_filtered/mFj1lf3ECK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d303a3ac339a3747d272cb06857f317a70f76b1 --- /dev/null +++ b/annotations_filtered/mFj1lf3ECK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 43.71], [45.0, 47.28], [48.0, 48.59], [50.0, 51.81], [59.0, 59.48], [64.0, 64.2], [66.0, 66.58], [70.0, 82.88], [84.0, 83.91], [88.0, 88.45], [97.0, 97.66], [100.0, 105.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.68, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 70.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [26.71, 2.28, 0.59, 1.81, 0.48, 0.2, 0.58, 12.88, -0.09, 0.45, 0.66, 5.06]} \ No newline at end of file diff --git a/annotations_filtered/mFkxrTfAkq8_filtered.json b/annotations_filtered/mFkxrTfAkq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a99ddbeb4c83caa78897f34b932fcf6f5456facf --- /dev/null +++ b/annotations_filtered/mFkxrTfAkq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 24.58], [27.0, 32.59], [35.0, 40.44], [41.0, 49.67], [54.0, 64.81], [69.0, 79.96], [83.0, 90.0], [92.0, 139.16], [146.0, 155.19], [159.0, 161.79]], "keep_status": [false, true, true, false, true, true, true, false, false, false], "silence_prob": [33.53, 32.23, 32.17, 35.03, 32.4, 31.7, 33.08, 0.0, 56.7, 58.81], "audiomae_on_audioset": [[["speech", 43.91], ["sidetone", 14.27], ["buzz", 13.53]], [["speech", 52.77], ["sidetone", 12.62], ["music", 3.71]], [["music", 50.35], ["speech", 14.16], ["groan", 5.24]], [["music", 81.6], ["theremin", 5.64], ["musical instrument", 2.58]], [["speech", 23.62], ["sidetone", 20.17], ["hum", 15.64]], [["speech", 19.26], ["buzz", 9.06], ["grunt", 8.55]], [["music", 43.62], ["groan", 12.93], ["speech", 6.4]], null, null, null], "duration": [15.58, 5.59, 5.44, 8.67, 10.81, 10.96, 7.0, 47.16, 9.19, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/mFl8nzZuExE_filtered.json b/annotations_filtered/mFl8nzZuExE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf9d9438c77bd3fb2773443df32d4bc22be10daf --- /dev/null +++ b/annotations_filtered/mFl8nzZuExE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.21], [8.0, 10.99], [25.0, 25.59], [29.0, 29.71], [38.0, 37.61], [41.0, 41.93], [44.0, 44.36], [51.0, 51.19], [53.0, 52.66], [53.0, 53.65], [60.0, 61.45], [66.0, 89.26], [90.0, 91.2], [96.0, 96.85], [101.0, 102.76], [110.0, 110.86], [112.0, 113.12], [124.0, 125.0], [136.0, 135.68], [149.0, 149.59], [152.0, 153.01], [170.0, 169.69], [176.0, 176.59], [177.0, 180.06], [184.0, 184.18], [187.0, 187.69], [192.0, 197.29], [197.0, 197.45], [198.0, 198.73], [199.0, 202.15], [210.0, 210.61]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 33.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.2, 0.0, 0.0, 33.89, 0.0, 0.0, 43.0, 0.0], "audiomae_on_audioset": [null, [["thunk", 28.02], ["breaking", 24.32], ["creak", 14.07]], null, null, null, null, null, null, null, null, null, [["music", 72.01], ["breaking", 8.72], ["hum", 2.59]], null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 56.04], ["moo", 22.61], ["livestock, farm animals, working animals", 18.35]], null, null, [["music", 17.42], ["moo", 6.52], ["crowd", 6.49]], null, null, [["music", 60.77], ["speech", 10.0], ["electronic music", 2.52]], null], "duration": [0.21, 2.99, 0.59, 0.71, -0.39, 0.93, 0.36, 0.19, -0.34, 0.65, 1.45, 23.26, 1.2, 0.85, 1.76, 0.86, 1.12, 1.0, -0.32, 0.59, 1.01, -0.31, 0.59, 3.06, 0.18, 0.69, 5.29, 0.45, 0.73, 3.15, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/mFoZz6PG72k_filtered.json b/annotations_filtered/mFoZz6PG72k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba42f78480b11067a934fde945decda15af09e1f --- /dev/null +++ b/annotations_filtered/mFoZz6PG72k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.99], [5.0, 5.91], [7.0, 7.69], [8.0, 9.09], [13.0, 13.36], [16.0, 16.63], [19.0, 20.33], [26.0, 26.23], [27.0, 27.75], [31.0, 32.88], [34.0, 34.21], [37.0, 37.3], [40.0, 40.96], [43.0, 44.76], [47.0, 48.52], [50.0, 51.38], [52.0, 56.2], [57.0, 57.64], [59.0, 60.2], [61.0, 61.15], [64.0, 65.38], [67.0, 66.85], [69.0, 69.16], [70.0, 70.71], [74.0, 74.83], [78.0, 79.15], [80.0, 85.75], [89.0, 90.37], [96.0, 97.75], [99.0, 99.15], [101.0, 101.28], [102.0, 102.9], [104.0, 109.21], [113.0, 112.78], [113.0, 112.82], [113.0, 117.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0, 32.92, 0.0, 0.0, 29.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 49.06], ["throbbing", 18.58], ["mains hum", 13.01]], null, null, [["music", 51.86], ["throbbing", 15.13], ["hum", 12.82]]], "duration": [-0.01, 0.91, 0.69, 1.09, 0.36, 0.63, 1.33, 0.23, 0.75, 1.88, 0.21, 0.3, 0.96, 1.76, 1.52, 1.38, 4.2, 0.64, 1.2, 0.15, 1.38, -0.15, 0.16, 0.71, 0.83, 1.15, 5.75, 1.37, 1.75, 0.15, 0.28, 0.9, 5.21, -0.22, -0.18, 4.12]} \ No newline at end of file diff --git a/annotations_filtered/mFwAm6oIPtk_filtered.json b/annotations_filtered/mFwAm6oIPtk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e519b94da5281b794e5313f769e151a789522424 --- /dev/null +++ b/annotations_filtered/mFwAm6oIPtk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.41], [16.0, 16.26], [19.0, 22.03], [35.0, 36.24], [42.0, 41.93], [45.0, 46.09], [50.0, 50.73], [51.0, 52.96], [53.0, 54.18], [54.0, 55.14], [56.0, 59.53], [62.0, 63.85], [67.0, 68.39], [71.0, 72.72], [76.0, 77.23], [86.0, 87.45], [88.0, 88.55], [89.0, 98.19], [100.0, 100.48], [102.0, 104.94], [110.0, 113.21], [114.0, 120.26], [122.0, 130.08], [131.0, 131.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.4, 0.0, 91.81, 50.71, 46.94, 60.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.88], ["musical instrument", 4.35], ["wind instrument, woodwind instrument", 3.89]], null, null, null, [["music", 68.44], ["theremin", 3.05], ["livestock, farm animals, working animals", 2.12]], null, null], "duration": [0.41, 0.26, 3.03, 1.24, -0.07, 1.09, 0.73, 1.96, 1.18, 1.14, 3.53, 1.85, 1.39, 1.72, 1.23, 1.45, 0.55, 9.19, 0.48, 2.94, 3.21, 6.26, 8.08, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/mG1vn39lP3M_filtered.json b/annotations_filtered/mG1vn39lP3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be8d6e973561536d930e1599963b29c944854abf --- /dev/null +++ b/annotations_filtered/mG1vn39lP3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [6.0, 18.67], [19.0, 18.94], [19.0, 19.87], [22.0, 24.95], [27.0, 62.16], [64.0, 71.9], [74.0, 93.46], [97.0, 97.61], [100.0, 101.68], [103.0, 110.61], [117.0, 118.35], [122.0, 126.27], [126.0, 126.3], [126.0, 126.33]], "keep_status": [false, true, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.76, 0.0, 0.0, 29.42, 0.0, 29.75, 30.2, 0.0, 0.0, 30.12, 0.0, 29.72, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 28.26], ["hum", 14.2], ["throbbing", 10.03]], null, null, [["speech", 29.34], ["music", 14.12], ["mains hum", 11.65]], null, [["speech", 26.4], ["vehicle", 20.17], ["car", 6.47]], [["music", 32.29], ["throbbing", 22.48], ["hum", 16.56]], null, null, [["speech", 56.2], ["music", 15.47], ["vehicle", 2.07]], null, [["music", 44.75], ["speech", 27.01], ["explosion", 3.11]], null, null], "duration": [0.5, 12.67, -0.06, 0.87, 2.95, 35.16, 7.9, 19.46, 0.61, 1.68, 7.61, 1.35, 4.27, 0.3, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/mGA_uH0-n28_filtered.json b/annotations_filtered/mGA_uH0-n28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e31029a26d67ef97396059b783d0e6f6ca6fdd58 --- /dev/null +++ b/annotations_filtered/mGA_uH0-n28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.42], [12.0, 12.5], [14.0, 13.71], [20.0, 21.0], [29.0, 30.48], [45.0, 44.66], [45.0, 47.33], [49.0, 56.67], [70.0, 73.67], [78.0, 78.51], [79.0, 90.14], [92.0, 92.87]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.64, 30.5, 32.88, 0.0, 33.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 38.81], ["speech", 10.37], ["gong", 5.16]], [["theremin", 28.89], ["music", 26.1], ["harp", 3.44]], [["speech", 34.7], ["sidetone", 20.86], ["hum", 11.84]], null, [["music", 51.15], ["mains hum", 13.22], ["hum", 10.81]], null], "duration": [1.42, 0.5, -0.29, 1.0, 1.48, -0.34, 2.33, 7.67, 3.67, 0.51, 11.14, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/mGAaR9KKszs_filtered.json b/annotations_filtered/mGAaR9KKszs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfb8a6ad29b5a239518d1ec7c71bef5ff0663b3f --- /dev/null +++ b/annotations_filtered/mGAaR9KKszs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 26.92], [28.0, 28.75], [48.0, 49.49], [50.0, 50.38], [52.0, 53.2], [64.0, 67.44], [68.0, 68.01], [70.0, 70.95], [74.0, 74.28], [76.0, 77.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 47.77], ["music", 26.17], ["thunk", 3.98]], null, null, null, null], "duration": [-0.08, 0.75, 1.49, 0.38, 1.2, 3.44, 0.01, 0.95, 0.28, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/mGLXbK2XWMY_filtered.json b/annotations_filtered/mGLXbK2XWMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7300e700fbc88a0346fcefeb057fc20831073ad6 --- /dev/null +++ b/annotations_filtered/mGLXbK2XWMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 40.9]], "keep_status": [true], "silence_prob": [41.16], "audiomae_on_audioset": [[["music", 36.76], ["hum", 9.92], ["mains hum", 6.65]]], "duration": [24.9]} \ No newline at end of file diff --git a/annotations_filtered/mG_G5waoSeo_filtered.json b/annotations_filtered/mG_G5waoSeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25fbaf6d375db6a8452cfd072d4c6e7224c21211 --- /dev/null +++ b/annotations_filtered/mG_G5waoSeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.56], [8.0, 12.78], [14.0, 14.71], [20.0, 21.27], [24.0, 24.85], [27.0, 27.9], [30.0, 30.84], [45.0, 46.99], [48.0, 54.7], [56.0, 56.57], [57.0, 60.56], [61.0, 66.92], [69.0, 84.27], [87.0, 87.72], [89.0, 100.6], [104.0, 113.98], [116.0, 115.87], [117.0, 126.57], [135.0, 136.58], [156.0, 171.46]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.84, 0.0, 32.34, 30.83, 28.38, 0.0, 28.25, 28.16, 0.0, 28.23, 0.0, 28.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 17.77], ["hum", 14.41], ["firecracker", 8.12]], null, [["fly, housefly", 13.34], ["whack, thwack", 12.49], ["groan", 11.56]], [["speech", 40.07], ["cattle, bovinae", 5.57], ["hubbub, speech noise, speech babble", 4.23]], [["music", 61.26], ["speech", 24.92], ["hum", 2.04]], null, [["music", 92.15], ["electronic music", 1.53], ["speech", 1.4]], [["music", 65.6], ["speech", 7.71], ["throbbing", 3.98]], null, [["music", 70.14], ["cattle, bovinae", 5.48], ["moo", 4.48]], null, [["music", 61.21], ["sidetone", 15.7], ["speech", 5.71]]], "duration": [0.56, 4.78, 0.71, 1.27, 0.85, 0.9, 0.84, 1.99, 6.7, 0.57, 3.56, 5.92, 15.27, 0.72, 11.6, 9.98, -0.13, 9.57, 1.58, 15.46]} \ No newline at end of file diff --git a/annotations_filtered/mGf4oL6RLGs_filtered.json b/annotations_filtered/mGf4oL6RLGs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67939c976ee9b458e87e75cb201bf21075321f2d --- /dev/null +++ b/annotations_filtered/mGf4oL6RLGs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.58], [18.0, 32.07], [35.0, 37.12], [38.0, 41.52], [42.0, 42.79], [45.0, 45.03], [47.0, 47.39], [48.0, 48.59], [49.0, 50.6], [54.0, 54.57], [55.0, 55.36], [65.0, 66.33], [67.0, 67.46], [68.0, 68.71], [71.0, 74.49], [76.0, 75.84], [85.0, 93.06], [95.0, 95.76], [96.0, 96.75], [99.0, 101.01], [107.0, 107.01], [109.0, 111.27], [113.0, 113.19], [114.0, 114.54], [118.0, 120.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 76.04, 93.91, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 97.92, 0.0, 0.0, 92.64, 0.0, 80.11, 0.0, 0.0, 55.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.58, 14.07, 2.12, 3.52, 0.79, 0.03, 0.39, 0.59, 1.6, 0.57, 0.36, 1.33, 0.46, 0.71, 3.49, -0.16, 8.06, 0.76, 0.75, 2.01, 0.01, 2.27, 0.19, 0.54, 2.92]} \ No newline at end of file diff --git a/annotations_filtered/mGq0iyW-f7A_filtered.json b/annotations_filtered/mGq0iyW-f7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7837740211be9180f8ea3db3da4954a88f7ed98e --- /dev/null +++ b/annotations_filtered/mGq0iyW-f7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 18.54], [20.0, 27.48], [36.0, 39.09], [44.0, 55.97], [58.0, 58.21], [58.0, 58.24], [59.0, 58.99], [61.0, 61.67], [63.0, 64.72], [75.0, 75.24], [76.0, 76.06], [77.0, 77.43], [78.0, 78.48], [87.0, 87.18], [88.0, 88.79], [92.0, 92.01], [106.0, 108.03], [109.0, 109.27], [120.0, 126.15], [137.0, 138.13], [140.0, 155.51], [157.0, 161.15], [164.0, 167.12], [169.0, 169.87]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [41.87, 34.83, 35.59, 31.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 0.0, 45.43, 0.0, 30.13, 29.07, 34.26, 0.0], "audiomae_on_audioset": [[["music", 29.77], ["speech", 29.1], ["hum", 7.08]], [["music", 40.13], ["hum", 13.71], ["mains hum", 10.9]], [["speech", 44.51], ["music", 8.94], ["fart", 7.28]], [["livestock, farm animals, working animals", 52.4], ["cattle, bovinae", 28.73], ["moo", 16.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.71], ["trombone", 7.02], ["brass instrument", 6.65]], null, [["livestock, farm animals, working animals", 42.2], ["moo", 23.81], ["cattle, bovinae", 18.34]], [["mains hum", 42.74], ["hum", 21.81], ["music", 15.78]], [["cattle, bovinae", 51.45], ["moo", 31.5], ["livestock, farm animals, working animals", 10.78]], null], "duration": [7.54, 7.48, 3.09, 11.97, 0.21, 0.24, -0.01, 0.67, 1.72, 0.24, 0.06, 0.43, 0.48, 0.18, 0.79, 0.01, 2.03, 0.27, 6.15, 1.13, 15.51, 4.15, 3.12, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/mHGHJwXWh1k_filtered.json b/annotations_filtered/mHGHJwXWh1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fe861aed5757d51726c69ab4a4761b7f3665dc4 --- /dev/null +++ b/annotations_filtered/mHGHJwXWh1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [14.0, 14.39], [23.0, 25.25], [25.0, 25.29], [26.0, 25.64], [26.0, 26.1], [26.0, 28.93], [30.0, 41.34], [45.0, 45.89], [46.0, 48.24], [50.0, 99.22], [103.0, 105.39], [110.0, 109.7], [110.0, 117.68], [121.0, 122.1], [123.0, 144.21]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 31.92, 0.0, 0.0, 0.0, 34.51, 35.28, 0.0, 32.08, 0.0, 36.14, 0.0, 32.81, 0.0, 32.73], "audiomae_on_audioset": [null, null, [["speech", 57.54], ["fly, housefly", 6.31], ["insect", 3.69]], null, null, null, [["cattle, bovinae", 42.94], ["livestock, farm animals, working animals", 23.92], ["moo", 21.87]], [["music", 67.87], ["speech", 8.71], ["synthesizer", 3.59]], null, [["moo", 25.28], ["cattle, bovinae", 21.59], ["music", 12.32]], null, [["music", 37.52], ["synthesizer", 7.8], ["didgeridoo", 6.18]], null, [["music", 70.01], ["theremin", 6.48], ["didgeridoo", 5.79]], null, [["speech", 35.83], ["music", 23.66], ["musical instrument", 9.17]]], "duration": [0.35, 0.39, 2.25, 0.29, -0.36, 0.1, 2.93, 11.34, 0.89, 2.24, 49.22, 2.39, -0.3, 7.68, 1.1, 21.21]} \ No newline at end of file diff --git a/annotations_filtered/mHJH39bjALk_filtered.json b/annotations_filtered/mHJH39bjALk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3354ad7f02edce79cb9e0ae30803db5643eafe7 --- /dev/null +++ b/annotations_filtered/mHJH39bjALk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.15], [4.0, 5.93], [12.0, 11.84], [12.0, 11.94], [17.0, 18.13], [24.0, 24.58], [50.0, 50.73], [72.0, 71.83], [78.0, 77.87], [114.0, 114.86], [123.0, 124.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 1.93, -0.16, -0.06, 1.13, 0.58, 0.73, -0.17, -0.13, 0.86, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/mHRbCgVCbIA_filtered.json b/annotations_filtered/mHRbCgVCbIA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eca838ee6b3f9c2eced630dc1d3d24195b04d5ab --- /dev/null +++ b/annotations_filtered/mHRbCgVCbIA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.1], [21.0, 21.03], [29.0, 29.93], [32.0, 33.37], [34.0, 33.99], [44.0, 44.17], [44.0, 44.36], [59.0, 59.68], [62.0, 71.63], [74.0, 75.61], [83.0, 83.3], [89.0, 89.73], [102.0, 103.06], [106.0, 107.08], [109.0, 109.16], [114.0, 113.9], [116.0, 117.86], [119.0, 119.04], [120.0, 121.37], [133.0, 133.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 77.62], ["animal", 11.03], ["roaring cats (lions, tigers)", 1.27]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.1, 0.03, 0.93, 1.37, -0.01, 0.17, 0.36, 0.68, 9.63, 1.61, 0.3, 0.73, 1.06, 1.08, 0.16, -0.1, 1.86, 0.04, 1.37, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/mHa1zTLrXO8_filtered.json b/annotations_filtered/mHa1zTLrXO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..057ba3bb9275f48fe0a0571e5d5c644eb9cdb91b --- /dev/null +++ b/annotations_filtered/mHa1zTLrXO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.51], [8.0, 11.23], [12.0, 12.8], [24.0, 25.44], [29.0, 29.66], [33.0, 33.84], [36.0, 36.29], [49.0, 50.99], [59.0, 59.48], [64.0, 64.35], [65.0, 65.42], [66.0, 70.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 3.23, 0.8, 1.44, 0.66, 0.84, 0.29, 1.99, 0.48, 0.35, 0.42, 4.66]} \ No newline at end of file diff --git a/annotations_filtered/mHh8PKWMQEw_filtered.json b/annotations_filtered/mHh8PKWMQEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..064ecac64ab0399d387fea50238fc810d325b43e --- /dev/null +++ b/annotations_filtered/mHh8PKWMQEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [6.0, 6.76], [10.0, 15.13], [17.0, 19.04], [19.0, 51.07], [56.0, 58.5], [59.0, 60.83], [64.0, 66.06], [68.0, 68.94], [70.0, 86.7], [87.0, 89.7], [93.0, 96.72], [97.0, 98.31], [101.0, 104.28], [107.0, 107.42], [111.0, 116.16], [116.0, 116.92], [118.0, 119.92], [122.0, 123.57], [124.0, 159.76], [162.0, 166.87], [168.0, 168.69], [171.0, 178.98]], "keep_status": [false, false, true, true, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.46, 46.75, 0.0, 43.13, 0.0, 40.54, 0.0, 37.64, 43.82, 42.65, 0.0, 33.94, 0.0, 32.53, 0.0, 0.0, 0.0, 0.0, 31.27, 0.0, 30.34], "audiomae_on_audioset": [null, null, [["speech", 42.48], ["music", 21.47], ["whale vocalization", 4.83]], [["hum", 30.02], ["mains hum", 23.25], ["music", 13.97]], null, [["music", 53.12], ["synthesizer", 5.83], ["electronic music", 4.92]], null, [["mains hum", 32.32], ["hum", 19.75], ["music", 11.9]], null, [["music", 57.47], ["hum", 18.37], ["mains hum", 5.85]], [["mains hum", 69.98], ["hum", 21.25], ["cat", 1.46]], [["hum", 40.08], ["music", 14.67], ["mains hum", 12.08]], null, [["music", 64.43], ["speech", 27.39], ["inside, small room", 1.11]], null, [["hum", 40.65], ["mains hum", 19.95], ["speech", 18.35]], null, null, null, null, [["theremin", 65.11], ["music", 22.66], ["musical instrument", 2.94]], null, [["music", 53.87], ["theremin", 26.38], ["musical instrument", 5.64]]], "duration": [1.6, 0.76, 5.13, 2.04, 32.07, 2.5, 1.83, 2.06, 0.94, 16.7, 2.7, 3.72, 1.31, 3.28, 0.42, 5.16, 0.92, 1.92, 1.57, 35.76, 4.87, 0.69, 7.98]} \ No newline at end of file diff --git a/annotations_filtered/mI3QaSoJado_filtered.json b/annotations_filtered/mI3QaSoJado_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b91f00b0d31c64176ba9203898b1306cc78f0114 --- /dev/null +++ b/annotations_filtered/mI3QaSoJado_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.47], [9.0, 9.36], [15.0, 15.52], [16.0, 17.44], [20.0, 20.31], [23.0, 23.36], [35.0, 36.48], [38.0, 44.14], [46.0, 47.19], [50.0, 51.0], [53.0, 53.4], [55.0, 55.58], [57.0, 57.1], [64.0, 65.06], [71.0, 72.08], [81.0, 82.21], [89.0, 89.14], [92.0, 92.52], [98.0, 99.2], [102.0, 102.61], [107.0, 106.69], [109.0, 111.37]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 34.58], ["hum", 14.97], ["sidetone", 13.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.36, 0.52, 1.44, 0.31, 0.36, 1.48, 6.14, 1.19, 1.0, 0.4, 0.58, 0.1, 1.06, 1.08, 1.21, 0.14, 0.52, 1.2, 0.61, -0.31, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/mI6O2d4Ieok_filtered.json b/annotations_filtered/mI6O2d4Ieok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68dacbeafd1ef30258064e164e4f47ef10b752a0 --- /dev/null +++ b/annotations_filtered/mI6O2d4Ieok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.17], [8.0, 17.86], [18.0, 25.44], [31.0, 34.4], [37.0, 42.99], [48.0, 48.84], [49.0, 51.85], [55.0, 59.09], [63.0, 63.51], [73.0, 85.83], [89.0, 93.72], [100.0, 102.68], [105.0, 116.45], [117.0, 117.29], [118.0, 118.5], [120.0, 134.23], [136.0, 137.4], [146.0, 154.62], [159.0, 174.46]], "keep_status": [false, false, false, true, true, false, true, false, false, true, false, true, true, false, false, false, false, true, true], "silence_prob": [0.0, 33.64, 34.5, 31.45, 32.22, 0.0, 33.15, 31.22, 0.0, 31.62, 34.53, 31.34, 31.63, 0.0, 0.0, 32.35, 0.0, 34.65, 32.26], "audiomae_on_audioset": [null, [["sidetone", 35.38], ["music", 24.63], ["speech", 13.3]], [["music", 46.45], ["hum", 17.03], ["throbbing", 16.29]], [["music", 25.92], ["speech", 15.48], ["electronic music", 8.32]], [["cattle, bovinae", 22.69], ["music", 20.65], ["moo", 20.61]], null, [["music", 41.68], ["speech", 10.68], ["fly, housefly", 4.44]], [["music", 54.44], ["speech", 19.29], ["electronic music", 2.36]], null, [["music", 29.29], ["speech", 18.03], ["hum", 7.02]], [["music", 61.44], ["throbbing", 6.48], ["hum", 6.29]], [["speech", 54.22], ["vehicle", 5.77], ["breaking", 3.89]], [["cattle, bovinae", 26.86], ["livestock, farm animals, working animals", 17.43], ["music", 17.2]], null, null, [["music", 45.34], ["speech", 27.88], ["electric shaver, electric razor", 5.18]], null, [["hum", 34.61], ["mains hum", 27.16], ["speech", 4.45]], [["music", 28.16], ["livestock, farm animals, working animals", 9.21], ["fly, housefly", 6.93]]], "duration": [1.17, 9.86, 7.44, 3.4, 5.99, 0.84, 2.85, 4.09, 0.51, 12.83, 4.72, 2.68, 11.45, 0.29, 0.5, 14.23, 1.4, 8.62, 15.46]} \ No newline at end of file diff --git a/annotations_filtered/mIGCgzqFR0s_filtered.json b/annotations_filtered/mIGCgzqFR0s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bb88932fcae499056b171299baaa5e24fe3dfaa --- /dev/null +++ b/annotations_filtered/mIGCgzqFR0s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.83], [12.0, 19.28], [20.0, 41.03], [42.0, 42.13], [44.0, 44.63], [46.0, 52.19], [53.0, 54.11], [57.0, 58.33], [63.0, 63.0], [65.0, 64.81], [67.0, 67.76], [71.0, 71.1], [78.0, 79.68], [80.0, 80.89], [85.0, 86.37], [89.0, 88.92], [94.0, 95.69], [96.0, 97.04], [104.0, 104.4], [106.0, 106.3], [110.0, 113.05], [113.0, 113.1], [113.0, 113.16], [114.0, 117.1], [120.0, 120.83], [123.0, 123.92], [131.0, 130.86], [132.0, 133.79], [135.0, 135.53], [140.0, 141.69], [151.0, 151.98], [155.0, 155.22], [169.0, 170.36], [175.0, 175.17], [177.0, 177.75], [180.0, 180.3], [181.0, 181.58], [183.0, 191.78], [193.0, 193.75], [196.0, 195.83], [208.0, 210.37], [213.0, 213.21], [222.0, 222.34], [228.0, 228.6], [235.0, 236.26], [239.0, 239.52], [240.0, 241.47], [246.0, 248.32], [255.0, 255.01], [270.0, 271.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 45.24, 29.16, 0.0, 0.0, 32.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.68, 0.0, 0.0, 35.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 44.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.72, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.51], ["electronic music", 9.42], ["noise", 6.97]], [["music", 64.11], ["synthesizer", 3.51], ["musical instrument", 3.48]], null, null, [["music", 64.81], ["speech", 10.88], ["animal", 2.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.28], ["music", 37.16], ["theremin", 6.05]], null, null, [["boing", 37.77], ["music", 29.73], ["speech", 7.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.13], ["throat clearing", 10.02], ["oink", 7.27]], null, null, null, null, null, null, [["music", 42.88], ["speech", 18.7], ["synthesizer", 5.93]], null, null], "duration": [-0.17, 7.28, 21.03, 0.13, 0.63, 6.19, 1.11, 1.33, 0.0, -0.19, 0.76, 0.1, 1.68, 0.89, 1.37, -0.08, 1.69, 1.04, 0.4, 0.3, 3.05, 0.1, 0.16, 3.1, 0.83, 0.92, -0.14, 1.79, 0.53, 1.69, 0.98, 0.22, 1.36, 0.17, 0.75, 0.3, 0.58, 8.78, 0.75, -0.17, 2.37, 0.21, 0.34, 0.6, 1.26, 0.52, 1.47, 2.32, 0.01, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/mIIZqCaHUFI_filtered.json b/annotations_filtered/mIIZqCaHUFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b3d8aa6e35dfaf4c06675df43d87f8b11691e12 --- /dev/null +++ b/annotations_filtered/mIIZqCaHUFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.15], [8.0, 12.19], [17.0, 17.02], [18.0, 18.44], [25.0, 28.71], [30.0, 31.28], [34.0, 34.94], [38.0, 39.38], [40.0, 40.9], [43.0, 43.29], [46.0, 47.73], [49.0, 50.95], [52.0, 52.44], [53.0, 56.56], [58.0, 59.97], [61.0, 62.8], [66.0, 68.71], [72.0, 73.41], [76.0, 77.14], [79.0, 80.32], [81.0, 83.66], [84.0, 84.35], [85.0, 85.33], [86.0, 86.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [70.86, 55.67, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 0.0, 42.46, 0.0, 0.0, 0.0, 65.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 14.71], ["speech", 9.87], ["groan", 6.15]], null, null, null, null, null, null, null], "duration": [3.15, 4.19, 0.02, 0.44, 3.71, 1.28, 0.94, 1.38, 0.9, 0.29, 1.73, 1.95, 0.44, 3.56, 1.97, 1.8, 2.71, 1.41, 1.14, 1.32, 2.66, 0.35, 0.33, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/mIJdrHpr3_Q_filtered.json b/annotations_filtered/mIJdrHpr3_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50728316525fd32ecd80108efb46912639ac6115 --- /dev/null +++ b/annotations_filtered/mIJdrHpr3_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [12.0, 13.96], [19.0, 20.53], [21.0, 27.99], [29.0, 43.17], [55.0, 55.22], [65.0, 72.67]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 90.43, 82.07, 0.0, 73.21], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.48, 1.96, 1.53, 6.99, 14.17, 0.22, 7.67]} \ No newline at end of file diff --git a/annotations_filtered/mIZOUXRYVyE_filtered.json b/annotations_filtered/mIZOUXRYVyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4ed1f2418641d4df01e5740cf0a205bfb190eb3 --- /dev/null +++ b/annotations_filtered/mIZOUXRYVyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.02], [6.0, 9.53], [10.0, 10.22], [11.0, 11.55], [12.0, 13.22], [14.0, 14.2], [15.0, 16.34], [26.0, 27.72], [35.0, 36.69], [38.0, 38.3], [49.0, 50.6]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 32.0], ["mains hum", 13.45], ["hum", 11.62]], null, null, null, null, null, null, null, null, null], "duration": [0.02, 3.53, 0.22, 0.55, 1.22, 0.2, 1.34, 1.72, 1.69, 0.3, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/mIeU7y3CGKQ_filtered.json b/annotations_filtered/mIeU7y3CGKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dfeee5298a3849c9621e9b58999deeb91efbfac --- /dev/null +++ b/annotations_filtered/mIeU7y3CGKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.14], [7.0, 10.29], [13.0, 17.31], [17.0, 17.37], [24.0, 26.59], [27.0, 29.78], [31.0, 33.42], [38.0, 43.71], [46.0, 57.37], [58.0, 58.5], [59.0, 58.55], [59.0, 58.62], [63.0, 68.2], [71.0, 83.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [30.84, 29.75, 29.89, 0.0, 30.02, 30.06, 30.07, 29.14, 29.08, 0.0, 0.0, 0.0, 29.45, 29.35], "audiomae_on_audioset": [[["music", 67.34], ["electronic music", 4.61], ["speech", 4.0]], [["music", 67.73], ["electronic music", 4.69], ["house music", 3.88]], [["music", 64.78], ["trance music", 10.31], ["sampler", 3.77]], null, [["music", 80.66], ["trance music", 4.76], ["electronic music", 2.94]], [["music", 77.7], ["trance music", 2.85], ["electronic music", 2.67]], [["music", 71.27], ["trance music", 5.42], ["electronic music", 3.91]], [["music", 55.9], ["throbbing", 5.51], ["hum", 4.06]], [["music", 76.47], ["electronic music", 1.73], ["trance music", 1.34]], null, null, null, [["music", 69.19], ["electronic music", 5.57], ["trance music", 2.93]], [["music", 77.99], ["trance music", 3.57], ["house music", 2.44]]], "duration": [2.14, 3.29, 4.31, 0.37, 2.59, 2.78, 2.42, 5.71, 11.37, 0.5, -0.45, -0.38, 5.2, 12.94]} \ No newline at end of file diff --git a/annotations_filtered/mIqXkwxzUB4_filtered.json b/annotations_filtered/mIqXkwxzUB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0d81f2cc6b7de7e0a63a7ce69b40d85c0e1201c --- /dev/null +++ b/annotations_filtered/mIqXkwxzUB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.95], [8.0, 11.94], [14.0, 19.33], [20.0, 26.57], [28.0, 29.39], [33.0, 32.9], [34.0, 39.23], [40.0, 43.07], [44.0, 45.94], [51.0, 52.68], [56.0, 56.94], [59.0, 60.39], [63.0, 64.42], [65.0, 67.88], [75.0, 76.57], [79.0, 79.71], [87.0, 86.91], [88.0, 89.9], [96.0, 96.99], [98.0, 98.64], [99.0, 102.2], [103.0, 110.2], [111.0, 111.37], [115.0, 115.35], [117.0, 117.8], [118.0, 119.37], [122.0, 123.23], [125.0, 127.47]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 60.98, 50.51, 47.62, 0.0, 0.0, 77.87, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 38.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 74.6, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76], "audiomae_on_audioset": [null, null, null, [["music", 25.67], ["hum", 23.79], ["throbbing", 8.1]], null, null, null, null, null, null, null, null, null, [["didgeridoo", 61.11], ["music", 18.77], ["speech", 5.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.95, 3.94, 5.33, 6.57, 1.39, -0.1, 5.23, 3.07, 1.94, 1.68, 0.94, 1.39, 1.42, 2.88, 1.57, 0.71, -0.09, 1.9, 0.99, 0.64, 3.2, 7.2, 0.37, 0.35, 0.8, 1.37, 1.23, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/mIvQRRVbt9E_filtered.json b/annotations_filtered/mIvQRRVbt9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be42341872260fba34f39e020e8a76f6e9c373bc --- /dev/null +++ b/annotations_filtered/mIvQRRVbt9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.04], [9.0, 28.98], [30.0, 36.86], [40.0, 40.93], [42.0, 42.48], [51.0, 52.15], [53.0, 53.86], [57.0, 57.67], [59.0, 59.17], [60.0, 62.01], [67.0, 67.63], [73.0, 74.78], [78.0, 78.8], [85.0, 87.59], [89.0, 89.5], [92.0, 97.23], [105.0, 106.73], [108.0, 126.4], [129.0, 129.84]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 30.54, 43.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.52, 0.0, 0.0, 0.0, 38.51, 0.0, 35.42, 0.0, 31.19, 0.0], "audiomae_on_audioset": [null, [["speech", 63.4], ["hum", 12.14], ["mains hum", 5.03]], [["music", 31.31], ["cowbell", 8.32], ["hum", 7.31]], null, null, null, null, null, null, [["speech", 57.21], ["music", 11.39], ["hum", 3.95]], null, null, null, [["music", 40.39], ["speech", 13.81], ["fly, housefly", 8.63]], null, [["music", 74.57], ["soundtrack music", 4.5], ["theremin", 1.74]], null, [["music", 47.21], ["hum", 9.34], ["explosion", 5.37]], null], "duration": [1.04, 19.98, 6.86, 0.93, 0.48, 1.15, 0.86, 0.67, 0.17, 2.01, 0.63, 1.78, 0.8, 2.59, 0.5, 5.23, 1.73, 18.4, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/mJbFV5i5ay8_filtered.json b/annotations_filtered/mJbFV5i5ay8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ffdc25d8bacf7353d5fc5cebf125849951999ec --- /dev/null +++ b/annotations_filtered/mJbFV5i5ay8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 41.45], [43.0, 52.81], [56.0, 56.62], [57.0, 62.16], [64.0, 152.71]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 32.29, 0.0, 31.63, 0.0], "audiomae_on_audioset": [null, [["music", 26.7], ["hum", 21.39], ["throbbing", 9.46]], null, [["music", 64.49], ["speech", 6.32], ["musical instrument", 3.49]], null], "duration": [0.45, 9.81, 0.62, 5.16, 88.71]} \ No newline at end of file diff --git a/annotations_filtered/mK10Ze-mcQo_filtered.json b/annotations_filtered/mK10Ze-mcQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c38eccbb71ad542a19d68edf194616fc99f0ee9 --- /dev/null +++ b/annotations_filtered/mK10Ze-mcQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [7.0, 7.4], [9.0, 10.44], [22.0, 22.98], [25.0, 25.73], [27.0, 28.51], [30.0, 31.26], [33.0, 33.93], [35.0, 35.97], [38.0, 38.89], [46.0, 48.88], [50.0, 50.97], [52.0, 53.72], [55.0, 56.02], [59.0, 61.99], [65.0, 65.85], [67.0, 67.91], [70.0, 70.85], [72.0, 74.38], [79.0, 79.59], [83.0, 83.94], [85.0, 86.07], [87.0, 87.78], [90.0, 90.64], [92.0, 92.8], [102.0, 102.41], [107.0, 108.04], [109.0, 109.9], [113.0, 113.83], [115.0, 115.72], [117.0, 118.1], [121.0, 121.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.11, 0.0, 0.0, 0.0, 42.88, 0.0, 0.0, 0.0, 52.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 22.82], ["music", 22.55], ["mains hum", 9.94]], null, null, null, [["music", 40.45], ["mains hum", 6.78], ["hum", 6.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 0.4, 1.44, 0.98, 0.73, 1.51, 1.26, 0.93, 0.97, 0.89, 2.88, 0.97, 1.72, 1.02, 2.99, 0.85, 0.91, 0.85, 2.38, 0.59, 0.94, 1.07, 0.78, 0.64, 0.8, 0.41, 1.04, 0.9, 0.83, 0.72, 1.1, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/mK8ad1nYFQA_filtered.json b/annotations_filtered/mK8ad1nYFQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56227c11bd1509d7a9e339bc189802fe02bd483e --- /dev/null +++ b/annotations_filtered/mK8ad1nYFQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [5.0, 5.53], [6.0, 7.62], [10.0, 10.47], [12.0, 13.96], [17.0, 18.1], [19.0, 20.92], [27.0, 28.22], [29.0, 30.4], [31.0, 33.49], [35.0, 36.76], [40.0, 40.98], [43.0, 44.15], [45.0, 47.01], [48.0, 49.86], [50.0, 54.8], [56.0, 62.53], [63.0, 65.18], [66.0, 66.46], [68.0, 72.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.94, 0.0, 0.0, 0.0, 45.85, 0.0, 34.51, 68.8, 42.74, 0.0, 39.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 58.5], ["speech", 13.98], ["chirp tone", 4.65]], null, null, null, [["cattle, bovinae", 12.18], ["sine wave", 7.57], ["caw", 6.79]], null, [["sidetone", 83.83], ["hum", 5.93], ["speech", 5.03]], null, [["dial tone", 37.8], ["speech", 27.49], ["hum", 4.71]], null, [["whale vocalization", 19.81], ["hum", 17.33], ["noise", 11.21]]], "duration": [0.52, 0.53, 1.62, 0.47, 1.96, 1.1, 1.92, 1.22, 1.4, 2.49, 1.76, 0.98, 1.15, 2.01, 1.86, 4.8, 6.53, 2.18, 0.46, 4.99]} \ No newline at end of file diff --git a/annotations_filtered/mKDqrUqOe8Y_filtered.json b/annotations_filtered/mKDqrUqOe8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..778586970b77741b1d124b446722067265ff7de8 --- /dev/null +++ b/annotations_filtered/mKDqrUqOe8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[93.0, 105.0], [105.0, 120.24], [120.0, 123.63], [124.0, 124.48]], "keep_status": [false, true, true, false], "silence_prob": [62.78, 36.02, 36.21, 0.0], "audiomae_on_audioset": [null, [["hum", 26.86], ["music", 17.08], ["throbbing", 14.05]], [["speech", 39.39], ["rumble", 9.19], ["music", 7.52]], null], "duration": [12.0, 15.24, 3.63, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/mKgy5W3S6nw_filtered.json b/annotations_filtered/mKgy5W3S6nw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64e36717373dd57b8a129b5a290d7404cf0463b2 --- /dev/null +++ b/annotations_filtered/mKgy5W3S6nw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [2.0, 3.54], [5.0, 5.76], [6.0, 10.07], [11.0, 11.5], [12.0, 15.94], [17.0, 18.42], [22.0, 26.65], [27.0, 28.43], [32.0, 33.45], [36.0, 38.31], [40.0, 40.41], [49.0, 49.23], [80.0, 81.84], [90.0, 91.57], [92.0, 95.28], [97.0, 97.87], [99.0, 100.03], [104.0, 105.19], [106.0, 117.71], [121.0, 121.58]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.44, 0.0, 43.48, 0.0, 64.18, 0.0, 0.0, 70.86, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 85.35, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 65.25], ["fart", 3.38], ["thunk", 2.87]], null, [["fly, housefly", 18.17], ["speech", 15.37], ["insect", 8.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 1.54, 0.76, 4.07, 0.5, 3.94, 1.42, 4.65, 1.43, 1.45, 2.31, 0.41, 0.23, 1.84, 1.57, 3.28, 0.87, 1.03, 1.19, 11.71, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/mKl11EzMTAE_filtered.json b/annotations_filtered/mKl11EzMTAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..126fd23f608fe061f3348d64926f8797adce0242 --- /dev/null +++ b/annotations_filtered/mKl11EzMTAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 53.72], [54.0, 55.63], [56.0, 57.99], [59.0, 65.47], [67.0, 69.7]], "keep_status": [true, false, false, true, true], "silence_prob": [31.19, 0.0, 0.0, 37.59, 37.01], "audiomae_on_audioset": [[["rumble", 17.56], ["music", 12.15], ["mains hum", 7.5]], null, null, [["speech", 27.95], ["noise", 16.73], ["music", 15.85]], [["noise", 13.37], ["music", 12.73], ["animal", 11.0]]], "duration": [19.72, 1.63, 1.99, 6.47, 2.7]} \ No newline at end of file diff --git a/annotations_filtered/mLKA_BX6xKo_filtered.json b/annotations_filtered/mLKA_BX6xKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a749c99856a30451b62c1fb9a2cf9bcfafc02e64 --- /dev/null +++ b/annotations_filtered/mLKA_BX6xKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.22], [17.0, 18.17], [24.0, 24.11], [26.0, 29.67], [31.0, 32.26], [35.0, 36.61], [39.0, 39.36], [48.0, 48.74], [50.0, 50.06], [52.0, 52.66], [59.0, 62.13], [63.0, 62.83], [63.0, 64.13], [65.0, 64.81], [65.0, 67.26], [72.0, 72.96], [82.0, 83.78], [85.0, 90.05], [91.0, 91.89], [93.0, 93.33], [100.0, 101.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.33, 0.0, 0.0, 0.0, 85.17, 0.0, 0.0, 52.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 53.52], ["speech", 21.18], ["musical instrument", 1.89]], null, null, null, null, null, null, null, null, null, null], "duration": [0.22, 1.17, 0.11, 3.67, 1.26, 1.61, 0.36, 0.74, 0.06, 0.66, 3.13, -0.17, 1.13, -0.19, 2.26, 0.96, 1.78, 5.05, 0.89, 0.33, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/mLk_txo4sYc_filtered.json b/annotations_filtered/mLk_txo4sYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..416db0fcb12974a9e8786710f0e283d7c167f94b --- /dev/null +++ b/annotations_filtered/mLk_txo4sYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 103.52]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [59.52]} \ No newline at end of file diff --git a/annotations_filtered/mLl9jkYywZY_filtered.json b/annotations_filtered/mLl9jkYywZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4dee4867e93901ed7f94ba57d572745d3c2933dd --- /dev/null +++ b/annotations_filtered/mLl9jkYywZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 13.32], [15.0, 20.76], [22.0, 28.88], [30.0, 32.24], [34.0, 36.71], [40.0, 121.24]], "keep_status": [true, false, false, false, false, false], "silence_prob": [32.55, 35.18, 65.55, 72.01, 77.2, 0.0], "audiomae_on_audioset": [[["music", 23.08], ["whack, thwack", 10.06], ["fly, housefly", 8.16]], [["whale vocalization", 63.42], ["theremin", 12.06], ["music", 5.46]], null, null, null, null], "duration": [10.32, 5.76, 6.88, 2.24, 2.71, 81.24]} \ No newline at end of file diff --git a/annotations_filtered/mLsptorbPUg_filtered.json b/annotations_filtered/mLsptorbPUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b7c07f66eec34106b36f44b437cf1312606d21f --- /dev/null +++ b/annotations_filtered/mLsptorbPUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 58.28], [60.0, 83.19], [85.0, 95.86], [99.0, 130.2]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 35.49, 31.66, 0.0], "audiomae_on_audioset": [null, [["hum", 35.31], ["music", 23.86], ["throbbing", 6.47]], [["music", 50.22], ["hum", 21.57], ["throbbing", 8.44]], null], "duration": [38.28, 23.19, 10.86, 31.2]} \ No newline at end of file diff --git a/annotations_filtered/mM5dRMY2u28_filtered.json b/annotations_filtered/mM5dRMY2u28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..883264843d44f4878c4049face3691171a5aeeb3 --- /dev/null +++ b/annotations_filtered/mM5dRMY2u28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.04], [16.0, 16.7], [18.0, 19.11], [20.0, 21.49], [45.0, 45.47], [50.0, 50.26], [51.0, 51.56], [52.0, 52.91], [54.0, 54.8], [72.0, 72.4], [84.0, 84.43], [86.0, 87.29], [90.0, 90.71], [109.0, 109.34], [116.0, 117.0], [119.0, 125.51], [126.0, 129.1], [136.0, 137.37], [140.0, 141.81], [147.0, 148.53], [151.0, 151.12], [154.0, 154.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.3, 43.61, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 73.72], ["singing", 1.71], ["folk music", 1.62]], [["music", 82.81], ["singing", 1.74], ["musical instrument", 1.07]], null, null, null, null, null], "duration": [0.04, 0.7, 1.11, 1.49, 0.47, 0.26, 0.56, 0.91, 0.8, 0.4, 0.43, 1.29, 0.71, 0.34, 1.0, 6.51, 3.1, 1.37, 1.81, 1.53, 0.12, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/mMRQdL_xvME_filtered.json b/annotations_filtered/mMRQdL_xvME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa6fc73b166a38e12492098fae63cb18bbedc0af --- /dev/null +++ b/annotations_filtered/mMRQdL_xvME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.04], [5.0, 8.43], [9.0, 17.76], [21.0, 22.44], [23.0, 24.0], [25.0, 26.28], [28.0, 29.02], [29.0, 29.81], [31.0, 32.98], [38.0, 38.55], [43.0, 44.88], [48.0, 49.0], [49.0, 51.49], [52.0, 52.05], [53.0, 54.21], [68.0, 70.19], [72.0, 73.2], [75.0, 82.75], [84.0, 85.01]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 40.26, 72.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.1, 0.0, 0.0, 94.81, 0.0, 40.28, 0.0], "audiomae_on_audioset": [null, [["sidetone", 35.22], ["speech", 22.77], ["whale vocalization", 9.36]], null, null, null, null, null, null, null, null, null, null, [["speech", 52.45], ["music", 16.27], ["hum", 5.12]], null, null, null, null, [["music", 54.15], ["ambient music", 8.71], ["singing bowl", 6.27]], null], "duration": [1.04, 3.43, 8.76, 1.44, 1.0, 1.28, 1.02, 0.81, 1.98, 0.55, 1.88, 1.0, 2.49, 0.05, 1.21, 2.19, 1.2, 7.75, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/mMyrxQNItpY_filtered.json b/annotations_filtered/mMyrxQNItpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96e8f6af688954d783ae77ab68ca96c33836412c --- /dev/null +++ b/annotations_filtered/mMyrxQNItpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.8], [11.0, 12.09], [16.0, 17.24], [19.0, 18.93], [29.0, 29.08], [30.0, 30.3], [34.0, 40.05], [41.0, 44.15], [45.0, 53.82], [57.0, 59.86], [60.0, 63.34], [64.0, 66.39], [68.0, 71.2], [72.0, 73.94], [74.0, 77.46], [79.0, 79.49], [80.0, 81.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 99.97, 100.0, 100.0, 0.0, 99.84, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.09, 1.24, -0.07, 0.08, 0.3, 6.05, 3.15, 8.82, 2.86, 3.34, 2.39, 3.2, 1.94, 3.46, 0.49, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/mNQx3KPxifQ_filtered.json b/annotations_filtered/mNQx3KPxifQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60fa95091bb99bd4fafc0c55664af20ea0e543aa --- /dev/null +++ b/annotations_filtered/mNQx3KPxifQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.35], [34.0, 38.5], [39.0, 39.95], [43.0, 43.46], [44.0, 44.86], [46.0, 46.7], [47.0, 48.19], [49.0, 49.71], [52.0, 53.45], [56.0, 56.07], [67.0, 68.25], [88.0, 88.37], [90.0, 91.3], [96.0, 96.87], [101.0, 100.9], [102.0, 102.79], [103.0, 103.74], [106.0, 112.77]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 29.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.55], "audiomae_on_audioset": [null, [["music", 47.32], ["grunt", 4.6], ["throbbing", 3.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 28.72], ["speech", 11.81], ["groan", 8.06]]], "duration": [0.35, 4.5, 0.95, 0.46, 0.86, 0.7, 1.19, 0.71, 1.45, 0.07, 1.25, 0.37, 1.3, 0.87, -0.1, 0.79, 0.74, 6.77]} \ No newline at end of file diff --git a/annotations_filtered/mNUnCTKwS8Q_filtered.json b/annotations_filtered/mNUnCTKwS8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1652671dc78d85d451c0ef6400f48738ae0a973e --- /dev/null +++ b/annotations_filtered/mNUnCTKwS8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 30.4], [31.0, 31.92], [33.0, 45.22], [46.0, 48.88], [49.0, 50.68], [54.0, 54.53], [55.0, 55.95], [58.0, 58.23], [59.0, 59.39], [70.0, 71.96], [78.0, 78.68], [80.0, 80.38], [81.0, 82.12], [83.0, 83.83], [94.0, 97.41], [99.0, 99.28], [99.0, 100.35], [112.0, 122.61], [128.0, 128.98], [130.0, 130.32], [131.0, 133.32], [136.0, 153.77], [159.0, 160.79], [161.0, 160.83], [161.0, 160.86], [164.0, 168.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [30.14, 0.0, 58.13, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 84.43, 0.0, 0.0, 74.76, 34.39, 0.0, 0.0, 0.0, 29.8], "audiomae_on_audioset": [[["music", 47.14], ["hum", 18.36], ["mains hum", 11.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 40.1], ["throbbing", 25.61], ["music", 11.29]], null, null, null, [["speech", 40.61], ["music", 20.56], ["whack, thwack", 4.15]]], "duration": [29.4, 0.92, 12.22, 2.88, 1.68, 0.53, 0.95, 0.23, 0.39, 1.96, 0.68, 0.38, 1.12, 0.83, 3.41, 0.28, 1.35, 10.61, 0.98, 0.32, 2.32, 17.77, 1.79, -0.17, -0.14, 4.42]} \ No newline at end of file diff --git a/annotations_filtered/mNd16XocjBg_filtered.json b/annotations_filtered/mNd16XocjBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..247dfdd759ff3518071f256373660453908fc7ab --- /dev/null +++ b/annotations_filtered/mNd16XocjBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [3.0, 3.89], [5.0, 6.64], [8.0, 8.14], [10.0, 10.59], [15.0, 14.99], [17.0, 17.69], [19.0, 18.87], [20.0, 20.6], [23.0, 23.82], [26.0, 27.43], [29.0, 29.51], [33.0, 34.38], [38.0, 38.13], [45.0, 45.86], [48.0, 48.71], [52.0, 54.19], [56.0, 57.52], [61.0, 61.16], [63.0, 63.32], [67.0, 67.22], [70.0, 70.6], [76.0, 77.45], [80.0, 80.86], [82.0, 82.63], [86.0, 85.9], [87.0, 87.56], [92.0, 92.87], [94.0, 94.37], [97.0, 99.66], [102.0, 102.59], [109.0, 109.8], [110.0, 111.57], [115.0, 115.94], [117.0, 117.98], [120.0, 120.48], [121.0, 122.66], [123.0, 124.02], [127.0, 128.98], [133.0, 133.34], [135.0, 135.84], [140.0, 142.03], [143.0, 143.73], [146.0, 146.96], [152.0, 152.54], [153.0, 156.49], [158.0, 160.2], [162.0, 164.47], [170.0, 170.88], [172.0, 173.13], [175.0, 177.65], [179.0, 184.45], [185.0, 187.27], [188.0, 188.55], [190.0, 191.0], [192.0, 192.6], [194.0, 194.83], [197.0, 196.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 100.0, 85.72, 79.76, 0.0, 0.0, 55.11, 64.41, 51.39, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.89, 1.64, 0.14, 0.59, -0.01, 0.69, -0.13, 0.6, 0.82, 1.43, 0.51, 1.38, 0.13, 0.86, 0.71, 2.19, 1.52, 0.16, 0.32, 0.22, 0.6, 1.45, 0.86, 0.63, -0.1, 0.56, 0.87, 0.37, 2.66, 0.59, 0.8, 1.57, 0.94, 0.98, 0.48, 1.66, 1.02, 1.98, 0.34, 0.84, 2.03, 0.73, 0.96, 0.54, 3.49, 2.2, 2.47, 0.88, 1.13, 2.65, 5.45, 2.27, 0.55, 1.0, 0.6, 0.83, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/mNtK6UvRjO8_filtered.json b/annotations_filtered/mNtK6UvRjO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c70324614a82e8ee555fae36e7e971fbf6bed74 --- /dev/null +++ b/annotations_filtered/mNtK6UvRjO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.32], [8.0, 9.02], [15.0, 16.5], [19.0, 19.45], [20.0, 21.07], [27.0, 29.05], [35.0, 35.97], [37.0, 37.77], [43.0, 42.7], [47.0, 48.39], [58.0, 59.04], [59.0, 60.15], [68.0, 69.92], [71.0, 70.85], [73.0, 73.58], [77.0, 78.26], [80.0, 80.2], [83.0, 83.08], [84.0, 85.35], [87.0, 87.18], [88.0, 87.99], [88.0, 88.3], [88.0, 89.26], [95.0, 95.15], [96.0, 96.4], [97.0, 97.48], [100.0, 100.48], [102.0, 103.86], [105.0, 106.08], [107.0, 109.05], [111.0, 112.28], [114.0, 115.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 1.02, 1.5, 0.45, 1.07, 2.05, 0.97, 0.77, -0.3, 1.39, 1.04, 1.15, 1.92, -0.15, 0.58, 1.26, 0.2, 0.08, 1.35, 0.18, -0.01, 0.3, 1.26, 0.15, 0.4, 0.48, 0.48, 1.86, 1.08, 2.05, 1.28, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/mO5UNbKzcpQ_filtered.json b/annotations_filtered/mO5UNbKzcpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb9c17e5ba341399ed765e6e36337e0ffab2b9fc --- /dev/null +++ b/annotations_filtered/mO5UNbKzcpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.49], [10.0, 11.94], [15.0, 15.42], [31.0, 31.63], [32.0, 39.8], [41.0, 46.48], [47.0, 49.35], [50.0, 51.61], [55.0, 63.0], [65.0, 65.96], [70.0, 70.73], [75.0, 81.99], [84.0, 88.26], [89.0, 98.36], [102.0, 104.46], [106.0, 111.18], [119.0, 121.83], [123.0, 124.66], [126.0, 128.14], [134.0, 133.98], [136.0, 146.1], [150.0, 151.33], [156.0, 162.09], [163.0, 165.55], [166.0, 169.21], [172.0, 172.49]], "keep_status": [false, false, false, false, true, false, true, false, true, false, false, true, true, false, true, true, true, false, true, false, true, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 48.44, 35.57, 39.66, 0.0, 32.56, 0.0, 0.0, 32.15, 31.34, 32.8, 30.79, 36.21, 40.92, 0.0, 30.58, 0.0, 31.09, 0.0, 33.72, 31.05, 33.05, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 56.48], ["musical instrument", 6.76], ["hum", 3.71]], [["music", 57.6], ["guitar", 8.38], ["musical instrument", 5.26]], [["music", 32.94], ["hum", 5.68], ["crackle", 4.3]], null, [["music", 45.75], ["synthesizer", 6.49], ["hum", 5.37]], null, null, [["music", 32.27], ["hum", 8.51], ["mains hum", 7.71]], [["hum", 32.96], ["mains hum", 19.05], ["throbbing", 7.91]], [["music", 47.42], ["mains hum", 15.38], ["hum", 9.51]], [["music", 38.76], ["speech", 25.57], ["theremin", 4.64]], [["hum", 28.63], ["mains hum", 21.37], ["music", 15.29]], [["music", 36.62], ["hum", 23.57], ["throbbing", 7.19]], null, [["music", 40.18], ["synthesizer", 7.98], ["hum", 7.35]], null, [["music", 25.76], ["hum", 14.18], ["mains hum", 12.83]], null, [["music", 59.85], ["musical instrument", 6.74], ["guitar", 5.52]], [["music", 24.91], ["hum", 14.56], ["mains hum", 11.76]], [["hum", 20.89], ["music", 18.45], ["mains hum", 9.8]], null], "duration": [1.49, 1.94, 0.42, 0.63, 7.8, 5.48, 2.35, 1.61, 8.0, 0.96, 0.73, 6.99, 4.26, 9.36, 2.46, 5.18, 2.83, 1.66, 2.14, -0.02, 10.1, 1.33, 6.09, 2.55, 3.21, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/mO8roISHjJo_filtered.json b/annotations_filtered/mO8roISHjJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a4dd87a6bb6e8afab112990758c7c9d8d2b59cd --- /dev/null +++ b/annotations_filtered/mO8roISHjJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.56], [21.0, 23.67], [26.0, 27.63], [28.0, 29.19], [31.0, 33.27], [34.0, 34.45], [38.0, 38.53], [40.0, 41.82], [42.0, 44.14], [48.0, 49.6], [54.0, 55.12], [56.0, 56.51], [64.0, 64.35], [69.0, 70.23], [84.0, 91.91], [108.0, 108.92], [110.0, 111.0], [111.0, 112.01], [117.0, 116.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.93, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 2.67, 1.63, 1.19, 2.27, 0.45, 0.53, 1.82, 2.14, 1.6, 1.12, 0.51, 0.35, 1.23, 7.91, 0.92, 1.0, 1.01, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/mOicvmEloyY_filtered.json b/annotations_filtered/mOicvmEloyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77965f8e141ab7058ded28a42f550e95016b45e0 --- /dev/null +++ b/annotations_filtered/mOicvmEloyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.34], [10.0, 21.49], [29.0, 31.13], [34.0, 34.8], [37.0, 37.61], [40.0, 43.46], [45.0, 46.14], [47.0, 47.29], [49.0, 49.67], [50.0, 50.65], [53.0, 55.05], [56.0, 57.06], [59.0, 60.2], [61.0, 66.85], [68.0, 69.82], [72.0, 87.08], [88.0, 88.42], [89.0, 111.25], [112.0, 112.65], [113.0, 115.89], [117.0, 118.2], [125.0, 125.85], [127.0, 128.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 86.64, 59.15, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 46.22, 0.0, 71.43, 0.0, 98.8, 0.0, 37.67, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 34.74], ["radio", 18.59], ["noise", 12.12]], null, null, null, null, null, [["bee, wasp, etc.", 46.94], ["fly, housefly", 28.35], ["insect", 17.37]], null, null, null], "duration": [1.34, 11.49, 2.13, 0.8, 0.61, 3.46, 1.14, 0.29, 0.67, 0.65, 2.05, 1.06, 1.2, 5.85, 1.82, 15.08, 0.42, 22.25, 0.65, 2.89, 1.2, 0.85, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/mOpvoWxjz90_filtered.json b/annotations_filtered/mOpvoWxjz90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50a939a390aca34e5ad156c362d5e4cd70c2b154 --- /dev/null +++ b/annotations_filtered/mOpvoWxjz90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.52], [44.0, 44.04], [55.0, 57.27], [57.0, 57.3], [62.0, 62.29], [63.0, 63.66], [65.0, 65.35], [69.0, 69.82], [73.0, 73.33], [74.0, 76.57], [77.0, 77.55], [79.0, 79.66], [82.0, 83.69], [88.0, 88.7], [90.0, 90.68], [91.0, 94.86], [96.0, 96.11], [97.0, 98.54], [100.0, 101.61], [117.0, 117.75], [119.0, 120.39], [121.0, 121.66], [123.0, 124.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 42.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["alarm clock", 49.68], ["alarm", 14.53], ["telephone bell ringing", 12.9]], null, null, null, null, null, null, [["speech", 89.03], ["boing", 6.24], ["inside, small room", 1.11]], null, null, null, null, null, [["speech", 90.38], ["inside, small room", 2.05], ["telephone", 1.44]], null, null, null, null, null, null, null], "duration": [0.52, 0.04, 2.27, 0.3, 0.29, 0.66, 0.35, 0.82, 0.33, 2.57, 0.55, 0.66, 1.69, 0.7, 0.68, 3.86, 0.11, 1.54, 1.61, 0.75, 1.39, 0.66, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/mPWo1Dsti3c_filtered.json b/annotations_filtered/mPWo1Dsti3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0156d2aa951311df033b8abcc390f1ed355e1427 --- /dev/null +++ b/annotations_filtered/mPWo1Dsti3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.53], [3.0, 4.29], [6.0, 6.91], [10.0, 10.56], [17.0, 19.85], [20.0, 37.96], [39.0, 40.8], [41.0, 41.81], [51.0, 51.95], [55.0, 55.93], [57.0, 57.32], [58.0, 58.35], [61.0, 76.22], [85.0, 85.36]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.22, 29.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.18, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 16.74], ["noise", 15.54], ["hum", 12.22]], [["music", 36.78], ["speech", 28.92], ["sidetone", 6.89]], null, null, null, null, null, null, [["music", 31.71], ["speech", 23.72], ["throbbing", 18.2]], null], "duration": [1.53, 1.29, 0.91, 0.56, 2.85, 17.96, 1.8, 0.81, 0.95, 0.93, 0.32, 0.35, 15.22, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/mPxTwqzr1sw_filtered.json b/annotations_filtered/mPxTwqzr1sw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57be2bbdf09dc9d6f3bacddf4aa016bbe6a8a9c4 --- /dev/null +++ b/annotations_filtered/mPxTwqzr1sw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 18.77], [20.0, 26.1], [31.0, 49.33], [52.0, 65.33], [68.0, 70.29]], "keep_status": [false, false, false, false, false], "silence_prob": [35.86, 36.71, 38.62, 38.2, 76.7], "audiomae_on_audioset": [[["music", 65.51], ["brass instrument", 7.34], ["speech", 5.18]], [["music", 68.01], ["speech", 9.6], ["electronic music", 2.24]], [["music", 56.66], ["speech", 14.35], ["throbbing", 4.23]], [["music", 86.2], ["didgeridoo", 1.58], ["musical instrument", 1.55]], null], "duration": [11.77, 6.1, 18.33, 13.33, 2.29]} \ No newline at end of file diff --git a/annotations_filtered/mQ3tgtzkz_U_filtered.json b/annotations_filtered/mQ3tgtzkz_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..899c12b733f214a482ae1140827f14ac31aae192 --- /dev/null +++ b/annotations_filtered/mQ3tgtzkz_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 46.53], [48.0, 48.44], [48.0, 64.81], [67.0, 70.41], [73.0, 79.42], [83.0, 100.3]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 77.2, 98.1, 58.72, 54.04], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [32.53, 0.44, 16.81, 3.41, 6.42, 17.3]} \ No newline at end of file diff --git a/annotations_filtered/mQAlpiB3_FQ_filtered.json b/annotations_filtered/mQAlpiB3_FQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b09153c811b7463c90317239898dc86ab446e7b8 --- /dev/null +++ b/annotations_filtered/mQAlpiB3_FQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.82], [7.0, 8.4], [12.0, 12.48], [16.0, 98.31], [99.0, 115.91]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.48], "audiomae_on_audioset": [null, null, null, null, [["music", 69.66], ["musical instrument", 3.8], ["drum", 2.02]]], "duration": [-0.18, 1.4, 0.48, 82.31, 16.91]} \ No newline at end of file diff --git a/annotations_filtered/mQTPziHf9Qc_filtered.json b/annotations_filtered/mQTPziHf9Qc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71f8815e063084e58f9f9a5db64bf97c1c561774 --- /dev/null +++ b/annotations_filtered/mQTPziHf9Qc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.08], [9.0, 9.78], [19.0, 20.44], [23.0, 24.11], [36.0, 37.83], [40.0, 41.44], [44.0, 43.63], [45.0, 45.42], [49.0, 51.98], [53.0, 53.89], [57.0, 58.11], [63.0, 67.41], [80.0, 80.69], [84.0, 92.1], [95.0, 96.15], [98.0, 100.03], [102.0, 103.86], [110.0, 111.55], [112.0, 116.26], [124.0, 152.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 55.31, 0.0, 33.07, 0.0, 33.95, 0.0, 0.0, 33.92, 48.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 84.09], ["singing", 1.77], ["soul music", 1.37]], null, [["music", 66.13], ["bass guitar", 3.48], ["musical instrument", 3.25]], null, null, [["music", 73.89], ["singing", 6.4], ["song", 1.56]], [["music", 60.15], ["effects unit", 4.3], ["musical instrument", 3.29]]], "duration": [1.08, 0.78, 1.44, 1.11, 1.83, 1.44, -0.37, 0.42, 2.98, 0.89, 1.11, 4.41, 0.69, 8.1, 1.15, 2.03, 1.86, 1.55, 4.26, 28.86]} \ No newline at end of file diff --git a/annotations_filtered/mQpZdtspStY_filtered.json b/annotations_filtered/mQpZdtspStY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..503081561ef1e3ff4dafbe71fde768b08228a3da --- /dev/null +++ b/annotations_filtered/mQpZdtspStY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.9], [17.0, 19.06], [20.0, 110.51], [113.0, 114.24], [118.0, 118.72], [120.0, 124.16], [127.0, 127.62], [129.0, 129.73], [133.0, 135.36], [139.0, 144.26], [146.0, 150.47], [152.0, 152.61], [155.0, 157.33]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.4, 44.34, 0.0, 0.0, 0.0, 89.36, 0.0, 0.0, 65.09, 84.62, 73.51, 0.0, 67.89], "audiomae_on_audioset": [[["speech", 49.69], ["music", 11.21], ["effects unit", 6.09]], [["speech", 37.58], ["music", 25.69], ["guitar", 3.89]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.9, 2.06, 90.51, 1.24, 0.72, 4.16, 0.62, 0.73, 2.36, 5.26, 4.47, 0.61, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/mR4FXksKdKg_filtered.json b/annotations_filtered/mR4FXksKdKg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..280f8d7e2243d8276e0f134131b56d1950f94331 --- /dev/null +++ b/annotations_filtered/mR4FXksKdKg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 24.33], [26.0, 27.36], [30.0, 30.69], [33.0, 34.37], [37.0, 36.93], [38.0, 38.42], [40.0, 39.55], [40.0, 40.83], [41.0, 41.08], [41.0, 41.32], [42.0, 42.18], [43.0, 44.47], [50.0, 49.74], [54.0, 54.62], [58.0, 58.63], [60.0, 60.08], [75.0, 74.93], [78.0, 115.7], [118.0, 118.13], [119.0, 119.28], [121.0, 120.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [13.33, 1.36, 0.69, 1.37, -0.07, 0.42, -0.45, 0.83, 0.08, 0.32, 0.18, 1.47, -0.26, 0.62, 0.63, 0.08, -0.07, 37.7, 0.13, 0.28, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/mRIaK9Vf0Ns_filtered.json b/annotations_filtered/mRIaK9Vf0Ns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3a3d7b1a411fecb3bf0c5fb3028d50f50b8978d --- /dev/null +++ b/annotations_filtered/mRIaK9Vf0Ns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 23.35], [25.0, 32.37], [33.0, 41.0], [43.0, 43.66], [44.0, 48.86], [51.0, 98.66], [100.0, 100.8], [107.0, 106.69], [107.0, 109.95], [110.0, 110.94], [114.0, 128.29], [133.0, 136.48], [140.0, 140.86], [142.0, 142.82], [146.0, 147.07], [149.0, 157.96], [159.0, 159.11], [159.0, 159.14], [159.0, 159.17], [159.0, 159.21], [159.0, 159.24], [159.0, 164.93], [167.0, 168.03], [171.0, 172.17], [173.0, 182.11], [183.0, 184.5]], "keep_status": [false, true, true, false, true, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [32.61, 33.15, 37.03, 0.0, 36.59, 0.0, 0.0, 0.0, 33.48, 0.0, 32.27, 31.73, 0.0, 0.0, 0.0, 35.93, 0.0, 0.0, 0.0, 0.0, 0.0, 33.46, 0.0, 0.0, 32.07, 0.0], "audiomae_on_audioset": [[["hum", 31.14], ["throbbing", 28.24], ["music", 15.22]], [["speech", 24.89], ["music", 15.82], ["mosquito", 12.01]], [["music", 15.2], ["hum", 9.79], ["fly, housefly", 8.96]], null, [["music", 28.38], ["whale vocalization", 6.28], ["rumble", 3.71]], null, null, null, [["music", 21.22], ["hum", 17.76], ["animal", 7.37]], null, [["music", 33.71], ["speech", 30.13], ["hum", 9.55]], [["music", 41.31], ["hum", 7.8], ["animal", 7.74]], null, null, null, [["speech", 18.17], ["music", 14.95], ["noise", 7.66]], null, null, null, null, null, [["music", 29.91], ["didgeridoo", 9.21], ["cacophony", 7.19]], null, null, [["music", 15.73], ["whale vocalization", 13.17], ["speech", 12.66]], null], "duration": [22.35, 7.37, 8.0, 0.66, 4.86, 47.66, 0.8, -0.31, 2.95, 0.94, 14.29, 3.48, 0.86, 0.82, 1.07, 8.96, 0.11, 0.14, 0.17, 0.21, 0.24, 5.93, 1.03, 1.17, 9.11, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/mRmLfuhXHR8_filtered.json b/annotations_filtered/mRmLfuhXHR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50633a791671cab4f43d29609a60abf381e0a9ea --- /dev/null +++ b/annotations_filtered/mRmLfuhXHR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.99], [6.0, 8.13], [9.0, 11.2], [15.0, 15.52], [18.0, 19.58], [22.0, 23.33], [24.0, 24.51], [26.0, 26.76], [28.0, 29.67], [32.0, 35.68], [37.0, 40.85], [42.0, 43.53], [45.0, 44.91], [45.0, 46.57], [49.0, 76.92], [82.0, 119.75], [120.0, 132.39], [135.0, 155.34], [156.0, 157.65], [158.0, 158.94], [161.0, 161.05], [162.0, 163.05], [164.0, 165.05], [169.0, 169.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 56.55, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.25, 57.09, 0.0, 0.0, 0.0, 31.62, 0.0, 32.96, 30.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.27], ["gong", 14.29], ["music", 5.73]], null, [["music", 33.05], ["synthesizer", 17.02], ["effects unit", 5.08]], [["music", 15.9], ["echo", 14.03], ["effects unit", 12.88]], null, null, null, null, null, null], "duration": [0.99, 2.13, 2.2, 0.52, 1.58, 1.33, 0.51, 0.76, 1.67, 3.68, 3.85, 1.53, -0.09, 1.57, 27.92, 37.75, 12.39, 20.34, 1.65, 0.94, 0.05, 1.05, 1.05, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/mRoffE53BJk_filtered.json b/annotations_filtered/mRoffE53BJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04ed30121152a6b5c01efb63fb3d685029ea5569 --- /dev/null +++ b/annotations_filtered/mRoffE53BJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [5.0, 12.21], [14.0, 14.64], [23.0, 25.42], [26.0, 27.19], [28.0, 31.14], [40.0, 40.59], [45.0, 55.14], [62.0, 63.44], [65.0, 66.31], [71.0, 85.67], [88.0, 87.62], [91.0, 113.63], [117.0, 125.47], [137.0, 139.19]], "keep_status": [false, true, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.19, 0.0, 36.82, 0.0, 30.85, 0.0, 29.58, 0.0, 0.0, 28.96, 0.0, 29.34, 29.43, 37.75], "audiomae_on_audioset": [null, [["hum", 28.47], ["throbbing", 15.61], ["rumble", 9.42]], null, [["music", 44.17], ["didgeridoo", 17.54], ["throbbing", 6.4]], null, [["music", 47.21], ["noise", 12.21], ["hum", 6.01]], null, [["music", 75.99], ["throbbing", 5.84], ["hum", 2.61]], null, null, [["music", 76.99], ["hum", 3.47], ["mains hum", 2.85]], null, [["music", 52.12], ["hum", 18.21], ["throbbing", 15.71]], [["music", 50.83], ["throbbing", 26.04], ["hum", 6.81]], [["music", 58.25], ["speech", 8.09], ["sidetone", 7.25]]], "duration": [0.5, 7.21, 0.64, 2.42, 1.19, 3.14, 0.59, 10.14, 1.44, 1.31, 14.67, -0.38, 22.63, 8.47, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/mRwKWTGCd7Y_filtered.json b/annotations_filtered/mRwKWTGCd7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3323689684689be498e7947fd7ab70e583b8b57 --- /dev/null +++ b/annotations_filtered/mRwKWTGCd7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.01], [18.0, 40.12], [41.0, 46.18], [51.0, 53.81], [56.0, 56.46], [62.0, 62.07], [62.0, 76.08], [79.0, 99.76]], "keep_status": [false, false, true, true, false, false, true, true], "silence_prob": [54.63, 45.59, 29.11, 31.92, 0.0, 0.0, 29.51, 30.18], "audiomae_on_audioset": [null, [["music", 36.45], ["hum", 35.53], ["mains hum", 5.96]], [["whack, thwack", 44.12], ["music", 10.69], ["speech", 8.77]], [["music", 30.76], ["speech", 17.36], ["pulse", 17.09]], null, null, [["whack, thwack", 27.11], ["groan", 18.5], ["fly, housefly", 8.82]], [["whack, thwack", 28.15], ["music", 27.8], ["speech", 4.54]]], "duration": [9.01, 22.12, 5.18, 2.81, 0.46, 0.07, 14.08, 20.76]} \ No newline at end of file diff --git a/annotations_filtered/mS-uVaGMOtw_filtered.json b/annotations_filtered/mS-uVaGMOtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/mS-uVaGMOtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/mS1u_E53e10_filtered.json b/annotations_filtered/mS1u_E53e10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f4503f5a5c351bda0e9fdb89c7a8896e383a10c --- /dev/null +++ b/annotations_filtered/mS1u_E53e10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.65], [8.0, 8.23], [12.0, 12.95], [15.0, 19.38], [24.0, 24.21], [27.0, 29.83], [33.0, 36.49], [40.0, 41.1], [48.0, 49.47], [51.0, 51.6], [61.0, 64.25], [76.0, 80.89], [82.0, 87.32], [92.0, 94.83], [96.0, 96.72], [108.0, 110.0]], "keep_status": [false, false, false, false, false, true, true, false, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.23, 0.0, 46.61, 32.1, 0.0, 0.0, 0.0, 35.14, 29.82, 30.55, 32.73, 0.0, 64.18], "audiomae_on_audioset": [null, null, null, [["fart", 35.63], ["speech", 33.22], ["fly, housefly", 5.28]], null, [["speech", 17.21], ["fly, housefly", 12.22], ["music", 10.56]], [["speech", 38.5], ["vehicle", 7.78], ["music", 4.54]], null, null, null, [["speech", 30.59], ["animal", 6.55], ["radio", 4.48]], [["moo", 26.88], ["cattle, bovinae", 23.83], ["livestock, farm animals, working animals", 12.43]], [["music", 41.16], ["speech", 36.05], ["electronic music", 5.84]], [["speech", 38.55], ["whale vocalization", 13.66], ["cattle, bovinae", 9.99]], null, null], "duration": [1.65, 0.23, 0.95, 4.38, 0.21, 2.83, 3.49, 1.1, 1.47, 0.6, 3.25, 4.89, 5.32, 2.83, 0.72, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/mS4njwcS4dw_filtered.json b/annotations_filtered/mS4njwcS4dw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4ff89bd527fca00365999d05636e5a6f844af06 --- /dev/null +++ b/annotations_filtered/mS4njwcS4dw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.69]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [-0.31]} \ No newline at end of file diff --git a/annotations_filtered/mSa_kUf6cxs_filtered.json b/annotations_filtered/mSa_kUf6cxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d93b09a6c6c38c3570c037a013544eec7e69da1 --- /dev/null +++ b/annotations_filtered/mSa_kUf6cxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.57], [19.0, 19.35], [21.0, 21.3], [26.0, 27.36], [28.0, 28.29], [28.0, 30.0], [31.0, 32.66], [35.0, 37.74], [42.0, 47.19]], "keep_status": [false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.58, 0.0, 30.39, 31.76], "audiomae_on_audioset": [null, null, null, null, null, [["music", 18.45], ["whale vocalization", 16.22], ["speech", 15.58]], null, [["vehicle", 15.32], ["whale vocalization", 13.99], ["music", 13.98]], [["music", 17.7], ["theremin", 13.62], ["speech", 13.32]]], "duration": [0.57, 0.35, 0.3, 1.36, 0.29, 2.0, 1.66, 2.74, 5.19]} \ No newline at end of file diff --git a/annotations_filtered/mSd_B5ZTP3s_filtered.json b/annotations_filtered/mSd_B5ZTP3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e15886a00dea15d0da937faabdc2adbdc13251c --- /dev/null +++ b/annotations_filtered/mSd_B5ZTP3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.99], [13.0, 15.03], [16.0, 17.0], [19.0, 19.85], [21.0, 26.7], [27.0, 29.94], [31.0, 34.1], [36.0, 37.0], [38.0, 41.23], [45.0, 48.34], [50.0, 55.04], [59.0, 61.15], [66.0, 76.11], [78.0, 99.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.93, 99.84, 0.0, 0.0, 93.76, 71.87, 84.8, 0.0, 98.1, 99.73, 97.92, 98.36, 88.64, 65.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.99, 2.03, 1.0, 0.85, 5.7, 2.94, 3.1, 1.0, 3.23, 3.34, 5.04, 2.15, 10.11, 21.49]} \ No newline at end of file diff --git a/annotations_filtered/mSeeLOr1GKI_filtered.json b/annotations_filtered/mSeeLOr1GKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffba6081e5ce3bbf05f4405864bc822b57a043af --- /dev/null +++ b/annotations_filtered/mSeeLOr1GKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.2], [5.0, 6.22], [8.0, 8.51], [12.0, 12.5], [14.0, 15.36], [16.0, 17.27], [20.0, 20.53], [21.0, 22.55], [24.0, 24.63], [26.0, 27.84], [31.0, 33.02], [36.0, 37.67], [39.0, 39.7], [41.0, 42.63], [44.0, 44.74], [46.0, 46.04], [47.0, 47.43], [49.0, 49.96], [51.0, 52.81], [56.0, 56.93], [60.0, 61.1], [63.0, 66.75], [70.0, 71.64], [74.0, 74.51], [75.0, 75.05], [76.0, 76.84], [80.0, 80.92], [84.0, 84.4], [86.0, 86.16], [87.0, 87.76], [89.0, 90.91], [92.0, 93.51], [95.0, 96.94], [100.0, 101.36], [105.0, 105.97], [106.0, 107.92], [110.0, 110.59], [115.0, 115.77], [118.0, 118.72], [123.0, 123.16], [127.0, 127.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.2, 1.22, 0.51, 0.5, 1.36, 1.27, 0.53, 1.55, 0.63, 1.84, 2.02, 1.67, 0.7, 1.63, 0.74, 0.04, 0.43, 0.96, 1.81, 0.93, 1.1, 3.75, 1.64, 0.51, 0.05, 0.84, 0.92, 0.4, 0.16, 0.76, 1.91, 1.51, 1.94, 1.36, 0.97, 1.92, 0.59, 0.77, 0.72, 0.16, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/mT1QTyuTr-M_filtered.json b/annotations_filtered/mT1QTyuTr-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bf03c0b312078ec2769a7e3fb1c54773c7c52c8 --- /dev/null +++ b/annotations_filtered/mT1QTyuTr-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 56.98], [59.0, 60.59], [61.0, 62.26], [63.0, 67.73], [68.0, 70.77], [74.0, 74.38], [77.0, 88.5], [92.0, 97.43], [98.0, 99.13], [100.0, 100.95], [103.0, 105.06], [107.0, 108.35], [110.0, 114.49], [115.0, 117.49], [118.0, 119.57], [123.0, 123.8], [126.0, 130.18]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.56, 38.33, 0.0, 56.1, 68.54, 0.0, 0.0, 82.07, 0.0, 73.21, 83.16, 0.0, 0.0, 70.02], "audiomae_on_audioset": [null, null, null, [["speech", 42.33], ["radio", 21.79], ["sidetone", 5.62]], [["speech", 18.53], ["radio", 16.58], ["sidetone", 13.78]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.98, 1.59, 1.26, 4.73, 2.77, 0.38, 11.5, 5.43, 1.13, 0.95, 2.06, 1.35, 4.49, 2.49, 1.57, 0.8, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/mT3_2sDEBJQ_filtered.json b/annotations_filtered/mT3_2sDEBJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a41d40ca591356a3240003f907aeae0c495381e --- /dev/null +++ b/annotations_filtered/mT3_2sDEBJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.2], [8.0, 8.65], [10.0, 9.88], [22.0, 22.0], [35.0, 34.72], [72.0, 73.01]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.2, 0.65, -0.12, 0.0, -0.28, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/mT5NiDGbnVM_filtered.json b/annotations_filtered/mT5NiDGbnVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17f100921a3e9e70e22b4f660cd60ba360430daa --- /dev/null +++ b/annotations_filtered/mT5NiDGbnVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.33], [10.0, 10.15], [27.0, 28.36], [49.0, 57.64], [89.0, 89.16], [91.0, 96.75], [103.0, 103.05], [108.0, 111.18], [113.0, 113.95], [117.0, 117.15], [120.0, 121.68], [124.0, 124.9], [126.0, 128.53], [132.0, 132.49], [135.0, 135.04], [136.0, 139.5], [141.0, 140.78], [147.0, 148.22], [149.0, 151.39]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.52, 0.0, 0.0, 30.82, 0.0, 40.41, 0.0, 58.22, 0.0, 0.0, 0.0, 0.0, 33.96, 0.0, 0.0, 62.78, 0.0, 0.0, 85.72], "audiomae_on_audioset": [[["speech", 46.06], ["beatboxing", 14.41], ["music", 10.44]], null, null, [["speech", 53.09], ["fart", 9.94], ["music", 7.1]], null, [["speech", 28.39], ["fart", 12.15], ["fly, housefly", 11.89]], null, null, null, null, null, null, [["speech", 71.72], ["dial tone", 2.37], ["inside, small room", 1.79]], null, null, null, null, null, null], "duration": [4.33, 0.15, 1.36, 8.64, 0.16, 5.75, 0.05, 3.18, 0.95, 0.15, 1.68, 0.9, 2.53, 0.49, 0.04, 3.5, -0.22, 1.22, 2.39]} \ No newline at end of file diff --git a/annotations_filtered/mTVRho54mAg_filtered.json b/annotations_filtered/mTVRho54mAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38fdf4a01c545702201afaf626dbfea65c13386c --- /dev/null +++ b/annotations_filtered/mTVRho54mAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.52], [9.0, 10.05], [10.0, 11.01], [14.0, 15.96], [17.0, 19.09], [20.0, 23.65], [24.0, 39.45], [40.0, 41.57], [43.0, 45.22], [46.0, 46.21], [47.0, 47.95]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [60.6, 0.0, 0.0, 0.0, 52.56, 63.31, 44.55, 0.0, 35.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 51.05], ["hum", 9.27], ["mains hum", 3.57]], null, [["music", 56.4], ["didgeridoo", 12.01], ["effects unit", 3.28]], null, null], "duration": [2.52, 1.05, 1.01, 1.96, 2.09, 3.65, 15.45, 1.57, 2.22, 0.21, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/mTYe5PvlRno_filtered.json b/annotations_filtered/mTYe5PvlRno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19d2556d36f8dfc51f0518334dd4f6a157f87f73 --- /dev/null +++ b/annotations_filtered/mTYe5PvlRno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.98], [12.0, 14.61], [16.0, 16.71], [18.0, 19.67], [21.0, 22.0], [26.0, 29.37], [30.0, 31.31], [33.0, 33.79], [37.0, 37.32], [52.0, 53.11], [55.0, 58.19], [62.0, 62.23], [63.0, 64.02], [65.0, 66.53], [67.0, 68.49], [71.0, 71.37], [75.0, 77.73], [79.0, 79.95], [81.0, 82.32], [83.0, 84.6], [89.0, 89.67], [103.0, 103.28], [105.0, 106.41], [120.0, 131.87], [134.0, 134.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 62.47, 0.0, 0.0, 0.0, 62.47, 0.0, 0.0, 0.0, 0.0, 40.16, 0.0, 0.0, 0.0, 0.0, 0.0, 33.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 11.2], ["burping, eructation", 7.16], ["groan", 6.71]], null, null, null, null, null, [["speech", 38.72], ["quack", 12.79], ["laughter", 6.75]], null, null, null, null, null, null, null, null], "duration": [-0.02, 2.61, 0.71, 1.67, 1.0, 3.37, 1.31, 0.79, 0.32, 1.11, 3.19, 0.23, 1.02, 1.53, 1.49, 0.37, 2.73, 0.95, 1.32, 1.6, 0.67, 0.28, 1.41, 11.87, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/mTYwZEhFwu0_filtered.json b/annotations_filtered/mTYwZEhFwu0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e930473edda77df605f4f087db36fe3c5923091e --- /dev/null +++ b/annotations_filtered/mTYwZEhFwu0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.21], [5.0, 7.18], [8.0, 11.74], [13.0, 13.81], [14.0, 15.94], [18.0, 20.14], [21.0, 21.44], [29.0, 30.82], [35.0, 34.89], [36.0, 36.31], [37.0, 37.37], [38.0, 38.62], [48.0, 48.0], [50.0, 51.02], [56.0, 57.64], [59.0, 58.7], [63.0, 63.95], [74.0, 75.52], [78.0, 78.44], [84.0, 83.91], [88.0, 88.43], [94.0, 95.35], [100.0, 101.01], [105.0, 105.93], [107.0, 109.73], [110.0, 112.26], [119.0, 119.67], [123.0, 123.36], [125.0, 126.06], [129.0, 129.78], [134.0, 134.25], [136.0, 136.24], [138.0, 138.2], [140.0, 140.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.78, 81.71, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.15, 54.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 2.18, 3.74, 0.81, 1.94, 2.14, 0.44, 1.82, -0.11, 0.31, 0.37, 0.62, 0.0, 1.02, 1.64, -0.3, 0.95, 1.52, 0.44, -0.09, 0.43, 1.35, 1.01, 0.93, 2.73, 2.26, 0.67, 0.36, 1.06, 0.78, 0.25, 0.24, 0.2, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/mTr1vpzU00Q_filtered.json b/annotations_filtered/mTr1vpzU00Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e257adcf7f651da4aaf7a7ce61e78f2ae6bbaaa --- /dev/null +++ b/annotations_filtered/mTr1vpzU00Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.26], [2.0, 3.79], [5.0, 5.51], [6.0, 6.62], [8.0, 7.86], [9.0, 9.53], [12.0, 14.01], [15.0, 16.11], [17.0, 18.32], [20.0, 20.55], [21.0, 22.62], [25.0, 25.61], [36.0, 40.59], [45.0, 51.41], [54.0, 54.77], [57.0, 60.37], [62.0, 83.39], [84.0, 84.91], [86.0, 86.78], [88.0, 89.01], [92.0, 93.92], [94.0, 94.74], [95.0, 96.82], [98.0, 99.67], [101.0, 101.6], [102.0, 102.96], [104.0, 105.68], [108.0, 108.58], [110.0, 111.16], [112.0, 112.46], [114.0, 114.88], [118.0, 120.53], [124.0, 124.53], [126.0, 126.22], [130.0, 131.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 45.69, 0.0, 84.07, 94.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 25.98], ["sidetone", 13.36], ["speech", 12.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.26, 1.79, 0.51, 0.62, -0.14, 0.53, 2.01, 1.11, 1.32, 0.55, 1.62, 0.61, 4.59, 6.41, 0.77, 3.37, 21.39, 0.91, 0.78, 1.01, 1.92, 0.74, 1.82, 1.67, 0.6, 0.96, 1.68, 0.58, 1.16, 0.46, 0.88, 2.53, 0.53, 0.22, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/mTx6_XT9Hns_filtered.json b/annotations_filtered/mTx6_XT9Hns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc7cc1cc6a709cd300b94f1c36148b0625e1d046 --- /dev/null +++ b/annotations_filtered/mTx6_XT9Hns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 21.36], [23.0, 27.72], [28.0, 80.97], [82.0, 117.85], [119.0, 129.83]], "keep_status": [true, false, false, false, true], "silence_prob": [30.95, 68.67, 0.0, 0.0, 30.17], "audiomae_on_audioset": [[["sound effect", 10.07], ["reverberation", 9.51], ["effects unit", 8.6]], null, null, null, [["whale vocalization", 47.37], ["animal", 5.75], ["music", 4.95]]], "duration": [7.36, 4.72, 52.97, 35.85, 10.83]} \ No newline at end of file diff --git a/annotations_filtered/mUVup2pr_eM_filtered.json b/annotations_filtered/mUVup2pr_eM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a29a293c4a4a5006273c3be77db87845dd458e8 --- /dev/null +++ b/annotations_filtered/mUVup2pr_eM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.67], [1.0, 7.5], [8.0, 9.41], [11.0, 11.84], [12.0, 53.05], [55.0, 55.05], [57.0, 57.13], [58.0, 60.51], [63.0, 71.0], [77.0, 117.37], [119.0, 119.75], [127.0, 127.3], [128.0, 129.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.04, 0.0, 0.0, 0.0, 0.0, 0.0, 33.8, 30.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["neigh, whinny", 41.02], ["animal", 22.15], ["horse", 15.68]], null, null, null, null, null, [["music", 70.42], ["didgeridoo", 3.15], ["synthesizer", 3.04]], [["music", 76.18], ["didgeridoo", 6.56], ["musical instrument", 5.89]], null, null, null, null], "duration": [0.67, 6.5, 1.41, 0.84, 41.05, 0.05, 0.13, 2.51, 8.0, 40.37, 0.75, 0.3, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/mUtHkSw9nEY_filtered.json b/annotations_filtered/mUtHkSw9nEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f04c34c7c7daac16571b6e3f08b44f68a9ae101 --- /dev/null +++ b/annotations_filtered/mUtHkSw9nEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.78], [7.0, 9.1], [11.0, 11.91], [13.0, 13.04], [14.0, 13.98], [14.0, 14.79], [16.0, 17.54], [20.0, 21.63], [23.0, 23.55], [25.0, 25.83], [26.0, 27.99], [29.0, 29.24], [31.0, 32.22], [34.0, 35.38], [36.0, 37.44], [38.0, 41.79], [44.0, 48.0], [49.0, 51.76], [55.0, 55.38], [57.0, 57.0], [63.0, 65.28], [66.0, 66.8], [67.0, 68.44], [70.0, 70.51], [72.0, 72.6], [74.0, 74.76], [79.0, 80.64], [83.0, 84.06], [87.0, 88.35], [90.0, 90.59], [92.0, 92.67], [95.0, 95.1], [100.0, 100.25], [104.0, 104.94], [106.0, 106.73], [108.0, 108.73], [110.0, 110.22], [111.0, 111.82], [120.0, 120.7], [125.0, 125.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 100.0, 97.73, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.78, 2.1, 0.91, 0.04, -0.02, 0.79, 1.54, 1.63, 0.55, 0.83, 1.99, 0.24, 1.22, 1.38, 1.44, 3.79, 4.0, 2.76, 0.38, 0.0, 2.28, 0.8, 1.44, 0.51, 0.6, 0.76, 1.64, 1.06, 1.35, 0.59, 0.67, 0.1, 0.25, 0.94, 0.73, 0.73, 0.22, 0.82, 0.7, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/mUxLZWWRKUI_filtered.json b/annotations_filtered/mUxLZWWRKUI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4e8579a7f2084a6d1b4454b218a93ef7c33ed61 --- /dev/null +++ b/annotations_filtered/mUxLZWWRKUI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.91], [4.0, 5.86], [7.0, 7.7], [9.0, 11.52], [13.0, 13.93], [14.0, 17.68], [19.0, 20.82], [22.0, 22.72], [24.0, 25.71], [27.0, 28.44], [35.0, 37.45], [39.0, 39.5], [45.0, 46.04], [49.0, 49.42], [52.0, 52.79], [53.0, 54.3], [57.0, 58.4], [61.0, 60.94], [62.0, 65.01], [73.0, 73.95], [75.0, 76.42], [78.0, 79.46], [82.0, 84.89], [87.0, 87.71], [89.0, 89.6], [91.0, 91.74], [93.0, 95.2], [101.0, 102.46], [104.0, 104.33], [106.0, 108.6], [111.0, 113.29], [115.0, 116.24], [118.0, 119.72], [121.0, 121.15], [122.0, 124.5], [127.0, 128.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 63.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 100.0, 99.56, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 1.86, 0.7, 2.52, 0.93, 3.68, 1.82, 0.72, 1.71, 1.44, 2.45, 0.5, 1.04, 0.42, 0.79, 1.3, 1.4, -0.06, 3.01, 0.95, 1.42, 1.46, 2.89, 0.71, 0.6, 0.74, 2.2, 1.46, 0.33, 2.6, 2.29, 1.24, 1.72, 0.15, 2.5, 1.88]} \ No newline at end of file diff --git a/annotations_filtered/mUzu93AhMuE_filtered.json b/annotations_filtered/mUzu93AhMuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7afe07efd317c7c2af0065c037c45ca7793afc3e --- /dev/null +++ b/annotations_filtered/mUzu93AhMuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.14], [6.0, 5.85], [7.0, 8.13], [9.0, 9.81], [11.0, 12.78], [16.0, 18.25], [21.0, 21.93], [23.0, 24.29], [29.0, 29.69], [31.0, 33.61], [35.0, 35.87], [37.0, 37.86], [41.0, 41.84], [46.0, 47.39], [52.0, 52.2], [54.0, 56.02], [63.0, 71.49], [73.0, 75.66], [77.0, 76.81], [79.0, 85.02], [87.0, 89.6], [91.0, 92.28], [95.0, 94.96], [103.0, 103.44], [110.0, 110.12], [116.0, 119.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 65.91, 0.0, 0.0, 0.0, 60.05, 0.0, 0.0, 0.0, 0.0, 0.0, 52.22, 63.64, 74.92, 0.0, 50.21, 100.0, 0.0, 0.0, 0.0, 0.0, 75.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.14, -0.15, 1.13, 0.81, 1.78, 2.25, 0.93, 1.29, 0.69, 2.61, 0.87, 0.86, 0.84, 1.39, 0.2, 2.02, 8.49, 2.66, -0.19, 6.02, 2.6, 1.28, -0.04, 0.44, 0.12, 3.7]} \ No newline at end of file diff --git a/annotations_filtered/mVUQ88T2S6E_filtered.json b/annotations_filtered/mVUQ88T2S6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d87e472a2b9d88532ff6ba02813d0871779d61ec --- /dev/null +++ b/annotations_filtered/mVUQ88T2S6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [5.0, 6.27], [11.0, 12.88], [19.0, 23.45], [24.0, 27.14], [28.0, 33.96], [40.0, 43.55], [53.0, 54.43], [57.0, 56.78], [64.0, 64.56], [66.0, 79.14], [82.0, 113.32]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 44.55, 43.25, 39.19, 40.75, 0.0, 0.0, 0.0, 28.4, 0.0], "audiomae_on_audioset": [null, null, null, [["telephone dialing, dtmf", 34.36], ["speech", 27.04], ["sidetone", 13.57]], [["speech", 23.92], ["sidetone", 18.3], ["music", 15.3]], [["speech", 58.3], ["radio", 19.75], ["sidetone", 9.14]], [["sidetone", 54.72], ["speech", 16.75], ["radio", 14.65]], null, null, null, [["mains hum", 58.5], ["hum", 21.25], ["music", 7.69]], null], "duration": [0.29, 1.27, 1.88, 4.45, 3.14, 5.96, 3.55, 1.43, -0.22, 0.56, 13.14, 31.32]} \ No newline at end of file diff --git a/annotations_filtered/mV__PXYxQYY_filtered.json b/annotations_filtered/mV__PXYxQYY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87b982b5bf7f42620e8c0d5b79df4b677b889441 --- /dev/null +++ b/annotations_filtered/mV__PXYxQYY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [12.0, 12.43], [14.0, 15.06], [19.0, 18.86], [23.0, 23.7], [26.0, 27.55], [34.0, 34.37], [37.0, 38.55], [40.0, 41.39], [42.0, 42.9], [43.0, 43.88], [45.0, 47.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 35.96], ["music", 21.3], ["musical instrument", 3.96]]], "duration": [0.83, 0.43, 1.06, -0.14, 0.7, 1.55, 0.37, 1.55, 1.39, 0.9, 0.88, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/mVbGpzsuNjE_filtered.json b/annotations_filtered/mVbGpzsuNjE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..764edb437fab60c9cafb2c2e5cdd39cea1756ad3 --- /dev/null +++ b/annotations_filtered/mVbGpzsuNjE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [5.0, 9.39], [10.0, 11.25], [18.0, 18.79], [22.0, 32.48], [42.0, 42.69], [46.0, 47.51], [53.0, 56.67], [61.0, 62.26], [64.0, 63.93], [67.0, 68.05], [71.0, 72.64], [77.0, 79.76], [81.0, 81.68], [85.0, 85.18], [86.0, 86.37], [90.0, 90.1], [91.0, 91.76], [98.0, 99.81], [103.0, 103.2], [104.0, 105.12], [110.0, 110.51], [112.0, 112.02], [113.0, 114.45], [117.0, 121.95], [123.0, 127.47]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 31.83, 0.0, 0.0, 49.68, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.98, 34.63], "audiomae_on_audioset": [null, [["music", 34.5], ["carnatic music", 17.89], ["chant", 7.1]], null, null, [["music", 18.05], ["mains hum", 15.72], ["telephone", 12.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 39.67], ["radio", 14.47], ["speech", 10.91]], [["moo", 50.44], ["cattle, bovinae", 37.25], ["livestock, farm animals, working animals", 8.97]]], "duration": [0.38, 4.39, 1.25, 0.79, 10.48, 0.69, 1.51, 3.67, 1.26, -0.07, 1.05, 1.64, 2.76, 0.68, 0.18, 0.37, 0.1, 0.76, 1.81, 0.2, 1.12, 0.51, 0.02, 1.45, 4.95, 4.47]} \ No newline at end of file diff --git a/annotations_filtered/mVcHdILwsXQ_filtered.json b/annotations_filtered/mVcHdILwsXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66cb744dd11661620ae3d78dd4f22f2843741ce0 --- /dev/null +++ b/annotations_filtered/mVcHdILwsXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 31.72]], "keep_status": [true], "silence_prob": [31.34], "audiomae_on_audioset": [[["hum", 30.02], ["mains hum", 19.62], ["speech", 9.79]]], "duration": [28.72]} \ No newline at end of file diff --git a/annotations_filtered/mVdTVvgW4EM_filtered.json b/annotations_filtered/mVdTVvgW4EM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..711880f47d4986fa9235f2c54e03f77682303fc9 --- /dev/null +++ b/annotations_filtered/mVdTVvgW4EM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.79], [21.0, 21.91], [23.0, 25.0], [26.0, 44.95], [48.0, 75.1], [75.0, 89.21], [89.0, 106.76], [107.0, 106.95], [107.0, 107.79], [109.0, 125.52], [130.0, 147.65], [149.0, 157.81], [161.0, 160.68], [162.0, 162.24], [170.0, 172.76]], "keep_status": [false, false, false, false, true, true, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 85.54, 29.36, 36.76, 36.72, 39.41, 0.0, 0.0, 48.56, 40.55, 40.77, 0.0, 0.0, 78.55], "audiomae_on_audioset": [null, null, null, [["music", 59.44], ["cacophony", 10.29], ["didgeridoo", 7.22]], [["music", 55.12], ["musical instrument", 5.94], ["brass instrument", 3.94]], [["music", 24.82], ["singing bowl", 17.67], ["theremin", 9.06]], [["music", 57.11], ["fart", 7.74], ["sidetone", 4.24]], null, null, [["music", 44.88], ["theremin", 26.12], ["singing bowl", 6.94]], [["music", 71.28], ["scary music", 4.5], ["soundtrack music", 2.72]], [["music", 35.45], ["hum", 11.88], ["throbbing", 5.95]], null, null, null], "duration": [0.79, 0.91, 2.0, 18.95, 27.1, 14.21, 17.76, -0.05, 0.79, 16.52, 17.65, 8.81, -0.32, 0.24, 2.76]} \ No newline at end of file diff --git a/annotations_filtered/mVqKHUtKh8Y_filtered.json b/annotations_filtered/mVqKHUtKh8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a632932c045989a2159925b3cc782b9ef219cd11 --- /dev/null +++ b/annotations_filtered/mVqKHUtKh8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.22], [6.0, 6.44], [10.0, 10.17], [12.0, 13.46], [17.0, 18.42], [19.0, 24.24], [25.0, 25.54], [26.0, 27.26], [28.0, 30.45], [32.0, 40.14], [42.0, 42.8], [44.0, 44.34], [46.0, 48.41], [50.0, 51.44], [54.0, 57.32], [60.0, 60.57], [63.0, 63.81], [65.0, 65.75], [67.0, 66.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 70.16, 63.96, 0.0, 0.0, 65.2, 0.0, 55.18, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.22, 0.44, 0.17, 1.46, 1.42, 5.24, 0.54, 1.26, 2.45, 8.14, 0.8, 0.34, 2.41, 1.44, 3.32, 0.57, 0.81, 0.75, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/mVv14yZ1c44_filtered.json b/annotations_filtered/mVv14yZ1c44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91c89265a975725f5f91b2d7aaa1dd22fa82420f --- /dev/null +++ b/annotations_filtered/mVv14yZ1c44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.51], [16.0, 17.71], [22.0, 22.54], [25.0, 28.97], [29.0, 36.15], [37.0, 40.2], [41.0, 57.0], [59.0, 61.06], [64.0, 70.53], [72.0, 75.41], [76.0, 76.76], [77.0, 79.66], [80.0, 81.75], [82.0, 106.08], [107.0, 108.21], [110.0, 123.15], [125.0, 125.91], [127.0, 129.95], [131.0, 132.9], [133.0, 136.51], [138.0, 138.28], [138.0, 138.59], [142.0, 142.75], [143.0, 144.53], [146.0, 146.69], [149.0, 152.47], [155.0, 157.64], [163.0, 162.97], [163.0, 167.22], [169.0, 169.87]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 49.87, 42.67, 64.29, 98.44, 41.05, 99.4, 99.4, 0.0, 89.72, 0.0, 89.9, 0.0, 68.67, 0.0, 82.07, 0.0, 49.27, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 51.18, 0.0, 47.82, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 12.84], ["mains hum", 12.7], ["creak", 6.64]], [["mains hum", 27.3], ["speech", 20.84], ["hum", 16.4]], null, null, [["effects unit", 26.3], ["music", 14.55], ["speech", 12.97]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.1], ["music", 25.75], ["sidetone", 9.35]], null, null, null, null, null, [["music", 59.71], ["musical instrument", 5.8], ["synthesizer", 4.15]], null, null, [["music", 20.07], ["synthesizer", 6.16], ["speech", 6.1]], null], "duration": [1.51, 1.71, 0.54, 3.97, 7.15, 3.2, 16.0, 2.06, 6.53, 3.41, 0.76, 2.66, 1.75, 24.08, 1.21, 13.15, 0.91, 2.95, 1.9, 3.51, 0.28, 0.59, 0.75, 1.53, 0.69, 3.47, 2.64, -0.03, 4.22, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/mVybomocIw4_filtered.json b/annotations_filtered/mVybomocIw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc200abc84c333b62738cfe888e04f7711b95823 --- /dev/null +++ b/annotations_filtered/mVybomocIw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 19.75], [20.0, 23.4], [25.0, 28.83], [31.0, 32.26], [36.0, 36.22], [37.0, 38.64], [40.0, 43.93], [46.0, 47.49], [49.0, 51.11], [52.0, 53.6], [55.0, 56.86], [58.0, 59.36], [62.0, 69.77], [71.0, 76.72], [77.0, 81.13], [82.0, 82.34], [95.0, 110.59], [112.0, 112.55], [113.0, 114.08], [115.0, 115.32], [117.0, 116.67], [120.0, 121.85], [125.0, 126.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.25, 99.94, 99.36, 0.0, 0.0, 0.0, 97.73, 0.0, 99.48, 0.0, 0.0, 0.0, 100.0, 99.91, 96.17, 0.0, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [18.75, 3.4, 3.83, 1.26, 0.22, 1.64, 3.93, 1.49, 2.11, 1.6, 1.86, 1.36, 7.77, 5.72, 4.13, 0.34, 15.59, 0.55, 1.08, 0.32, -0.33, 1.85, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/mVzdHEhC8YI_filtered.json b/annotations_filtered/mVzdHEhC8YI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dffa6fd2a32735d8cec409ab76a54d24e04e19a4 --- /dev/null +++ b/annotations_filtered/mVzdHEhC8YI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 27.62], [29.0, 29.54], [30.0, 69.97], [73.0, 73.67], [75.0, 76.01], [78.0, 81.9]], "keep_status": [true, false, false, false, false, true], "silence_prob": [29.21, 0.0, 0.0, 0.0, 0.0, 30.03], "audiomae_on_audioset": [[["music", 32.86], ["speech", 22.78], ["livestock, farm animals, working animals", 7.81]], null, null, null, null, [["music", 44.67], ["hum", 14.36], ["theremin", 5.75]]], "duration": [16.62, 0.54, 39.97, 0.67, 1.01, 3.9]} \ No newline at end of file diff --git a/annotations_filtered/mWqZWXSj-s0_filtered.json b/annotations_filtered/mWqZWXSj-s0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17cb4a5d08fb2eeea048c711987b2e06e5719bf4 --- /dev/null +++ b/annotations_filtered/mWqZWXSj-s0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [5.0, 6.2], [7.0, 12.11], [14.0, 28.09], [40.0, 47.33], [48.0, 51.33], [52.0, 52.66], [55.0, 55.53], [57.0, 59.32], [61.0, 61.37], [68.0, 69.01], [70.0, 70.66], [72.0, 71.91], [75.0, 75.56]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.92, 35.72, 97.64, 88.83, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["whack, thwack", 21.91], ["speech", 19.56], ["fart", 7.02]], null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 1.2, 5.11, 14.09, 7.33, 3.33, 0.66, 0.53, 2.32, 0.37, 1.01, 0.66, -0.09, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/mX5Vqy1ETgM_filtered.json b/annotations_filtered/mX5Vqy1ETgM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a70f854dcb5776a558cfaf6f00de303a149c366d --- /dev/null +++ b/annotations_filtered/mX5Vqy1ETgM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [4.0, 4.19], [5.0, 7.53], [10.0, 11.21], [12.0, 14.64], [16.0, 16.26], [17.0, 18.5], [21.0, 21.37], [24.0, 24.19], [28.0, 28.04], [38.0, 38.6], [48.0, 49.0], [55.0, 54.95], [55.0, 55.76], [57.0, 57.32], [58.0, 58.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 91.64, 0.0, 50.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.19, 2.53, 1.21, 2.64, 0.26, 1.5, 0.37, 0.19, 0.04, 0.6, 1.0, -0.05, 0.76, 0.32, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/mXLSLzeu-mM_filtered.json b/annotations_filtered/mXLSLzeu-mM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed12dc621decc26e749e0f50c5fba469036412a0 --- /dev/null +++ b/annotations_filtered/mXLSLzeu-mM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [4.0, 4.92], [8.0, 26.28], [27.0, 27.89], [30.0, 52.79], [54.0, 64.98], [68.0, 68.79], [69.0, 96.57], [97.0, 97.68], [101.0, 115.92], [118.0, 119.8], [121.0, 124.02], [125.0, 126.72], [128.0, 132.36], [135.0, 135.26], [139.0, 139.6], [141.0, 143.95], [145.0, 146.01], [148.0, 152.64]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.19, 0.0, 36.85, 32.4, 0.0, 40.24, 0.0, 58.72, 0.0, 74.29, 0.0, 86.64, 0.0, 0.0, 80.29, 0.0, 80.11], "audiomae_on_audioset": [null, null, [["music", 55.64], ["timpani", 3.53], ["musical instrument", 3.28]], null, [["music", 71.29], ["percussion", 6.32], ["tabla", 3.55]], [["music", 29.67], ["thunk", 11.09], ["speech", 9.01]], null, [["music", 81.42], ["musical instrument", 2.43], ["timpani", 2.32]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.92, 18.28, 0.89, 22.79, 10.98, 0.79, 27.57, 0.68, 14.92, 1.8, 3.02, 1.72, 4.36, 0.26, 0.6, 2.95, 1.01, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/mXp99jJtyII_filtered.json b/annotations_filtered/mXp99jJtyII_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5aeafe9ccc34d4ee49212d90a4f4e4086231d9b --- /dev/null +++ b/annotations_filtered/mXp99jJtyII_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.99], [5.0, 8.95], [10.0, 10.56], [14.0, 17.41], [18.0, 30.84], [34.0, 36.91], [38.0, 38.53], [42.0, 45.57], [46.0, 46.85], [51.0, 52.24], [54.0, 55.38], [57.0, 57.99], [60.0, 67.26], [68.0, 70.31], [72.0, 73.85], [74.0, 76.52], [78.0, 80.0], [81.0, 88.64], [90.0, 92.8], [94.0, 97.09], [98.0, 100.41], [102.0, 104.13], [107.0, 108.99], [110.0, 113.53]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, false, true, false, true, true, false, false, true, true, true, false, false], "silence_prob": [0.0, 43.45, 0.0, 33.23, 37.64, 40.77, 0.0, 42.02, 0.0, 0.0, 0.0, 0.0, 36.27, 33.55, 0.0, 42.15, 42.35, 47.86, 46.12, 38.4, 42.3, 46.57, 0.0, 52.68], "audiomae_on_audioset": [null, [["hum", 40.95], ["mains hum", 25.92], ["throbbing", 7.29]], null, [["aircraft", 15.87], ["propeller, airscrew", 13.37], ["vehicle", 13.36]], [["music", 46.05], ["scary music", 7.47], ["hum", 7.41]], [["music", 41.27], ["mains hum", 7.48], ["didgeridoo", 5.48]], null, [["frog", 49.15], ["croak", 29.14], ["didgeridoo", 4.51]], null, null, null, null, [["speech", 41.16], ["music", 34.96], ["hum", 6.86]], [["hum", 33.8], ["mains hum", 12.21], ["speech", 10.94]], null, [["speech", 24.16], ["hum", 23.86], ["mains hum", 20.71]], [["music", 33.21], ["frog", 15.95], ["croak", 3.65]], [["hum", 30.52], ["mains hum", 27.68], ["music", 20.64]], [["music", 43.26], ["didgeridoo", 27.18], ["animal", 3.5]], [["didgeridoo", 24.11], ["music", 20.97], ["hum", 17.76]], [["music", 15.83], ["whale vocalization", 9.38], ["speech", 9.34]], [["mains hum", 25.56], ["speech", 14.97], ["music", 13.21]], null, null], "duration": [1.99, 3.95, 0.56, 3.41, 12.84, 2.91, 0.53, 3.57, 0.85, 1.24, 1.38, 0.99, 7.26, 2.31, 1.85, 2.52, 2.0, 7.64, 2.8, 3.09, 2.41, 2.13, 1.99, 3.53]} \ No newline at end of file diff --git a/annotations_filtered/mXvst0jlR9Q_filtered.json b/annotations_filtered/mXvst0jlR9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f797f93b39297fc73113450b8a9836eee98189c3 --- /dev/null +++ b/annotations_filtered/mXvst0jlR9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.53], [8.0, 8.07], [9.0, 9.78], [19.0, 18.82], [19.0, 20.16], [21.0, 20.75], [22.0, 22.55], [23.0, 23.46], [24.0, 25.95], [26.0, 27.04], [28.0, 28.44], [29.0, 30.7], [32.0, 34.4], [35.0, 37.02], [38.0, 39.43], [44.0, 45.82], [49.0, 49.54], [51.0, 52.07], [52.0, 52.62], [54.0, 54.53], [56.0, 56.96], [60.0, 68.47], [69.0, 70.28], [70.0, 73.85], [74.0, 75.98], [78.0, 78.92], [80.0, 81.04], [84.0, 100.82], [101.0, 102.37], [103.0, 115.67], [118.0, 121.85], [126.0, 128.44], [129.0, 132.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.67, 60.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 83.34, 0.0, 0.0, 0.0, 98.59, 0.0, 95.37, 80.64, 97.73, 91.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.53, 0.07, 0.78, -0.18, 1.16, -0.25, 0.55, 0.46, 1.95, 1.04, 0.44, 1.7, 2.4, 2.02, 1.43, 1.82, 0.54, 1.07, 0.62, 0.53, 0.96, 8.47, 1.28, 3.85, 1.98, 0.92, 1.04, 16.82, 1.37, 12.67, 3.85, 2.44, 3.83]} \ No newline at end of file diff --git a/annotations_filtered/mXz39lQAEmY_filtered.json b/annotations_filtered/mXz39lQAEmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72f28e0ebf425746cd4bb894426d241e4deea3c9 --- /dev/null +++ b/annotations_filtered/mXz39lQAEmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.63], [6.0, 9.51], [11.0, 11.69], [12.0, 15.08], [19.0, 24.19], [25.0, 26.84], [29.0, 30.82], [37.0, 40.93], [42.0, 43.19], [44.0, 45.1], [46.0, 48.05], [50.0, 53.76], [57.0, 57.42], [60.0, 61.18], [64.0, 66.53], [69.0, 70.34], [75.0, 75.14], [77.0, 78.11], [81.0, 82.58], [83.0, 84.96], [86.0, 88.42], [89.0, 90.9], [92.0, 94.37], [99.0, 101.71], [106.0, 108.04], [113.0, 117.58], [119.0, 119.75], [122.0, 122.99], [123.0, 125.54], [126.0, 128.95], [131.0, 132.92], [134.0, 135.67], [137.0, 139.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.19, 98.27, 0.0, 89.72, 95.64, 0.0, 0.0, 90.43, 0.0, 0.0, 82.43, 91.81, 0.0, 0.0, 78.38, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 84.25, 97.73, 79.07, 83.7, 0.0, 0.0, 66.27, 57.01, 0.0, 0.0, 73.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.63, 3.51, 0.69, 3.08, 5.19, 1.84, 1.82, 3.93, 1.19, 1.1, 2.05, 3.76, 0.42, 1.18, 2.53, 1.34, 0.14, 1.11, 1.58, 1.96, 2.42, 1.9, 2.37, 2.71, 2.04, 4.58, 0.75, 0.99, 2.54, 2.95, 1.92, 1.67, 2.83]} \ No newline at end of file diff --git a/annotations_filtered/mYS3zyHIxqA_filtered.json b/annotations_filtered/mYS3zyHIxqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2121f2e5b20519f7d1b687790abdd6598aa537e1 --- /dev/null +++ b/annotations_filtered/mYS3zyHIxqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 42.77]], "keep_status": [true], "silence_prob": [28.34], "audiomae_on_audioset": [[["music", 15.66], ["speech", 15.61], ["rumble", 8.5]]], "duration": [12.77]} \ No newline at end of file diff --git a/annotations_filtered/mYhkrT5de2Y_filtered.json b/annotations_filtered/mYhkrT5de2Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..051acf1fb5912f9d73d7fbc334bf37e0c0dab343 --- /dev/null +++ b/annotations_filtered/mYhkrT5de2Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.86], [5.0, 5.81], [9.0, 9.75], [28.0, 30.79], [36.0, 37.17]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 47.43, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 15.34], ["speech", 15.1], ["insect", 8.49]], null], "duration": [1.86, 0.81, 0.75, 2.79, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/mZ2kxdQf3t0_filtered.json b/annotations_filtered/mZ2kxdQf3t0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/mZ2kxdQf3t0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/mZHlantNtwg_filtered.json b/annotations_filtered/mZHlantNtwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aea677e2057c726929710231977794acf016d8e8 --- /dev/null +++ b/annotations_filtered/mZHlantNtwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.67], [15.0, 17.41], [23.0, 41.22], [47.0, 47.9], [60.0, 60.54], [62.0, 65.52], [66.0, 81.09], [83.0, 89.99], [94.0, 95.2], [96.0, 97.26], [99.0, 99.3], [103.0, 106.27], [109.0, 109.27], [119.0, 118.84], [146.0, 149.23], [151.0, 153.62]], "keep_status": [true, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [34.46, 30.03, 33.06, 0.0, 0.0, 44.84, 31.13, 30.91, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 68.02, 35.74], "audiomae_on_audioset": [[["music", 34.03], ["throbbing", 8.81], ["theremin", 7.28]], [["groan", 27.51], ["speech", 18.45], ["music", 18.35]], [["speech", 65.84], ["music", 19.84], ["explosion", 1.37]], null, null, [["speech", 22.21], ["fly, housefly", 19.66], ["insect", 14.04]], [["music", 55.42], ["speech", 20.31], ["fart", 3.12]], [["music", 54.91], ["hum", 5.53], ["musical instrument", 3.66]], null, null, null, null, null, null, null, [["speech", 45.21], ["chirp tone", 15.39], ["sine wave", 15.33]]], "duration": [4.67, 2.41, 18.22, 0.9, 0.54, 3.52, 15.09, 6.99, 1.2, 1.26, 0.3, 3.27, 0.27, -0.16, 3.23, 2.62]} \ No newline at end of file diff --git a/annotations_filtered/mZYTLYXT-CQ_filtered.json b/annotations_filtered/mZYTLYXT-CQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e77f53c96df3e36dce1251230d0e80cf12a91799 --- /dev/null +++ b/annotations_filtered/mZYTLYXT-CQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.77], [18.0, 17.74], [20.0, 24.98], [31.0, 34.82], [40.0, 44.76], [51.0, 52.25], [53.0, 59.49], [61.0, 63.05], [63.0, 73.35], [75.0, 79.44], [82.0, 91.42], [94.0, 117.73], [119.0, 120.34], [121.0, 122.82], [127.0, 128.82], [132.0, 132.71], [134.0, 137.34], [140.0, 144.88], [146.0, 146.92], [148.0, 150.31], [150.0, 152.15], [152.0, 161.49], [162.0, 170.4], [176.0, 176.59]], "keep_status": [true, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [37.61, 0.0, 34.32, 59.15, 52.68, 0.0, 39.66, 40.04, 49.36, 53.59, 48.61, 53.91, 0.0, 0.0, 0.0, 0.0, 78.55, 54.04, 0.0, 37.26, 38.83, 49.87, 71.57, 0.0], "audiomae_on_audioset": [[["animal", 21.29], ["dog", 17.32], ["domestic animals, pets", 13.82]], null, [["music", 40.51], ["theremin", 14.33], ["speech", 6.61]], null, null, null, [["whale vocalization", 54.29], ["speech", 17.57], ["theremin", 12.45]], [["whale vocalization", 36.16], ["music", 18.08], ["theremin", 17.91]], [["music", 54.86], ["theremin", 6.99], ["speech", 3.61]], null, [["music", 45.77], ["whale vocalization", 10.86], ["speech", 10.2]], null, null, null, null, null, null, null, null, [["fly, housefly", 15.88], ["livestock, farm animals, working animals", 15.25], ["bee, wasp, etc.", 12.85]], [["hum", 31.73], ["speech", 15.17], ["mains hum", 6.35]], [["livestock, farm animals, working animals", 33.79], ["animal", 26.09], ["cattle, bovinae", 7.88]], null, null], "duration": [10.77, -0.26, 4.98, 3.82, 4.76, 1.25, 6.49, 2.05, 10.35, 4.44, 9.42, 23.73, 1.34, 1.82, 1.82, 0.71, 3.34, 4.88, 0.92, 2.31, 2.15, 9.49, 8.4, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/mZwKEa09xTc_filtered.json b/annotations_filtered/mZwKEa09xTc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e64021c39d57fb17e3027f10a6080203740f97b --- /dev/null +++ b/annotations_filtered/mZwKEa09xTc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 52.64], [56.0, 56.47], [72.0, 73.84], [75.0, 75.42], [75.0, 77.73], [78.0, 79.03], [86.0, 87.15], [95.0, 95.96], [102.0, 102.81], [109.0, 109.48], [117.0, 117.09], [119.0, 119.48], [120.0, 121.41], [122.0, 124.17], [125.0, 126.64]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.84, 0.0, 0.0, 0.0, 39.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.55, 0.0], "audiomae_on_audioset": [[["music", 83.44], ["thunk", 2.85], ["boing", 2.13]], null, null, null, [["throbbing", 24.07], ["hum", 18.73], ["speech", 15.9]], null, null, null, null, null, null, null, null, null, null], "duration": [11.64, 0.47, 1.84, 0.42, 2.73, 1.03, 1.15, 0.96, 0.81, 0.48, 0.09, 0.48, 1.41, 2.17, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/mZzkE03B64o_filtered.json b/annotations_filtered/mZzkE03B64o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57e0d2c9f2c552f80df6e77da6995295221200ca --- /dev/null +++ b/annotations_filtered/mZzkE03B64o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.8], [16.0, 17.49], [22.0, 23.72], [25.0, 26.81], [32.0, 34.03], [37.0, 39.16], [41.0, 42.63], [51.0, 63.21], [64.0, 108.94], [113.0, 123.16]], "keep_status": [false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.7, 40.17, 0.0, 53.34, 0.0, 35.26], "audiomae_on_audioset": [null, null, null, null, [["music", 19.82], ["crushing", 11.14], ["hands", 8.06]], [["effects unit", 6.86], ["noise", 4.51], ["music", 4.3]], null, null, null, [["music", 15.24], ["effects unit", 11.4], ["sound effect", 5.85]]], "duration": [0.8, 1.49, 1.72, 1.81, 2.03, 2.16, 1.63, 12.21, 44.94, 10.16]} \ No newline at end of file diff --git a/annotations_filtered/m_7Bm1gyq2c_filtered.json b/annotations_filtered/m_7Bm1gyq2c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..987b6160def6e52890d0a7209ac3bf95ffe8b9fd --- /dev/null +++ b/annotations_filtered/m_7Bm1gyq2c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.75], [15.0, 15.89], [24.0, 24.31], [50.0, 50.09], [52.0, 52.39], [59.0, 61.94], [65.0, 65.45], [70.0, 71.74], [72.0, 73.57], [75.0, 77.25], [78.0, 80.37], [84.0, 83.83], [85.0, 85.29], [93.0, 93.66], [98.0, 102.19], [105.0, 106.35], [108.0, 111.05], [115.0, 115.37], [129.0, 130.99], [132.0, 131.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 98.99, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 0.89, 0.31, 0.09, 0.39, 2.94, 0.45, 1.74, 1.57, 2.25, 2.37, -0.17, 0.29, 0.66, 4.19, 1.35, 3.05, 0.37, 1.99, -0.27]} \ No newline at end of file diff --git a/annotations_filtered/m_C2cbqPkx0_filtered.json b/annotations_filtered/m_C2cbqPkx0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dabc50d37ccdd65cd9088696fe98c0fcf2004d59 --- /dev/null +++ b/annotations_filtered/m_C2cbqPkx0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.05], [10.0, 11.06], [14.0, 14.93], [18.0, 18.05], [19.0, 20.55], [21.0, 21.73], [23.0, 24.04], [26.0, 25.76], [27.0, 31.18], [32.0, 33.61], [34.0, 37.17], [39.0, 41.61], [43.0, 44.95], [47.0, 48.74], [54.0, 54.45], [55.0, 56.74], [58.0, 59.32], [60.0, 61.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 99.98, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 1.06, 0.93, 0.05, 1.55, 0.73, 1.04, -0.24, 4.18, 1.61, 3.17, 2.61, 1.95, 1.74, 0.45, 1.74, 1.32, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/m_PeQCPq8QA_filtered.json b/annotations_filtered/m_PeQCPq8QA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c090e768d382b73043eb5ff1366949801ca814e --- /dev/null +++ b/annotations_filtered/m_PeQCPq8QA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [5.0, 5.7], [6.0, 8.68], [16.0, 58.82], [61.0, 61.16], [71.0, 71.44], [73.0, 72.99], [74.0, 128.49], [132.0, 144.12], [145.0, 145.98], [147.0, 150.18]], "keep_status": [false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 32.4, 0.0, 0.0, 0.0, 0.0, 0.0, 35.19, 0.0, 35.09], "audiomae_on_audioset": [null, null, [["music", 55.03], ["speech", 7.69], ["synthesizer", 5.26]], null, null, null, null, null, [["livestock, farm animals, working animals", 15.64], ["vehicle", 10.27], ["fly, housefly", 6.08]], null, [["whale vocalization", 11.47], ["gurgling", 4.54], ["speech", 4.07]]], "duration": [0.62, 0.7, 2.68, 42.82, 0.16, 0.44, -0.01, 54.49, 12.12, 0.98, 3.18]} \ No newline at end of file diff --git a/annotations_filtered/ma7zprvD7UA_filtered.json b/annotations_filtered/ma7zprvD7UA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a55f1fa252a37ed0126bf1b16e11c1be2316063a --- /dev/null +++ b/annotations_filtered/ma7zprvD7UA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 108.11], [112.0, 113.09], [115.0, 115.79], [123.0, 124.68], [129.0, 131.5], [132.0, 155.85], [157.0, 166.51]], "keep_status": [false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.33, 29.66, 30.07], "audiomae_on_audioset": [null, null, null, null, [["music", 43.39], ["speech", 13.54], ["hum", 6.33]], [["music", 42.36], ["crowd", 14.93], ["electronic music", 7.86]], [["music", 51.84], ["speech", 15.12], ["civil defense siren", 3.18]]], "duration": [38.11, 1.09, 0.79, 1.68, 2.5, 23.85, 9.51]} \ No newline at end of file diff --git a/annotations_filtered/ma_XNn1bwOM_filtered.json b/annotations_filtered/ma_XNn1bwOM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d10bba3a658eec3f3ca9ddaf767f0245e59a71c0 --- /dev/null +++ b/annotations_filtered/ma_XNn1bwOM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.8], [18.0, 21.51], [23.0, 22.91], [27.0, 30.86], [32.0, 32.36], [38.0, 71.58], [75.0, 99.5], [104.0, 105.51]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.67, 0.0, 67.38, 0.0, 0.0, 99.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [-0.2, 3.51, -0.09, 3.86, 0.36, 33.58, 24.5, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/mb2bzOdITdU_filtered.json b/annotations_filtered/mb2bzOdITdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af2d10fe51900b3c6aa2040fb7ebde1b64835716 --- /dev/null +++ b/annotations_filtered/mb2bzOdITdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.51], [18.0, 27.46], [30.0, 83.66], [84.0, 92.8], [94.0, 101.82], [103.0, 103.64], [107.0, 110.17], [111.0, 112.9], [116.0, 119.01]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [58.38, 34.21, 0.0, 57.25, 59.42, 0.0, 37.74, 0.0, 67.89], "audiomae_on_audioset": [null, [["music", 62.93], ["thunk", 6.55], ["animal", 3.48]], null, null, null, null, [["horse", 36.93], ["neigh, whinny", 18.04], ["animal", 10.73]], null, null], "duration": [2.51, 9.46, 53.66, 8.8, 7.82, 0.64, 3.17, 1.9, 3.01]} \ No newline at end of file diff --git a/annotations_filtered/mb63Ds-XWQE_filtered.json b/annotations_filtered/mb63Ds-XWQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7472792d599998be34169db3ecb9591648b372f1 --- /dev/null +++ b/annotations_filtered/mb63Ds-XWQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 27.9], [30.0, 60.37], [62.0, 63.71], [66.0, 119.33], [123.0, 126.5]], "keep_status": [true, false, false, false, true], "silence_prob": [34.15, 0.0, 0.0, 0.0, 30.99], "audiomae_on_audioset": [[["music", 35.23], ["hum", 22.65], ["mains hum", 10.94]], null, null, null, [["music", 59.8], ["synthesizer", 5.53], ["keyboard (musical)", 4.57]]], "duration": [22.9, 30.37, 1.71, 53.33, 3.5]} \ No newline at end of file diff --git a/annotations_filtered/mbBhikLj86Y_filtered.json b/annotations_filtered/mbBhikLj86Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cd4800145edd95ca4ba6a3f0c37b57b4b32c6c7 --- /dev/null +++ b/annotations_filtered/mbBhikLj86Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.27], [19.0, 18.74], [21.0, 21.95], [23.0, 26.0], [28.0, 32.93], [34.0, 42.38], [45.0, 45.79], [47.0, 55.46], [57.0, 58.36], [59.0, 63.27], [64.0, 64.99], [65.0, 72.55], [87.0, 89.04], [92.0, 92.64], [95.0, 96.25], [97.0, 97.09], [97.0, 97.44], [97.0, 99.17], [102.0, 102.07], [103.0, 103.2], [108.0, 108.24], [110.0, 109.98], [115.0, 117.85], [119.0, 119.23]], "keep_status": [true, false, false, true, false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [32.14, 0.0, 0.0, 32.61, 31.93, 31.91, 0.0, 44.26, 0.0, 42.96, 0.0, 34.04, 33.38, 0.0, 0.0, 0.0, 0.0, 32.28, 0.0, 0.0, 0.0, 0.0, 36.08, 0.0], "audiomae_on_audioset": [[["music", 48.58], ["cello", 5.66], ["musical instrument", 5.62]], null, null, [["music", 43.23], ["cello", 10.14], ["bowed string instrument", 5.64]], [["music", 65.69], ["cello", 2.99], ["musical instrument", 2.92]], [["speech", 55.6], ["fart", 19.44], ["whack, thwack", 2.96]], null, [["music", 29.57], ["animal", 10.31], ["frog", 10.23]], null, [["music", 45.6], ["chime", 15.15], ["marimba, xylophone", 4.57]], null, [["speech", 83.0], ["telephone", 1.94], ["fart", 1.85]], [["radio", 7.7], ["telephone", 6.34], ["boing", 6.08]], null, null, null, null, [["speech", 42.67], ["music", 40.63], ["inside, small room", 2.03]], null, null, null, null, [["music", 28.78], ["cello", 14.73], ["musical instrument", 11.59]], null], "duration": [2.27, -0.26, 0.95, 3.0, 4.93, 8.38, 0.79, 8.46, 1.36, 4.27, 0.99, 7.55, 2.04, 0.64, 1.25, 0.09, 0.44, 2.17, 0.07, 0.2, 0.24, -0.02, 2.85, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/mbFx0CbaIlY_filtered.json b/annotations_filtered/mbFx0CbaIlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef610142f8415d82f423b99f664cdbb27b46ecd1 --- /dev/null +++ b/annotations_filtered/mbFx0CbaIlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.37], [13.0, 30.32], [33.0, 33.91], [34.0, 34.33], [35.0, 35.5], [37.0, 37.44], [38.0, 39.85], [41.0, 41.98], [42.0, 44.2], [45.0, 46.26], [47.0, 47.38], [48.0, 49.76], [50.0, 53.5], [54.0, 57.42], [63.0, 64.69], [65.0, 68.71], [69.0, 69.35], [71.0, 73.14], [75.0, 75.22], [76.0, 76.22], [78.0, 78.14], [93.0, 92.96], [96.0, 96.04], [99.0, 102.12], [111.0, 112.9], [124.0, 126.37], [127.0, 127.67], [128.0, 128.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.07, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 93.76, 72.75, 0.0, 43.58, 0.0, 74.6, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 0.0, 50.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.79], ["boing", 4.25], ["speech", 4.17]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.37, 17.32, 0.91, 0.33, 0.5, 0.44, 1.85, 0.98, 2.2, 1.26, 0.38, 1.76, 3.5, 3.42, 1.69, 3.71, 0.35, 2.14, 0.22, 0.22, 0.14, -0.04, 0.04, 3.12, 1.9, 2.37, 0.67, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/mbKEarx9CCs_filtered.json b/annotations_filtered/mbKEarx9CCs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a93659135d9521f1067d420df8cd2d52ea5549 --- /dev/null +++ b/annotations_filtered/mbKEarx9CCs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 68.88], [71.0, 72.87], [76.0, 77.38], [80.0, 81.55], [83.0, 82.9], [86.0, 87.84], [89.0, 103.72], [105.0, 105.22], [106.0, 105.73], [107.0, 109.0], [110.0, 111.77], [113.0, 115.13], [116.0, 133.0], [135.0, 140.27], [140.0, 141.15], [142.0, 142.86], [145.0, 144.78]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [43.45, 0.0, 0.0, 0.0, 0.0, 0.0, 32.67, 0.0, 0.0, 40.92, 0.0, 38.1, 33.45, 31.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 42.01], ["mains hum", 17.53], ["throbbing", 7.26]], null, null, null, null, null, [["music", 31.45], ["hum", 29.07], ["mains hum", 21.63]], null, null, [["music", 57.97], ["theremin", 26.93], ["didgeridoo", 1.34]], null, [["music", 24.86], ["hum", 14.52], ["throbbing", 10.6]], [["music", 41.9], ["speech", 6.53], ["mains hum", 5.3]], [["music", 51.93], ["hum", 12.25], ["throbbing", 9.77]], null, null, null], "duration": [2.88, 1.87, 1.38, 1.55, -0.1, 1.84, 14.72, 0.22, -0.27, 2.0, 1.77, 2.13, 17.0, 5.27, 1.15, 0.86, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/mbKiHp_ljJY_filtered.json b/annotations_filtered/mbKiHp_ljJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cff073438e3b28456cfb864d2e30172fe3dcde04 --- /dev/null +++ b/annotations_filtered/mbKiHp_ljJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.49], [15.0, 19.57], [21.0, 25.27], [27.0, 34.67], [36.0, 36.98], [41.0, 41.76], [44.0, 44.44], [48.0, 49.06], [50.0, 50.57], [53.0, 54.46]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [38.83, 63.1, 66.88, 50.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.24], ["speech", 16.54], ["effects unit", 4.65]], null, null, null, null, null, null, null, null, null], "duration": [9.49, 4.57, 4.27, 7.67, 0.98, 0.76, 0.44, 1.06, 0.57, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/mbPEuV3NJIg_filtered.json b/annotations_filtered/mbPEuV3NJIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81b8b3ff610ba21e13757163cce445c4681a418f --- /dev/null +++ b/annotations_filtered/mbPEuV3NJIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.59], [8.0, 9.34], [11.0, 11.92], [14.0, 13.78], [27.0, 27.28], [36.0, 36.51], [38.0, 38.96], [46.0, 47.09], [49.0, 49.5], [54.0, 54.06], [57.0, 58.38], [59.0, 58.68], [59.0, 58.72], [59.0, 58.92], [59.0, 59.02], [59.0, 59.05], [59.0, 59.09], [59.0, 59.19], [59.0, 59.39], [59.0, 65.26], [70.0, 75.09], [80.0, 101.07], [103.0, 105.16], [108.0, 110.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 33.15, 30.92, 32.37, 37.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.78], ["boing", 7.99], ["speech", 3.5]], [["music", 27.91], ["speech", 25.29], ["throbbing", 8.41]], [["music", 41.15], ["sidetone", 28.28], ["speech", 20.39]], [["throbbing", 22.32], ["music", 14.33], ["hum", 10.5]], [["cattle, bovinae", 34.28], ["livestock, farm animals, working animals", 13.25], ["moo", 13.25]]], "duration": [1.59, 1.34, 0.92, -0.22, 0.28, 0.51, 0.96, 1.09, 0.5, 0.06, 1.38, -0.32, -0.28, -0.08, 0.02, 0.05, 0.09, 0.19, 0.39, 6.26, 5.09, 21.07, 2.16, 2.98]} \ No newline at end of file diff --git a/annotations_filtered/mbTKo5Ylypw_filtered.json b/annotations_filtered/mbTKo5Ylypw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dfc6497a2ef148602cf97a727b2037d80cf896f --- /dev/null +++ b/annotations_filtered/mbTKo5Ylypw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.88], [10.0, 10.74], [11.0, 12.65], [18.0, 21.63], [23.0, 23.5], [33.0, 40.71], [44.0, 45.1], [48.0, 48.37], [52.0, 52.02], [61.0, 61.33], [62.0, 62.7], [65.0, 65.58], [70.0, 70.83], [72.0, 73.84], [74.0, 76.77], [78.0, 79.62], [81.0, 88.89], [90.0, 92.08], [93.0, 92.82], [93.0, 95.13], [97.0, 98.9], [102.0, 102.84], [103.0, 104.04], [109.0, 109.41], [110.0, 111.13], [113.0, 115.26], [116.0, 121.37], [123.0, 125.17], [126.0, 125.93], [127.0, 128.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.95, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 43.51, 96.17, 0.0, 91.3, 0.0, 0.0, 0.0, 0.0, 0.0, 43.79, 44.63, 68.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 19.35], ["hum", 12.16], ["eruption", 8.86]], null, null, null, null, null, null, null, null, [["speech", 89.69], ["dial tone", 2.54], ["telephone", 1.52]], [["speech", 31.4], ["stomach rumble", 10.12], ["hum", 8.68]], null, null, null], "duration": [2.88, 0.74, 1.65, 3.63, 0.5, 7.71, 1.1, 0.37, 0.02, 0.33, 0.7, 0.58, 0.83, 1.84, 2.77, 1.62, 7.89, 2.08, -0.18, 2.13, 1.9, 0.84, 1.04, 0.41, 1.13, 2.26, 5.37, 2.17, -0.07, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/mbWtLBLt1ro_filtered.json b/annotations_filtered/mbWtLBLt1ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/mbWtLBLt1ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/mbkWniWSpR0_filtered.json b/annotations_filtered/mbkWniWSpR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9e787908a813ff891ef2578580e44b4b69aad24 --- /dev/null +++ b/annotations_filtered/mbkWniWSpR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.41], [7.0, 7.16], [9.0, 11.04], [14.0, 17.17], [18.0, 18.74], [28.0, 33.72], [36.0, 41.79], [43.0, 43.12], [44.0, 44.95], [48.0, 47.93], [51.0, 51.49], [53.0, 53.13], [55.0, 55.68], [59.0, 60.02], [63.0, 63.86], [66.0, 66.88], [67.0, 67.91], [70.0, 72.18], [73.0, 74.58], [77.0, 77.53], [81.0, 83.81], [84.0, 89.34], [90.0, 90.24], [91.0, 92.52], [96.0, 95.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [99.52, 0.0, 99.4, 99.85, 0.0, 99.26, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 31.38, 58.05, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.94], ["gunshot, gunfire", 8.12], ["explosion", 7.43]], null, null, null, null], "duration": [3.41, 0.16, 2.04, 3.17, 0.74, 5.72, 5.79, 0.12, 0.95, -0.07, 0.49, 0.13, 0.68, 1.02, 0.86, 0.88, 0.91, 2.18, 1.58, 0.53, 2.81, 5.34, 0.24, 1.52, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/mbzNdI-1iUc_filtered.json b/annotations_filtered/mbzNdI-1iUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/mbzNdI-1iUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/mcUWG23hqvw_filtered.json b/annotations_filtered/mcUWG23hqvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9ca0aefb54fd8b25bc45b2f2f57d1cc844a3402 --- /dev/null +++ b/annotations_filtered/mcUWG23hqvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [5.0, 5.64], [7.0, 7.55], [8.0, 8.88], [10.0, 9.86], [12.0, 18.54], [21.0, 29.57], [30.0, 31.92], [34.0, 35.46], [38.0, 40.19], [42.0, 43.82], [51.0, 53.03], [54.0, 54.35], [55.0, 55.44], [57.0, 58.99], [60.0, 61.92], [63.0, 70.66], [73.0, 73.52], [75.0, 75.44], [76.0, 88.43], [89.0, 89.56], [90.0, 91.12], [92.0, 92.52], [93.0, 94.17], [99.0, 110.4], [113.0, 113.73], [117.0, 118.29], [127.0, 128.01], [131.0, 131.84], [137.0, 137.96], [138.0, 147.11], [152.0, 152.64], [157.0, 157.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [92.64, 0.0, 0.0, 0.0, 0.0, 80.29, 33.64, 0.0, 0.0, 74.29, 0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 37.91, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 0.0, 39.15, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 88.34], ["music", 5.38], ["electric shaver, electric razor", 0.68]], null, null, null, null, null, null, null, null, null, [["speech", 59.11], ["fart", 20.92], ["frog", 4.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 20.08], ["stomach rumble", 11.29], ["speech", 10.52]], null, null], "duration": [2.11, 0.64, 0.55, 0.88, -0.14, 6.54, 8.57, 1.92, 1.46, 2.19, 1.82, 2.03, 0.35, 0.44, 1.99, 1.92, 7.66, 0.52, 0.44, 12.43, 0.56, 1.12, 0.52, 1.17, 11.4, 0.73, 1.29, 1.01, 0.84, 0.96, 9.11, 0.64, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/mcWrZOrafnA_filtered.json b/annotations_filtered/mcWrZOrafnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ff11a4aef3950597aab19a1d520d733535e1644 --- /dev/null +++ b/annotations_filtered/mcWrZOrafnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.42], [9.0, 12.04], [16.0, 16.88], [17.0, 18.37], [19.0, 20.58], [22.0, 22.22], [26.0, 27.11], [33.0, 34.94], [37.0, 37.91], [41.0, 41.86], [43.0, 43.61], [47.0, 47.24], [49.0, 49.33], [67.0, 68.1], [73.0, 75.03], [84.0, 84.01], [90.0, 93.39], [98.0, 100.84], [103.0, 106.17], [110.0, 110.73], [113.0, 116.68], [129.0, 129.12]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 79.76, 96.66, 92.97, 0.0, 77.36, 0.0], "audiomae_on_audioset": [null, [["throbbing", 22.3], ["music", 12.09], ["speech", 11.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 3.04, 0.88, 1.37, 1.58, 0.22, 1.11, 1.94, 0.91, 0.86, 0.61, 0.24, 0.33, 1.1, 2.03, 0.01, 3.39, 2.84, 3.17, 0.73, 3.68, 0.12]} \ No newline at end of file diff --git a/annotations_filtered/mcerWHb94yo_filtered.json b/annotations_filtered/mcerWHb94yo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2058f7b638e9cb94e6d2bf98fbb7d13b5284ded --- /dev/null +++ b/annotations_filtered/mcerWHb94yo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.22], [7.0, 19.18], [21.0, 23.55], [27.0, 28.36], [31.0, 32.8], [35.0, 42.38], [50.0, 53.47], [56.0, 56.37], [61.0, 70.17], [80.0, 80.65], [83.0, 112.18], [115.0, 116.11], [118.0, 121.91], [125.0, 125.85], [129.0, 141.88], [147.0, 148.47], [150.0, 161.94], [163.0, 227.75]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.43, 64.75, 0.0, 0.0, 31.61, 33.33, 0.0, 30.29, 0.0, 29.25, 0.0, 29.51, 0.0, 29.32, 0.0, 28.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 45.45], ["guitar", 12.89], ["musical instrument", 8.4]], [["music", 50.73], ["mantra", 17.98], ["chant", 3.14]], null, [["music", 76.43], ["hum", 2.51], ["throbbing", 1.84]], null, [["music", 79.21], ["musical instrument", 6.91], ["carnatic music", 3.91]], null, [["music", 77.27], ["synthesizer", 1.66], ["boing", 1.11]], null, [["music", 83.3], ["synthetic singing", 1.2], ["musical instrument", 0.79]], null, [["music", 46.22], ["didgeridoo", 22.08], ["theremin", 4.95]], null], "duration": [0.22, 12.18, 2.55, 1.36, 1.8, 7.38, 3.47, 0.37, 9.17, 0.65, 29.18, 1.11, 3.91, 0.85, 12.88, 1.47, 11.94, 64.75]} \ No newline at end of file diff --git a/annotations_filtered/mdHpbI8Y7Oo_filtered.json b/annotations_filtered/mdHpbI8Y7Oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84b89781423593b1e40347b14505f15e725255c9 --- /dev/null +++ b/annotations_filtered/mdHpbI8Y7Oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [2.0, 2.4], [3.0, 3.25], [5.0, 5.27], [6.0, 6.67], [8.0, 8.04], [12.0, 14.1], [18.0, 20.41], [24.0, 26.6], [28.0, 41.42], [44.0, 45.18], [49.0, 49.37], [50.0, 50.73], [53.0, 53.64], [63.0, 64.4], [70.0, 70.71], [77.0, 76.72], [79.0, 80.22], [84.0, 84.55], [103.0, 106.34], [108.0, 109.61], [112.0, 112.35], [114.0, 113.98], [116.0, 116.23], [118.0, 118.56], [120.0, 120.82], [123.0, 123.01], [124.0, 124.28], [129.0, 129.24], [132.0, 132.97], [137.0, 150.13], [154.0, 159.68], [161.0, 164.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 100.0, 99.96, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.71, 42.76, 36.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 72.26], ["music", 6.54], ["busy signal", 5.83]], [["animal", 33.37], ["speech", 25.95], ["sheep", 8.41]], [["vehicle", 25.84], ["fly, housefly", 6.45], ["car", 6.05]]], "duration": [0.21, 0.4, 0.25, 0.27, 0.67, 0.04, 2.1, 2.41, 2.6, 13.42, 1.18, 0.37, 0.73, 0.64, 1.4, 0.71, -0.28, 1.22, 0.55, 3.34, 1.61, 0.35, -0.02, 0.23, 0.56, 0.82, 0.01, 0.28, 0.24, 0.97, 13.13, 5.68, 3.96]} \ No newline at end of file diff --git a/annotations_filtered/mdcXOlUMfq0_filtered.json b/annotations_filtered/mdcXOlUMfq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..160ea2e98bf9b78268024be3de18e35570c8c3eb --- /dev/null +++ b/annotations_filtered/mdcXOlUMfq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.8], [6.0, 9.39], [18.0, 20.46], [23.0, 25.24], [28.0, 29.56], [33.0, 34.64], [43.0, 44.25], [54.0, 60.34], [61.0, 62.19], [62.0, 70.92], [72.0, 72.93], [78.0, 80.23], [81.0, 82.92], [85.0, 86.66], [90.0, 90.76], [93.0, 94.29], [95.0, 96.63], [98.0, 100.68], [103.0, 104.6], [105.0, 106.83], [109.0, 110.05], [113.0, 114.32], [120.0, 122.93], [127.0, 129.22]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [39.07, 40.92, 47.58, 45.24, 0.0, 0.0, 0.0, 34.19, 0.0, 35.03, 0.0, 57.48, 0.0, 0.0, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 0.0, 0.0, 66.76, 46.15], "audiomae_on_audioset": [[["noise", 20.77], ["grunt", 10.41], ["music", 10.18]], [["music", 38.6], ["speech", 6.22], ["hum", 5.46]], [["music", 12.42], ["whale vocalization", 8.54], ["theremin", 5.91]], [["music", 11.33], ["hum", 5.97], ["cattle, bovinae", 4.81]], null, null, null, [["speech", 44.05], ["music", 15.47], ["hum", 13.59]], null, [["speech", 43.59], ["noise", 25.0], ["siren", 5.88]], null, null, null, null, null, null, null, [["hum", 23.86], ["mains hum", 6.9], ["speech", 6.18]], null, null, null, null, null, [["hum", 52.87], ["mains hum", 17.33], ["throbbing", 12.15]]], "duration": [3.8, 3.39, 2.46, 2.24, 1.56, 1.64, 1.25, 6.34, 1.19, 8.92, 0.93, 2.23, 1.92, 1.66, 0.76, 1.29, 1.63, 2.68, 1.6, 1.83, 1.05, 1.32, 2.93, 2.22]} \ No newline at end of file diff --git a/annotations_filtered/mdgbtrpVBm8_filtered.json b/annotations_filtered/mdgbtrpVBm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63d40a3669ff7466e170a904db02ad6ab704a04b --- /dev/null +++ b/annotations_filtered/mdgbtrpVBm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.55], [12.0, 13.69], [15.0, 15.67], [17.0, 18.52], [20.0, 22.59], [23.0, 22.91], [26.0, 26.28], [30.0, 30.0], [31.0, 31.6], [38.0, 41.71], [43.0, 44.25], [45.0, 46.84], [47.0, 48.63], [50.0, 50.52], [52.0, 52.17], [53.0, 54.18], [56.0, 56.12], [58.0, 58.48], [59.0, 59.68], [60.0, 66.02], [74.0, 77.8], [79.0, 82.19], [85.0, 86.49], [88.0, 88.87], [90.0, 92.58], [94.0, 95.44], [99.0, 99.62], [100.0, 103.27], [105.0, 106.35], [107.0, 106.89], [107.0, 108.4], [111.0, 112.33], [115.0, 115.1], [120.0, 120.16], [124.0, 125.19]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.57, 0.0, 0.0, 0.0, 50.46, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 98.99, 38.25, 0.0, 0.0, 100.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 15.97], ["livestock, farm animals, working animals", 15.3], ["hum", 8.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.28], ["vehicle", 5.47], ["door", 5.27]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.55, 1.69, 0.67, 1.52, 2.59, -0.09, 0.28, 0.0, 0.6, 3.71, 1.25, 1.84, 1.63, 0.52, 0.17, 1.18, 0.12, 0.48, 0.68, 6.02, 3.8, 3.19, 1.49, 0.87, 2.58, 1.44, 0.62, 3.27, 1.35, -0.11, 1.4, 1.33, 0.1, 0.16, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/mdsLJ_ciPHI_filtered.json b/annotations_filtered/mdsLJ_ciPHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79c72e4a5b7edc5498e87c0a45cd68751a1289f2 --- /dev/null +++ b/annotations_filtered/mdsLJ_ciPHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.54], [14.0, 18.89], [19.0, 36.78], [61.0, 61.35], [62.0, 64.56], [66.0, 67.66], [75.0, 75.59], [79.0, 81.97], [83.0, 84.27]], "keep_status": [false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 50.41, 32.54, 0.0, 34.38, 0.0, 0.0, 38.7, 0.0], "audiomae_on_audioset": [null, null, [["music", 66.95], ["speech", 5.39], ["whale vocalization", 4.42]], null, [["moo", 26.39], ["cattle, bovinae", 22.55], ["livestock, farm animals, working animals", 9.18]], null, null, [["music", 23.55], ["ambient music", 18.11], ["gong", 15.06]], null], "duration": [1.54, 4.89, 17.78, 0.35, 2.56, 1.66, 0.59, 2.97, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/mdwLxOK7xLc_filtered.json b/annotations_filtered/mdwLxOK7xLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95edc81a927be975f8cc914e424d0129f3fe534d --- /dev/null +++ b/annotations_filtered/mdwLxOK7xLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.72], [37.0, 38.7], [48.0, 57.96], [70.0, 70.39], [81.0, 87.76], [89.0, 94.09], [100.0, 107.18], [126.0, 126.74]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 32.09, 0.0, 31.11, 32.15, 31.14, 0.0], "audiomae_on_audioset": [null, null, [["speech", 56.01], ["music", 22.6], ["animal", 2.65]], null, [["music", 65.56], ["throbbing", 5.87], ["hum", 3.7]], [["speech", 43.34], ["boing", 8.38], ["vehicle", 6.13]], [["music", 38.04], ["speech", 24.32], ["boing", 10.63]], null], "duration": [0.72, 1.7, 9.96, 0.39, 6.76, 5.09, 7.18, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/me7nuXZfXVM_filtered.json b/annotations_filtered/me7nuXZfXVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd9e797148309d778291dc50987392ad5966e69f --- /dev/null +++ b/annotations_filtered/me7nuXZfXVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.06], [9.0, 13.66], [16.0, 33.3], [36.0, 52.03], [53.0, 54.23], [56.0, 65.45], [66.0, 65.85], [66.0, 65.89], [68.0, 79.66]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 31.09, 31.16, 30.53, 0.0, 30.35, 0.0, 0.0, 30.38], "audiomae_on_audioset": [null, [["speech", 47.12], ["music", 37.96], ["throbbing", 2.34]], [["music", 71.77], ["speech", 4.58], ["musical instrument", 2.88]], [["music", 23.06], ["didgeridoo", 16.32], ["fart", 9.84]], null, [["speech", 73.24], ["fart", 10.88], ["outside, rural or natural", 1.7]], null, null, [["speech", 67.93], ["fart", 15.61], ["animal", 4.29]]], "duration": [1.06, 4.66, 17.3, 16.03, 1.23, 9.45, -0.15, -0.11, 11.66]} \ No newline at end of file diff --git a/annotations_filtered/me9Vweatkto_filtered.json b/annotations_filtered/me9Vweatkto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b7979edba3e93a8e250e636ee3f4f3a2571176d --- /dev/null +++ b/annotations_filtered/me9Vweatkto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.13], [10.0, 13.69], [16.0, 17.64], [21.0, 21.09], [23.0, 23.63], [25.0, 28.71], [31.0, 44.39], [46.0, 90.31], [93.0, 121.02], [130.0, 131.09], [134.0, 138.55], [142.0, 142.84], [144.0, 145.03]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 54.56, 0.0, 0.0, 0.0, 30.25, 28.44, 0.0, 28.68, 0.0, 29.49, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["didgeridoo", 46.2], ["music", 15.03], ["theremin", 5.55]], [["music", 51.46], ["musical instrument", 27.99], ["didgeridoo", 7.1]], null, [["speech", 28.84], ["vehicle", 21.37], ["music", 18.7]], null, [["music", 71.0], ["sound effect", 3.11], ["musical instrument", 2.23]], null, null], "duration": [0.13, 3.69, 1.64, 0.09, 0.63, 3.71, 13.39, 44.31, 28.02, 1.09, 4.55, 0.84, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/meEN8tfT7b4_filtered.json b/annotations_filtered/meEN8tfT7b4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34e5a68342c46e8d39dd0f1afdf1a9ac6344898b --- /dev/null +++ b/annotations_filtered/meEN8tfT7b4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.27], [24.0, 24.54], [43.0, 42.63], [49.0, 49.52], [51.0, 52.07], [54.0, 54.72], [61.0, 61.53], [67.0, 68.0], [70.0, 70.5], [72.0, 74.12], [81.0, 82.12], [83.0, 84.32], [86.0, 86.78], [88.0, 89.5], [94.0, 94.22], [99.0, 100.74], [102.0, 103.05], [106.0, 107.05]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 39.66], ["grunt", 6.45], ["music", 4.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.27, 0.54, -0.37, 0.52, 1.07, 0.72, 0.53, 1.0, 0.5, 2.12, 1.12, 1.32, 0.78, 1.5, 0.22, 1.74, 1.05, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/meSIVfOyerg_filtered.json b/annotations_filtered/meSIVfOyerg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70c18c0c0fd13c0226f50ebd185cef99c739f8f8 --- /dev/null +++ b/annotations_filtered/meSIVfOyerg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.27], [7.0, 7.57], [10.0, 11.1], [26.0, 26.64], [27.0, 27.82], [28.0, 28.76], [30.0, 32.88], [33.0, 34.3], [35.0, 35.8], [42.0, 43.11], [44.0, 49.3], [60.0, 60.69], [61.0, 62.13], [63.0, 63.91], [67.0, 68.07], [74.0, 74.36], [84.0, 84.99], [88.0, 90.8], [92.0, 94.29]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 0.0, 0.0, 35.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 42.51], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 11.07], ["hum", 8.49], ["mains hum", 7.66]], null, null, null, [["speech", 73.64], ["fly, housefly", 4.31], ["fart", 4.02]], null, null, null, null, null, null, null, [["fly, housefly", 27.16], ["bee, wasp, etc.", 15.97], ["insect", 15.63]]], "duration": [0.27, 0.57, 1.1, 0.64, 0.82, 0.76, 2.88, 1.3, 0.8, 1.11, 5.3, 0.69, 1.13, 0.91, 1.07, 0.36, 0.99, 2.8, 2.29]} \ No newline at end of file diff --git a/annotations_filtered/meZXqa_CE_o_filtered.json b/annotations_filtered/meZXqa_CE_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dde564cef1aa224712c7b9a21022ca53af329d22 --- /dev/null +++ b/annotations_filtered/meZXqa_CE_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.13], [2.0, 7.77], [11.0, 15.77], [16.0, 19.6], [22.0, 23.16], [26.0, 35.95], [37.0, 49.62], [52.0, 53.54], [55.0, 58.5], [63.0, 63.41], [64.0, 65.69], [67.0, 68.5], [70.0, 70.61], [72.0, 72.87], [75.0, 76.17], [79.0, 80.69], [81.0, 81.48], [83.0, 83.07], [88.0, 88.86], [92.0, 93.55], [97.0, 97.17], [101.0, 102.64], [105.0, 109.98], [112.0, 112.67]], "keep_status": [false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.9, 32.58, 36.5, 0.0, 32.52, 47.74, 0.0, 55.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.81, 0.0], "audiomae_on_audioset": [null, [["speech", 59.47], ["sidetone", 8.42], ["vehicle", 5.92]], [["vehicle", 27.12], ["car", 23.36], ["race car, auto racing", 6.62]], [["speech", 32.78], ["hum", 15.64], ["whale vocalization", 6.66]], null, [["music", 32.15], ["speech", 29.22], ["musical instrument", 7.51]], [["music", 67.02], ["synthesizer", 4.71], ["harmonic", 4.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 5.77, 4.77, 3.6, 1.16, 9.95, 12.62, 1.54, 3.5, 0.41, 1.69, 1.5, 0.61, 0.87, 1.17, 1.69, 0.48, 0.07, 0.86, 1.55, 0.17, 1.64, 4.98, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/melCNhYmwII_filtered.json b/annotations_filtered/melCNhYmwII_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73ab3386947d69728cfb03df61eba7589f9898b1 --- /dev/null +++ b/annotations_filtered/melCNhYmwII_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.58], [12.0, 13.68], [14.0, 15.74], [17.0, 18.1], [21.0, 21.51], [25.0, 25.76], [26.0, 27.9], [29.0, 29.35], [30.0, 43.19], [44.0, 47.01], [48.0, 49.72], [58.0, 59.71], [60.0, 59.76], [60.0, 88.65], [89.0, 93.45], [96.0, 100.43], [121.0, 120.9]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [51.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.14, 99.97, 0.0, 0.0, 0.0, 86.64, 40.12, 39.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["thunk", 24.83], ["electric shaver, electric razor", 8.07], ["whack, thwack", 7.08]], null, null, null, null, null, [["mains hum", 53.27], ["hum", 42.14], ["speech", 0.65]], [["hum", 30.18], ["mains hum", 26.5], ["speech", 12.52]], null], "duration": [2.58, 1.68, 1.74, 1.1, 0.51, 0.76, 1.9, 0.35, 13.19, 3.01, 1.72, 1.71, -0.24, 28.65, 4.45, 4.43, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/mfCwgYR1yS8_filtered.json b/annotations_filtered/mfCwgYR1yS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8defb0c40839016d1f183b601390b1d6de4acae7 --- /dev/null +++ b/annotations_filtered/mfCwgYR1yS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[113.0, 117.61]], "keep_status": [false], "silence_prob": [35.72], "audiomae_on_audioset": [[["throbbing", 32.64], ["hum", 28.01], ["music", 19.41]]], "duration": [4.61]} \ No newline at end of file diff --git a/annotations_filtered/mfg2O0A6L4g_filtered.json b/annotations_filtered/mfg2O0A6L4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31b4120cbcf748ae886d827a8ec217a9c29bf4fa --- /dev/null +++ b/annotations_filtered/mfg2O0A6L4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.36], [6.0, 9.63], [16.0, 23.57], [24.0, 26.84], [27.0, 70.46], [72.0, 73.55], [75.0, 78.16], [79.0, 81.9], [84.0, 84.91], [87.0, 89.34], [91.0, 93.09], [94.0, 96.74], [98.0, 98.52], [100.0, 100.72], [102.0, 102.19], [103.0, 104.33], [105.0, 108.85], [110.0, 111.33], [112.0, 114.51], [116.0, 116.48], [120.0, 123.96], [125.0, 126.47]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.34, 34.78, 76.53, 91.98, 0.0, 0.0, 46.4, 65.79, 0.0, 71.87, 53.59, 53.04, 0.0, 0.0, 0.0, 0.0, 60.7, 0.0, 62.89, 0.0, 62.89, 0.0], "audiomae_on_audioset": [null, [["throbbing", 22.99], ["hum", 22.72], ["speech", 13.74]], null, null, null, null, [["hum", 9.72], ["fly, housefly", 8.23], ["throbbing", 6.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.36, 3.63, 7.57, 2.84, 43.46, 1.55, 3.16, 2.9, 0.91, 2.34, 2.09, 2.74, 0.52, 0.72, 0.19, 1.33, 3.85, 1.33, 2.51, 0.48, 3.96, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/mfkzA9zjRdM_filtered.json b/annotations_filtered/mfkzA9zjRdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dacd07f70103c38ccb53826ea9d3581cdd6a460a --- /dev/null +++ b/annotations_filtered/mfkzA9zjRdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 39.58], [40.0, 40.9], [42.0, 42.92], [44.0, 46.52], [47.0, 53.55], [55.0, 61.43], [64.0, 69.45], [76.0, 93.92], [100.0, 100.97], [103.0, 104.19], [105.0, 105.68], [107.0, 112.63], [117.0, 119.69], [121.0, 121.31]], "keep_status": [true, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.21, 0.0, 0.0, 49.87, 40.99, 31.7, 30.83, 29.89, 0.0, 0.0, 0.0, 29.64, 37.64, 0.0], "audiomae_on_audioset": [[["music", 60.22], ["synthesizer", 4.24], ["effects unit", 2.87]], null, null, [["music", 47.59], ["synthesizer", 7.15], ["musical instrument", 4.33]], [["music", 37.84], ["speech", 11.83], ["sidetone", 8.77]], [["music", 67.79], ["throbbing", 5.21], ["hum", 4.76]], [["music", 58.62], ["ambient music", 10.52], ["theremin", 6.35]], [["music", 73.15], ["musical instrument", 5.31], ["ambient music", 2.28]], null, null, null, [["music", 59.07], ["musical instrument", 10.44], ["synthesizer", 8.85]], [["speech", 40.68], ["music", 23.51], ["foghorn", 8.48]], null], "duration": [8.58, 0.9, 0.92, 2.52, 6.55, 6.43, 5.45, 17.92, 0.97, 1.19, 0.68, 5.63, 2.69, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/mgSDir-wcGk_filtered.json b/annotations_filtered/mgSDir-wcGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0ed739ada0738b7c09df3f1da5a9e01a0dd0480 --- /dev/null +++ b/annotations_filtered/mgSDir-wcGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.36], [5.0, 5.02], [6.0, 6.79], [9.0, 10.13], [11.0, 11.2], [16.0, 19.89], [27.0, 30.82], [33.0, 33.39], [35.0, 35.4], [37.0, 38.47], [43.0, 43.29], [49.0, 49.69], [53.0, 53.5], [57.0, 60.1], [61.0, 72.94], [73.0, 74.48], [77.0, 77.67], [80.0, 81.46], [82.0, 85.53], [86.0, 86.98], [87.0, 89.92], [90.0, 98.71], [100.0, 103.96], [105.0, 106.24], [106.0, 107.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 99.91, 0.0, 0.0, 0.0, 96.66, 0.0, 83.34, 99.1, 99.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.02, 0.79, 1.13, 0.2, 3.89, 3.82, 0.39, 0.4, 1.47, 0.29, 0.69, 0.5, 3.1, 11.94, 1.48, 0.67, 1.46, 3.53, 0.98, 2.92, 8.71, 3.96, 1.24, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/mgSQQjO5pwI_filtered.json b/annotations_filtered/mgSQQjO5pwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38987fccdeb9eb437c6ab991b0030d86bc08459e --- /dev/null +++ b/annotations_filtered/mgSQQjO5pwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.77], [7.0, 7.82], [9.0, 10.86], [13.0, 16.55], [20.0, 20.61], [29.0, 29.86], [32.0, 32.1], [34.0, 34.23], [37.0, 38.97], [39.0, 40.54], [47.0, 47.92], [53.0, 56.25], [57.0, 57.69], [58.0, 59.39], [60.0, 64.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 99.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 0.82, 1.86, 3.55, 0.61, 0.86, 0.1, 0.23, 1.97, 1.54, 0.92, 3.25, 0.69, 1.39, 4.1]} \ No newline at end of file diff --git a/annotations_filtered/mgr2tLYYha4_filtered.json b/annotations_filtered/mgr2tLYYha4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..464d0729ff6e97506887ec69879101ee505ba9c7 --- /dev/null +++ b/annotations_filtered/mgr2tLYYha4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.58], [15.0, 15.55], [18.0, 18.84], [20.0, 20.88], [24.0, 38.72], [39.0, 44.0], [45.0, 46.75], [49.0, 50.95], [51.0, 53.16], [54.0, 56.3], [57.0, 59.41], [60.0, 61.26], [62.0, 75.19], [76.0, 81.53], [82.0, 89.13], [89.0, 92.4], [93.0, 109.48], [110.0, 111.6], [113.0, 113.91]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.64, 53.84, 0.0, 0.0, 40.55, 74.92, 35.0, 0.0, 36.26, 34.21, 34.83, 34.8, 32.23, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 18.69], ["mains hum", 15.65], ["didgeridoo", 13.08]], null, [["fly, housefly", 42.9], ["insect", 20.91], ["mosquito", 9.69]], null, [["music", 74.03], ["ambient music", 6.4], ["theremin", 4.13]], [["music", 71.27], ["ambient music", 6.3], ["synthesizer", 3.71]], [["music", 34.97], ["theremin", 16.81], ["hum", 7.76]], [["music", 41.81], ["ambient music", 14.06], ["didgeridoo", 11.35]], [["music", 54.33], ["ambient music", 14.02], ["didgeridoo", 6.91]], null, null], "duration": [0.58, 0.55, 0.84, 0.88, 14.72, 5.0, 1.75, 1.95, 2.16, 2.3, 2.41, 1.26, 13.19, 5.53, 7.13, 3.4, 16.48, 1.6, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/mgyypjEpK6U_filtered.json b/annotations_filtered/mgyypjEpK6U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f97464b22bbb99d4df0ca7c7783a1411fc321747 --- /dev/null +++ b/annotations_filtered/mgyypjEpK6U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.83], [2.0, 2.76], [4.0, 4.5], [7.0, 8.92], [10.0, 10.45], [18.0, 18.86], [21.0, 21.37], [22.0, 22.96], [25.0, 26.55], [33.0, 33.67], [35.0, 35.14], [38.0, 37.99], [39.0, 39.66], [46.0, 47.98], [48.0, 50.45], [51.0, 52.54], [55.0, 55.98], [57.0, 56.86], [57.0, 57.97], [59.0, 60.03], [73.0, 73.67], [74.0, 75.32], [76.0, 76.49], [78.0, 79.12], [80.0, 80.91], [85.0, 84.84], [94.0, 94.63], [99.0, 99.54], [102.0, 101.66], [110.0, 111.21], [112.0, 114.57], [115.0, 115.86], [119.0, 119.57], [123.0, 124.11], [130.0, 130.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 0.76, 0.5, 1.92, 0.45, 0.86, 0.37, 0.96, 1.55, 0.67, 0.14, -0.01, 0.66, 1.98, 2.45, 1.54, 0.98, -0.14, 0.97, 1.03, 0.67, 1.32, 0.49, 1.12, 0.91, -0.16, 0.63, 0.54, -0.34, 1.21, 2.57, 0.86, 0.57, 1.11, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/mh7fUlkkX68_filtered.json b/annotations_filtered/mh7fUlkkX68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b454b4d8c90f42a73d807943c84b2226514338f6 --- /dev/null +++ b/annotations_filtered/mh7fUlkkX68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.04], [20.0, 21.39], [25.0, 25.3], [25.0, 25.34], [25.0, 26.08], [28.0, 28.44], [36.0, 36.51], [51.0, 51.46], [57.0, 57.81], [59.0, 59.39], [64.0, 64.44], [66.0, 65.84], [73.0, 73.8], [80.0, 80.18], [99.0, 98.63], [105.0, 105.24], [109.0, 109.54], [114.0, 114.99], [117.0, 117.66], [120.0, 121.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 1.39, 0.3, 0.34, 1.08, 0.44, 0.51, 0.46, 0.81, 0.39, 0.44, -0.16, 0.8, 0.18, -0.37, 0.24, 0.54, 0.99, 0.66, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/mhCiFB07I2w_filtered.json b/annotations_filtered/mhCiFB07I2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..407b536a6bad68edcb38194404e8ff8f2557386c --- /dev/null +++ b/annotations_filtered/mhCiFB07I2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 37.52], [40.0, 41.49], [42.0, 53.06], [56.0, 75.54], [81.0, 81.04], [83.0, 83.62], [85.0, 85.53], [87.0, 114.47], [119.0, 119.67], [125.0, 129.98], [130.0, 131.26], [134.0, 135.53]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [52.05, 0.0, 32.61, 34.64, 0.0, 0.0, 0.0, 31.69, 0.0, 30.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 12.17], ["police car (siren)", 7.74], ["emergency vehicle", 7.48]], [["hum", 35.96], ["mains hum", 21.98], ["throbbing", 19.87]], null, null, null, [["speech", 49.47], ["noise", 11.07], ["sidetone", 5.59]], null, [["explosion", 43.13], ["speech", 25.68], ["artillery fire", 9.96]], null, null], "duration": [19.52, 1.49, 11.06, 19.54, 0.04, 0.62, 0.53, 27.47, 0.67, 4.98, 1.26, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/mha0N1Cx1Ck_filtered.json b/annotations_filtered/mha0N1Cx1Ck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50e608acc48242d71b270c8622fd0c364dc2abee --- /dev/null +++ b/annotations_filtered/mha0N1Cx1Ck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 23.11], [24.0, 24.65], [28.0, 44.91], [46.0, 52.34], [54.0, 98.85], [100.0, 100.5], [102.0, 102.59], [104.0, 109.98]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [62.47, 0.0, 78.72, 77.87, 0.0, 0.0, 0.0, 76.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [5.11, 0.65, 16.91, 6.34, 44.85, 0.5, 0.59, 5.98]} \ No newline at end of file diff --git a/annotations_filtered/mhaxNZs5MGc_filtered.json b/annotations_filtered/mhaxNZs5MGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..421880a755f85714895ee663ddeccbaffaba0853 --- /dev/null +++ b/annotations_filtered/mhaxNZs5MGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[82.0, 93.11], [94.0, 102.91], [104.0, 104.13]], "keep_status": [false, false, false], "silence_prob": [83.88, 61.08, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [11.11, 8.91, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/miJ26dYcbBw_filtered.json b/annotations_filtered/miJ26dYcbBw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/miJ26dYcbBw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/mjbxL_v2DPk_filtered.json b/annotations_filtered/mjbxL_v2DPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28126df7f97390e4870e8f626cf8defcd8b4f0b1 --- /dev/null +++ b/annotations_filtered/mjbxL_v2DPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.37], [12.0, 12.9], [26.0, 26.55], [32.0, 33.07], [33.0, 34.4], [42.0, 41.96], [43.0, 45.22], [49.0, 49.15], [52.0, 53.38], [56.0, 65.72], [68.0, 69.13], [71.0, 72.32], [73.0, 75.56], [81.0, 84.96], [88.0, 92.3], [94.0, 94.91]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [41.28, 0.0, 0.0, 0.0, 0.0, 0.0, 41.01, 0.0, 0.0, 51.94, 0.0, 0.0, 51.55, 29.97, 37.82, 0.0], "audiomae_on_audioset": [[["speech", 21.41], ["mains hum", 18.4], ["hum", 12.53]], null, null, null, null, null, [["fly, housefly", 54.39], ["insect", 19.08], ["mosquito", 17.27]], null, null, null, null, null, null, [["explosion", 14.31], ["throbbing", 7.98], ["stomach rumble", 7.52]], [["mains hum", 19.52], ["crushing", 16.36], ["hum", 14.78]], null], "duration": [2.37, 0.9, 0.55, 1.07, 1.4, -0.04, 2.22, 0.15, 1.38, 9.72, 1.13, 1.32, 2.56, 3.96, 4.3, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/mjdgDECpWr4_filtered.json b/annotations_filtered/mjdgDECpWr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f898961f746c84a22cdbfc6aff7691194da7abd4 --- /dev/null +++ b/annotations_filtered/mjdgDECpWr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.98], [3.0, 3.55], [6.0, 12.46], [13.0, 20.6], [21.0, 21.81], [23.0, 24.36], [29.0, 29.51], [31.0, 32.44], [35.0, 35.78], [37.0, 37.05], [38.0, 38.31], [39.0, 40.51], [41.0, 42.96], [48.0, 48.1], [50.0, 50.53], [51.0, 52.81], [53.0, 54.7], [58.0, 58.31], [65.0, 65.79], [73.0, 73.7], [74.0, 78.98], [84.0, 84.97], [86.0, 87.1], [88.0, 88.86], [90.0, 93.66], [95.0, 96.28], [99.0, 100.11], [106.0, 106.03], [107.0, 107.59], [109.0, 109.83], [115.0, 115.94], [118.0, 118.0], [119.0, 119.15], [122.0, 122.27], [125.0, 126.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.55, 78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 42.06], ["foghorn", 27.33], ["musical instrument", 6.94]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.02, 0.55, 6.46, 7.6, 0.81, 1.36, 0.51, 1.44, 0.78, 0.05, 0.31, 1.51, 1.96, 0.1, 0.53, 1.81, 1.7, 0.31, 0.79, 0.7, 4.98, 0.97, 1.1, 0.86, 3.66, 1.28, 1.11, 0.03, 0.59, 0.83, 0.94, 0.0, 0.15, 0.27, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/mjo4d488_yE_filtered.json b/annotations_filtered/mjo4d488_yE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cce2a62cdee95b3287ad3a7db6c714892199686 --- /dev/null +++ b/annotations_filtered/mjo4d488_yE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 21.56], [42.0, 50.94], [51.0, 80.65], [83.0, 92.45], [93.0, 100.7], [103.0, 109.43], [110.0, 111.27], [113.0, 113.12], [114.0, 122.4], [123.0, 123.63], [128.0, 130.35]], "keep_status": [false, false, true, false, true, false, false, false, true, false, false], "silence_prob": [44.9, 64.52, 31.13, 31.75, 34.92, 48.87, 0.0, 0.0, 42.76, 0.0, 64.18], "audiomae_on_audioset": [[["sidetone", 57.12], ["frog", 18.59], ["speech", 4.67]], null, [["music", 40.51], ["whack, thwack", 8.52], ["speech", 6.59]], [["music", 74.32], ["explosion", 2.63], ["musical instrument", 2.61]], [["music", 24.12], ["livestock, farm animals, working animals", 7.54], ["cattle, bovinae", 7.29]], [["music", 67.67], ["musical instrument", 6.4], ["hum", 2.24]], null, null, [["speech", 36.3], ["music", 20.43], ["breaking", 8.41]], null, null], "duration": [4.56, 8.94, 29.65, 9.45, 7.7, 6.43, 1.27, 0.12, 8.4, 0.63, 2.35]} \ No newline at end of file diff --git a/annotations_filtered/mjt0iNTJrWE_filtered.json b/annotations_filtered/mjt0iNTJrWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..648a2794f9475d055c3460a529ddfdc9f39e7995 --- /dev/null +++ b/annotations_filtered/mjt0iNTJrWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.2], [11.0, 13.74], [14.0, 16.9], [30.0, 31.51], [36.0, 37.32], [39.0, 40.49], [56.0, 56.52], [58.0, 58.58], [61.0, 64.08], [68.0, 68.3], [70.0, 82.44], [96.0, 96.47], [98.0, 98.12], [99.0, 100.47], [105.0, 105.34], [110.0, 112.09], [113.0, 114.44], [120.0, 121.19], [128.0, 128.55]], "keep_status": [true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [45.98, 41.83, 39.66, 0.0, 0.0, 0.0, 0.0, 0.0, 42.33, 0.0, 41.01, 0.0, 0.0, 0.0, 0.0, 43.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["mechanical fan", 9.18], ["creak", 7.75], ["speech", 7.67]], [["creak", 11.61], ["mechanisms", 10.43], ["hum", 6.51]], [["speech", 31.54], ["whale vocalization", 24.64], ["stomach rumble", 21.1]], null, null, null, null, null, [["hum", 18.88], ["speech", 13.13], ["throbbing", 10.53]], null, [["hum", 29.89], ["whale vocalization", 20.93], ["mains hum", 19.32]], null, null, null, null, [["hum", 25.91], ["throbbing", 17.26], ["mains hum", 8.58]], null, null, null], "duration": [2.2, 2.74, 2.9, 1.51, 1.32, 1.49, 0.52, 0.58, 3.08, 0.3, 12.44, 0.47, 0.12, 1.47, 0.34, 2.09, 1.44, 1.19, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/mjuNE5wyMzY_filtered.json b/annotations_filtered/mjuNE5wyMzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b8b06c7fb353b18ee297074ca051c0879c7f79c --- /dev/null +++ b/annotations_filtered/mjuNE5wyMzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 16.93], [17.0, 24.39], [26.0, 35.99], [39.0, 64.13], [69.0, 105.39], [108.0, 110.54], [115.0, 114.99], [116.0, 131.19], [131.0, 137.59], [140.0, 143.82], [144.0, 148.56], [155.0, 172.66]], "keep_status": [true, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [33.05, 32.33, 31.12, 30.44, 0.0, 33.77, 0.0, 34.18, 31.58, 61.87, 50.76, 30.46], "audiomae_on_audioset": [[["bee, wasp, etc.", 14.47], ["music", 12.37], ["fly, housefly", 11.41]], [["hum", 32.66], ["speech", 23.73], ["music", 20.18]], [["music", 49.18], ["speech", 32.71], ["hum", 2.42]], [["speech", 56.49], ["music", 18.43], ["hum", 4.14]], null, [["music", 37.56], ["didgeridoo", 11.03], ["musical instrument", 6.83]], null, [["music", 80.4], ["didgeridoo", 5.66], ["theremin", 5.29]], [["music", 40.5], ["trombone", 4.87], ["fly, housefly", 4.77]], null, null, [["music", 33.91], ["foghorn", 6.09], ["hum", 4.23]]], "duration": [12.93, 7.39, 9.99, 25.13, 36.39, 2.54, -0.01, 15.19, 6.59, 3.82, 4.56, 17.66]} \ No newline at end of file diff --git a/annotations_filtered/mk2OptcsXuo_filtered.json b/annotations_filtered/mk2OptcsXuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47e3e9194f57f65324fe09d4bb05f816234543ed --- /dev/null +++ b/annotations_filtered/mk2OptcsXuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 123.77], [124.0, 123.87], [124.0, 142.37], [144.0, 163.92]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 31.78, 29.18], "audiomae_on_audioset": [null, null, [["music", 39.84], ["whack, thwack", 7.95], ["mains hum", 6.94]], [["music", 65.23], ["speech", 13.84], ["didgeridoo", 5.92]]], "duration": [48.77, -0.13, 18.37, 19.92]} \ No newline at end of file diff --git a/annotations_filtered/mkG2YdCogPY_filtered.json b/annotations_filtered/mkG2YdCogPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78c0f00af27a850f244287022b8eb4f1d0c01bfc --- /dev/null +++ b/annotations_filtered/mkG2YdCogPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.16], [9.0, 8.85], [12.0, 13.59], [14.0, 15.16], [17.0, 21.15], [28.0, 28.98], [30.0, 31.06], [32.0, 33.37], [35.0, 35.19], [37.0, 37.86], [40.0, 40.93], [42.0, 43.33], [46.0, 47.41], [48.0, 48.15], [49.0, 49.64], [51.0, 52.88], [58.0, 59.48], [60.0, 60.32], [62.0, 63.22], [65.0, 66.36], [67.0, 67.69], [69.0, 70.38], [74.0, 78.58], [79.0, 81.09], [84.0, 85.01], [87.0, 87.42], [90.0, 90.42], [91.0, 91.71], [96.0, 95.89], [99.0, 100.77], [103.0, 103.37], [105.0, 107.37], [112.0, 113.14], [119.0, 119.47], [122.0, 122.3], [123.0, 123.18], [125.0, 126.79], [128.0, 127.9], [130.0, 130.45], [131.0, 132.48], [134.0, 135.06], [136.0, 137.56], [138.0, 139.67], [141.0, 142.3], [144.0, 144.44], [145.0, 145.27], [146.0, 147.39], [148.0, 148.51], [149.0, 149.72], [150.0, 150.36], [152.0, 152.49], [155.0, 155.56], [156.0, 158.53], [159.0, 159.6], [163.0, 163.38], [165.0, 165.28], [166.0, 167.21], [168.0, 169.1], [169.0, 170.02], [170.0, 171.75], [173.0, 173.96], [174.0, 175.04], [176.0, 176.49], [178.0, 178.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.8], ["boing", 9.54], ["inside, small room", 8.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, -0.15, 1.59, 1.16, 4.15, 0.98, 1.06, 1.37, 0.19, 0.86, 0.93, 1.33, 1.41, 0.15, 0.64, 1.88, 1.48, 0.32, 1.22, 1.36, 0.69, 1.38, 4.58, 2.09, 1.01, 0.42, 0.42, 0.71, -0.11, 1.77, 0.37, 2.37, 1.14, 0.47, 0.3, 0.18, 1.79, -0.1, 0.45, 1.48, 1.06, 1.56, 1.67, 1.3, 0.44, 0.27, 1.39, 0.51, 0.72, 0.36, 0.49, 0.56, 2.53, 0.6, 0.38, 0.28, 1.21, 1.1, 1.02, 1.75, 0.96, 1.04, 0.49, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/mkNO5Y4LOMs_filtered.json b/annotations_filtered/mkNO5Y4LOMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..372e44e355d47c27ad1609e03857223f52dcd89c --- /dev/null +++ b/annotations_filtered/mkNO5Y4LOMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.83], [8.0, 8.45], [28.0, 28.61], [32.0, 33.78], [47.0, 47.7], [48.0, 48.2], [49.0, 48.95]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [-0.17, 0.45, 0.61, 1.78, 0.7, 0.2, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/mkYNhZvlHv0_filtered.json b/annotations_filtered/mkYNhZvlHv0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c02ddcc56b7521ace501fdd3a158011b3515778 --- /dev/null +++ b/annotations_filtered/mkYNhZvlHv0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.13], [4.0, 30.75], [33.0, 34.06], [34.0, 41.52], [42.0, 44.69], [55.0, 55.71], [58.0, 59.43], [62.0, 64.27], [67.0, 70.7], [74.0, 115.16], [116.0, 116.94], [117.0, 118.08]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.6, 44.01, 0.0, 99.31, 99.85, 0.0, 0.0, 74.92, 99.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 33.06], ["synthesizer", 9.76], ["cattle, bovinae", 9.07]], null, null, null, null, null, null, null, null, null, null], "duration": [3.13, 26.75, 1.06, 7.52, 2.69, 0.71, 1.43, 2.27, 3.7, 41.16, 0.94, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/mklRbf1JoGY_filtered.json b/annotations_filtered/mklRbf1JoGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05e60cc0b97b1bab617b6faed0a7504cb6b26d1c --- /dev/null +++ b/annotations_filtered/mklRbf1JoGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [8.0, 10.91], [13.0, 14.3], [17.0, 18.32], [20.0, 23.84], [26.0, 29.56], [30.0, 32.02], [33.0, 35.41], [36.0, 38.91], [41.0, 41.94], [43.0, 45.71], [48.0, 49.32], [51.0, 53.77], [55.0, 57.08], [58.0, 59.46], [61.0, 65.23], [66.0, 67.81], [72.0, 73.33], [74.0, 77.55], [79.0, 82.11], [83.0, 85.56], [89.0, 92.28], [93.0, 101.83], [103.0, 108.41], [110.0, 113.78], [118.0, 118.2]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 79.59, 0.0, 0.0, 81.89, 71.72, 34.62, 51.39, 71.57, 0.0, 70.02, 0.0, 67.76, 36.82, 0.0, 59.24, 0.0, 0.0, 55.81, 57.17, 62.37, 45.05, 46.57, 39.49, 33.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 35.49], ["music", 23.66], ["sidetone", 9.64]], null, null, null, null, null, null, [["music", 38.22], ["speech", 21.25], ["synthesizer", 6.05]], null, null, null, null, null, null, null, [["mains hum", 28.84], ["hum", 24.11], ["music", 16.37]], [["music", 41.33], ["speech", 16.66], ["hum", 10.19]], [["theremin", 40.19], ["music", 39.46], ["musical instrument", 2.54]], [["theremin", 41.88], ["music", 33.55], ["ambient music", 3.97]], null], "duration": [0.26, 2.91, 1.3, 1.32, 3.84, 3.56, 2.02, 2.41, 2.91, 0.94, 2.71, 1.32, 2.77, 2.08, 1.46, 4.23, 1.81, 1.33, 3.55, 3.11, 2.56, 3.28, 8.83, 5.41, 3.78, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/mkn6s-f8PqM_filtered.json b/annotations_filtered/mkn6s-f8PqM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51fe2285eb727caadca89b23ef21e5a730a39f05 --- /dev/null +++ b/annotations_filtered/mkn6s-f8PqM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.11], [8.0, 8.33], [24.0, 25.27], [27.0, 30.64], [33.0, 35.02], [37.0, 37.89], [41.0, 51.63], [52.0, 54.85], [56.0, 61.72]], "keep_status": [true, false, false, true, true, false, true, true, true], "silence_prob": [29.8, 0.0, 0.0, 41.72, 32.2, 0.0, 30.4, 29.79, 29.16], "audiomae_on_audioset": [[["didgeridoo", 35.99], ["speech", 8.52], ["music", 7.94]], null, null, [["speech", 44.39], ["foghorn", 9.3], ["fly, housefly", 5.4]], [["synthesizer", 26.59], ["music", 21.14], ["sonar", 14.06]], null, [["speech", 17.75], ["music", 16.85], ["sound effect", 16.53]], [["whack, thwack", 11.02], ["speech", 10.18], ["sidetone", 7.59]], [["music", 20.44], ["sonar", 16.92], ["synthesizer", 8.07]]], "duration": [4.11, 0.33, 1.27, 3.64, 2.02, 0.89, 10.63, 2.85, 5.72]} \ No newline at end of file diff --git a/annotations_filtered/mksJyq7Z-mQ_filtered.json b/annotations_filtered/mksJyq7Z-mQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dec46c23685a6508a81811f43a6932a241bdcf57 --- /dev/null +++ b/annotations_filtered/mksJyq7Z-mQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.11], [35.0, 37.07], [42.0, 47.01], [86.0, 86.53], [93.0, 94.22], [101.0, 101.7], [117.0, 117.15], [124.0, 124.98], [155.0, 155.36], [170.0, 171.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.4, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.11, 2.07, 5.01, 0.53, 1.22, 0.7, 0.15, 0.98, 0.36, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/mlHF0Vv7yEc_filtered.json b/annotations_filtered/mlHF0Vv7yEc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..665c3fe2de4d055df7e21eef8c6170515f6b9569 --- /dev/null +++ b/annotations_filtered/mlHF0Vv7yEc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.79], [16.0, 18.67], [25.0, 27.46], [30.0, 39.21], [42.0, 54.45], [55.0, 87.94], [95.0, 95.25], [98.0, 110.12], [111.0, 110.76], [111.0, 110.79], [111.0, 110.83], [111.0, 118.71], [119.0, 120.31], [125.0, 127.65], [130.0, 133.83], [134.0, 136.21], [140.0, 170.95]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 34.88, 31.72, 32.37, 32.54, 0.0, 0.0, 30.97, 0.0, 0.0, 0.0, 53.34, 0.0, 31.09, 32.24, 32.39, 0.0], "audiomae_on_audioset": [null, [["music", 20.45], ["speech", 11.41], ["boing", 3.2]], [["music", 46.07], ["speech", 30.16], ["cattle, bovinae", 1.75]], [["hum", 46.67], ["throbbing", 18.7], ["speech", 9.03]], [["speech", 37.79], ["music", 16.2], ["buzz", 11.98]], null, null, [["music", 19.41], ["livestock, farm animals, working animals", 17.38], ["sound effect", 7.34]], null, null, null, null, null, [["speech", 26.37], ["crowd", 10.21], ["music", 7.99]], [["vehicle", 33.88], ["speech", 24.69], ["aircraft", 7.56]], [["quack", 43.87], ["music", 36.21], ["duck", 9.18]], null], "duration": [0.79, 2.67, 2.46, 9.21, 12.45, 32.94, 0.25, 12.12, -0.24, -0.21, -0.17, 7.71, 1.31, 2.65, 3.83, 2.21, 30.95]} \ No newline at end of file diff --git a/annotations_filtered/ml_zSw6yWOE_filtered.json b/annotations_filtered/ml_zSw6yWOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..265f5cb504e531a0a17598d6657754762b5f434f --- /dev/null +++ b/annotations_filtered/ml_zSw6yWOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.76], [8.0, 8.58], [12.0, 12.45], [15.0, 16.87], [19.0, 21.22], [24.0, 27.24], [32.0, 33.71], [36.0, 38.04], [42.0, 44.47], [45.0, 46.28], [46.0, 51.83], [53.0, 55.85], [57.0, 59.02], [64.0, 94.98], [95.0, 95.59], [96.0, 96.08], [96.0, 96.21], [96.0, 104.28], [106.0, 118.37], [121.0, 123.47], [128.0, 129.69], [130.0, 135.95], [137.0, 138.28], [139.0, 139.62], [142.0, 141.96], [147.0, 155.93], [157.0, 157.74], [159.0, 161.3]], "keep_status": [false, false, false, false, true, true, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.31, 28.96, 0.0, 29.21, 28.7, 0.0, 28.74, 29.06, 29.54, 0.0, 0.0, 0.0, 0.0, 46.61, 92.64, 45.02, 0.0, 50.26, 0.0, 0.0, 0.0, 76.2, 0.0, 88.64], "audiomae_on_audioset": [null, null, null, null, [["speech", 48.31], ["rumble", 9.58], ["music", 8.01]], [["hum", 28.24], ["mains hum", 14.85], ["throbbing", 12.6]], null, [["hum", 36.38], ["throbbing", 25.3], ["mains hum", 10.76]], [["whack, thwack", 33.59], ["music", 8.95], ["door", 5.05]], null, [["speech", 32.79], ["livestock, farm animals, working animals", 16.85], ["cattle, bovinae", 7.27]], [["music", 39.54], ["throbbing", 23.32], ["hum", 7.56]], [["music", 25.19], ["beatboxing", 16.71], ["speech", 5.43]], null, null, null, null, [["gong", 53.82], ["singing bowl", 13.62], ["music", 7.45]], null, [["speech", 63.69], ["sidetone", 6.05], ["hum", 3.34]], null, null, null, null, null, null, null, null], "duration": [0.76, 0.58, 0.45, 1.87, 2.22, 3.24, 1.71, 2.04, 2.47, 1.28, 5.83, 2.85, 2.02, 30.98, 0.59, 0.08, 0.21, 8.28, 12.37, 2.47, 1.69, 5.95, 1.28, 0.62, -0.04, 8.93, 0.74, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/mlc2UyZdalQ_filtered.json b/annotations_filtered/mlc2UyZdalQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b20a12055ba57f85b960cb4153622ab61e8495cb --- /dev/null +++ b/annotations_filtered/mlc2UyZdalQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.11], [4.0, 6.91], [10.0, 11.67], [12.0, 21.09], [23.0, 23.03], [28.0, 28.53], [31.0, 31.16], [35.0, 37.1], [38.0, 39.02], [41.0, 42.26], [44.0, 46.63], [52.0, 57.37], [59.0, 59.75], [61.0, 61.47], [62.0, 63.15], [67.0, 69.2], [71.0, 71.73], [77.0, 79.42], [80.0, 83.76], [98.0, 98.71], [99.0, 100.06], [101.0, 101.38], [102.0, 102.03], [103.0, 104.19], [105.0, 105.97], [113.0, 113.04], [117.0, 117.42], [118.0, 127.14]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.37, 0.0, 30.45, 0.0, 0.0, 0.0, 36.03, 0.0, 0.0, 37.72, 31.0, 0.0, 0.0, 0.0, 38.02, 0.0, 71.43, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.6], "audiomae_on_audioset": [null, null, null, [["music", 40.58], ["speech", 20.85], ["throbbing", 8.32]], null, null, null, [["speech", 40.49], ["sidetone", 33.67], ["busy signal", 3.02]], null, null, [["speech", 54.89], ["chirp tone", 8.46], ["sine wave", 7.35]], [["speech", 21.19], ["music", 9.49], ["foghorn", 8.36]], null, null, null, [["music", 23.78], ["theremin", 16.3], ["synthesizer", 13.02]], null, null, null, null, null, null, null, null, null, null, null, [["music", 67.26], ["theremin", 18.87], ["opera", 6.94]]], "duration": [0.11, 2.91, 1.67, 9.09, 0.03, 0.53, 0.16, 2.1, 1.02, 1.26, 2.63, 5.37, 0.75, 0.47, 1.15, 2.2, 0.73, 2.42, 3.76, 0.71, 1.06, 0.38, 0.03, 1.19, 0.97, 0.04, 0.42, 9.14]} \ No newline at end of file diff --git a/annotations_filtered/mlcBwNHilHE_filtered.json b/annotations_filtered/mlcBwNHilHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e61d1ce69feaffc6b51ffd488382a0d529f5856e --- /dev/null +++ b/annotations_filtered/mlcBwNHilHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 26.97], [30.0, 30.5], [38.0, 50.94], [54.0, 56.74], [59.0, 63.83], [67.0, 79.83], [80.0, 81.72], [83.0, 83.35], [85.0, 85.82], [88.0, 90.46], [91.0, 104.06], [107.0, 126.6]], "keep_status": [true, false, false, false, true, false, false, false, false, true, true, true], "silence_prob": [33.3, 0.0, 31.48, 82.97, 33.51, 38.83, 0.0, 0.0, 0.0, 42.55, 33.17, 33.02], "audiomae_on_audioset": [[["music", 36.52], ["whack, thwack", 19.59], ["hum", 3.93]], null, [["music", 84.82], ["speech", 3.22], ["electronic music", 1.76]], null, [["hum", 46.52], ["mains hum", 11.88], ["music", 9.8]], [["music", 62.17], ["speech", 10.82], ["scary music", 3.4]], null, null, null, [["music", 26.41], ["mains hum", 15.68], ["hum", 10.44]], [["speech", 22.43], ["music", 20.93], ["hum", 13.91]], [["ding", 31.18], ["clang", 23.23], ["music", 10.33]]], "duration": [10.97, 0.5, 12.94, 2.74, 4.83, 12.83, 1.72, 0.35, 0.82, 2.46, 13.06, 19.6]} \ No newline at end of file diff --git a/annotations_filtered/mlkWgiyQ-8g_filtered.json b/annotations_filtered/mlkWgiyQ-8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b1949cbe932d61dfe5797704eb183aa4333f803 --- /dev/null +++ b/annotations_filtered/mlkWgiyQ-8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.08], [8.0, 8.48], [10.0, 10.77], [18.0, 17.71], [19.0, 33.22], [34.0, 35.58], [38.0, 38.8], [42.0, 42.35], [44.0, 45.62], [46.0, 46.26], [47.0, 57.67], [59.0, 59.27], [62.0, 62.41], [64.0, 65.62], [66.0, 66.68], [68.0, 68.82], [71.0, 71.25], [72.0, 72.74], [77.0, 77.08], [78.0, 78.71], [87.0, 87.22], [94.0, 93.95], [96.0, 96.8], [98.0, 98.71], [101.0, 102.36], [103.0, 104.57], [105.0, 106.49], [107.0, 109.34], [110.0, 111.08], [112.0, 113.48], [117.0, 117.73], [121.0, 121.14], [124.0, 123.84], [128.0, 127.87], [131.0, 132.26], [133.0, 133.64], [136.0, 136.88], [143.0, 142.8], [149.0, 149.03], [151.0, 152.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.07, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.32], ["hum", 4.16], ["inside, small room", 3.78]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.08, 0.48, 0.77, -0.29, 14.22, 1.58, 0.8, 0.35, 1.62, 0.26, 10.67, 0.27, 0.41, 1.62, 0.68, 0.82, 0.25, 0.74, 0.08, 0.71, 0.22, -0.05, 0.8, 0.71, 1.36, 1.57, 1.49, 2.34, 1.08, 1.48, 0.73, 0.14, -0.16, -0.13, 1.26, 0.64, 0.88, -0.2, 0.03, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/mlpkQuvDJbs_filtered.json b/annotations_filtered/mlpkQuvDJbs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6366a042518d02ecb656bcc1bd5e7d565e31e5d8 --- /dev/null +++ b/annotations_filtered/mlpkQuvDJbs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 78.22], [82.0, 82.14], [83.0, 83.05], [85.0, 86.12], [87.0, 96.42], [101.0, 109.63], [110.0, 118.37], [120.0, 120.56], [122.0, 123.42], [127.0, 128.21], [131.0, 142.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.41, 53.78, 35.48, 0.0, 0.0, 0.0, 30.24], "audiomae_on_audioset": [null, null, null, null, [["hum", 40.38], ["mains hum", 35.09], ["music", 12.57]], null, [["music", 30.75], ["throbbing", 29.01], ["hum", 27.69]], null, null, null, [["noise", 24.26], ["music", 22.71], ["mains hum", 5.47]]], "duration": [36.22, 0.14, 0.05, 1.12, 9.42, 8.63, 8.37, 0.56, 1.42, 1.21, 11.23]} \ No newline at end of file diff --git a/annotations_filtered/mm93ELyLN1w_filtered.json b/annotations_filtered/mm93ELyLN1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33c084fee207de54e9ee3ae66073f508af994f3e --- /dev/null +++ b/annotations_filtered/mm93ELyLN1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.5], [16.0, 19.75], [26.0, 25.93], [28.0, 28.56]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 30.65, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 40.64], ["thunk", 14.22], ["music", 6.06]], null, null], "duration": [0.5, 3.75, -0.07, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/mmH76155CuU_filtered.json b/annotations_filtered/mmH76155CuU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5ff8e6a689d7130dd272ff3e071174b5beb4787 --- /dev/null +++ b/annotations_filtered/mmH76155CuU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.42], [21.0, 22.54], [24.0, 25.68], [27.0, 81.48]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.42, 1.54, 1.68, 54.48]} \ No newline at end of file diff --git a/annotations_filtered/mmdPZs0Nvvg_filtered.json b/annotations_filtered/mmdPZs0Nvvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07c38918a312190d8fe007c87556cf0442f0e92f --- /dev/null +++ b/annotations_filtered/mmdPZs0Nvvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 28.05], [29.0, 34.01], [37.0, 39.39], [41.0, 42.6], [43.0, 75.64], [77.0, 77.23], [79.0, 85.4], [87.0, 88.77], [90.0, 93.55]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [98.36, 66.51, 96.66, 0.0, 0.0, 0.0, 66.15, 0.0, 44.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["singing bowl", 28.83], ["music", 18.66], ["speech", 16.76]]], "duration": [15.05, 5.01, 2.39, 1.6, 32.64, 0.23, 6.4, 1.77, 3.55]} \ No newline at end of file diff --git a/annotations_filtered/mmuJb30cigQ_filtered.json b/annotations_filtered/mmuJb30cigQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa8a548def3533244086c2996f3d268ce16c2832 --- /dev/null +++ b/annotations_filtered/mmuJb30cigQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [19.0, 19.7], [20.0, 21.0], [22.0, 22.5], [23.0, 26.32], [28.0, 28.63], [29.0, 29.2], [39.0, 42.57], [43.0, 43.17], [44.0, 45.55], [47.0, 49.72], [51.0, 52.15], [53.0, 55.04], [56.0, 57.54], [58.0, 59.98], [61.0, 61.5], [63.0, 63.39], [65.0, 66.09], [68.0, 69.84], [70.0, 72.59], [76.0, 76.5], [78.0, 78.44], [80.0, 80.33], [81.0, 84.35], [85.0, 85.58], [98.0, 99.01], [100.0, 100.5], [102.0, 102.93]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.94, 0.0, 0.0, 35.35, 0.0, 0.0, 81.71, 0.0, 48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.79, 0.0, 0.0, 0.0, 32.67, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sine wave", 23.17], ["chirp tone", 20.35], ["speech", 16.27]], null, null, [["livestock, farm animals, working animals", 20.79], ["hum", 11.86], ["electric shaver, electric razor", 8.25]], null, null, null, null, [["music", 37.38], ["speech", 23.94], ["musical instrument", 6.0]], null, null, null, null, null, null, [["music", 46.42], ["speech", 26.18], ["musical instrument", 3.7]], null, null, null, [["animal", 28.77], ["music", 16.47], ["roaring cats (lions, tigers)", 15.38]], null, null, null, null], "duration": [0.49, 0.7, 1.0, 0.5, 3.32, 0.63, 0.2, 3.57, 0.17, 1.55, 2.72, 1.15, 2.04, 1.54, 1.98, 0.5, 0.39, 1.09, 1.84, 2.59, 0.5, 0.44, 0.33, 3.35, 0.58, 1.01, 0.5, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/mn5crhTusSA_filtered.json b/annotations_filtered/mn5crhTusSA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9aa8af13f718153e8a474987f680b3b2723bea5b --- /dev/null +++ b/annotations_filtered/mn5crhTusSA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.13], [10.0, 10.15], [12.0, 12.65], [13.0, 13.74], [17.0, 18.62], [21.0, 21.44], [22.0, 23.55], [25.0, 25.49], [31.0, 30.86], [35.0, 35.04], [42.0, 43.11], [45.0, 45.59], [48.0, 48.46], [50.0, 55.02], [57.0, 57.52], [61.0, 63.39], [65.0, 66.88], [69.0, 70.06], [71.0, 71.79], [75.0, 76.27], [78.0, 78.88], [80.0, 81.19], [82.0, 82.63], [109.0, 112.01], [112.0, 116.87], [117.0, 117.48], [121.0, 122.66], [127.0, 127.99], [132.0, 132.68], [136.0, 137.44], [140.0, 140.54], [141.0, 142.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 58.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 0.15, 0.65, 0.74, 1.62, 0.44, 1.55, 0.49, -0.14, 0.04, 1.11, 0.59, 0.46, 5.02, 0.52, 2.39, 1.88, 1.06, 0.79, 1.27, 0.88, 1.19, 0.63, 3.01, 4.87, 0.48, 1.66, 0.99, 0.68, 1.44, 0.54, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/mn60YWO218k_filtered.json b/annotations_filtered/mn60YWO218k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f404f8d3d055f0faa5fce3f141399d7e69da1729 --- /dev/null +++ b/annotations_filtered/mn60YWO218k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.56], [9.0, 9.83], [13.0, 13.1], [15.0, 15.82], [16.0, 16.97], [18.0, 18.79], [21.0, 21.64], [24.0, 24.16], [27.0, 29.13], [47.0, 50.03], [52.0, 52.02], [55.0, 56.15], [58.0, 59.73], [61.0, 61.84], [63.0, 64.27], [67.0, 67.09], [70.0, 71.04], [76.0, 77.28], [80.0, 81.13], [83.0, 82.78], [85.0, 86.31], [88.0, 90.0], [92.0, 92.1], [94.0, 94.81], [96.0, 96.79], [101.0, 101.55], [103.0, 103.25], [105.0, 106.89], [107.0, 107.96], [110.0, 114.78], [118.0, 118.94], [122.0, 121.64], [124.0, 128.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.93, 0.0, 0.0, 43.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["tuning fork", 71.48], ["sine wave", 14.07], ["chirp tone", 9.06]], null, null, null, null, null, null, null, [["music", 39.91], ["hum", 28.34], ["mains hum", 6.23]], null, null, [["music", 41.02], ["didgeridoo", 11.02], ["speech", 8.58]]], "duration": [1.56, 0.83, 0.1, 0.82, 0.97, 0.79, 0.64, 0.16, 2.13, 3.03, 0.02, 1.15, 1.73, 0.84, 1.27, 0.09, 1.04, 1.28, 1.13, -0.22, 1.31, 2.0, 0.1, 0.81, 0.79, 0.55, 0.25, 1.89, 0.96, 4.78, 0.94, -0.36, 4.97]} \ No newline at end of file diff --git a/annotations_filtered/mn6Wmceebfc_filtered.json b/annotations_filtered/mn6Wmceebfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbaf2358726751d95786029d86cac77c6d4bc5b7 --- /dev/null +++ b/annotations_filtered/mn6Wmceebfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.95], [10.0, 10.59], [13.0, 13.47], [16.0, 15.94], [18.0, 19.72], [24.0, 24.9], [25.0, 27.3], [28.0, 29.96], [31.0, 33.08], [34.0, 34.6], [37.0, 72.05], [73.0, 77.09], [78.0, 131.58], [135.0, 135.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.17, 0.0, 94.52, 0.0, 0.0, 63.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.95, 0.59, 0.47, -0.06, 1.72, 0.9, 2.3, 1.96, 2.08, 0.6, 35.05, 4.09, 53.58, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/mnUfDpO87Y0_filtered.json b/annotations_filtered/mnUfDpO87Y0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44a0f9eae341b593e6503a91610d672cdadac595 --- /dev/null +++ b/annotations_filtered/mnUfDpO87Y0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 27.16], [29.0, 34.77], [36.0, 40.56], [42.0, 47.65], [52.0, 57.54], [60.0, 60.34], [60.0, 62.11], [64.0, 64.39], [64.0, 64.42], [64.0, 64.45], [77.0, 78.16]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [68.41, 33.05, 29.93, 29.72, 31.14, 0.0, 40.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 59.54], ["synthesizer", 6.46], ["musical instrument", 4.88]], [["music", 83.12], ["musical instrument", 1.64], ["drum machine", 1.37]], [["music", 68.11], ["drum machine", 6.74], ["synthesizer", 3.03]], [["music", 46.36], ["musical instrument", 19.12], ["drum", 3.71]], null, [["whale vocalization", 59.87], ["stomach rumble", 7.92], ["music", 5.95]], null, null, null, null], "duration": [9.16, 5.77, 4.56, 5.65, 5.54, 0.34, 2.11, 0.39, 0.42, 0.45, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/mnuJ_YVLL64_filtered.json b/annotations_filtered/mnuJ_YVLL64_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61cb34cbe45f4e188017c3949d94f67dd8758dfc --- /dev/null +++ b/annotations_filtered/mnuJ_YVLL64_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.83], [9.0, 9.75], [34.0, 35.77], [54.0, 55.21], [57.0, 57.37], [62.0, 65.21], [66.0, 67.07], [96.0, 96.15], [110.0, 111.28], [115.0, 115.94], [120.0, 120.26], [136.0, 138.1], [139.0, 150.21], [151.0, 150.94], [154.0, 154.89], [155.0, 162.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0, 38.59, 44.72, 0.0, 0.0, 40.82], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 59.45], ["music", 16.79], ["sidetone", 2.32]], null, null, null, null, null, [["frog", 10.97], ["quack", 10.39], ["animal", 6.87]], [["theremin", 67.61], ["howl", 8.57], ["music", 5.06]], null, null, [["theremin", 36.08], ["music", 11.96], ["animal", 8.49]]], "duration": [0.83, 0.75, 1.77, 1.21, 0.37, 3.21, 1.07, 0.15, 1.28, 0.94, 0.26, 2.1, 11.21, -0.06, 0.89, 7.03]} \ No newline at end of file diff --git a/annotations_filtered/moH3FSt88FY_filtered.json b/annotations_filtered/moH3FSt88FY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..153e162de176a0aa69ff31091f1ca5614a346509 --- /dev/null +++ b/annotations_filtered/moH3FSt88FY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [6.0, 14.79], [15.0, 43.5], [45.0, 48.42], [50.0, 51.73], [52.0, 55.39], [58.0, 60.89], [61.0, 69.45], [76.0, 76.99], [84.0, 84.72], [88.0, 97.9]], "keep_status": [false, true, true, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 35.26, 28.87, 49.68, 0.0, 57.25, 50.56, 28.7, 0.0, 0.0, 39.4], "audiomae_on_audioset": [null, [["mains hum", 33.24], ["hum", 28.55], ["fly, housefly", 5.75]], [["hum", 35.51], ["mains hum", 21.81], ["rumble", 11.43]], [["music", 77.38], ["ambient music", 3.14], ["didgeridoo", 2.4]], null, null, null, [["machine gun", 42.89], ["speech", 17.67], ["music", 6.58]], null, null, [["music", 38.76], ["animal", 13.92], ["grunt", 4.96]]], "duration": [0.5, 8.79, 28.5, 3.42, 1.73, 3.39, 2.89, 8.45, 0.99, 0.72, 9.9]} \ No newline at end of file diff --git a/annotations_filtered/moJvW1-7_Cw_filtered.json b/annotations_filtered/moJvW1-7_Cw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f72a70e9e98e2111f5d03cf368b5ce0834a1923 --- /dev/null +++ b/annotations_filtered/moJvW1-7_Cw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.89], [10.0, 11.37], [13.0, 14.44], [16.0, 16.6], [29.0, 29.32], [30.0, 31.31], [32.0, 32.26], [35.0, 51.78], [52.0, 52.71], [53.0, 58.04], [66.0, 66.01], [69.0, 69.77], [73.0, 73.53], [79.0, 80.96], [83.0, 91.29], [102.0, 101.8], [106.0, 108.04], [117.0, 117.32], [118.0, 118.59], [122.0, 123.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.65, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 36.22, 0.0, 49.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 37.05], ["hum", 34.27], ["music", 11.55]], null, [["hum", 42.08], ["throbbing", 28.4], ["music", 10.78]], null, null, null], "duration": [0.89, 1.37, 1.44, 0.6, 0.32, 1.31, 0.26, 16.78, 0.71, 5.04, 0.01, 0.77, 0.53, 1.96, 8.29, -0.2, 2.04, 0.32, 0.59, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/moYXL6hX8vI_filtered.json b/annotations_filtered/moYXL6hX8vI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80f45299dc27b290d2a66c47e02fa45ca5c2429c --- /dev/null +++ b/annotations_filtered/moYXL6hX8vI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 33.89], [36.0, 35.87], [39.0, 46.55], [48.0, 51.27], [52.0, 53.23], [55.0, 56.66], [63.0, 63.42], [66.0, 65.92], [67.0, 67.96], [76.0, 76.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 59.68, 40.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 31.91], ["mains hum", 22.35], ["music", 21.23]], null, null, null, null, null, null], "duration": [0.89, -0.13, 7.55, 3.27, 1.23, 1.66, 0.42, -0.08, 0.96, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/moeAot5_Q_U_filtered.json b/annotations_filtered/moeAot5_Q_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90ae66151ffafc4db7334d6eccfa6389ecdf3c8e --- /dev/null +++ b/annotations_filtered/moeAot5_Q_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [14.0, 14.22], [19.0, 19.03], [26.0, 26.64], [30.0, 30.55], [48.0, 48.44], [55.0, 56.05], [64.0, 64.13], [65.0, 65.74], [68.0, 68.61], [71.0, 71.22], [74.0, 77.04], [78.0, 80.11], [83.0, 83.67], [99.0, 99.28], [100.0, 101.7], [107.0, 107.89], [113.0, 115.59], [117.0, 117.27], [118.0, 119.45], [123.0, 126.28], [130.0, 130.71], [132.0, 132.97], [134.0, 134.49], [135.0, 137.34], [142.0, 142.15], [157.0, 158.23], [160.0, 159.97], [161.0, 162.14], [163.0, 165.55], [166.0, 167.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.16, 39.77, 0.0, 0.0, 0.0, 0.0, 41.85, 0.0, 0.0, 37.95, 0.0, 0.0, 0.0, 39.01, 0.0, 0.0, 0.0, 0.0, 72.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.91], ["music", 22.63], ["throbbing", 11.47]], null, null, null, null, [["music", 64.41], ["musical instrument", 7.63], ["foghorn", 3.5]], null, null, [["mains hum", 33.41], ["hum", 27.53], ["music", 15.16]], null, null, null, [["music", 63.11], ["didgeridoo", 3.93], ["theremin", 3.76]], null, null, null, null, null, null], "duration": [0.77, 0.22, 0.03, 0.64, 0.55, 0.44, 1.05, 0.13, 0.74, 0.61, 0.22, 3.04, 2.11, 0.67, 0.28, 1.7, 0.89, 2.59, 0.27, 1.45, 3.28, 0.71, 0.97, 0.49, 2.34, 0.15, 1.23, -0.03, 1.14, 2.55, 1.91]} \ No newline at end of file diff --git a/annotations_filtered/mohoyRj_VpU_filtered.json b/annotations_filtered/mohoyRj_VpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75f733819ab902b6aa846ea7d8e9339b8639fadb --- /dev/null +++ b/annotations_filtered/mohoyRj_VpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.82], [25.0, 25.22], [27.0, 32.43]], "keep_status": [false, false, false], "silence_prob": [97.92, 0.0, 85.35], "audiomae_on_audioset": [null, null, null], "duration": [2.82, 0.22, 5.43]} \ No newline at end of file diff --git a/annotations_filtered/mokXxWsIsWg_filtered.json b/annotations_filtered/mokXxWsIsWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7220a111d8ff17824a6fb9123526fe5ecd0989b --- /dev/null +++ b/annotations_filtered/mokXxWsIsWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [5.0, 6.86], [8.0, 10.93], [12.0, 15.09], [23.0, 23.48], [27.0, 27.68], [30.0, 30.3], [33.0, 34.94], [39.0, 39.45], [40.0, 42.18], [49.0, 49.25], [54.0, 54.01], [61.0, 61.2], [78.0, 78.02], [78.0, 78.36], [85.0, 84.7], [86.0, 86.98], [102.0, 102.42], [120.0, 120.66], [121.0, 123.87], [135.0, 135.48], [139.0, 139.38], [146.0, 145.59], [151.0, 152.74]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.84, 37.75, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["chuckle, chortle", 13.91], ["speech", 11.08], ["snicker", 10.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 1.86, 2.93, 3.09, 0.48, 0.68, 0.3, 1.94, 0.45, 2.18, 0.25, 0.01, 0.2, 0.02, 0.36, -0.3, 0.98, 0.42, 0.66, 2.87, 0.48, 0.38, -0.41, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/mpBQ883QIUs_filtered.json b/annotations_filtered/mpBQ883QIUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90d4d2e7de23e94be7f20936e0310156a6923e22 --- /dev/null +++ b/annotations_filtered/mpBQ883QIUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.66], [12.0, 12.58], [14.0, 19.84], [21.0, 38.87], [40.0, 43.55], [50.0, 50.19], [52.0, 53.59], [67.0, 69.72], [76.0, 76.87], [82.0, 83.25], [84.0, 84.52], [85.0, 85.6], [88.0, 88.94], [94.0, 94.14], [95.0, 100.28], [102.0, 109.22], [114.0, 120.01], [121.0, 121.32], [123.0, 122.98], [136.0, 145.56], [150.0, 152.74], [159.0, 164.08], [165.0, 167.97], [171.0, 176.94], [179.0, 179.14], [183.0, 183.98], [186.0, 197.41], [198.0, 201.24]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 87.55, 32.61, 48.44, 0.0, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 33.31, 32.73, 0.0, 0.0, 36.37, 37.36, 37.28, 38.36, 42.58, 0.0, 0.0, 63.1, 97.73], "audiomae_on_audioset": [null, null, null, [["music", 33.29], ["speech", 12.79], ["groan", 9.13]], [["speech", 29.7], ["inside, small room", 6.16], ["insect", 5.87]], null, null, [["speech", 30.95], ["music", 21.68], ["boing", 8.62]], null, null, null, null, null, null, null, [["speech", 29.33], ["music", 23.8], ["foghorn", 13.44]], [["music", 56.8], ["speech", 19.53], ["whale vocalization", 2.25]], null, null, [["music", 49.02], ["speech", 8.34], ["musical instrument", 3.28]], [["music", 52.19], ["musical instrument", 2.55], ["brass instrument", 2.42]], [["music", 78.44], ["throbbing", 2.11], ["fart", 1.86]], [["speech", 21.47], ["music", 14.23], ["cowbell", 6.81]], [["music", 46.85], ["speech", 26.97], ["synthesizer", 3.41]], null, null, null, null], "duration": [0.66, 0.58, 5.84, 17.87, 3.55, 0.19, 1.59, 2.72, 0.87, 1.25, 0.52, 0.6, 0.94, 0.14, 5.28, 7.22, 6.01, 0.32, -0.02, 9.56, 2.74, 5.08, 2.97, 5.94, 0.14, 0.98, 11.41, 3.24]} \ No newline at end of file diff --git a/annotations_filtered/mpDGnFwbw0U_filtered.json b/annotations_filtered/mpDGnFwbw0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f0d9a25dcf9dad207245c19d63eab0d0eef8765 --- /dev/null +++ b/annotations_filtered/mpDGnFwbw0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.37], [8.0, 8.83], [11.0, 11.5], [13.0, 16.6], [22.0, 22.64], [23.0, 25.49], [32.0, 34.94], [38.0, 39.88], [44.0, 52.42], [55.0, 55.85], [56.0, 57.03], [57.0, 58.7], [62.0, 62.46], [91.0, 91.59], [97.0, 101.78], [123.0, 123.36]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 55.04, 0.0, 42.79, 37.62, 0.0, 44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 37.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["creak", 25.14], ["fly, housefly", 15.3], ["insect", 5.84]], [["rumble", 14.01], ["throbbing", 8.43], ["vehicle horn, car horn, honking", 7.2]], null, [["hum", 41.63], ["throbbing", 15.61], ["rumble", 12.77]], null, null, null, null, null, [["speech", 45.32], ["rumble", 17.23], ["hum", 14.94]], null], "duration": [1.37, 0.83, 0.5, 3.6, 0.64, 2.49, 2.94, 1.88, 8.42, 0.85, 1.03, 1.7, 0.46, 0.59, 4.78, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/mpDnD5Pp90I_filtered.json b/annotations_filtered/mpDnD5Pp90I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dea8575017ca650cbd77242a7ce098e6c303b8df --- /dev/null +++ b/annotations_filtered/mpDnD5Pp90I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.24], [10.0, 10.39], [13.0, 12.73], [23.0, 23.14], [28.0, 28.22], [30.0, 30.82], [33.0, 34.1], [37.0, 38.03], [42.0, 52.54], [54.0, 54.35], [58.0, 58.18], [64.0, 64.89], [67.0, 67.58], [70.0, 78.16], [85.0, 85.72], [89.0, 94.37], [95.0, 96.01], [98.0, 98.69], [100.0, 101.26], [103.0, 108.01], [108.0, 111.1], [112.0, 112.24], [113.0, 113.73], [120.0, 120.61], [123.0, 123.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.43, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 57.56, 0.0, 0.0, 0.0, 63.85, 60.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 34.17], ["music", 27.79], ["hum", 11.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.39, -0.27, 0.14, 0.22, 0.82, 1.1, 1.03, 10.54, 0.35, 0.18, 0.89, 0.58, 8.16, 0.72, 5.37, 1.01, 0.69, 1.26, 5.01, 3.1, 0.24, 0.73, 0.61, 0.13]} \ No newline at end of file diff --git a/annotations_filtered/mpG7K909Gi4_filtered.json b/annotations_filtered/mpG7K909Gi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf4de8b958757b6367d0b4acf1a4518adc649ddd --- /dev/null +++ b/annotations_filtered/mpG7K909Gi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.92], [23.0, 27.7], [29.0, 29.47], [31.0, 31.5], [36.0, 36.81], [38.0, 50.11], [51.0, 51.65], [52.0, 54.8], [60.0, 69.99], [72.0, 77.03], [78.0, 78.36], [80.0, 80.57], [83.0, 83.42], [84.0, 90.24], [93.0, 95.0], [96.0, 97.82], [99.0, 103.2], [104.0, 125.37], [127.0, 127.57], [128.0, 129.86]], "keep_status": [false, true, false, false, false, false, false, true, true, true, false, false, false, true, true, false, false, false, false, false], "silence_prob": [30.96, 30.79, 0.0, 0.0, 0.0, 29.91, 0.0, 32.03, 28.68, 30.02, 0.0, 0.0, 0.0, 35.45, 32.01, 0.0, 32.0, 28.96, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 40.11], ["insect", 35.46], ["bee, wasp, etc.", 10.27]], [["music", 32.41], ["hum", 13.3], ["gong", 9.22]], null, null, null, [["hum", 45.25], ["throbbing", 24.08], ["mains hum", 13.87]], null, [["music", 12.55], ["speech", 11.65], ["animal", 8.66]], [["music", 42.73], ["whale vocalization", 20.46], ["throbbing", 3.8]], [["music", 35.48], ["hum", 17.53], ["throbbing", 16.76]], null, null, null, [["music", 42.9], ["whale vocalization", 14.06], ["theremin", 5.55]], [["music", 46.0], ["giggle", 3.68], ["hum", 3.54]], null, [["hum", 44.15], ["mains hum", 17.67], ["throbbing", 14.6]], [["music", 38.54], ["speech", 30.92], ["buzz", 3.54]], null, null], "duration": [5.92, 4.7, 0.47, 0.5, 0.81, 12.11, 0.65, 2.8, 9.99, 5.03, 0.36, 0.57, 0.42, 6.24, 2.0, 1.82, 4.2, 21.37, 0.57, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/mpfBH5WLlOA_filtered.json b/annotations_filtered/mpfBH5WLlOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bacf228eaf6f064c9a12ab060aef84c05309a18a --- /dev/null +++ b/annotations_filtered/mpfBH5WLlOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.69], [15.0, 14.84], [15.0, 15.99], [20.0, 20.46], [20.0, 20.51], [21.0, 20.61], [22.0, 26.59], [27.0, 28.38], [29.0, 38.06], [39.0, 43.73], [49.0, 89.72], [90.0, 96.38], [97.0, 105.36], [106.0, 111.11], [112.0, 116.01], [120.0, 124.68], [126.0, 128.07], [131.0, 131.9]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 40.52, 34.23, 0.0, 35.22, 28.88, 28.39, 29.47, 30.23, 35.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 42.79], ["mains hum", 15.43], ["throbbing", 11.82]], [["sine wave", 27.93], ["chirp tone", 15.18], ["speech", 11.37]], null, [["music", 24.23], ["glass", 9.52], ["speech", 7.79]], [["speech", 77.06], ["music", 5.43], ["thunk", 2.0]], [["whack, thwack", 15.57], ["breaking", 15.0], ["hammer", 13.01]], [["gong", 16.91], ["speech", 15.1], ["music", 14.8]], [["whale vocalization", 57.6], ["speech", 10.82], ["music", 9.02]], [["speech", 33.36], ["creak", 13.17], ["music", 11.8]], null], "duration": [1.69, -0.16, 0.99, 0.46, 0.51, -0.39, 4.59, 1.38, 9.06, 4.73, 40.72, 6.38, 8.36, 5.11, 4.01, 4.68, 2.07, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/mpgaMjGOeJg_filtered.json b/annotations_filtered/mpgaMjGOeJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6f4f555458cb85c6abda350457dff8fe1bb0427 --- /dev/null +++ b/annotations_filtered/mpgaMjGOeJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.98], [11.0, 12.48], [13.0, 14.03], [17.0, 19.97], [23.0, 23.67], [26.0, 25.98], [30.0, 31.06], [34.0, 34.43], [38.0, 38.31], [45.0, 46.06], [47.0, 47.71], [48.0, 49.76], [53.0, 53.62], [57.0, 61.89], [63.0, 65.25], [68.0, 68.89], [72.0, 73.36], [76.0, 77.35], [84.0, 88.23], [89.0, 89.77], [92.0, 102.0], [103.0, 111.27], [116.0, 142.91], [146.0, 152.17], [156.0, 157.96], [159.0, 159.78], [162.0, 165.23], [166.0, 171.51], [173.0, 173.77], [175.0, 193.99], [196.0, 212.65], [217.0, 222.44], [223.0, 223.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 33.13, 0.0, 0.0, 0.0, 30.92, 0.0, 30.87, 30.52, 94.66, 82.79, 0.0, 0.0, 94.22, 68.93, 0.0, 48.19, 35.49, 33.46, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.39], ["groan", 5.58], ["rumble", 2.55]], null, null, null, [["wind instrument, woodwind instrument", 57.65], ["music", 15.01], ["didgeridoo", 10.83]], null, [["animal", 49.45], ["dog", 20.48], ["domestic animals, pets", 12.11]], [["music", 45.02], ["didgeridoo", 9.84], ["wind instrument, woodwind instrument", 9.69]], null, null, null, null, null, null, null, [["music", 75.2], ["synthesizer", 4.05], ["ambient music", 3.49]], [["music", 74.38], ["synthesizer", 5.36], ["soundtrack music", 4.11]], [["music", 65.56], ["speech", 4.07], ["explosion", 3.55]], null], "duration": [-0.02, 1.48, 1.03, 2.97, 0.67, -0.02, 1.06, 0.43, 0.31, 1.06, 0.71, 1.76, 0.62, 4.89, 2.25, 0.89, 1.36, 1.35, 4.23, 0.77, 10.0, 8.27, 26.91, 6.17, 1.96, 0.78, 3.23, 5.51, 0.77, 18.99, 16.65, 5.44, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/mpr3XG5Tzmk_filtered.json b/annotations_filtered/mpr3XG5Tzmk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a08cca41cf0dea9ae3e54508965728ce0d329ce --- /dev/null +++ b/annotations_filtered/mpr3XG5Tzmk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.45], [15.0, 15.6], [17.0, 18.1], [21.0, 24.34], [26.0, 51.92], [53.0, 91.29], [96.0, 97.41], [103.0, 105.19], [110.0, 112.68], [125.0, 126.47], [128.0, 130.67]], "keep_status": [false, false, false, true, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.98, 29.66, 0.0, 0.0, 33.02, 30.73, 0.0, 28.57], "audiomae_on_audioset": [null, null, null, [["livestock, farm animals, working animals", 12.77], ["explosion", 8.68], ["insect", 8.44]], [["music", 47.85], ["hum", 14.36], ["electronic music", 8.04]], null, null, [["music", 20.74], ["moo", 7.36], ["frog", 6.44]], [["hum", 25.05], ["music", 25.0], ["mains hum", 11.82]], null, [["buzz", 11.84], ["hum", 8.93], ["fly, housefly", 8.62]]], "duration": [0.45, 0.6, 1.1, 3.34, 25.92, 38.29, 1.41, 2.19, 2.68, 1.47, 2.67]} \ No newline at end of file diff --git a/annotations_filtered/mq2cz9Xvzcw_filtered.json b/annotations_filtered/mq2cz9Xvzcw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12fde2fc1ccbcf6b7eb9c329fa7690f53908f157 --- /dev/null +++ b/annotations_filtered/mq2cz9Xvzcw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.96], [12.0, 13.17], [15.0, 16.17], [21.0, 21.64], [23.0, 28.41], [33.0, 40.63], [49.0, 50.09], [52.0, 53.27], [56.0, 56.94], [59.0, 59.81], [61.0, 61.53], [64.0, 64.47], [65.0, 71.32], [74.0, 74.7], [76.0, 76.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.78, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 1.17, 1.17, 0.64, 5.41, 7.63, 1.09, 1.27, 0.94, 0.81, 0.53, 0.47, 6.32, 0.7, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/mqQ8Y9Sjp7o_filtered.json b/annotations_filtered/mqQ8Y9Sjp7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..deaa58e0ebcdb3a67670de2f2abae61601685542 --- /dev/null +++ b/annotations_filtered/mqQ8Y9Sjp7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.08], [15.0, 84.37], [86.0, 88.45], [89.0, 89.67], [90.0, 91.27], [93.0, 130.72], [135.0, 147.31], [152.0, 155.19], [157.0, 157.64]], "keep_status": [false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 29.95, 41.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 25.38], ["sidetone", 18.39], ["hum", 9.1]], [["sidetone", 33.06], ["music", 16.75], ["radio", 14.16]], null], "duration": [1.08, 69.37, 2.45, 0.67, 1.27, 37.72, 12.31, 3.19, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/mqYkD0nMs04_filtered.json b/annotations_filtered/mqYkD0nMs04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..050218e3a9324744febc7de1dbd3bf1b9e72fe0d --- /dev/null +++ b/annotations_filtered/mqYkD0nMs04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.18], [10.0, 10.22], [10.0, 15.16], [26.0, 27.28], [40.0, 40.58], [42.0, 43.04], [44.0, 45.47], [50.0, 52.93], [55.0, 55.36], [58.0, 59.21], [79.0, 78.66], [80.0, 81.24], [84.0, 84.18], [89.0, 89.09], [90.0, 90.22]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.59, 0.0, 0.0, 0.0, 0.0, 48.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 65.65], ["speech", 14.66], ["electronic music", 5.37]], null, null, null, null, [["boing", 42.19], ["speech", 16.88], ["dog", 3.81]], null, null, null, null, null, null, null], "duration": [0.18, 0.22, 5.16, 1.28, 0.58, 1.04, 1.47, 2.93, 0.36, 1.21, -0.34, 1.24, 0.18, 0.09, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/mqhpZ30uNic_filtered.json b/annotations_filtered/mqhpZ30uNic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18a99747db3a7106ac19977bbf72583f8b6cbf42 --- /dev/null +++ b/annotations_filtered/mqhpZ30uNic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [3.0, 121.0], [122.0, 130.55], [146.0, 146.1], [152.0, 153.57], [157.0, 163.75], [165.0, 170.78], [172.0, 173.85], [175.0, 184.62]], "keep_status": [false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.45, 0.0, 0.0, 56.4, 36.21, 0.0, 48.27], "audiomae_on_audioset": [null, null, [["music", 34.72], ["hum", 12.78], ["whale vocalization", 5.66]], null, null, null, [["dog", 27.09], ["animal", 26.22], ["bow-wow", 19.09]], null, [["whale vocalization", 85.24], ["speech", 5.43], ["animal", 1.21]]], "duration": [0.66, 118.0, 8.55, 0.1, 1.57, 6.75, 5.78, 1.85, 9.62]} \ No newline at end of file diff --git a/annotations_filtered/mqkYeGeQ1f4_filtered.json b/annotations_filtered/mqkYeGeQ1f4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41ada88a4b84fffc2a6af406d805ec29a34021f7 --- /dev/null +++ b/annotations_filtered/mqkYeGeQ1f4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.5], [27.0, 45.87], [47.0, 80.01], [85.0, 98.98]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 30.3, 0.0, 30.58], "audiomae_on_audioset": [null, [["music", 35.05], ["hum", 12.21], ["mains hum", 6.24]], null, [["music", 51.07], ["hum", 19.01], ["throbbing", 9.3]]], "duration": [0.5, 18.87, 33.01, 13.98]} \ No newline at end of file diff --git a/annotations_filtered/mqnB2ef3S6M_filtered.json b/annotations_filtered/mqnB2ef3S6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f778a650b0af0ad8c4584e389baaba82fc2fa2e5 --- /dev/null +++ b/annotations_filtered/mqnB2ef3S6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.07], [8.0, 8.78], [13.0, 13.14], [14.0, 18.64], [21.0, 23.77], [25.0, 27.9], [30.0, 32.17], [36.0, 38.21], [40.0, 40.49], [41.0, 42.72], [44.0, 45.35], [46.0, 46.67], [51.0, 50.87], [55.0, 56.08], [61.0, 62.68], [63.0, 63.39], [65.0, 65.82], [67.0, 78.19], [80.0, 84.35], [86.0, 86.43], [87.0, 87.42], [88.0, 88.55], [90.0, 90.29], [93.0, 96.16], [99.0, 102.61], [104.0, 105.61], [107.0, 107.92], [110.0, 111.03], [125.0, 125.9]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.66, 56.7, 46.33, 37.41, 44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.96, 40.47, 0.0, 0.0, 0.0, 0.0, 36.28, 47.5, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 23.64], ["theremin", 12.87], ["foghorn", 5.64]], [["speech", 34.94], ["music", 14.83], ["hum", 12.46]], [["mains hum", 42.69], ["hum", 23.79], ["speech", 10.12]], null, null, null, null, null, null, null, null, null, [["music", 69.32], ["speech", 8.95], ["mains hum", 7.18]], [["music", 31.87], ["speech", 13.03], ["hum", 4.86]], null, null, null, null, [["speech", 35.78], ["music", 34.65], ["hiccup", 4.79]], [["music", 46.89], ["frog", 10.34], ["croak", 6.36]], null, null, null, null], "duration": [0.07, 0.78, 0.14, 4.64, 2.77, 2.9, 2.17, 2.21, 0.49, 1.72, 1.35, 0.67, -0.13, 1.08, 1.68, 0.39, 0.82, 11.19, 4.35, 0.43, 0.42, 0.55, 0.29, 3.16, 3.61, 1.61, 0.92, 1.03, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/mqpQgFfidcA_filtered.json b/annotations_filtered/mqpQgFfidcA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83d6c7e1d479a4fa1aa528ed33693a8257afb169 --- /dev/null +++ b/annotations_filtered/mqpQgFfidcA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.13], [10.0, 10.84], [22.0, 22.76], [36.0, 36.42], [37.0, 39.19], [45.0, 47.53], [59.0, 62.68], [65.0, 68.01], [71.0, 73.5], [81.0, 81.51], [99.0, 100.14], [119.0, 119.2], [133.0, 136.19], [141.0, 142.16], [144.0, 145.57], [147.0, 147.72], [149.0, 150.69], [156.0, 156.34], [161.0, 167.85], [169.0, 174.14]], "keep_status": [true, false, false, false, true, true, true, true, false, false, false, false, true, false, false, false, false, false, true, true], "silence_prob": [33.43, 0.0, 0.0, 0.0, 32.73, 33.0, 33.86, 31.39, 31.04, 0.0, 0.0, 0.0, 35.33, 0.0, 0.0, 0.0, 0.0, 0.0, 36.16, 31.62], "audiomae_on_audioset": [[["music", 35.32], ["clang", 18.66], ["smash, crash", 8.32]], null, null, null, [["music", 28.81], ["speech", 14.83], ["electronic music", 6.57]], [["music", 24.13], ["speech", 12.5], ["moo", 6.86]], [["sidetone", 18.78], ["speech", 17.57], ["hum", 15.62]], [["music", 38.49], ["hum", 11.52], ["mains hum", 10.54]], [["music", 43.86], ["speech", 42.98], ["vehicle", 0.49]], null, null, null, [["music", 35.88], ["speech", 29.58], ["scary music", 3.27]], null, null, null, null, null, [["music", 25.82], ["hum", 21.65], ["mains hum", 21.37]], [["music", 55.0], ["scary music", 3.3], ["hum", 2.58]]], "duration": [2.13, 0.84, 0.76, 0.42, 2.19, 2.53, 3.68, 3.01, 2.5, 0.51, 1.14, 0.2, 3.19, 1.16, 1.57, 0.72, 1.69, 0.34, 6.85, 5.14]} \ No newline at end of file diff --git a/annotations_filtered/mqzu3AI7Dow_filtered.json b/annotations_filtered/mqzu3AI7Dow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d730eed86f27eaebf6db04b76782f705736027f --- /dev/null +++ b/annotations_filtered/mqzu3AI7Dow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.05], [15.0, 16.66], [24.0, 27.99], [37.0, 47.61], [51.0, 104.55], [106.0, 108.3], [112.0, 118.44]], "keep_status": [true, false, true, true, false, true, true], "silence_prob": [33.44, 0.0, 32.44, 32.21, 0.0, 37.42, 33.9], "audiomae_on_audioset": [[["music", 24.87], ["hum", 12.41], ["electronic music", 5.85]], null, [["speech", 16.52], ["vehicle", 11.3], ["music", 7.49]], [["vehicle", 12.26], ["speech", 11.77], ["music", 9.22]], null, [["whack, thwack", 10.27], ["music", 6.52], ["sound effect", 6.51]], [["speech", 10.56], ["vehicle", 6.07], ["animal", 4.43]]], "duration": [3.05, 1.66, 3.99, 10.61, 53.55, 2.3, 6.44]} \ No newline at end of file diff --git a/annotations_filtered/mr1bVID2qao_filtered.json b/annotations_filtered/mr1bVID2qao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c96376d4ee14d08f2ee0f5bc666f6fbcd831328 --- /dev/null +++ b/annotations_filtered/mr1bVID2qao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.91], [12.0, 13.17], [15.0, 15.38], [28.0, 28.43], [59.0, 69.4], [98.0, 97.83], [100.0, 100.62], [129.0, 130.13], [144.0, 144.14], [144.0, 144.17], [145.0, 145.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.21, 0.0, 0.0, 0.0, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 73.61], ["synthesizer", 5.84], ["musical instrument", 3.62]], null, null, null, [["music", 80.57], ["musical instrument", 1.51], ["cello", 1.26]], null, null, null, null, null, null], "duration": [5.91, 1.17, 0.38, 0.43, 10.4, -0.17, 0.62, 1.13, 0.14, 0.17, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/mr3L2D4yv-0_filtered.json b/annotations_filtered/mr3L2D4yv-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d994c5d8769a0b76cb92043d4f7628606fe875e --- /dev/null +++ b/annotations_filtered/mr3L2D4yv-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 57.05], [58.0, 64.42], [65.0, 66.04], [66.0, 76.08], [78.0, 83.12], [85.0, 93.38], [95.0, 96.38], [96.0, 96.47], [96.0, 96.52]], "keep_status": [false, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 30.43, 0.0, 31.79, 98.36, 33.21, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 38.92], ["speech", 15.03], ["hum", 4.33]], null, [["music", 42.64], ["smash, crash", 5.61], ["sound effect", 5.28]], null, [["hum", 16.13], ["machine gun", 13.99], ["breaking", 12.44]], null, null, null], "duration": [55.05, 6.42, 1.04, 10.08, 5.12, 8.38, 1.38, 0.47, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/mrx4SwMyGdQ_filtered.json b/annotations_filtered/mrx4SwMyGdQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a5d36821360b605918bc620a9e635733c21c971 --- /dev/null +++ b/annotations_filtered/mrx4SwMyGdQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [5.0, 7.15], [8.0, 8.97], [16.0, 22.69], [23.0, 24.07], [27.0, 28.48], [32.0, 33.79], [38.0, 38.33], [44.0, 44.78], [51.0, 53.15], [54.0, 57.48], [66.0, 66.99], [68.0, 69.82]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.84, 0.0, 37.35, 0.0, 0.0, 0.0, 0.0, 0.0, 73.06, 56.33, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 39.03], ["theremin", 9.87], ["synthesizer", 9.43]], null, null, null, null, null, null, null, null, null], "duration": [0.58, 2.15, 0.97, 6.69, 1.07, 1.48, 1.79, 0.33, 0.78, 2.15, 3.48, 0.99, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/msSsPzKVzW0_filtered.json b/annotations_filtered/msSsPzKVzW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46ede202a6de4be4134f01d40ad48a9c6fb05103 --- /dev/null +++ b/annotations_filtered/msSsPzKVzW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.8], [7.0, 7.55], [9.0, 9.73], [13.0, 14.05], [25.0, 25.35], [30.0, 31.92], [38.0, 38.38], [43.0, 43.06], [47.0, 46.65], [47.0, 48.51], [49.0, 49.05], [53.0, 53.32], [56.0, 56.13], [57.0, 57.55], [59.0, 58.99], [60.0, 60.52], [62.0, 63.14], [67.0, 67.36], [68.0, 68.71], [73.0, 73.21], [75.0, 75.59], [76.0, 77.03], [83.0, 83.12], [93.0, 92.99], [104.0, 104.94], [105.0, 105.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 0.55, 0.73, 1.05, 0.35, 1.92, 0.38, 0.06, -0.35, 1.51, 0.05, 0.32, 0.13, 0.55, -0.01, 0.52, 1.14, 0.36, 0.71, 0.21, 0.59, 1.03, 0.12, -0.01, 0.94, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/msWWI02CG-o_filtered.json b/annotations_filtered/msWWI02CG-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbd208f5f0da6ce8d261954af073ede6de45afd7 --- /dev/null +++ b/annotations_filtered/msWWI02CG-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.94], [14.0, 15.3], [22.0, 23.08], [26.0, 27.09], [35.0, 35.36], [36.0, 37.66], [38.0, 39.55], [44.0, 48.81], [49.0, 50.14], [51.0, 51.41], [52.0, 52.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 65.26], ["electronic music", 5.81], ["techno", 3.01]], null, null, null], "duration": [1.94, 1.3, 1.08, 1.09, 0.36, 1.66, 1.55, 4.81, 1.14, 0.41, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/ms_ERfOYnqI_filtered.json b/annotations_filtered/ms_ERfOYnqI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b100fee9f10f5afd48a3e5faa60afbd7f0d334c4 --- /dev/null +++ b/annotations_filtered/ms_ERfOYnqI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 55.75], [58.0, 70.43], [72.0, 72.4], [73.0, 76.77], [78.0, 79.27], [80.0, 84.28], [87.0, 92.3], [95.0, 101.48]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 29.27, 0.0, 57.72, 0.0, 63.53, 51.94, 57.32], "audiomae_on_audioset": [null, [["sound effect", 12.76], ["speech", 10.79], ["explosion", 9.59]], null, null, null, null, null, null], "duration": [40.75, 12.43, 0.4, 3.77, 1.27, 4.28, 5.3, 6.48]} \ No newline at end of file diff --git a/annotations_filtered/msaelEZ_eEs_filtered.json b/annotations_filtered/msaelEZ_eEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bebd3169635f5bdb6c2be2e8e21aefe0b86ff0f --- /dev/null +++ b/annotations_filtered/msaelEZ_eEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [7.0, 37.76], [42.0, 50.06], [52.0, 73.36], [76.0, 95.44], [99.0, 118.86], [119.0, 172.96], [175.0, 177.62], [180.0, 180.33]], "keep_status": [false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 34.29, 32.32, 34.33, 34.81, 0.0, 52.92, 0.0], "audiomae_on_audioset": [null, null, [["speech", 44.11], ["music", 33.89], ["synthesizer", 2.26]], [["music", 46.74], ["theremin", 14.21], ["hum", 8.33]], [["music", 21.53], ["hum", 10.81], ["mains hum", 10.26]], [["music", 67.4], ["synthesizer", 4.03], ["musical instrument", 3.14]], null, null, null], "duration": [0.75, 30.76, 8.06, 21.36, 19.44, 19.86, 53.96, 2.62, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/msoyjm3gCBM_filtered.json b/annotations_filtered/msoyjm3gCBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cecdd8993d441d11afd04b2051b709e997e1e6fb --- /dev/null +++ b/annotations_filtered/msoyjm3gCBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 120.66], [124.0, 129.22], [131.0, 135.11], [138.0, 139.01], [143.0, 160.57]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 28.16, 28.42, 0.0, 28.29], "audiomae_on_audioset": [null, [["music", 47.76], ["speech", 9.24], ["crowd", 3.85]], [["music", 46.87], ["throbbing", 17.09], ["hum", 12.87]], null, [["music", 66.75], ["vehicle", 3.99], ["car", 3.02]]], "duration": [60.66, 5.22, 4.11, 1.01, 17.57]} \ No newline at end of file diff --git a/annotations_filtered/msqRzlYXXQE_filtered.json b/annotations_filtered/msqRzlYXXQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92faf37425291c4d8fd9a260ff94c0201e3baa73 --- /dev/null +++ b/annotations_filtered/msqRzlYXXQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 72.74]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [58.74]} \ No newline at end of file diff --git a/annotations_filtered/mszANpbvdM8_filtered.json b/annotations_filtered/mszANpbvdM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d50e04eb76d54fe6f00bd73205df561046367239 --- /dev/null +++ b/annotations_filtered/mszANpbvdM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 55.12], [56.0, 87.86], [89.0, 89.01], [90.0, 89.95], [106.0, 106.68], [107.0, 108.14], [112.0, 112.41], [113.0, 114.81], [116.0, 117.26], [118.0, 175.76], [176.0, 176.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [55.12, 31.86, 0.01, -0.05, 0.68, 1.14, 0.41, 1.81, 1.26, 57.76, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/mszPMVP_qcw_filtered.json b/annotations_filtered/mszPMVP_qcw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc41f24107cd977da5a596824266fcd2681b0f37 --- /dev/null +++ b/annotations_filtered/mszPMVP_qcw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.07], [15.0, 17.42], [19.0, 21.56], [22.0, 22.45], [23.0, 24.49], [27.0, 28.88], [32.0, 33.37], [37.0, 37.79], [46.0, 46.48], [61.0, 61.15], [63.0, 64.3], [68.0, 70.63], [75.0, 76.35], [77.0, 78.31], [86.0, 86.73], [95.0, 95.17], [101.0, 101.9], [104.0, 104.18], [104.0, 104.6], [108.0, 107.77], [111.0, 110.74], [128.0, 128.46], [132.0, 132.41], [137.0, 138.16], [142.0, 143.28], [145.0, 148.1], [154.0, 156.2], [157.0, 158.03], [159.0, 159.17], [161.0, 162.19], [165.0, 168.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.38, 74.13, 95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.88, 50.11, 0.0, 0.0, 0.0, 95.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 40.36], ["moo", 25.41], ["animal", 9.67]], null, null, null, null, null], "duration": [3.07, 2.42, 2.56, 0.45, 1.49, 1.88, 1.37, 0.79, 0.48, 0.15, 1.3, 2.63, 1.35, 1.31, 0.73, 0.17, 0.9, 0.18, 0.6, -0.23, -0.26, 0.46, 0.41, 1.16, 1.28, 3.1, 2.2, 1.03, 0.17, 1.19, 3.98]} \ No newline at end of file diff --git a/annotations_filtered/mt0zR2uOAB8_filtered.json b/annotations_filtered/mt0zR2uOAB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f3e19585811d7e84235b03675adc35bd88920ee --- /dev/null +++ b/annotations_filtered/mt0zR2uOAB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [8.0, 9.29], [10.0, 10.93], [17.0, 17.02], [22.0, 26.08], [30.0, 30.5], [33.0, 33.45], [36.0, 36.63], [48.0, 48.96], [50.0, 50.87], [51.0, 55.48], [57.0, 61.99], [65.0, 75.19], [77.0, 79.95], [83.0, 86.64], [94.0, 98.22], [100.0, 106.46], [111.0, 115.69], [116.0, 138.45], [139.0, 141.39], [142.0, 143.58], [145.0, 147.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, true, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 40.7, 35.72, 34.67, 80.11, 31.76, 31.91, 32.77, 42.48, 32.74, 43.28, 0.0, 41.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 28.61], ["music", 27.37], ["synthesizer", 12.53]], [["sidetone", 60.8], ["speech", 7.66], ["coin (dropping)", 6.19]], [["hum", 35.97], ["speech", 17.0], ["mains hum", 8.63]], null, [["music", 31.66], ["speech", 24.83], ["musical instrument", 14.93]], [["music", 49.6], ["hum", 9.94], ["synthesizer", 8.17]], [["hum", 40.27], ["music", 13.87], ["throbbing", 12.93]], [["speech", 34.75], ["music", 30.99], ["hum", 9.0]], [["music", 16.73], ["sidetone", 13.83], ["explosion", 8.87]], [["music", 50.66], ["throbbing", 4.58], ["hum", 3.57]], null, [["speech", 38.63], ["hum", 10.55], ["fly, housefly", 5.06]]], "duration": [0.5, 1.29, 0.93, 0.02, 4.08, 0.5, 0.45, 0.63, 0.96, 0.87, 4.48, 4.99, 10.19, 2.95, 3.64, 4.22, 6.46, 4.69, 22.45, 2.39, 1.58, 2.56]} \ No newline at end of file diff --git a/annotations_filtered/mtkuDgE-qOI_filtered.json b/annotations_filtered/mtkuDgE-qOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8323ef3bd57315257b64c7127fb82a0c2d3c357 --- /dev/null +++ b/annotations_filtered/mtkuDgE-qOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 20.46], [21.0, 21.2], [22.0, 78.38], [80.0, 112.6], [114.0, 115.69]], "keep_status": [false, false, false, false, false], "silence_prob": [99.94, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [6.46, 0.2, 56.38, 32.6, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/mtsQ0CR4Z28_filtered.json b/annotations_filtered/mtsQ0CR4Z28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..add54beeff18f2339ad3673c41aebf4834f02b93 --- /dev/null +++ b/annotations_filtered/mtsQ0CR4Z28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 68.44], [71.0, 71.83], [72.0, 84.48], [85.0, 86.0], [96.0, 97.23], [99.0, 101.29], [102.0, 108.82], [118.0, 119.75], [120.0, 121.47]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.46, 0.0, 0.0, 67.13, 43.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 48.01], ["buzz", 19.7], ["speech", 4.53]], null, null, null, [["music", 60.19], ["theremin", 10.74], ["musical instrument", 5.34]], null, null], "duration": [54.44, 0.83, 12.48, 1.0, 1.23, 2.29, 6.82, 1.75, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/mtuBqolFOVs_filtered.json b/annotations_filtered/mtuBqolFOVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..450efc2669dab21e53282f26d8d9232d03413281 --- /dev/null +++ b/annotations_filtered/mtuBqolFOVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.12], [5.0, 6.67], [7.0, 13.49], [14.0, 15.21], [16.0, 18.87], [19.0, 20.33], [25.0, 27.48], [35.0, 38.21], [39.0, 40.44], [40.0, 43.21], [45.0, 45.23], [46.0, 47.95], [53.0, 53.49], [55.0, 57.94], [58.0, 59.9], [61.0, 61.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 90.78, 0.0, 64.41, 0.0, 99.56, 99.82, 0.0, 60.05, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.12, 1.67, 6.49, 1.21, 2.87, 1.33, 2.48, 3.21, 1.44, 3.21, 0.23, 1.95, 0.49, 2.94, 1.9, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/mtuuOV4FtKY_filtered.json b/annotations_filtered/mtuuOV4FtKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acd635a5f6d1944b62e018a5cab53abd336fe812 --- /dev/null +++ b/annotations_filtered/mtuuOV4FtKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [4.0, 4.04], [5.0, 7.96], [9.0, 15.11], [16.0, 16.09], [16.0, 20.09], [21.0, 23.38], [28.0, 38.65], [40.0, 40.41], [49.0, 49.94], [50.0, 52.46], [53.0, 54.58], [55.0, 55.44], [60.0, 74.66], [75.0, 78.9], [80.0, 93.75], [95.0, 113.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 61.57, 98.99, 0.0, 75.88, 100.0, 52.22, 0.0, 0.0, 94.37, 0.0, 0.0, 44.6, 93.76, 99.92, 35.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.88], ["hum", 9.01], ["throbbing", 7.41]], null, null, [["speech", 17.82], ["fly, housefly", 17.7], ["insect", 10.4]]], "duration": [0.94, 0.04, 2.96, 6.11, 0.09, 4.09, 2.38, 10.65, 0.41, 0.94, 2.46, 1.58, 0.44, 14.66, 3.9, 13.75, 18.53]} \ No newline at end of file diff --git a/annotations_filtered/mu-YLZpB6is_filtered.json b/annotations_filtered/mu-YLZpB6is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa7b41dbeffc96f23a118766b3afcaf93d4153f3 --- /dev/null +++ b/annotations_filtered/mu-YLZpB6is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 34.52], [37.0, 42.82], [46.0, 47.01], [49.0, 54.38], [55.0, 54.57], [55.0, 63.19], [66.0, 121.2], [122.0, 123.15], [125.0, 125.19], [127.0, 129.32]], "keep_status": [false, false, false, true, false, false, false, false, false, false], "silence_prob": [31.1, 34.09, 0.0, 32.5, 0.0, 32.94, 0.0, 0.0, 0.0, 44.26], "audiomae_on_audioset": [[["music", 70.23], ["animal", 6.13], ["dog", 3.41]], [["music", 68.62], ["theremin", 11.87], ["musical instrument", 2.11]], null, [["music", 18.37], ["whale vocalization", 18.08], ["vehicle", 17.07]], null, [["music", 44.32], ["didgeridoo", 21.78], ["fart", 11.81]], null, null, null, [["speech", 60.0], ["boing", 5.91], ["echo", 4.28]]], "duration": [22.52, 5.82, 1.01, 5.38, -0.43, 8.19, 55.2, 1.15, 0.19, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/muVopS3Yn7s_filtered.json b/annotations_filtered/muVopS3Yn7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96642d7f6afe5739bde5d9cd370ffbee8d2d9c75 --- /dev/null +++ b/annotations_filtered/muVopS3Yn7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.52], [27.0, 26.69], [29.0, 44.61], [46.0, 46.75], [49.0, 55.56], [62.0, 62.56], [63.0, 63.32], [66.0, 66.53], [86.0, 86.04], [88.0, 88.82], [93.0, 94.22], [105.0, 107.54], [111.0, 111.75], [114.0, 116.13], [116.0, 117.93]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.09, 0.0, 31.88, 0.0, 31.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.66, 0.0, 37.95, 0.0], "audiomae_on_audioset": [[["music", 41.1], ["hum", 9.96], ["throbbing", 8.81]], null, [["cattle, bovinae", 42.09], ["moo", 33.12], ["livestock, farm animals, working animals", 15.92]], null, [["music", 29.62], ["throbbing", 26.11], ["hum", 21.4]], null, null, null, null, null, null, [["cattle, bovinae", 36.76], ["moo", 29.42], ["livestock, farm animals, working animals", 27.56]], null, [["moo", 45.34], ["cattle, bovinae", 32.74], ["livestock, farm animals, working animals", 19.29]], null], "duration": [3.52, -0.31, 15.61, 0.75, 6.56, 0.56, 0.32, 0.53, 0.04, 0.82, 1.22, 2.54, 0.75, 2.13, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/mudt7nvWwo4_filtered.json b/annotations_filtered/mudt7nvWwo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a249ecc27c8425a0564eeb8201547f28b402b73 --- /dev/null +++ b/annotations_filtered/mudt7nvWwo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [6.0, 7.11], [7.0, 12.51], [13.0, 15.2], [16.0, 17.37], [18.0, 22.01], [24.0, 25.79], [27.0, 29.27], [32.0, 40.26], [43.0, 45.25], [49.0, 50.3], [52.0, 53.28]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 64.52, 51.88, 0.0, 41.5, 0.0, 33.28, 32.66, 31.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 50.01], ["synthesizer", 12.15], ["electronic music", 4.78]], null, [["music", 41.27], ["speech", 20.6], ["foghorn", 9.23]], [["music", 56.41], ["synthesizer", 20.03], ["theremin", 3.88]], [["music", 29.29], ["speech", 19.73], ["foghorn", 11.91]], null, null], "duration": [0.73, 1.11, 5.51, 2.2, 1.37, 4.01, 1.79, 2.27, 8.26, 2.25, 1.3, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/mvAkLCKYvwU_filtered.json b/annotations_filtered/mvAkLCKYvwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14db6a65ae68c4ed4232db0d0f7351116101d735 --- /dev/null +++ b/annotations_filtered/mvAkLCKYvwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.87], [6.0, 7.18], [15.0, 18.42], [23.0, 23.97], [27.0, 28.93], [30.0, 34.52], [43.0, 44.12], [47.0, 47.11], [48.0, 60.83]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 49.59, 0.0, 0.0, 32.92, 0.0, 0.0, 33.36], "audiomae_on_audioset": [null, null, [["music", 35.18], ["theremin", 32.01], ["foghorn", 7.65]], null, null, [["music", 49.78], ["hum", 7.21], ["musical instrument", 6.69]], null, null, [["music", 30.04], ["trombone", 21.61], ["brass instrument", 20.37]]], "duration": [1.87, 1.18, 3.42, 0.97, 1.93, 4.52, 1.12, 0.11, 12.83]} \ No newline at end of file diff --git a/annotations_filtered/mvH6IhKpehk_filtered.json b/annotations_filtered/mvH6IhKpehk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..792049977dced172ca16befcc5cf1f41fc5f97a7 --- /dev/null +++ b/annotations_filtered/mvH6IhKpehk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.92], [10.0, 11.1], [12.0, 13.17], [18.0, 18.28], [19.0, 19.75], [20.0, 20.88], [21.0, 34.05], [40.0, 44.81], [53.0, 53.25], [63.0, 63.17], [65.0, 65.26], [80.0, 80.57], [91.0, 90.75], [92.0, 92.23], [105.0, 105.68], [108.0, 108.73], [111.0, 112.04], [113.0, 113.19], [133.0, 132.73], [138.0, 138.75], [139.0, 139.53], [140.0, 140.58], [146.0, 146.57], [154.0, 154.14]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 35.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 45.08], ["didgeridoo", 8.71], ["musical instrument", 5.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 1.1, 1.17, 0.28, 0.75, 0.88, 13.05, 4.81, 0.25, 0.17, 0.26, 0.57, -0.25, 0.23, 0.68, 0.73, 1.04, 0.19, -0.27, 0.75, 0.53, 0.58, 0.57, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/mvWdOSJ7l2c_filtered.json b/annotations_filtered/mvWdOSJ7l2c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16c91bcfd36dc20fc1fce2b26b64a449122c641b --- /dev/null +++ b/annotations_filtered/mvWdOSJ7l2c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 47.97], [54.0, 73.77], [82.0, 84.08], [86.0, 88.47], [92.0, 94.04], [96.0, 103.91], [104.0, 106.89], [108.0, 111.11], [113.0, 117.07], [119.0, 120.88], [124.0, 124.29], [128.0, 129.05]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.78, 41.87, 99.99, 100.0, 100.0, 100.0, 99.99, 100.0, 99.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.92], ["didgeridoo", 11.43], ["cattle, bovinae", 6.94]], null, null, null, null, null, null, null, null, null, null], "duration": [12.97, 19.77, 2.08, 2.47, 2.04, 7.91, 2.89, 3.11, 4.07, 1.88, 0.29, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/mvYdMO5ZfYM_filtered.json b/annotations_filtered/mvYdMO5ZfYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a14ee4be26cc45ed1ff7e9b81fa8ef0110dbde53 --- /dev/null +++ b/annotations_filtered/mvYdMO5ZfYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.86], [10.0, 11.65], [16.0, 18.35], [19.0, 24.06], [29.0, 30.47], [32.0, 34.64], [36.0, 36.36], [39.0, 40.71], [46.0, 47.31], [48.0, 49.91], [51.0, 53.1], [54.0, 57.1], [60.0, 61.43], [63.0, 64.42], [67.0, 70.44], [71.0, 73.48], [75.0, 78.46], [81.0, 81.16], [82.0, 87.64], [88.0, 91.89], [93.0, 95.05], [97.0, 97.92], [101.0, 103.79], [108.0, 110.13], [113.0, 115.72], [116.0, 118.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.83, 0.0, 80.82, 77.2, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 73.51, 98.73, 0.0, 0.0, 84.62, 99.31, 95.78, 0.0, 98.66, 64.86, 76.2, 0.0, 87.92, 88.83, 72.6, 59.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.86, 1.65, 2.35, 5.06, 1.47, 2.64, 0.36, 1.71, 1.31, 1.91, 2.1, 3.1, 1.43, 1.42, 3.44, 2.48, 3.46, 0.16, 5.64, 3.89, 2.05, 0.92, 2.79, 2.13, 2.72, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/mvbLx0pbohk_filtered.json b/annotations_filtered/mvbLx0pbohk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17042b9a901dfe4ef3ae34d79b993530309bf2ad --- /dev/null +++ b/annotations_filtered/mvbLx0pbohk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 83.17], [83.0, 93.51], [97.0, 117.76], [121.0, 125.14]], "keep_status": [false, true, true, true], "silence_prob": [0.0, 29.71, 30.36, 29.9], "audiomae_on_audioset": [null, [["vehicle", 16.83], ["buzz", 10.66], ["outside, rural or natural", 5.07]], [["music", 30.83], ["cacophony", 13.49], ["noise", 6.46]], [["hum", 16.2], ["speech", 13.05], ["buzzer", 8.58]]], "duration": [66.17, 10.51, 20.76, 4.14]} \ No newline at end of file diff --git a/annotations_filtered/mvgKGY5m71w_filtered.json b/annotations_filtered/mvgKGY5m71w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e4a8471883ea5d90506697b4092d40be18344d7 --- /dev/null +++ b/annotations_filtered/mvgKGY5m71w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.32], [7.0, 11.74], [14.0, 18.17], [21.0, 22.0], [23.0, 24.29], [26.0, 28.05], [31.0, 30.86], [32.0, 35.09], [41.0, 46.7], [48.0, 49.08], [51.0, 52.27], [54.0, 57.28], [60.0, 60.49], [61.0, 65.82], [67.0, 67.54], [69.0, 70.48], [71.0, 75.12], [78.0, 82.56], [86.0, 86.58], [89.0, 90.98], [93.0, 95.13], [96.0, 98.24], [101.0, 101.68], [104.0, 106.57], [108.0, 110.42], [113.0, 116.18], [117.0, 119.45], [120.0, 122.25], [124.0, 126.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 99.99, 0.0, 0.0, 99.68, 100.0, 0.0, 0.0, 71.72, 100.0, 0.0, 100.0, 100.0, 100.0, 86.82, 63.85, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 4.74, 4.17, 1.0, 1.29, 2.05, -0.14, 3.09, 5.7, 1.08, 1.27, 3.28, 0.49, 4.82, 0.54, 1.48, 4.12, 4.56, 0.58, 1.98, 2.13, 2.24, 0.68, 2.57, 2.42, 3.18, 2.45, 2.25, 2.93]} \ No newline at end of file diff --git a/annotations_filtered/mvmAa1cYZK4_filtered.json b/annotations_filtered/mvmAa1cYZK4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d3a5eb31e9bfc8265df3eb30663bc64bdeab250 --- /dev/null +++ b/annotations_filtered/mvmAa1cYZK4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [6.0, 7.15], [9.0, 10.86], [12.0, 11.77], [15.0, 18.15], [19.0, 20.38], [25.0, 25.91], [26.0, 27.14], [27.0, 27.87], [29.0, 29.66], [30.0, 36.1], [37.0, 38.06], [40.0, 48.95], [49.0, 53.5], [55.0, 59.14], [61.0, 62.68], [65.0, 66.61], [77.0, 78.92], [81.0, 89.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.44, 0.0, 33.37, 32.24, 31.25, 0.0, 0.0, 0.0, 30.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 31.7], ["animal", 4.48], ["dog", 4.15]], null, [["music", 35.0], ["gong", 16.4], ["hum", 10.89]], [["music", 61.87], ["mains hum", 12.51], ["hum", 7.9]], [["music", 49.6], ["synthesizer", 11.51], ["hum", 4.69]], null, null, null, [["music", 37.14], ["synthesizer", 15.32], ["sidetone", 12.73]]], "duration": [0.23, 1.15, 1.86, -0.23, 3.15, 1.38, 0.91, 1.14, 0.87, 0.66, 6.1, 1.06, 8.95, 4.5, 4.14, 1.68, 1.61, 1.92, 8.18]} \ No newline at end of file diff --git a/annotations_filtered/mw3M1fIiegc_filtered.json b/annotations_filtered/mw3M1fIiegc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..628969152f48ca3c4e56a951414ec82a5d96a5fe --- /dev/null +++ b/annotations_filtered/mw3M1fIiegc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [5.0, 6.56], [9.0, 10.25], [12.0, 13.44], [15.0, 15.57], [17.0, 18.52], [20.0, 21.98], [24.0, 25.59], [28.0, 30.69], [32.0, 34.11], [35.0, 35.55], [38.0, 38.42], [39.0, 40.54], [42.0, 44.1], [46.0, 46.28], [47.0, 47.49], [50.0, 50.35], [52.0, 56.1], [58.0, 60.54], [61.0, 63.1], [67.0, 67.54], [68.0, 70.9], [73.0, 73.5], [75.0, 76.32], [80.0, 81.57], [83.0, 89.07], [89.0, 93.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 97.73, 0.0, 0.0, 0.0, 82.07, 0.0, 0.0, 0.0, 94.37, 95.51, 96.42, 0.0, 64.41, 0.0, 0.0, 0.0, 99.21, 79.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 1.56, 1.25, 1.44, 0.57, 1.52, 1.98, 1.59, 2.69, 2.11, 0.55, 0.42, 1.54, 2.1, 0.28, 0.49, 0.35, 4.1, 2.54, 2.1, 0.54, 2.9, 0.5, 1.32, 1.57, 6.07, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/mw7xjHBJOvs_filtered.json b/annotations_filtered/mw7xjHBJOvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8f735a1ed92b9d3535e414ef9ef9e4a564d6271 --- /dev/null +++ b/annotations_filtered/mw7xjHBJOvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.67], [11.0, 11.03], [17.0, 17.81], [21.0, 21.51], [29.0, 29.19], [36.0, 36.46], [44.0, 47.83], [52.0, 55.04], [55.0, 55.11], [55.0, 55.14], [80.0, 80.87], [86.0, 87.02], [90.0, 97.29], [98.0, 104.7], [108.0, 108.9]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.07, 30.05, 0.0, 0.0, 0.0, 0.0, 33.11, 54.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 50.35], ["sidetone", 7.24], ["busy signal", 6.22]], [["speech", 90.86], ["sheep", 1.54], ["whimper", 1.44]], null, null, null, null, [["moo", 33.41], ["cattle, bovinae", 30.95], ["livestock, farm animals, working animals", 24.44]], null, null], "duration": [-0.33, 0.03, 0.81, 0.51, 0.19, 0.46, 3.83, 3.04, 0.11, 0.14, 0.87, 1.02, 7.29, 6.7, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/mw96cSYo9dU_filtered.json b/annotations_filtered/mw96cSYo9dU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e48298993e5535362e008e4d0d3e5ff0d7ce87b2 --- /dev/null +++ b/annotations_filtered/mw96cSYo9dU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 17.46], [20.0, 21.91], [23.0, 23.7], [25.0, 26.7], [29.0, 29.96], [32.0, 32.44], [34.0, 35.34], [39.0, 40.07], [41.0, 42.82], [45.0, 47.06], [48.0, 51.53], [52.0, 52.83], [54.0, 54.41], [56.0, 58.8], [61.0, 61.99], [64.0, 65.26], [67.0, 68.76], [74.0, 74.36], [78.0, 79.44], [81.0, 81.01], [82.0, 109.39], [110.0, 110.96], [112.0, 113.91], [114.0, 114.13], [116.0, 117.41], [119.0, 120.18], [122.0, 122.28], [123.0, 123.94], [127.0, 127.06], [129.0, 129.54]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [29.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44, 30.0, 0.0, 0.0, 29.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["explosion", 25.16], ["hum", 20.08], ["throbbing", 16.61]], null, null, null, null, null, null, null, null, null, [["speech", 54.97], ["explosion", 11.77], ["burst, pop", 7.16]], null, null, [["speech", 40.17], ["hum", 9.18], ["explosion", 6.06]], null, null, null, null, null, null, [["hum", 37.42], ["explosion", 14.55], ["throbbing", 11.48]], null, null, null, null, null, null, null, null, null], "duration": [13.46, 1.91, 0.7, 1.7, 0.96, 0.44, 1.34, 1.07, 1.82, 2.06, 3.53, 0.83, 0.41, 2.8, 0.99, 1.26, 1.76, 0.36, 1.44, 0.01, 27.39, 0.96, 1.91, 0.13, 1.41, 1.18, 0.28, 0.94, 0.06, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/mwAlagYhRV8_filtered.json b/annotations_filtered/mwAlagYhRV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95770eb0ad56a218cad2a982d60914fa405420f2 --- /dev/null +++ b/annotations_filtered/mwAlagYhRV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 35.31], [63.0, 69.9], [71.0, 71.83], [73.0, 79.66], [82.0, 83.24], [87.0, 88.69], [95.0, 98.0], [101.0, 104.68], [106.0, 114.91], [117.0, 123.45], [128.0, 129.42], [133.0, 133.78], [139.0, 141.08], [143.0, 143.67], [145.0, 152.79], [159.0, 163.97], [170.0, 171.36]], "keep_status": [false, true, false, true, false, false, true, true, true, false, false, false, false, false, false, false, false], "silence_prob": [33.21, 30.6, 0.0, 30.73, 0.0, 0.0, 33.28, 32.47, 30.67, 30.9, 0.0, 0.0, 30.59, 0.0, 29.36, 29.73, 0.0], "audiomae_on_audioset": [[["music", 66.34], ["mains hum", 10.82], ["hum", 8.51]], [["music", 30.05], ["mains hum", 20.46], ["hum", 14.14]], null, [["mains hum", 31.16], ["hum", 21.45], ["music", 16.87]], null, null, [["music", 31.08], ["hum", 17.13], ["mains hum", 13.61]], [["music", 36.68], ["whale vocalization", 12.23], ["speech", 4.16]], [["speech", 25.5], ["hum", 23.41], ["music", 11.25]], [["music", 44.11], ["speech", 25.04], ["mains hum", 7.38]], null, null, [["music", 53.02], ["mains hum", 12.57], ["hum", 7.56]], null, [["speech", 27.9], ["eruption", 24.83], ["explosion", 17.68]], [["eruption", 41.45], ["speech", 20.12], ["explosion", 15.43]], null], "duration": [22.31, 6.9, 0.83, 6.66, 1.24, 1.69, 3.0, 3.68, 8.91, 6.45, 1.42, 0.78, 2.08, 0.67, 7.79, 4.97, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/mwHOh0YPpBU_filtered.json b/annotations_filtered/mwHOh0YPpBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/mwHOh0YPpBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/mwMmZ8dtWNM_filtered.json b/annotations_filtered/mwMmZ8dtWNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a54c90c18021fa2cc0c8abd734a397d341249ee --- /dev/null +++ b/annotations_filtered/mwMmZ8dtWNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.44], [8.0, 8.82], [17.0, 17.49], [22.0, 22.82], [45.0, 45.45], [47.0, 47.95], [54.0, 55.32], [62.0, 62.63], [64.0, 64.0], [71.0, 73.09], [74.0, 77.79], [80.0, 80.99], [84.0, 87.67], [89.0, 91.5], [92.0, 96.4], [103.0, 104.26], [105.0, 105.16], [106.0, 116.21], [122.0, 122.49], [124.0, 140.12], [142.0, 142.64], [144.0, 145.02], [147.0, 150.31], [153.0, 153.66], [168.0, 167.97], [170.0, 171.37], [178.0, 178.85], [185.0, 185.16], [187.0, 187.52], [192.0, 192.89], [194.0, 197.09], [200.0, 201.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 99.87, 0.0, 100.0, 98.1, 82.97, 0.0, 0.0, 79.59, 0.0, 50.02, 0.0, 0.0, 46.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.26], ["speech", 6.91], ["musical instrument", 2.62]], null, null, null, null, null, null, null, null, null], "duration": [3.44, 0.82, 0.49, 0.82, 0.45, 0.95, 1.32, 0.63, 0.0, 2.09, 3.79, 0.99, 3.67, 2.5, 4.4, 1.26, 0.16, 10.21, 0.49, 16.12, 0.64, 1.02, 3.31, 0.66, -0.03, 1.37, 0.85, 0.16, 0.52, 0.89, 3.09, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/mwqxM-ccpNE_filtered.json b/annotations_filtered/mwqxM-ccpNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8566ec5fbfe1d675eb1abf6f05945fe033b703cb --- /dev/null +++ b/annotations_filtered/mwqxM-ccpNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.0], [4.0, 4.14], [12.0, 12.02], [18.0, 18.67], [22.0, 22.3], [27.0, 27.78], [29.0, 29.37], [33.0, 33.3]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [51.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [2.0, 0.14, 0.02, 0.67, 0.3, 0.78, 0.37, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/mwrMEQnMRCQ_filtered.json b/annotations_filtered/mwrMEQnMRCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..779cfcc8db9102901371f2b230fb35c3ce873bd4 --- /dev/null +++ b/annotations_filtered/mwrMEQnMRCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [27.0, 34.05], [37.0, 63.8], [66.0, 84.89], [85.0, 93.43], [94.0, 105.76], [112.0, 113.64], [115.0, 117.21], [120.0, 124.06], [131.0, 130.79], [131.0, 132.73]], "keep_status": [false, false, false, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 29.69, 29.15, 28.97, 29.28, 29.62, 0.0, 40.84, 31.83, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 49.03], ["throbbing", 20.92], ["hum", 11.98]], [["music", 62.93], ["throbbing", 9.52], ["hum", 6.24]], [["music", 49.01], ["throbbing", 20.75], ["electronic music", 5.92]], [["music", 55.57], ["buzz", 6.49], ["speech", 5.44]], [["music", 71.21], ["buzz", 5.9], ["hum", 2.64]], null, [["fly, housefly", 20.75], ["insect", 13.35], ["hum", 8.61]], [["music", 28.62], ["speech", 14.1], ["throbbing", 9.76]], null, null], "duration": [0.51, 7.05, 26.8, 18.89, 8.43, 11.76, 1.64, 2.21, 4.06, -0.21, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/mx15l4L4Zlk_filtered.json b/annotations_filtered/mx15l4L4Zlk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f271c115744fb0e3eb56edda06415fa9492d6f06 --- /dev/null +++ b/annotations_filtered/mx15l4L4Zlk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 29.47], [30.0, 35.95], [37.0, 39.07], [40.0, 40.93], [42.0, 42.26], [44.0, 46.85], [50.0, 50.19], [52.0, 52.44], [58.0, 58.7], [60.0, 61.03], [63.0, 64.03], [65.0, 67.41], [69.0, 70.01], [72.0, 72.39], [73.0, 125.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.0, 57.89, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 45.7], ["music", 15.54], ["mains hum", 13.01]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [16.47, 5.95, 2.07, 0.93, 0.26, 2.85, 0.19, 0.44, 0.7, 1.03, 1.03, 2.41, 1.01, 0.39, 52.52]} \ No newline at end of file diff --git a/annotations_filtered/mxJtFvNByKw_filtered.json b/annotations_filtered/mxJtFvNByKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1e42c7a8fcbb44203a013e6a639a27ec8f100b3 --- /dev/null +++ b/annotations_filtered/mxJtFvNByKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.44], [7.0, 7.57], [10.0, 10.47], [13.0, 13.19], [18.0, 20.28], [27.0, 28.86], [29.0, 32.19]], "keep_status": [false, false, false, false, true, false, true], "silence_prob": [41.38, 0.0, 0.0, 0.0, 41.01, 0.0, 39.07], "audiomae_on_audioset": [[["music", 54.78], ["didgeridoo", 19.81], ["speech", 3.35]], null, null, null, [["music", 48.19], ["theremin", 12.39], ["ambient music", 4.8]], null, [["music", 20.04], ["speech", 18.69], ["hum", 16.63]]], "duration": [3.44, 0.57, 0.47, 0.19, 2.28, 1.86, 3.19]} \ No newline at end of file diff --git a/annotations_filtered/mxz_RfabdUo_filtered.json b/annotations_filtered/mxz_RfabdUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e8960e61349848707711f592c951dc743074060 --- /dev/null +++ b/annotations_filtered/mxz_RfabdUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [13.0, 13.86], [14.0, 14.23], [23.0, 25.24], [29.0, 29.47], [32.0, 32.24], [33.0, 33.52], [35.0, 36.0], [37.0, 37.22], [39.0, 47.58], [49.0, 50.25], [51.0, 55.09], [56.0, 56.73], [58.0, 58.16], [72.0, 72.22], [75.0, 74.95], [77.0, 76.81], [77.0, 77.38], [80.0, 80.01], [83.0, 83.4], [87.0, 87.76], [94.0, 94.15], [96.0, 97.12], [103.0, 103.94], [106.0, 106.2], [114.0, 115.28], [117.0, 117.41], [131.0, 131.35], [133.0, 133.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.95, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.86, 0.23, 2.24, 0.47, 0.24, 0.52, 1.0, 0.22, 8.58, 1.25, 4.09, 0.73, 0.16, 0.22, -0.05, -0.19, 0.38, 0.01, 0.4, 0.76, 0.15, 1.12, 0.94, 0.2, 1.28, 0.41, 0.35, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/myOTp1wr3Bg_filtered.json b/annotations_filtered/myOTp1wr3Bg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3ae2e155a99a37daa5f0f230105f5283dd94a67 --- /dev/null +++ b/annotations_filtered/myOTp1wr3Bg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.31], [10.0, 10.52], [11.0, 17.96], [20.0, 29.88], [35.0, 35.55], [36.0, 38.06], [44.0, 44.63], [45.0, 47.65], [52.0, 52.88], [61.0, 64.13], [65.0, 68.13], [69.0, 69.3], [74.0, 74.28], [76.0, 76.23], [80.0, 92.84]], "keep_status": [false, false, false, true, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 64.75, 31.23, 0.0, 75.39, 0.0, 62.47, 0.0, 43.79, 48.23, 0.0, 0.0, 0.0, 36.92], "audiomae_on_audioset": [null, null, null, [["machine gun", 18.34], ["noise", 15.01], ["speech", 9.33]], null, null, null, null, null, [["vehicle", 21.16], ["aircraft", 7.38], ["speech", 7.19]], [["frog", 21.14], ["electric shaver, electric razor", 13.49], ["whale vocalization", 10.89]], null, null, null, [["music", 23.85], ["hum", 9.86], ["noise", 6.35]]], "duration": [0.31, 0.52, 6.96, 9.88, 0.55, 2.06, 0.63, 2.65, 0.88, 3.13, 3.13, 0.3, 0.28, 0.23, 12.84]} \ No newline at end of file diff --git a/annotations_filtered/mySMw3VkEBE_filtered.json b/annotations_filtered/mySMw3VkEBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b288832a6a4df4e5350c8f284df9a05bde6b734d --- /dev/null +++ b/annotations_filtered/mySMw3VkEBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.31], [5.0, 9.96], [11.0, 14.35], [16.0, 21.54], [24.0, 27.11], [28.0, 30.15], [31.0, 34.26], [36.0, 37.2], [38.0, 39.02], [43.0, 44.51], [46.0, 46.06], [47.0, 48.46], [51.0, 51.26], [54.0, 54.6], [56.0, 61.01], [62.0, 72.06], [77.0, 89.31], [100.0, 101.53], [104.0, 104.82], [120.0, 129.07], [130.0, 132.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.94, 53.72, 99.16, 75.72, 70.86, 99.05, 52.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.92, 56.63, 37.93, 0.0, 0.0, 72.16, 52.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["busy signal", 31.57], ["dial tone", 30.06], ["sine wave", 12.16]], null, [["speech", 43.58], ["telephone", 25.47], ["telephone bell ringing", 16.28]], null, null, null, null], "duration": [3.31, 4.96, 3.35, 5.54, 3.11, 2.15, 3.26, 1.2, 1.02, 1.51, 0.06, 1.46, 0.26, 0.6, 5.01, 10.06, 12.31, 1.53, 0.82, 9.07, 2.16]} \ No newline at end of file diff --git a/annotations_filtered/myZDn8fFRLY_filtered.json b/annotations_filtered/myZDn8fFRLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75dabbc259706ba17d32554aff22c9775dd4c971 --- /dev/null +++ b/annotations_filtered/myZDn8fFRLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.44], [26.0, 27.35], [50.0, 63.58], [69.0, 70.07], [73.0, 72.94], [104.0, 104.25], [107.0, 107.81], [112.0, 112.31], [113.0, 114.12], [115.0, 116.02], [131.0, 132.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.47, 0.0, 32.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 55.49], ["speech", 18.28], ["groan", 6.54]], null, null, null, null, null, null, null, null], "duration": [13.44, 1.35, 13.58, 1.07, -0.06, 0.25, 0.81, 0.31, 1.12, 1.02, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/mycAsRhAr_M_filtered.json b/annotations_filtered/mycAsRhAr_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..539bb68871bfd32402fd75705846edb96aff8dcf --- /dev/null +++ b/annotations_filtered/mycAsRhAr_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.7], [8.0, 7.74], [8.0, 7.77], [8.0, 7.8], [8.0, 13.78], [15.0, 16.02], [17.0, 19.28], [23.0, 24.38], [26.0, 26.74], [27.0, 32.32], [34.0, 39.26], [40.0, 41.15], [44.0, 45.81], [49.0, 53.43], [54.0, 56.88], [58.0, 62.9], [65.0, 70.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.4, 0.0, 62.99, 0.0, 0.0, 78.21, 95.37, 0.0, 0.0, 51.82, 48.69, 43.1, 43.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.22], ["theremin", 18.15], ["shofar", 13.29]], [["theremin", 50.28], ["music", 22.98], ["speech", 5.53]], [["music", 65.09], ["theremin", 19.74], ["musical instrument", 3.06]]], "duration": [-0.3, -0.26, -0.23, -0.2, 5.78, 1.02, 2.28, 1.38, 0.74, 5.32, 5.26, 1.15, 1.81, 4.43, 2.88, 4.9, 5.28]} \ No newline at end of file diff --git a/annotations_filtered/mydc8K7yaZI_filtered.json b/annotations_filtered/mydc8K7yaZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa779d15aacdb575c7544fc93878f78f37a370c1 --- /dev/null +++ b/annotations_filtered/mydc8K7yaZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.12], [10.0, 10.39], [15.0, 15.97], [17.0, 16.98], [24.0, 24.56], [27.0, 27.31], [28.0, 41.08], [45.0, 45.06]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.09, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 20.86], ["moo", 7.38], ["cattle, bovinae", 6.1]], null], "duration": [0.12, 0.39, 0.97, -0.02, 0.56, 0.31, 13.08, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/mz6dgt11n-E_filtered.json b/annotations_filtered/mz6dgt11n-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13ed034baf16b0358f15f9b1290ba5d625e9085c --- /dev/null +++ b/annotations_filtered/mz6dgt11n-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.8], [11.0, 12.51], [14.0, 14.84], [15.0, 15.74], [19.0, 22.35], [23.0, 23.77], [24.0, 25.46], [27.0, 29.0], [29.0, 30.55], [37.0, 37.71], [43.0, 43.16], [44.0, 45.03], [51.0, 51.85], [53.0, 53.1], [54.0, 55.21], [56.0, 60.35], [64.0, 65.48], [72.0, 71.88], [75.0, 76.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.51, 0.84, 0.74, 3.35, 0.77, 1.46, 2.0, 1.55, 0.71, 0.16, 1.03, 0.85, 0.1, 1.21, 4.35, 1.48, -0.12, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/mzNUbT2sQT4_filtered.json b/annotations_filtered/mzNUbT2sQT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..847e2cabac02229404098e8b6a766ad5fc4e3435 --- /dev/null +++ b/annotations_filtered/mzNUbT2sQT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.74], [12.0, 12.97], [14.0, 14.91], [16.0, 16.14], [18.0, 21.46], [26.0, 26.77], [30.0, 31.09], [33.0, 33.83], [37.0, 37.2], [43.0, 43.82], [46.0, 47.36], [52.0, 52.81], [53.0, 54.18], [55.0, 60.2], [64.0, 63.96], [68.0, 68.71], [74.0, 74.16], [75.0, 76.2], [78.0, 78.54], [81.0, 84.55], [90.0, 92.7], [95.0, 96.82], [100.0, 101.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 46.9, 97.33, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 17.91], ["creak", 16.6], ["mosquito", 13.36]], null, null, null], "duration": [0.74, 0.97, 0.91, 0.14, 3.46, 0.77, 1.09, 0.83, 0.2, 0.82, 1.36, 0.81, 1.18, 5.2, -0.04, 0.71, 0.16, 1.2, 0.54, 3.55, 2.7, 1.82, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/mzP8haJXI5A_filtered.json b/annotations_filtered/mzP8haJXI5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c7c03a86702ad62c32272e29bf36e82d1a8942c --- /dev/null +++ b/annotations_filtered/mzP8haJXI5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.29], [3.0, 27.63], [29.0, 36.41], [36.0, 43.73], [44.0, 44.32], [44.0, 49.77]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 29.12, 39.34, 30.37, 0.0, 30.51], "audiomae_on_audioset": [null, [["music", 41.93], ["sitar", 21.16], ["speech", 12.33]], [["music", 25.33], ["speech", 24.51], ["sidetone", 15.63]], [["music", 39.25], ["boing", 23.9], ["speech", 23.57]], null, [["boing", 41.07], ["music", 26.25], ["speech", 21.25]]], "duration": [1.29, 24.63, 7.41, 7.73, 0.32, 5.77]} \ No newline at end of file diff --git a/annotations_filtered/mzddAYYDZkk_filtered.json b/annotations_filtered/mzddAYYDZkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4724f3f2fc0f4cad48b1fc90c1e78de38bb1a85 --- /dev/null +++ b/annotations_filtered/mzddAYYDZkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [8.0, 7.91], [8.0, 9.04], [10.0, 11.01], [12.0, 12.23], [13.0, 13.61], [16.0, 17.69], [20.0, 20.56], [25.0, 25.05], [26.0, 25.98], [29.0, 29.29], [32.0, 32.37], [38.0, 38.16], [43.0, 49.11], [52.0, 52.15], [54.0, 56.54], [59.0, 59.75], [64.0, 64.27], [71.0, 71.9], [73.0, 73.8], [76.0, 76.77], [79.0, 80.01], [80.0, 80.76], [83.0, 83.61], [86.0, 95.67], [96.0, 97.06], [101.0, 101.82], [106.0, 106.52], [107.0, 108.04], [109.0, 109.54], [113.0, 120.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.38, 0.0, 35.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.63, 0.0, 0.0, 0.0, 0.0, 0.0, 42.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 33.35], ["speech", 9.97], ["sidetone", 7.02]], null, [["speech", 65.38], ["telephone", 9.59], ["dial tone", 8.2]], null, null, null, null, null, null, null, null, [["fart", 28.18], ["hum", 9.21], ["skateboard", 5.88]], null, null, null, null, null, [["hum", 25.47], ["heart sounds, heartbeat", 7.56], ["mains hum", 7.56]]], "duration": [1.0, -0.09, 1.04, 1.01, 0.23, 0.61, 1.69, 0.56, 0.05, -0.02, 0.29, 0.37, 0.16, 6.11, 0.15, 2.54, 0.75, 0.27, 0.9, 0.8, 0.77, 1.01, 0.76, 0.61, 9.67, 1.06, 0.82, 0.52, 1.04, 0.54, 7.04]} \ No newline at end of file diff --git a/annotations_filtered/mzuVsHCLSOg_filtered.json b/annotations_filtered/mzuVsHCLSOg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..380a26b5672ca3b838f850e3d55ef54e4e18e9c3 --- /dev/null +++ b/annotations_filtered/mzuVsHCLSOg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [6.0, 6.24], [8.0, 9.12], [12.0, 12.21], [12.0, 13.15], [14.0, 15.01], [18.0, 20.97], [23.0, 24.22], [31.0, 31.89], [34.0, 34.3], [38.0, 39.87], [41.0, 42.15], [43.0, 43.92], [48.0, 49.22], [53.0, 55.7], [56.0, 57.21], [61.0, 62.85], [64.0, 67.29], [68.0, 68.81], [71.0, 72.66], [73.0, 73.94], [79.0, 85.35], [86.0, 115.84], [118.0, 118.54], [120.0, 122.35], [123.0, 123.74], [124.0, 124.85], [126.0, 127.35], [129.0, 129.61], [130.0, 130.99]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.2, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 45.05, 70.16, 0.0, 36.3, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["fart", 24.26], ["throat clearing", 12.57], ["cough", 9.35]], null, null, null, null, null, null, null, [["hum", 37.05], ["speech", 19.4], ["mains hum", 6.67]], null, null, null, null, null, null, [["frog", 17.56], ["speech", 14.6], ["grunt", 12.8]], null, null, [["speech", 82.09], ["dial tone", 3.49], ["busy signal", 3.17]], null, null, null, null, null], "duration": [1.13, 0.24, 1.12, 0.21, 1.15, 1.01, 2.97, 1.22, 0.89, 0.3, 1.87, 1.15, 0.92, 1.22, 2.7, 1.21, 1.85, 3.29, 0.81, 1.66, 0.94, 6.35, 29.84, 0.54, 2.35, 0.74, 0.85, 1.35, 0.61, 0.99]} \ No newline at end of file