diff --git a/annotations_filtered/a-9990dlfvo_filtered.json b/annotations_filtered/a-9990dlfvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..680883a26962b98d2b3856609b92ed6e3279ac7c --- /dev/null +++ b/annotations_filtered/a-9990dlfvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.94], [11.0, 10.61], [11.0, 11.87], [13.0, 16.95], [18.0, 22.4], [24.0, 33.08], [35.0, 37.17], [38.0, 89.46], [92.0, 92.28], [96.0, 96.38], [97.0, 97.48], [99.0, 99.6], [101.0, 103.76], [110.0, 110.24], [111.0, 111.2], [116.0, 116.87], [122.0, 122.61], [123.0, 123.58], [125.0, 124.97], [126.0, 126.6], [130.0, 130.76], [131.0, 138.55], [142.0, 142.01], [145.0, 148.96], [149.0, 150.15], [154.0, 154.97], [155.0, 156.32], [157.0, 159.51], [161.0, 165.47], [167.0, 167.04], [167.0, 167.1], [167.0, 173.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, true], "silence_prob": [62.89, 0.0, 0.0, 58.13, 53.04, 56.18, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 31.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.13, 0.0, 32.35, 0.0, 0.0, 0.0, 33.09, 31.81, 0.0, 0.0, 31.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.65], ["speech", 4.74], ["meow", 4.68]], null, null, null, null, null, null, null, null, [["music", 36.25], ["livestock, farm animals, working animals", 9.95], ["hum", 6.28]], null, [["speech", 47.96], ["music", 22.24], ["musical instrument", 10.32]], null, null, null, [["music", 33.5], ["wind instrument, woodwind instrument", 8.27], ["musical instrument", 6.59]], [["music", 36.18], ["musical instrument", 16.14], ["shofar", 6.98]], null, null, [["speech", 53.16], ["music", 11.99], ["electric shaver, electric razor", 4.51]]], "duration": [2.94, -0.39, 0.87, 3.95, 4.4, 9.08, 2.17, 51.46, 0.28, 0.38, 0.48, 0.6, 2.76, 0.24, 0.2, 0.87, 0.61, 0.58, -0.03, 0.6, 0.76, 7.55, 0.01, 3.96, 1.15, 0.97, 1.32, 2.51, 4.47, 0.04, 0.1, 6.31]} \ No newline at end of file diff --git a/annotations_filtered/a-CS6CjnEw8_filtered.json b/annotations_filtered/a-CS6CjnEw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2fab5d544b4f14b8b5ef74ef7bc6c40d95d43ed0 --- /dev/null +++ b/annotations_filtered/a-CS6CjnEw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.62], [23.0, 23.8], [25.0, 26.2], [27.0, 30.47], [35.0, 36.68], [38.0, 38.57], [40.0, 40.19], [41.0, 42.09], [43.0, 49.52], [51.0, 51.53], [52.0, 52.71], [53.0, 56.1], [58.0, 58.29], [59.0, 76.6], [78.0, 80.28], [82.0, 84.13], [87.0, 89.06], [98.0, 99.23], [101.0, 108.38], [109.0, 115.26], [116.0, 131.16], [132.0, 133.62], [135.0, 137.0], [142.0, 142.65], [143.0, 146.42]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 48.74, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 49.54, 0.0, 72.01, 96.54, 100.0, 94.81, 0.0, 100.0, 96.89, 99.93, 0.0, 97.54, 0.0, 88.28], "audiomae_on_audioset": [null, null, null, [["music", 25.28], ["didgeridoo", 11.68], ["guitar", 7.89]], null, null, null, null, null, null, null, [["sidetone", 50.03], ["busy signal", 18.45], ["speech", 16.24]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.62, 0.8, 1.2, 3.47, 1.68, 0.57, 0.19, 1.09, 6.52, 0.53, 0.71, 3.1, 0.29, 17.6, 2.28, 2.13, 2.06, 1.23, 7.38, 6.26, 15.16, 1.62, 2.0, 0.65, 3.42]} \ No newline at end of file diff --git a/annotations_filtered/a-IU2mBY1_4_filtered.json b/annotations_filtered/a-IU2mBY1_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6f76275439322d3495ff21a7381ecff155ec47b --- /dev/null +++ b/annotations_filtered/a-IU2mBY1_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.94], [12.0, 26.69], [29.0, 47.36], [48.0, 52.79], [53.0, 56.42], [58.0, 67.27], [71.0, 70.87], [72.0, 74.95], [76.0, 79.0], [82.0, 85.99], [88.0, 91.0], [92.0, 95.89], [98.0, 106.78], [107.0, 110.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 76.53, 89.19, 99.99, 95.91, 97.73, 0.0, 99.68, 99.59, 54.7, 57.64, 66.27, 64.52, 44.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.05], ["hiccup", 12.11], ["theremin", 7.62]]], "duration": [0.94, 14.69, 18.36, 4.79, 3.42, 9.27, -0.13, 2.95, 3.0, 3.99, 3.0, 3.89, 8.78, 3.71]} \ No newline at end of file diff --git a/annotations_filtered/a-KQ5h6WmJg_filtered.json b/annotations_filtered/a-KQ5h6WmJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84a8324f1d053e8789d074a3079e5eb46c95d035 --- /dev/null +++ b/annotations_filtered/a-KQ5h6WmJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [5.0, 5.16], [6.0, 6.56], [8.0, 8.55], [9.0, 12.68], [13.0, 17.04], [18.0, 19.8], [22.0, 22.81], [25.0, 24.98], [27.0, 31.51], [32.0, 32.31], [34.0, 35.53], [36.0, 37.32], [40.0, 40.02], [42.0, 42.9], [49.0, 48.86], [51.0, 57.65], [61.0, 62.18], [65.0, 65.6], [68.0, 71.71], [80.0, 80.64], [81.0, 82.38], [83.0, 83.96], [91.0, 91.64], [93.0, 93.18], [98.0, 98.69], [102.0, 102.39], [104.0, 104.03], [106.0, 106.08], [111.0, 112.87], [115.0, 115.8], [117.0, 116.99], [121.0, 121.59], [124.0, 126.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 86.09, 51.28, 0.0, 0.0, 0.0, 54.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.44, 0.16, 0.56, 0.55, 3.68, 4.04, 1.8, 0.81, -0.02, 4.51, 0.31, 1.53, 1.32, 0.02, 0.9, -0.14, 6.65, 1.18, 0.6, 3.71, 0.64, 1.38, 0.96, 0.64, 0.18, 0.69, 0.39, 0.03, 0.08, 1.87, 0.8, -0.01, 0.59, 2.45]} \ No newline at end of file diff --git a/annotations_filtered/a-SnsqKFHLY_filtered.json b/annotations_filtered/a-SnsqKFHLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3291225131b21ab3e8c61ebae734e006344fbf5 --- /dev/null +++ b/annotations_filtered/a-SnsqKFHLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.27], [21.0, 30.08], [31.0, 32.76], [33.0, 36.46], [46.0, 49.15], [57.0, 58.58], [60.0, 82.49], [85.0, 85.43], [87.0, 88.25], [89.0, 89.78], [92.0, 94.34], [96.0, 97.58], [102.0, 107.2], [109.0, 109.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 58.05, 0.0, 58.98, 67.51, 0.0, 62.37, 0.0, 0.0, 0.0, 98.19, 0.0, 57.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.27, 9.08, 1.76, 3.46, 3.15, 1.58, 22.49, 0.43, 1.25, 0.78, 2.34, 1.58, 5.2, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/a-VqYtkvmzw_filtered.json b/annotations_filtered/a-VqYtkvmzw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2653c1d602ccc07d227263c1b1f813151451f7d5 --- /dev/null +++ b/annotations_filtered/a-VqYtkvmzw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.91], [35.0, 36.17], [38.0, 38.11], [39.0, 39.39], [41.0, 41.66], [44.0, 43.95], [45.0, 46.99], [52.0, 52.69], [64.0, 64.35], [66.0, 72.69]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["rumble", 48.11], ["hum", 13.72], ["mains hum", 3.13]]], "duration": [1.91, 1.17, 0.11, 0.39, 0.66, -0.05, 1.99, 0.69, 0.35, 6.69]} \ No newline at end of file diff --git a/annotations_filtered/a-Z66uN97Ds_filtered.json b/annotations_filtered/a-Z66uN97Ds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6a7953666fbc3a3dc46250e00bcfa1f9a659c8f --- /dev/null +++ b/annotations_filtered/a-Z66uN97Ds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 51.0], [58.0, 77.82], [82.0, 83.35], [88.0, 88.43], [90.0, 90.37], [92.0, 96.31], [102.0, 102.86], [104.0, 104.68]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 33.85, 0.0, 0.0, 0.0, 35.73, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 37.6], ["throbbing", 26.77], ["hum", 16.89]], null, null, null, [["fly, housefly", 22.33], ["insect", 18.13], ["music", 15.21]], null, null], "duration": [0.0, 19.82, 1.35, 0.43, 0.37, 4.31, 0.86, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/a-h2glY0jyg_filtered.json b/annotations_filtered/a-h2glY0jyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61fddcae7e3b851253e89b9562ef4dc4d16eec6b --- /dev/null +++ b/annotations_filtered/a-h2glY0jyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [4.0, 5.49], [8.0, 8.6], [9.0, 10.86], [12.0, 12.8], [14.0, 15.21], [17.0, 18.4], [21.0, 23.08], [23.0, 29.29], [30.0, 32.22], [33.0, 35.28], [36.0, 36.75], [37.0, 38.53], [40.0, 41.55], [44.0, 45.18], [46.0, 46.85], [48.0, 49.23], [50.0, 58.14], [60.0, 60.4], [61.0, 62.13], [63.0, 63.49], [64.0, 64.49], [66.0, 66.75], [68.0, 69.01], [70.0, 71.29], [74.0, 73.89], [75.0, 75.44], [76.0, 76.91], [78.0, 78.98], [80.0, 81.45], [83.0, 84.11], [86.0, 86.05], [87.0, 89.18], [95.0, 95.44], [97.0, 98.22], [101.0, 101.02], [106.0, 109.19], [110.0, 113.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 86.27, 88.28, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 68.28, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.49, 0.6, 1.86, 0.8, 1.21, 1.4, 2.08, 6.29, 2.22, 2.28, 0.75, 1.53, 1.55, 1.18, 0.85, 1.23, 8.14, 0.4, 1.13, 0.49, 0.49, 0.75, 1.01, 1.29, -0.11, 0.44, 0.91, 0.98, 1.45, 1.11, 0.05, 2.18, 0.44, 1.22, 0.02, 3.19, 3.27]} \ No newline at end of file diff --git a/annotations_filtered/a1Bx9nyw35w_filtered.json b/annotations_filtered/a1Bx9nyw35w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f0adca9f55405f9dfacce687da5c24000e9b74b --- /dev/null +++ b/annotations_filtered/a1Bx9nyw35w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 24.34], [26.0, 32.93], [34.0, 34.55], [43.0, 45.5], [47.0, 46.9], [53.0, 86.19], [90.0, 100.9], [103.0, 103.79], [105.0, 127.36], [129.0, 132.8], [135.0, 185.3], [187.0, 188.03], [188.0, 192.18]], "keep_status": [true, true, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [34.11, 35.62, 0.0, 54.23, 0.0, 0.0, 35.39, 0.0, 30.76, 37.72, 0.0, 0.0, 46.43], "audiomae_on_audioset": [[["music", 23.3], ["noise", 10.22], ["whale vocalization", 8.51]], [["speech", 26.07], ["dog", 6.21], ["bouncing", 5.96]], null, null, null, null, [["music", 38.47], ["speech", 19.93], ["brass instrument", 6.6]], null, [["music", 33.67], ["mains hum", 14.46], ["hum", 13.77]], [["music", 46.82], ["hum", 9.03], ["didgeridoo", 3.25]], null, null, [["music", 72.37], ["musical instrument", 4.85], ["bowed string instrument", 2.66]]], "duration": [21.34, 6.93, 0.55, 2.5, -0.1, 33.19, 10.9, 0.79, 22.36, 3.8, 50.3, 1.03, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/a1GeB9y9zzo_filtered.json b/annotations_filtered/a1GeB9y9zzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e35d0ba5add7d53c0b585e245f1a59965d3d7742 --- /dev/null +++ b/annotations_filtered/a1GeB9y9zzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 111.92]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [106.92]} \ No newline at end of file diff --git a/annotations_filtered/a1REfTIc5po_filtered.json b/annotations_filtered/a1REfTIc5po_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07c9d0c7bcfb0e4d0b323e4157f81a477e3b3f7e --- /dev/null +++ b/annotations_filtered/a1REfTIc5po_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.78], [18.0, 18.69], [20.0, 20.75], [22.0, 25.07], [25.0, 26.47], [30.0, 30.48], [33.0, 34.35], [39.0, 40.86], [42.0, 42.99], [44.0, 45.06], [47.0, 64.83], [73.0, 74.87], [83.0, 82.83], [86.0, 86.63], [87.0, 90.21], [90.0, 90.95], [102.0, 102.17], [107.0, 108.08], [109.0, 112.14], [120.0, 120.75], [122.0, 122.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.2, 0.0, 0.0, 0.0, 32.08, 0.0, 0.0, 0.0, 39.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 43.3], ["throbbing", 11.73], ["hum", 10.69]], null, null, null, [["music", 50.04], ["speech", 13.67], ["electronic music", 1.64]], null, null, null, [["music", 52.07], ["didgeridoo", 12.94], ["hum", 5.72]], null, null], "duration": [7.78, 0.69, 0.75, 3.07, 1.47, 0.48, 1.35, 1.86, 0.99, 1.06, 17.83, 1.87, -0.17, 0.63, 3.21, 0.95, 0.17, 1.08, 3.14, 0.75, 0.12]} \ No newline at end of file diff --git a/annotations_filtered/a1iQDKCkh6k_filtered.json b/annotations_filtered/a1iQDKCkh6k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11550235254f357ec07a37093abaf0f0e8899f07 --- /dev/null +++ b/annotations_filtered/a1iQDKCkh6k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 20.65], [21.0, 48.98], [49.0, 49.57], [52.0, 51.98], [53.0, 53.6], [54.0, 74.02], [77.0, 142.05], [144.0, 146.23], [150.0, 152.17], [153.0, 157.01]], "keep_status": [false, true, false, false, false, false, false, true, false, false], "silence_prob": [95.51, 30.38, 0.0, 0.0, 0.0, 30.37, 0.0, 35.79, 55.39, 37.73], "audiomae_on_audioset": [null, [["speech", 37.39], ["music", 15.48], ["boing", 5.38]], null, null, null, [["speech", 60.27], ["machine gun", 11.31], ["sidetone", 8.12]], null, [["music", 15.79], ["noise", 14.32], ["hum", 6.65]], null, [["sidetone", 61.57], ["speech", 18.95], ["explosion", 3.82]]], "duration": [3.65, 27.98, 0.57, -0.02, 0.6, 20.02, 65.05, 2.23, 2.17, 4.01]} \ No newline at end of file diff --git a/annotations_filtered/a2872XpfqKY_filtered.json b/annotations_filtered/a2872XpfqKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c74154da8d409dcc679c1eef532cae42bd68bb24 --- /dev/null +++ b/annotations_filtered/a2872XpfqKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[108.0, 108.75]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.75]} \ No newline at end of file diff --git a/annotations_filtered/a2ZdXUZt3iw_filtered.json b/annotations_filtered/a2ZdXUZt3iw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df29d7f48b70aeb32f211d1ddcc3e4c015939f30 --- /dev/null +++ b/annotations_filtered/a2ZdXUZt3iw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 39.45], [40.0, 43.63], [45.0, 47.29], [49.0, 52.35], [53.0, 54.14], [56.0, 56.29], [58.0, 58.26], [59.0, 60.34], [63.0, 64.5], [65.0, 67.56], [68.0, 67.61], [68.0, 96.58], [99.0, 105.02], [107.0, 107.49], [109.0, 111.32], [114.0, 115.69]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.27, 45.92, 36.01, 41.42, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 28.85, 34.88, 0.0, 76.7, 0.0], "audiomae_on_audioset": [[["speech", 47.4], ["explosion", 10.71], ["music", 7.53]], [["music", 27.49], ["didgeridoo", 20.73], ["speech", 14.26]], [["didgeridoo", 18.3], ["speech", 16.09], ["mains hum", 14.86]], [["fart", 28.8], ["speech", 11.53], ["dog", 10.47]], null, null, null, null, null, null, null, [["speech", 57.29], ["music", 17.27], ["hum", 5.81]], [["music", 33.04], ["hum", 23.44], ["mains hum", 9.14]], null, null, null], "duration": [21.45, 3.63, 2.29, 3.35, 1.14, 0.29, 0.26, 1.34, 1.5, 2.56, -0.39, 28.58, 6.02, 0.49, 2.32, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/a2_9fQ0U57w_filtered.json b/annotations_filtered/a2_9fQ0U57w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e636cd51c13089b1185fb7db2a97dc54f42c48f --- /dev/null +++ b/annotations_filtered/a2_9fQ0U57w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [4.0, 10.0], [11.0, 13.39], [14.0, 20.38], [22.0, 29.86], [30.0, 29.93], [30.0, 34.3], [35.0, 34.96], [36.0, 37.96], [38.0, 42.38], [45.0, 48.05], [49.0, 57.43], [59.0, 73.77], [74.0, 73.8], [74.0, 86.61], [87.0, 101.73], [102.0, 112.19], [113.0, 122.45], [124.0, 125.93], [127.0, 133.3], [135.0, 142.94], [143.0, 143.41], [148.0, 154.11], [156.0, 158.46], [165.0, 172.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.1, 99.56, 99.95, 99.93, 0.0, 99.97, 0.0, 0.0, 99.48, 99.99, 99.84, 90.08, 0.0, 99.97, 99.95, 100.0, 100.0, 0.0, 88.64, 59.07, 0.0, 54.56, 34.26, 33.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.12], ["ambient music", 23.31], ["synthesizer", 4.62]], [["music", 83.17], ["ambient music", 7.73], ["scary music", 1.93]]], "duration": [1.08, 6.0, 2.39, 6.38, 7.86, -0.07, 4.3, -0.04, 1.96, 4.38, 3.05, 8.43, 14.77, -0.2, 12.61, 14.73, 10.19, 9.45, 1.93, 6.3, 7.94, 0.41, 6.11, 2.46, 7.84]} \ No newline at end of file diff --git a/annotations_filtered/a2gMY3TRx8s_filtered.json b/annotations_filtered/a2gMY3TRx8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e26ac99e349cc0b2f55b4b5c4b4f2b515f56e6d --- /dev/null +++ b/annotations_filtered/a2gMY3TRx8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.42], [4.0, 6.76], [9.0, 9.9], [11.0, 12.07], [13.0, 14.84], [16.0, 19.18], [22.0, 24.73], [27.0, 27.8], [29.0, 30.28], [32.0, 33.05], [35.0, 36.12], [38.0, 39.66], [41.0, 41.88], [43.0, 45.87], [47.0, 48.76], [51.0, 53.15], [54.0, 57.69], [58.0, 58.72], [60.0, 60.03], [63.0, 64.1], [66.0, 68.42], [69.0, 79.03], [81.0, 82.71], [84.0, 89.18], [91.0, 92.45], [94.0, 97.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 52.86, 0.0, 0.0, 0.0, 85.54, 59.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 96.77, 70.16, 0.0, 0.0, 0.0, 94.95, 39.4, 0.0, 79.24, 0.0, 45.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 23.73], ["speech", 18.38], ["dog", 17.71]], null, null, null, [["music", 43.2], ["theremin", 8.45], ["synthesizer", 7.36]]], "duration": [1.42, 2.76, 0.9, 1.07, 1.84, 3.18, 2.73, 0.8, 1.28, 1.05, 1.12, 1.66, 0.88, 2.87, 1.76, 2.15, 3.69, 0.72, 0.03, 1.1, 2.42, 10.03, 1.71, 5.18, 1.45, 3.53]} \ No newline at end of file diff --git a/annotations_filtered/a2lb_3-fYFc_filtered.json b/annotations_filtered/a2lb_3-fYFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..980cacc587616dc428311015f21e685836fa86b6 --- /dev/null +++ b/annotations_filtered/a2lb_3-fYFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.13], [9.0, 9.78], [12.0, 13.12], [13.0, 13.51], [18.0, 18.57], [20.0, 20.71], [22.0, 23.06], [25.0, 26.96], [30.0, 30.43], [34.0, 34.11], [38.0, 38.01], [41.0, 41.45], [43.0, 43.48], [45.0, 45.01], [46.0, 47.09], [54.0, 58.41], [61.0, 61.48], [70.0, 70.77], [76.0, 76.06], [80.0, 80.87], [84.0, 85.5], [88.0, 88.05], [89.0, 92.55], [95.0, 97.26], [99.0, 100.06], [101.0, 100.94], [101.0, 101.88], [103.0, 107.3], [108.0, 109.85], [110.0, 111.0], [112.0, 112.53], [116.0, 116.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.53, 58.22, 0.0, 0.0, 0.0, 39.18, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.1], ["radio", 11.16], ["animal", 10.19]], null, null, null, null, null, null, [["sidetone", 60.73], ["music", 8.81], ["speech", 4.22]], null, null, null, null, [["fly, housefly", 25.32], ["insect", 20.5], ["hum", 9.34]], null, null, null, null], "duration": [0.13, 0.78, 1.12, 0.51, 0.57, 0.71, 1.06, 1.96, 0.43, 0.11, 0.01, 0.45, 0.48, 0.01, 1.09, 4.41, 0.48, 0.77, 0.06, 0.87, 1.5, 0.05, 3.55, 2.26, 1.06, -0.06, 0.88, 4.3, 1.85, 1.0, 0.53, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/a2qE4hG9XCk_filtered.json b/annotations_filtered/a2qE4hG9XCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72ba4c7dc702e0957e0e8673a725365a84854f41 --- /dev/null +++ b/annotations_filtered/a2qE4hG9XCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [7.0, 16.28], [17.0, 44.27], [44.0, 48.25], [49.0, 49.55], [51.0, 62.7], [66.0, 68.79], [75.0, 78.66], [82.0, 87.18], [93.0, 93.24], [95.0, 98.24], [99.0, 101.66], [103.0, 103.11], [109.0, 109.53], [113.0, 121.42], [125.0, 140.16]], "keep_status": [false, true, true, true, false, false, true, true, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 34.06, 31.04, 31.35, 0.0, 35.1, 37.56, 30.82, 30.25, 0.0, 32.35, 30.67, 0.0, 0.0, 30.43, 30.69], "audiomae_on_audioset": [null, [["hum", 23.84], ["music", 23.15], ["speech", 15.4]], [["music", 43.75], ["speech", 17.57], ["motorcycle", 6.65]], [["music", 46.49], ["throbbing", 9.02], ["hum", 6.22]], null, [["music", 42.89], ["whale vocalization", 15.88], ["speech", 15.0]], [["whale vocalization", 24.0], ["speech", 18.08], ["noise", 10.59]], [["music", 31.6], ["throbbing", 17.26], ["hum", 10.33]], [["music", 61.56], ["throbbing", 4.44], ["hum", 4.18]], null, [["music", 54.62], ["throbbing", 15.17], ["hum", 7.45]], [["music", 46.12], ["hum", 9.91], ["mains hum", 8.59]], null, null, [["speech", 23.11], ["buzz", 19.19], ["fly, housefly", 11.27]], [["music", 52.58], ["speech", 15.87], ["throbbing", 2.57]]], "duration": [0.51, 9.28, 27.27, 4.25, 0.55, 11.7, 2.79, 3.66, 5.18, 0.24, 3.24, 2.66, 0.11, 0.53, 8.42, 15.16]} \ No newline at end of file diff --git a/annotations_filtered/a38HZFbhB-M_filtered.json b/annotations_filtered/a38HZFbhB-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0f5548d379aede28789ced0d249445f79174ca0 --- /dev/null +++ b/annotations_filtered/a38HZFbhB-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.51], [5.0, 5.93], [8.0, 8.23], [10.0, 9.75], [11.0, 11.5], [13.0, 13.46], [14.0, 16.65], [17.0, 18.1], [26.0, 26.05], [28.0, 35.18], [38.0, 43.17], [51.0, 51.7], [55.0, 56.25], [57.0, 57.59], [59.0, 60.15], [61.0, 61.18], [62.0, 79.42], [83.0, 83.39], [89.0, 88.99], [92.0, 96.6], [100.0, 101.65], [104.0, 105.56], [107.0, 107.3], [110.0, 114.22], [116.0, 119.01], [121.0, 121.19], [125.0, 125.73]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 34.11, 55.25, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 99.48, 61.57, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 17.82], ["moo", 15.05], ["grunt", 9.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 0.93, 0.23, -0.25, 0.5, 0.46, 2.65, 1.1, 0.05, 7.18, 5.17, 0.7, 1.25, 0.59, 1.15, 0.18, 17.42, 0.39, -0.01, 4.6, 1.65, 1.56, 0.3, 4.22, 3.01, 0.19, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/a3HOCIXroqQ_filtered.json b/annotations_filtered/a3HOCIXroqQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..661201bf13c906ef187c42f34134443229ca4f0c --- /dev/null +++ b/annotations_filtered/a3HOCIXroqQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.08], [13.0, 14.2], [19.0, 23.7], [27.0, 27.04], [34.0, 34.69], [37.0, 39.28], [40.0, 63.29], [65.0, 64.94], [65.0, 65.52], [67.0, 126.54]], "keep_status": [false, false, true, false, false, true, true, false, false, false], "silence_prob": [32.05, 0.0, 34.24, 0.0, 0.0, 29.76, 29.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 29.22], ["music", 21.11], ["hum", 19.91]], null, [["music", 20.85], ["speech", 18.62], ["throbbing", 17.01]], null, null, [["noise", 20.23], ["hum", 16.92], ["mains hum", 11.09]], [["vehicle", 21.13], ["music", 11.74], ["buzz", 11.25]], null, null, null], "duration": [2.08, 1.2, 4.7, 0.04, 0.69, 2.28, 23.29, -0.06, 0.52, 59.54]} \ No newline at end of file diff --git a/annotations_filtered/a3Xm0KpUYj4_filtered.json b/annotations_filtered/a3Xm0KpUYj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2ba4bce93bb3554e2903cf3de5feb1837cdae00 --- /dev/null +++ b/annotations_filtered/a3Xm0KpUYj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [11.0, 11.6], [14.0, 29.15], [31.0, 33.18], [36.0, 38.64], [40.0, 45.66], [47.0, 47.02], [48.0, 49.33], [50.0, 52.83]], "keep_status": [false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 28.51, 33.06, 32.56, 39.5, 0.0, 0.0, 36.1], "audiomae_on_audioset": [null, null, [["music", 35.34], ["hum", 24.56], ["throbbing", 24.16]], [["music", 29.16], ["synthesizer", 10.57], ["hum", 7.12]], [["music", 48.31], ["hum", 11.81], ["mains hum", 5.86]], [["speech", 55.42], ["hum", 20.14], ["mains hum", 7.45]], null, null, [["music", 65.82], ["bass guitar", 3.45], ["didgeridoo", 3.32]]], "duration": [0.4, 0.6, 15.15, 2.18, 2.64, 5.66, 0.02, 1.33, 2.83]} \ No newline at end of file diff --git a/annotations_filtered/a3bI7kbVBwM_filtered.json b/annotations_filtered/a3bI7kbVBwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6090461df8b196d9ffa5d39d6573147470d6febd --- /dev/null +++ b/annotations_filtered/a3bI7kbVBwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.06], [14.0, 15.2], [17.0, 17.78], [18.0, 22.47], [24.0, 29.62], [30.0, 31.94], [33.0, 35.24], [37.0, 44.58], [46.0, 47.34], [50.0, 64.47], [65.0, 70.48], [74.0, 75.56], [82.0, 94.19], [97.0, 100.57], [101.0, 118.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [30.36, 0.0, 0.0, 30.17, 29.78, 0.0, 29.83, 30.65, 0.0, 30.3, 31.21, 0.0, 29.97, 29.93, 30.22], "audiomae_on_audioset": [[["music", 64.4], ["throbbing", 7.64], ["electronic music", 4.49]], null, null, [["music", 79.91], ["throbbing", 4.67], ["electronic music", 3.1]], [["music", 77.63], ["electronic music", 3.75], ["techno", 2.7]], null, [["music", 73.6], ["sampler", 2.59], ["electronic music", 2.54]], [["music", 64.57], ["hum", 5.2], ["drum and bass", 3.68]], null, [["music", 92.31], ["funny music", 1.14], ["throbbing", 0.69]], [["music", 37.47], ["didgeridoo", 7.61], ["musical instrument", 4.85]], null, [["music", 85.85], ["roll", 2.42], ["rock and roll", 2.05]], [["music", 78.76], ["buzz", 1.91], ["electronic music", 1.58]], [["music", 94.63], ["psychedelic rock", 0.83], ["rock music", 0.67]]], "duration": [4.06, 1.2, 0.78, 4.47, 5.62, 1.94, 2.24, 7.58, 1.34, 14.47, 5.48, 1.56, 12.19, 3.57, 17.32]} \ No newline at end of file diff --git a/annotations_filtered/a469ezsg86A_filtered.json b/annotations_filtered/a469ezsg86A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8bceccc9ec11c76aae52bcff48a23ed5586741b --- /dev/null +++ b/annotations_filtered/a469ezsg86A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.82], [9.0, 8.88], [11.0, 12.83], [15.0, 15.8], [19.0, 19.97], [21.0, 26.54], [37.0, 50.43], [55.0, 55.63], [56.0, 57.37], [59.0, 60.0], [61.0, 61.11], [68.0, 68.05], [73.0, 72.99], [74.0, 74.49], [76.0, 76.44], [77.0, 86.58], [91.0, 93.39], [96.0, 96.04], [96.0, 105.07], [107.0, 109.0], [112.0, 119.21], [120.0, 121.61], [123.0, 140.16], [150.0, 150.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 100.0, 0.0, 59.33, 83.52, 65.67, 0.0, 32.26, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.23], ["throbbing", 28.2], ["mains hum", 13.9]], null], "duration": [0.82, -0.12, 1.83, 0.8, 0.97, 5.54, 13.43, 0.63, 1.37, 1.0, 0.11, 0.05, -0.01, 0.49, 0.44, 9.58, 2.39, 0.04, 9.07, 2.0, 7.21, 1.61, 17.16, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/a46FsHMRPkc_filtered.json b/annotations_filtered/a46FsHMRPkc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c462a2171bf48a9d6bfd15475c0838dc462fe9de --- /dev/null +++ b/annotations_filtered/a46FsHMRPkc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 22.11], [23.0, 31.28], [36.0, 47.48], [52.0, 54.92], [59.0, 77.94], [79.0, 83.32], [84.0, 85.14], [96.0, 96.26], [100.0, 102.32], [113.0, 117.24], [118.0, 124.04]], "keep_status": [false, false, false, false, true, true, false, false, true, true, true], "silence_prob": [34.0, 33.64, 32.79, 33.0, 35.28, 30.13, 0.0, 0.0, 33.55, 30.4, 31.63], "audiomae_on_audioset": [[["music", 48.43], ["speech", 34.15], ["throbbing", 3.22]], [["throbbing", 40.2], ["hum", 36.72], ["music", 10.94]], [["music", 47.04], ["speech", 25.06], ["didgeridoo", 3.92]], [["speech", 46.67], ["music", 18.29], ["throbbing", 9.59]], [["music", 51.13], ["throbbing", 7.87], ["didgeridoo", 5.32]], [["hum", 22.39], ["mains hum", 22.38], ["music", 15.76]], null, null, [["music", 51.17], ["speech", 12.01], ["musical instrument", 2.31]], [["music", 38.96], ["hum", 9.61], ["throbbing", 9.46]], [["hum", 25.69], ["music", 16.72], ["throbbing", 13.49]]], "duration": [18.11, 8.28, 11.48, 2.92, 18.94, 4.32, 1.14, 0.26, 2.32, 4.24, 6.04]} \ No newline at end of file diff --git a/annotations_filtered/a46m8g3grB8_filtered.json b/annotations_filtered/a46m8g3grB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d55aef3e825b7a6a6a0e39697849ab77f2edc94d --- /dev/null +++ b/annotations_filtered/a46m8g3grB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 46.68], [51.0, 64.29], [65.0, 65.45], [66.0, 66.9], [79.0, 79.08], [80.0, 80.35], [81.0, 84.5], [85.0, 85.94], [86.0, 88.89], [93.0, 93.01], [95.0, 95.49], [100.0, 100.21], [102.0, 103.0], [105.0, 105.81], [106.0, 107.16], [108.0, 109.11], [114.0, 115.15], [116.0, 116.41], [117.0, 118.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.45, 52.74, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.83], ["fly, housefly", 3.57], ["livestock, farm animals, working animals", 3.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [21.68, 13.29, 0.45, 0.9, 0.08, 0.35, 3.5, 0.94, 2.89, 0.01, 0.49, 0.21, 1.0, 0.81, 1.16, 1.11, 1.15, 0.41, 1.98]} \ No newline at end of file diff --git a/annotations_filtered/a4EqbYUl7Rg_filtered.json b/annotations_filtered/a4EqbYUl7Rg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/a4EqbYUl7Rg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/a4OWkIrQUJw_filtered.json b/annotations_filtered/a4OWkIrQUJw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77ae13e5f453f75b646d5ef6eefd16b630314ece --- /dev/null +++ b/annotations_filtered/a4OWkIrQUJw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.21], [7.0, 8.19], [9.0, 10.81], [13.0, 13.39], [14.0, 18.33], [25.0, 25.59], [33.0, 36.09], [40.0, 39.77], [40.0, 42.6], [44.0, 50.67], [52.0, 55.78], [57.0, 59.39], [63.0, 64.02], [64.0, 64.1], [64.0, 64.13], [65.0, 65.25], [66.0, 67.24], [68.0, 83.54], [85.0, 85.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.51, 0.0, 0.0, 0.0, 99.44, 0.0, 98.59, 0.0, 72.31, 91.81, 99.31, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.25, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 1.19, 1.81, 0.39, 4.33, 0.59, 3.09, -0.23, 2.6, 6.67, 3.78, 2.39, 1.02, 0.1, 0.13, 0.25, 1.24, 15.54, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/a4QlQy31HIk_filtered.json b/annotations_filtered/a4QlQy31HIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba823fd3b7412076e7019e6485df56fe2ada96b9 --- /dev/null +++ b/annotations_filtered/a4QlQy31HIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.28], [8.0, 14.93], [18.0, 28.48], [30.0, 31.97], [33.0, 63.54], [66.0, 96.26], [98.0, 101.12], [103.0, 128.22]], "keep_status": [false, true, true, false, false, false, true, true], "silence_prob": [0.0, 30.27, 30.07, 0.0, 0.0, 0.0, 39.55, 42.44], "audiomae_on_audioset": [null, [["speech", 27.5], ["music", 24.35], ["hum", 9.27]], [["music", 19.56], ["speech", 15.0], ["hum", 12.25]], null, null, null, [["hum", 24.97], ["mains hum", 22.91], ["music", 20.21]], [["noise", 24.48], ["hum", 16.54], ["music", 14.5]]], "duration": [0.28, 6.93, 10.48, 1.97, 30.54, 30.26, 3.12, 25.22]} \ No newline at end of file diff --git a/annotations_filtered/a4Td_W5dc1w_filtered.json b/annotations_filtered/a4Td_W5dc1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bbb02acd89f110b7d729fc95a7ad7eb59641687 --- /dev/null +++ b/annotations_filtered/a4Td_W5dc1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.2], [8.0, 8.36], [10.0, 11.38], [19.0, 19.4], [23.0, 24.04], [24.0, 24.93], [26.0, 26.77], [31.0, 31.62], [35.0, 34.87], [35.0, 35.73], [36.0, 36.63], [37.0, 37.86], [41.0, 41.93], [44.0, 44.39], [51.0, 56.3], [58.0, 58.5], [59.0, 60.93], [62.0, 82.36], [86.0, 87.0], [91.0, 91.03], [93.0, 97.14], [100.0, 100.31], [108.0, 146.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 32.04, 0.0, 0.0, 30.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.3], ["hum", 15.38], ["mains hum", 7.65]], null, null, [["music", 38.63], ["explosion", 10.49], ["burst, pop", 6.94]], null, null], "duration": [1.2, 0.36, 1.38, 0.4, 1.04, 0.93, 0.77, 0.62, -0.13, 0.73, 0.63, 0.86, 0.93, 0.39, 5.3, 0.5, 1.93, 20.36, 1.0, 0.03, 4.14, 0.31, 38.69]} \ No newline at end of file diff --git a/annotations_filtered/a4wb-xmYM50_filtered.json b/annotations_filtered/a4wb-xmYM50_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a79a32a700b1690ac3df6f5beeadce566e95f7c --- /dev/null +++ b/annotations_filtered/a4wb-xmYM50_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.47], [9.0, 11.67], [15.0, 22.13], [23.0, 23.46], [26.0, 34.11], [38.0, 44.25], [45.0, 46.06], [49.0, 59.48], [63.0, 69.08]], "keep_status": [false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 40.73, 35.24, 0.0, 36.3, 37.27, 0.0, 35.08, 40.88], "audiomae_on_audioset": [null, [["buzz", 56.53], ["hum", 12.33], ["mains hum", 6.05]], [["hum", 42.75], ["mains hum", 30.32], ["throbbing", 8.57]], null, [["hum", 35.12], ["speech", 17.07], ["throbbing", 14.89]], [["hum", 48.86], ["throbbing", 35.08], ["mains hum", 4.19]], null, [["hum", 30.38], ["throbbing", 23.71], ["speech", 10.64]], [["music", 77.9], ["buzz", 2.24], ["guitar", 2.01]]], "duration": [1.47, 2.67, 7.13, 0.46, 8.11, 6.25, 1.06, 10.48, 6.08]} \ No newline at end of file diff --git a/annotations_filtered/a51EYR5AeNk_filtered.json b/annotations_filtered/a51EYR5AeNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..461e2e4a0ed9871dc4d564a5ad2984ac4717b1a3 --- /dev/null +++ b/annotations_filtered/a51EYR5AeNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 43.12], [46.0, 68.45], [71.0, 71.14], [71.0, 78.63], [83.0, 84.86], [86.0, 101.33], [102.0, 103.42], [112.0, 113.43], [116.0, 116.58], [120.0, 120.93], [131.0, 133.64], [135.0, 136.41], [140.0, 142.33], [145.0, 149.47], [151.0, 152.95], [154.0, 154.06], [158.0, 159.19]], "keep_status": [true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.93, 31.81, 0.0, 29.17, 0.0, 31.4, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 84.07, 53.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.23], ["smash, crash", 11.94], ["buzz", 5.32]], [["music", 33.2], ["hum", 20.68], ["throbbing", 16.77]], null, [["hum", 17.99], ["music", 17.76], ["mains hum", 12.42]], null, [["speech", 29.18], ["music", 25.38], ["hum", 8.18]], null, null, null, null, null, null, null, null, null, null, null], "duration": [12.12, 22.45, 0.14, 7.63, 1.86, 15.33, 1.42, 1.43, 0.58, 0.93, 2.64, 1.41, 2.33, 4.47, 1.95, 0.06, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/a5BtDmdw708_filtered.json b/annotations_filtered/a5BtDmdw708_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd6879b081d75579cdada7ea7f05db532179d1fe --- /dev/null +++ b/annotations_filtered/a5BtDmdw708_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.08], [4.0, 7.11], [8.0, 9.12], [11.0, 11.87], [21.0, 21.17], [24.0, 25.41], [26.0, 32.53], [40.0, 43.88], [44.0, 46.33], [47.0, 53.97], [54.0, 58.16]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [97.0, 99.94, 0.0, 0.0, 0.0, 0.0, 98.44, 86.27, 99.44, 38.78, 39.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 21.24], ["music", 14.23], ["fly, housefly", 7.52]], [["speech", 35.39], ["vehicle", 5.83], ["electric shaver, electric razor", 5.71]]], "duration": [2.08, 3.11, 1.12, 0.87, 0.17, 1.41, 6.53, 3.88, 2.33, 6.97, 4.16]} \ No newline at end of file diff --git a/annotations_filtered/a5PoLM_QBuo_filtered.json b/annotations_filtered/a5PoLM_QBuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21d647c987871bb613ca78be61bd9001fac6df71 --- /dev/null +++ b/annotations_filtered/a5PoLM_QBuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.9], [8.0, 10.64], [13.0, 27.92], [31.0, 30.94], [35.0, 36.42], [38.0, 38.37], [39.0, 40.32], [41.0, 43.44], [45.0, 46.97], [47.0, 48.83], [49.0, 70.58], [73.0, 73.41], [74.0, 75.95], [77.0, 80.7], [81.0, 82.05], [84.0, 84.4], [85.0, 106.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 42.81, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 51.77, 0.0, 0.0, 50.71, 0.0, 0.0, 65.44], "audiomae_on_audioset": [null, null, [["speech", 61.24], ["firecracker", 16.51], ["explosion", 3.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 2.64, 14.92, -0.06, 1.42, 0.37, 1.32, 2.44, 1.97, 1.83, 21.58, 0.41, 1.95, 3.7, 1.05, 0.4, 21.64]} \ No newline at end of file diff --git a/annotations_filtered/a5QBuJla5do_filtered.json b/annotations_filtered/a5QBuJla5do_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7708a45c12df7f58f91c76d76b1fecfd838e85cf --- /dev/null +++ b/annotations_filtered/a5QBuJla5do_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.3], [8.0, 21.41], [23.0, 26.11], [27.0, 29.39], [35.0, 38.53], [46.0, 46.55], [48.0, 50.57], [53.0, 58.63], [60.0, 64.23], [69.0, 69.97], [78.0, 86.58], [93.0, 92.89], [94.0, 99.27], [101.0, 100.95], [108.0, 112.95], [115.0, 120.75]], "keep_status": [false, true, false, false, true, false, true, false, true, false, false, false, false, false, true, true], "silence_prob": [54.5, 34.44, 34.38, 35.29, 33.27, 0.0, 37.88, 31.02, 35.54, 0.0, 33.09, 0.0, 30.71, 0.0, 30.46, 30.68], "audiomae_on_audioset": [null, [["hum", 25.05], ["whale vocalization", 24.84], ["mains hum", 11.16]], [["music", 62.95], ["synthesizer", 9.03], ["musical instrument", 7.64]], [["music", 67.34], ["musical instrument", 6.02], ["synthesizer", 4.92]], [["music", 43.61], ["speech", 12.42], ["boing", 3.03]], null, [["speech", 24.78], ["music", 24.15], ["moo", 8.08]], [["music", 64.75], ["theremin", 8.05], ["musical instrument", 5.76]], [["music", 24.1], ["shofar", 21.51], ["speech", 8.52]], null, [["music", 53.68], ["speech", 21.59], ["sidetone", 8.85]], null, [["music", 66.88], ["synthesizer", 6.28], ["musical instrument", 4.34]], null, [["music", 29.66], ["speech", 24.47], ["theremin", 12.86]], [["music", 37.47], ["speech", 18.05], ["hum", 4.14]]], "duration": [3.3, 13.41, 3.11, 2.39, 3.53, 0.55, 2.57, 5.63, 4.23, 0.97, 8.58, -0.11, 5.27, -0.05, 4.95, 5.75]} \ No newline at end of file diff --git a/annotations_filtered/a5WAyc-EaNc_filtered.json b/annotations_filtered/a5WAyc-EaNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8b1802d0cb9c7fd2edee5443280e7105f977a23 --- /dev/null +++ b/annotations_filtered/a5WAyc-EaNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.21], [12.0, 12.14], [12.0, 20.33], [21.0, 22.77], [23.0, 25.0], [26.0, 28.02], [30.0, 30.64], [32.0, 33.71], [35.0, 37.45], [41.0, 43.16], [44.0, 49.57], [52.0, 54.13], [56.0, 58.72], [60.0, 61.74], [62.0, 63.42], [67.0, 68.76], [70.0, 73.08]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.97, 0.0, 39.33, 0.0, 39.14, 66.76, 0.0, 0.0, 69.74, 67.0, 59.86, 76.37, 39.18, 0.0, 0.0, 0.0, 80.46], "audiomae_on_audioset": [[["music", 49.36], ["theremin", 32.05], ["ambient music", 5.47]], null, [["music", 29.12], ["hum", 14.07], ["theremin", 9.74]], null, [["speech", 49.92], ["music", 11.27], ["hum", 4.7]], null, null, null, null, null, null, null, [["speech", 58.33], ["sidetone", 22.12], ["busy signal", 6.91]], null, null, null, null], "duration": [8.21, 0.14, 8.33, 1.77, 2.0, 2.02, 0.64, 1.71, 2.45, 2.16, 5.57, 2.13, 2.72, 1.74, 1.42, 1.76, 3.08]} \ No newline at end of file diff --git a/annotations_filtered/a6--cEjo3bY_filtered.json b/annotations_filtered/a6--cEjo3bY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9345711c347854aed3d1c0fb74433820141da379 --- /dev/null +++ b/annotations_filtered/a6--cEjo3bY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.78], [9.0, 8.77], [13.0, 15.97], [19.0, 20.11], [21.0, 21.59], [32.0, 32.14], [36.0, 36.42], [37.0, 37.96], [41.0, 44.52], [48.0, 48.9], [58.0, 63.95], [66.0, 67.51], [69.0, 71.05], [73.0, 73.26], [73.0, 74.24], [76.0, 76.91], [77.0, 80.38], [82.0, 83.54], [85.0, 87.17], [88.0, 89.13], [90.0, 92.23], [95.0, 96.92], [102.0, 111.75], [115.0, 115.4], [116.0, 117.19], [118.0, 123.5], [124.0, 123.57], [124.0, 124.78], [130.0, 132.22], [135.0, 147.31], [147.0, 173.84], [174.0, 175.58], [176.0, 177.69]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 42.44, 0.0, 0.0, 0.0, 0.0, 0.0, 53.16, 0.0, 88.28, 0.0, 73.06, 0.0, 0.0, 0.0, 42.28, 0.0, 48.1, 0.0, 91.13, 0.0, 38.12, 0.0, 0.0, 36.09, 0.0, 0.0, 98.19, 35.94, 31.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 26.2], ["livestock, farm animals, working animals", 18.55], ["moo", 13.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["creak", 31.23], ["noise", 11.59], ["mosquito", 7.08]], null, [["speech", 36.9], ["insect", 8.79], ["fly, housefly", 8.46]], null, null, null, [["throbbing", 16.94], ["noise", 16.05], ["whack, thwack", 10.06]], null, null, [["speech", 57.84], ["noise", 3.97], ["hum", 3.65]], null, null, null, [["speech", 47.81], ["sidetone", 7.89], ["fart", 7.02]], [["speech", 38.55], ["whack, thwack", 9.09], ["animal", 6.55]], null, null], "duration": [1.78, -0.23, 2.97, 1.11, 0.59, 0.14, 0.42, 0.96, 3.52, 0.9, 5.95, 1.51, 2.05, 0.26, 1.24, 0.91, 3.38, 1.54, 2.17, 1.13, 2.23, 1.92, 9.75, 0.4, 1.19, 5.5, -0.43, 0.78, 2.22, 12.31, 26.84, 1.58, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/a66f39DMwtY_filtered.json b/annotations_filtered/a66f39DMwtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4b4fa425e22d46c7fb214228a5732602aef983a --- /dev/null +++ b/annotations_filtered/a66f39DMwtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 30.94], [39.0, 43.6], [46.0, 46.23], [47.0, 47.85], [51.0, 51.19], [54.0, 54.7], [63.0, 73.25], [75.0, 75.63], [81.0, 81.21]], "keep_status": [false, true, false, false, false, false, true, false, false], "silence_prob": [38.04, 46.47, 0.0, 0.0, 0.0, 0.0, 40.92, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 43.9], ["music", 25.11], ["theremin", 3.47]], [["speech", 51.46], ["music", 10.16], ["sidetone", 7.42]], null, null, null, null, [["hum", 20.51], ["speech", 20.33], ["mains hum", 13.79]], null, null], "duration": [3.94, 4.6, 0.23, 0.85, 0.19, 0.7, 10.25, 0.63, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/a6CsW4dCk_8_filtered.json b/annotations_filtered/a6CsW4dCk_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ba4f9b3179aaeec3beb8bd3d381d168348cd478 --- /dev/null +++ b/annotations_filtered/a6CsW4dCk_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.56], [7.0, 7.03], [8.0, 10.0], [16.0, 16.21], [18.0, 18.72], [19.0, 20.75], [30.0, 30.69], [36.0, 35.94], [37.0, 40.19], [42.0, 61.75], [74.0, 74.6], [75.0, 76.27], [82.0, 84.91], [95.0, 101.58], [107.0, 107.0], [112.0, 141.22], [142.0, 145.91]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [80.64, 0.0, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 31.46, 40.34, 0.0, 0.0, 30.19, 30.15, 0.0, 32.56, 92.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["ocean", 8.95], ["speech", 8.36], ["cattle, bovinae", 7.04]], [["music", 66.06], ["mains hum", 5.13], ["noise", 3.89]], null, null, [["music", 59.54], ["speech", 12.16], ["didgeridoo", 4.02]], [["music", 70.03], ["whale vocalization", 4.46], ["foghorn", 2.93]], null, [["speech", 77.42], ["vehicle", 3.96], ["boat, water vehicle", 2.4]], null], "duration": [3.56, 0.03, 2.0, 0.21, 0.72, 1.75, 0.69, -0.06, 3.19, 19.75, 0.6, 1.27, 2.91, 6.58, 0.0, 29.22, 3.91]} \ No newline at end of file diff --git a/annotations_filtered/a6XtVMtUZI8_filtered.json b/annotations_filtered/a6XtVMtUZI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea2fb8b7e03b57e20b816efb036d4a15b0837274 --- /dev/null +++ b/annotations_filtered/a6XtVMtUZI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 46.57], [47.0, 47.43], [51.0, 51.9], [53.0, 53.77], [55.0, 59.09], [61.0, 62.43], [63.0, 66.53], [67.0, 74.46], [75.0, 77.92], [79.0, 80.57], [81.0, 83.24], [86.0, 111.27], [112.0, 118.86], [120.0, 120.53], [122.0, 127.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 65.09, 86.09, 0.0, 96.04, 99.48, 100.0, 0.0, 97.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.57, 0.43, 0.9, 0.77, 4.09, 1.43, 3.53, 7.46, 2.92, 1.57, 2.24, 25.27, 6.86, 0.53, 5.16]} \ No newline at end of file diff --git a/annotations_filtered/a6cUudbbHl0_filtered.json b/annotations_filtered/a6cUudbbHl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..832503368c5969dd02f8ed6a334343c4a28bd833 --- /dev/null +++ b/annotations_filtered/a6cUudbbHl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.43], [6.0, 8.16], [10.0, 13.42], [14.0, 18.96], [20.0, 21.91], [24.0, 26.52], [32.0, 35.9], [40.0, 40.49], [42.0, 42.77], [44.0, 49.82], [54.0, 57.21], [59.0, 60.22], [61.0, 62.61], [65.0, 68.84], [69.0, 69.45], [69.0, 69.5], [70.0, 70.7], [76.0, 76.25], [79.0, 81.67], [84.0, 85.08], [94.0, 94.95], [97.0, 97.75], [99.0, 100.33], [103.0, 107.72], [108.0, 114.07], [115.0, 117.91], [119.0, 120.95], [123.0, 124.09], [125.0, 127.62], [130.0, 131.46], [132.0, 134.47], [136.0, 137.69], [140.0, 140.83], [142.0, 143.43], [148.0, 150.13], [151.0, 153.54], [157.0, 158.13], [159.0, 160.1], [161.0, 162.23], [165.0, 165.67], [167.0, 168.1]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.22, 44.07, 60.32, 42.58, 0.0, 52.33, 54.63, 0.0, 0.0, 55.46, 36.52, 0.0, 0.0, 31.99, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0, 61.57, 40.7, 31.77, 0.0, 0.0, 36.44, 0.0, 38.95, 0.0, 0.0, 0.0, 43.4, 46.54, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.35], ["electronic music", 9.73], ["synthesizer", 7.52]], [["music", 53.53], ["singing bowl", 26.36], ["ambient music", 5.01]], null, [["singing bowl", 28.24], ["music", 27.15], ["speech", 21.3]], null, null, null, null, null, null, [["sine wave", 39.03], ["chirp tone", 13.69], ["fire", 4.75]], null, null, [["music", 18.64], ["hum", 14.18], ["speech", 14.15]], null, null, null, null, null, null, null, null, null, null, [["music", 36.79], ["singing bowl", 33.59], ["speech", 6.61]], [["speech", 22.16], ["music", 10.02], ["thump, thud", 6.55]], null, null, [["music", 70.79], ["hum", 5.79], ["electronic music", 3.78]], null, [["music", 27.48], ["sine wave", 23.14], ["gong", 15.43]], null, null, null, [["music", 47.25], ["singing bowl", 21.38], ["ambient music", 4.26]], [["music", 62.75], ["musical instrument", 7.93], ["synthesizer", 4.96]], null, null, null, null, null], "duration": [2.43, 2.16, 3.42, 4.96, 1.91, 2.52, 3.9, 0.49, 0.77, 5.82, 3.21, 1.22, 1.61, 3.84, 0.45, 0.5, 0.7, 0.25, 2.67, 1.08, 0.95, 0.75, 1.33, 4.72, 6.07, 2.91, 1.95, 1.09, 2.62, 1.46, 2.47, 1.69, 0.83, 1.43, 2.13, 2.54, 1.13, 1.1, 1.23, 0.67, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/a6mkbps0BmY_filtered.json b/annotations_filtered/a6mkbps0BmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f9f9762eb70cc7983becf11be1774b17cce2cc4 --- /dev/null +++ b/annotations_filtered/a6mkbps0BmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.77], [51.0, 51.6], [53.0, 54.11], [60.0, 60.44], [67.0, 68.27], [71.0, 72.81], [77.0, 77.58], [86.0, 86.09], [88.0, 89.21], [90.0, 90.75], [93.0, 93.09], [121.0, 121.22], [122.0, 123.09], [130.0, 129.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 0.6, 1.11, 0.44, 1.27, 1.81, 0.58, 0.09, 1.21, 0.75, 0.09, 0.22, 1.09, -0.16]} \ No newline at end of file diff --git a/annotations_filtered/a6oC5iQB4u8_filtered.json b/annotations_filtered/a6oC5iQB4u8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48d4f1c87901dca9e2d1e8172cd2e20ca4f3201a --- /dev/null +++ b/annotations_filtered/a6oC5iQB4u8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 37.44], [41.0, 43.04], [45.0, 46.92], [47.0, 59.53], [60.0, 62.06], [63.0, 64.72], [67.0, 70.77], [72.0, 72.66], [75.0, 76.08], [77.0, 86.34], [96.0, 96.72], [97.0, 110.73], [113.0, 115.18], [116.0, 117.31], [119.0, 124.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.26, 96.17, 0.0, 99.73, 88.1, 0.0, 88.64, 0.0, 0.0, 82.97, 0.0, 99.84, 86.82, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.44, 2.04, 1.92, 12.53, 2.06, 1.72, 3.77, 0.66, 1.08, 9.34, 0.72, 13.73, 2.18, 1.31, 5.93]} \ No newline at end of file diff --git a/annotations_filtered/a72FDTElH9g_filtered.json b/annotations_filtered/a72FDTElH9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8678e16f77dee41748710660b7dd4499a777598 --- /dev/null +++ b/annotations_filtered/a72FDTElH9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.83], [7.0, 9.14], [11.0, 11.42], [14.0, 15.33], [16.0, 18.6], [20.0, 21.29], [24.0, 24.38], [26.0, 26.28], [30.0, 30.18], [31.0, 32.12], [33.0, 33.61], [35.0, 34.91], [36.0, 37.93], [39.0, 44.47], [50.0, 51.71], [52.0, 136.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.8, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 2.14, 0.42, 1.33, 2.6, 1.29, 0.38, 0.28, 0.18, 1.12, 0.61, -0.09, 1.93, 5.47, 1.71, 84.34]} \ No newline at end of file diff --git a/annotations_filtered/a7K1xgoi_c4_filtered.json b/annotations_filtered/a7K1xgoi_c4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3539afe40fb84cb086e5fc809e69bdf1afed5acc --- /dev/null +++ b/annotations_filtered/a7K1xgoi_c4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.72], [17.0, 23.55], [26.0, 32.29], [37.0, 55.34], [58.0, 58.97], [62.0, 62.6], [64.0, 65.67], [72.0, 72.45]], "keep_status": [true, true, true, false, false, false, false, false], "silence_prob": [31.74, 33.25, 34.38, 32.68, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 32.88], ["eruption", 13.01], ["explosion", 5.35]], [["whale vocalization", 24.86], ["ocean", 6.15], ["boat, water vehicle", 5.71]], [["whale vocalization", 44.44], ["gurgling", 10.8], ["stomach rumble", 7.38]], [["whale vocalization", 85.03], ["music", 2.88], ["speech", 2.77]], null, null, null, null], "duration": [3.72, 6.55, 6.29, 18.34, 0.97, 0.6, 1.67, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/a7XZaIy4a9k_filtered.json b/annotations_filtered/a7XZaIy4a9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..959a773ef3b2caa4ec9c776e0fcf51d292faf1e2 --- /dev/null +++ b/annotations_filtered/a7XZaIy4a9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.23], [7.0, 8.18], [12.0, 12.66], [15.0, 16.58], [18.0, 18.15], [18.0, 27.19], [28.0, 29.71], [31.0, 31.65], [33.0, 35.41], [38.0, 39.07], [40.0, 40.34], [41.0, 42.04], [43.0, 44.15], [48.0, 48.69], [50.0, 50.79], [51.0, 55.97], [57.0, 58.18], [59.0, 61.25], [62.0, 63.12], [66.0, 68.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 66.76, 0.0, 74.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 1.18, 0.66, 1.58, 0.15, 9.19, 1.71, 0.65, 2.41, 1.07, 0.34, 1.04, 1.15, 0.69, 0.79, 4.97, 1.18, 2.25, 1.12, 2.69]} \ No newline at end of file diff --git a/annotations_filtered/a7gZgEpgKiY_filtered.json b/annotations_filtered/a7gZgEpgKiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d4d3b063238b140bc2add85aad99894bcc8e290 --- /dev/null +++ b/annotations_filtered/a7gZgEpgKiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.88], [4.0, 4.78], [8.0, 8.78], [12.0, 23.6], [25.0, 26.11], [26.0, 28.24], [30.0, 29.79], [31.0, 35.06], [36.0, 62.5], [64.0, 67.8], [69.0, 73.23], [75.0, 79.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.54, 0.0, 65.32, 0.0, 96.66, 69.47, 92.48, 94.52, 53.4], "audiomae_on_audioset": [null, null, null, [["music", 54.8], ["speech", 10.19], ["fart", 6.48]], null, null, null, null, null, null, null, null], "duration": [-0.12, 0.78, 0.78, 11.6, 1.11, 2.24, -0.21, 4.06, 26.5, 3.8, 4.23, 4.14]} \ No newline at end of file diff --git a/annotations_filtered/a7qRJ9T9TPg_filtered.json b/annotations_filtered/a7qRJ9T9TPg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8a19f92ce8c622ff44c5b2f40a9700fbae563b1 --- /dev/null +++ b/annotations_filtered/a7qRJ9T9TPg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 24.11], [28.0, 31.5], [35.0, 36.29], [37.0, 39.31], [42.0, 42.62], [44.0, 47.12], [51.0, 55.39], [59.0, 81.24], [93.0, 96.7], [104.0, 104.55], [113.0, 112.99], [118.0, 118.81], [119.0, 120.24]], "keep_status": [true, true, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [31.8, 33.24, 0.0, 33.83, 0.0, 33.18, 33.78, 32.2, 31.27, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.55], ["synthesizer", 9.81], ["speech", 9.02]], [["speech", 22.7], ["music", 20.68], ["vehicle", 4.96]], null, [["music", 62.8], ["foghorn", 2.4], ["musical instrument", 2.38]], null, [["music", 85.52], ["musical instrument", 1.75], ["hum", 1.75]], [["music", 55.28], ["synthesizer", 13.07], ["musical instrument", 4.61]], [["music", 21.48], ["theremin", 12.47], ["civil defense siren", 12.02]], [["music", 21.0], ["speech", 18.21], ["dog", 10.71]], null, null, null, null], "duration": [14.11, 3.5, 1.29, 2.31, 0.62, 3.12, 4.39, 22.24, 3.7, 0.55, -0.01, 0.81, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/a7vAR-7YBWE_filtered.json b/annotations_filtered/a7vAR-7YBWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bee2d3cbebfc3f6b79df7e1ae2fe052b8df9cec7 --- /dev/null +++ b/annotations_filtered/a7vAR-7YBWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.67], [21.0, 22.3], [23.0, 23.62], [25.0, 25.79], [27.0, 29.39], [32.0, 35.19], [36.0, 35.85], [36.0, 40.36], [49.0, 49.57], [57.0, 57.77], [59.0, 63.15], [67.0, 67.83], [71.0, 72.74], [75.0, 81.87], [93.0, 93.06], [95.0, 96.38], [98.0, 104.58], [115.0, 115.87], [128.0, 129.05]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 64.86, 83.34, 0.0, 44.29, 0.0, 0.0, 55.18, 0.0, 0.0, 40.62, 0.0, 0.0, 36.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 27.72], ["music", 13.7], ["fly, housefly", 6.73]], null, null, null, null, null, [["music", 32.41], ["singing bowl", 11.96], ["synthesizer", 7.81]], null, null, [["speech", 31.39], ["mains hum", 14.2], ["music", 10.77]], null, null], "duration": [0.67, 1.3, 0.62, 0.79, 2.39, 3.19, -0.15, 4.36, 0.57, 0.77, 4.15, 0.83, 1.74, 6.87, 0.06, 1.38, 6.58, 0.87, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/a81pNygdAXw_filtered.json b/annotations_filtered/a81pNygdAXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f7ac28193cf21b48cde6dfab51f17bf4f3d1328 --- /dev/null +++ b/annotations_filtered/a81pNygdAXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.95], [13.0, 14.17], [15.0, 18.67], [20.0, 20.43], [23.0, 23.65], [27.0, 27.89], [29.0, 30.08], [32.0, 32.1], [33.0, 37.05], [40.0, 41.82], [44.0, 45.62], [48.0, 48.63], [52.0, 52.89], [56.0, 57.25], [62.0, 63.68], [65.0, 73.41], [75.0, 75.86], [77.0, 79.02], [82.0, 82.78], [84.0, 85.23], [86.0, 88.08], [91.0, 93.28], [95.0, 97.23], [99.0, 101.73], [103.0, 103.67], [105.0, 106.08], [109.0, 112.58]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.6, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 99.8, 79.07, 95.91, 99.68, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, [["cat", 7.72], ["hum", 6.7], ["inside, small room", 6.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.95, 1.17, 3.67, 0.43, 0.65, 0.89, 1.08, 0.1, 4.05, 1.82, 1.62, 0.63, 0.89, 1.25, 1.68, 8.41, 0.86, 2.02, 0.78, 1.23, 2.08, 2.28, 2.23, 2.73, 0.67, 1.08, 3.58]} \ No newline at end of file diff --git a/annotations_filtered/a861J6gxqmg_filtered.json b/annotations_filtered/a861J6gxqmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab79565cd12f202ef6ec048f2bc8e30a54390987 --- /dev/null +++ b/annotations_filtered/a861J6gxqmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 47.41], [48.0, 49.42], [53.0, 57.6], [60.0, 63.56], [65.0, 80.57], [88.0, 88.15], [89.0, 88.99], [91.0, 92.31], [94.0, 94.88], [97.0, 97.01], [101.0, 102.44], [103.0, 103.33], [105.0, 107.38], [111.0, 113.98], [115.0, 125.37]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.43, 0.0, 31.27, 88.28, 34.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53, 100.0, 100.0], "audiomae_on_audioset": [[["music", 21.72], ["speech", 18.46], ["hum", 12.25]], null, [["music", 38.73], ["breaking", 13.78], ["hum", 9.81]], null, [["music", 41.94], ["didgeridoo", 39.46], ["gong", 2.77]], null, null, null, null, null, null, null, null, null, null], "duration": [8.41, 1.42, 4.6, 3.56, 15.57, 0.15, -0.01, 1.31, 0.88, 0.01, 1.44, 0.33, 2.38, 2.98, 10.37]} \ No newline at end of file diff --git a/annotations_filtered/a87b-bsz1Mg_filtered.json b/annotations_filtered/a87b-bsz1Mg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a000bf8c1a2dcfcc92ab82b380216f210d23ad3b --- /dev/null +++ b/annotations_filtered/a87b-bsz1Mg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.64], [14.0, 15.08], [16.0, 17.61], [20.0, 39.55], [42.0, 44.68], [48.0, 53.11], [54.0, 63.76], [66.0, 66.12], [67.0, 68.64], [70.0, 71.73], [74.0, 76.72], [80.0, 79.95], [86.0, 86.48], [90.0, 95.08], [102.0, 107.32], [108.0, 111.97], [113.0, 120.29], [123.0, 130.2], [133.0, 134.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.67, 0.0, 0.0, 79.59, 91.81, 92.97, 80.64, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 94.22, 87.19, 56.4, 71.29, 92.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.64, 1.08, 1.61, 19.55, 2.68, 5.11, 9.76, 0.12, 1.64, 1.73, 2.72, -0.05, 0.48, 5.08, 5.32, 3.97, 7.29, 7.2, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/a88BNDMlPSE_filtered.json b/annotations_filtered/a88BNDMlPSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54e6310e1cb4a549d07a65f2a12a7762be7a84bb --- /dev/null +++ b/annotations_filtered/a88BNDMlPSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 32.21], [34.0, 38.16], [44.0, 45.3], [46.0, 46.23], [47.0, 59.54], [60.0, 60.27]], "keep_status": [true, true, false, false, false, false], "silence_prob": [35.49, 33.24, 0.0, 0.0, 30.0, 0.0], "audiomae_on_audioset": [[["speech", 26.62], ["coin (dropping)", 15.66], ["cowbell", 13.97]], [["music", 39.24], ["mains hum", 15.56], ["hum", 14.0]], null, null, [["music", 67.76], ["theremin", 3.66], ["musical instrument", 3.19]], null], "duration": [5.21, 4.16, 1.3, 0.23, 12.54, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/a8EeFNXk1TE_filtered.json b/annotations_filtered/a8EeFNXk1TE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f05a214a8a3b7c1f44d2c4eed3346908a4e7b28 --- /dev/null +++ b/annotations_filtered/a8EeFNXk1TE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.72], [11.0, 12.38], [12.0, 12.41], [12.0, 12.45], [15.0, 15.38], [21.0, 21.9], [24.0, 25.42], [32.0, 38.74], [42.0, 46.26], [51.0, 51.48], [56.0, 58.38], [60.0, 60.29], [61.0, 62.36], [63.0, 64.34], [65.0, 67.46]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.18, 38.02, 0.0, 51.66, 0.0, 0.0, 0.0, 95.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 17.08], ["speech", 10.56], ["hum", 6.7]], [["speech", 53.59], ["noise", 5.6], ["sine wave", 3.77]], null, null, null, null, null, null], "duration": [-0.28, 1.38, 0.41, 0.45, 0.38, 0.9, 1.42, 6.74, 4.26, 0.48, 2.38, 0.29, 1.36, 1.34, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/a8FA5zBHiFA_filtered.json b/annotations_filtered/a8FA5zBHiFA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..772ff811d6baee47af122be80f51cd8bf8c1452b --- /dev/null +++ b/annotations_filtered/a8FA5zBHiFA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.81], [16.0, 17.09], [19.0, 20.11], [23.0, 27.6], [30.0, 37.42], [39.0, 41.12], [44.0, 61.15], [63.0, 64.15], [64.0, 66.31], [66.0, 66.43], [68.0, 69.47], [70.0, 70.51], [72.0, 79.76], [80.0, 81.08], [82.0, 111.86], [114.0, 117.48], [118.0, 121.1], [123.0, 129.52], [131.0, 133.3], [135.0, 136.26], [139.0, 139.77], [141.0, 185.16], [186.0, 187.49], [188.0, 196.11], [197.0, 197.33], [199.0, 200.92]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.53, 42.17, 37.82, 34.69, 0.0, 31.65, 0.0, 0.0, 0.0, 42.51, 0.0, 31.79, 35.23, 36.36, 37.05, 48.39, 0.0, 0.0, 0.0, 0.0, 42.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["theremin", 84.21], ["music", 13.36], ["musical instrument", 0.47]], [["music", 42.58], ["theremin", 33.76], ["musical instrument", 4.15]], [["music", 29.24], ["theremin", 27.1], ["speech", 20.48]], [["speech", 38.87], ["music", 32.76], ["theremin", 8.4]], null, [["didgeridoo", 24.96], ["quack", 21.38], ["boing", 8.53]], null, null, null, [["music", 55.22], ["theremin", 18.22], ["didgeridoo", 6.33]], null, [["theremin", 71.39], ["music", 19.3], ["didgeridoo", 2.27]], [["music", 54.66], ["theremin", 31.04], ["musical instrument", 4.57]], [["theremin", 51.01], ["music", 36.08], ["musical instrument", 3.25]], [["theremin", 67.56], ["music", 22.18], ["musical instrument", 2.49]], [["theremin", 50.45], ["music", 39.32], ["musical instrument", 2.67]], null, null, null, null, [["didgeridoo", 45.74], ["music", 22.53], ["theremin", 8.65]], null, null], "duration": [1.81, 1.09, 1.11, 4.6, 7.42, 2.12, 17.15, 1.15, 2.31, 0.43, 1.47, 0.51, 7.76, 1.08, 29.86, 3.48, 3.1, 6.52, 2.3, 1.26, 0.77, 44.16, 1.49, 8.11, 0.33, 1.92]} \ No newline at end of file diff --git a/annotations_filtered/a8mImo0aNDo_filtered.json b/annotations_filtered/a8mImo0aNDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cec14281d1387111363fd02374ed1b6e0d74146 --- /dev/null +++ b/annotations_filtered/a8mImo0aNDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.85], [8.0, 8.41], [12.0, 16.26], [18.0, 18.76], [23.0, 55.38], [57.0, 57.06], [61.0, 61.92], [62.0, 62.78], [65.0, 66.75], [69.0, 75.68], [82.0, 82.9], [87.0, 87.71], [90.0, 90.31], [92.0, 92.87], [95.0, 110.64], [113.0, 123.52], [125.0, 130.2], [130.0, 131.67], [133.0, 134.72], [136.0, 137.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 50.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.57, 0.0, 0.0, 0.0, 0.0, 29.79, 29.76, 28.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 68.61], ["throbbing", 12.75], ["hum", 2.82]], null, null, null, null, [["throbbing", 37.22], ["hum", 35.04], ["music", 14.72]], [["music", 53.99], ["hum", 7.72], ["mains hum", 7.44]], [["music", 46.43], ["speech", 18.79], ["throbbing", 3.54]], null, null, null], "duration": [0.85, 0.41, 4.26, 0.76, 32.38, 0.06, 0.92, 0.78, 1.75, 6.68, 0.9, 0.71, 0.31, 0.87, 15.64, 10.52, 5.2, 1.67, 1.72, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/a8xs3O-NwsY_filtered.json b/annotations_filtered/a8xs3O-NwsY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7580d7789130f092f42a82fd66678c791b98d922 --- /dev/null +++ b/annotations_filtered/a8xs3O-NwsY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.22], [10.0, 10.54], [18.0, 19.72], [20.0, 21.32], [22.0, 25.98], [29.0, 42.43], [44.0, 45.94], [48.0, 67.17], [69.0, 73.11], [74.0, 101.98], [104.0, 115.03], [117.0, 117.73], [119.0, 118.86], [120.0, 121.64], [122.0, 125.36], [127.0, 129.81]], "keep_status": [false, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 86.09, 34.32, 0.0, 30.43, 29.15, 34.01, 46.57, 0.0, 0.0, 0.0, 52.74, 93.45], "audiomae_on_audioset": [null, null, null, null, null, [["music", 54.87], ["bathtub (filling or washing)", 8.49], ["drip", 6.88]], null, [["fly, housefly", 31.17], ["mains hum", 15.42], ["buzz", 13.68]], [["car", 12.77], ["vehicle", 10.04], ["speech", 7.32]], [["whale vocalization", 29.39], ["boat, water vehicle", 20.63], ["music", 16.79]], [["music", 36.73], ["didgeridoo", 17.2], ["musical instrument", 8.41]], null, null, null, null, null], "duration": [1.22, 0.54, 1.72, 1.32, 3.98, 13.43, 1.94, 19.17, 4.11, 27.98, 11.03, 0.73, -0.14, 1.64, 3.36, 2.81]} \ No newline at end of file diff --git a/annotations_filtered/a9biNJwX3OA_filtered.json b/annotations_filtered/a9biNJwX3OA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..855a9cee07c3dde755001e1ec3b1d6077d8f4eea --- /dev/null +++ b/annotations_filtered/a9biNJwX3OA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [14.0, 18.01], [20.0, 20.58], [32.0, 32.63], [41.0, 42.82], [44.0, 44.81], [66.0, 66.83], [68.0, 68.96], [69.0, 69.85], [75.0, 78.48], [80.0, 81.36], [84.0, 86.19], [94.0, 97.33], [99.0, 99.57], [101.0, 102.12], [111.0, 111.87], [114.0, 115.92], [127.0, 127.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.97, 63.31, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["thunk", 35.93], ["speech", 32.35], ["whack, thwack", 13.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 4.01, 0.58, 0.63, 1.82, 0.81, 0.83, 0.96, 0.85, 3.48, 1.36, 2.19, 3.33, 0.57, 1.12, 0.87, 1.92, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/aAF6B3USip0_filtered.json b/annotations_filtered/aAF6B3USip0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16905554ff6b88ee8c3e56c20e07b4a578204958 --- /dev/null +++ b/annotations_filtered/aAF6B3USip0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.76], [18.0, 18.49], [22.0, 25.76], [33.0, 33.17], [35.0, 35.53], [50.0, 51.06], [53.0, 53.74], [56.0, 57.27], [59.0, 59.81], [65.0, 77.28], [79.0, 81.11], [89.0, 90.12], [97.0, 97.75], [103.0, 104.08], [109.0, 111.0], [112.0, 112.82], [124.0, 124.71], [128.0, 129.03], [130.0, 130.65]], "keep_status": [false, false, true, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 29.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.65, 34.61, 0.0, 0.0, 0.0, 38.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 22.49], ["moo", 20.8], ["music", 17.13]], null, null, null, null, null, null, [["cattle, bovinae", 29.75], ["livestock, farm animals, working animals", 20.71], ["moo", 18.11]], [["music", 31.48], ["throbbing", 19.54], ["hum", 5.91]], null, null, null, [["music", 30.18], ["speech", 18.34], ["crowd", 9.48]], null, null, null, null], "duration": [0.76, 0.49, 3.76, 0.17, 0.53, 1.06, 0.74, 1.27, 0.81, 12.28, 2.11, 1.12, 0.75, 1.08, 2.0, 0.82, 0.71, 1.03, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/aARaYjgm_rA_filtered.json b/annotations_filtered/aARaYjgm_rA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a086574674261a6be84471a5680813f839895ee3 --- /dev/null +++ b/annotations_filtered/aARaYjgm_rA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.42], [11.0, 11.1], [12.0, 20.76], [21.0, 22.82], [24.0, 50.95], [55.0, 59.49], [60.0, 60.96], [62.0, 66.26], [67.0, 68.52], [69.0, 71.47], [72.0, 129.19]], "keep_status": [false, false, true, false, true, true, false, true, false, true, false], "silence_prob": [0.0, 0.0, 37.44, 0.0, 31.86, 30.5, 0.0, 31.79, 0.0, 31.93, 0.0], "audiomae_on_audioset": [null, null, [["fly, housefly", 22.52], ["insect", 12.21], ["bee, wasp, etc.", 9.97]], null, [["speech", 16.44], ["outside, rural or natural", 8.24], ["livestock, farm animals, working animals", 7.87]], [["music", 28.15], ["noise", 27.68], ["cacophony", 11.03]], null, [["music", 35.02], ["speech", 8.76], ["frog", 4.05]], null, [["music", 30.5], ["cacophony", 10.39], ["speech", 10.08]], null], "duration": [1.42, 0.1, 8.76, 1.82, 26.95, 4.49, 0.96, 4.26, 1.52, 2.47, 57.19]} \ No newline at end of file diff --git a/annotations_filtered/aAWIZFqE6L4_filtered.json b/annotations_filtered/aAWIZFqE6L4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..008ee05ddb18c7781712b6059d8d66758c864c5f --- /dev/null +++ b/annotations_filtered/aAWIZFqE6L4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.98], [8.0, 22.59], [25.0, 25.69], [27.0, 29.73], [31.0, 31.35], [35.0, 35.92], [46.0, 45.71], [54.0, 53.91], [65.0, 65.82], [84.0, 85.11], [89.0, 89.61], [95.0, 98.22], [100.0, 105.36], [107.0, 107.57], [109.0, 110.03], [111.0, 112.87], [117.0, 118.27], [119.0, 119.74], [121.0, 121.19], [122.0, 122.45], [124.0, 126.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.49, 0.0, 33.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.4, 43.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.48], "audiomae_on_audioset": [null, [["music", 56.5], ["speech", 18.44], ["didgeridoo", 4.31]], null, [["music", 41.88], ["speech", 26.33], ["middle eastern music", 4.08]], null, null, null, null, null, null, null, [["speech", 46.82], ["music", 14.41], ["hum", 2.31]], [["fly, housefly", 37.37], ["insect", 24.65], ["bee, wasp, etc.", 13.15]], null, null, null, null, null, null, null, [["music", 51.72], ["didgeridoo", 19.84], ["musical instrument", 3.31]]], "duration": [0.98, 14.59, 0.69, 2.73, 0.35, 0.92, -0.29, -0.09, 0.82, 1.11, 0.61, 3.22, 5.36, 0.57, 1.03, 1.87, 1.27, 0.74, 0.19, 0.45, 2.33]} \ No newline at end of file diff --git a/annotations_filtered/aA_j4KpP0W0_filtered.json b/annotations_filtered/aA_j4KpP0W0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11e284f4a70ea2b1b5279ef04f907bc61142f5c1 --- /dev/null +++ b/annotations_filtered/aA_j4KpP0W0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 57.94], [60.0, 70.82], [71.0, 77.31], [78.0, 99.81], [102.0, 112.9], [116.0, 116.24], [117.0, 117.24], [119.0, 119.26], [120.0, 123.8], [125.0, 132.31], [136.0, 142.43], [143.0, 143.24], [144.0, 147.18], [147.0, 148.41], [153.0, 153.32], [158.0, 159.8], [160.0, 160.52], [161.0, 163.49], [164.0, 169.05], [169.0, 170.31], [171.0, 174.93], [175.0, 175.66], [176.0, 176.72], [178.0, 180.66], [187.0, 194.66], [196.0, 200.25], [200.0, 205.29], [206.0, 206.58], [207.0, 208.06], [209.0, 212.68], [218.0, 221.43], [234.0, 234.74], [236.0, 235.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 73.21, 46.61, 56.33, 59.51, 0.0, 0.0, 0.0, 73.21, 55.04, 58.81, 0.0, 48.74, 0.0, 0.0, 0.0, 0.0, 62.58, 62.37, 0.0, 62.37, 0.0, 0.0, 65.09, 60.98, 41.85, 69.2, 0.0, 0.0, 61.08, 67.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 60.89], ["cattle, bovinae", 7.61], ["livestock, farm animals, working animals", 7.29]], null, null, null, null, null, null, null, null, null, [["music", 48.29], ["speech", 9.06], ["musical instrument", 8.97]], null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 47.27], ["music", 40.97], ["guitar", 1.08]], null, null, null, null, null, null, null], "duration": [0.94, 10.82, 6.31, 21.81, 10.9, 0.24, 0.24, 0.26, 3.8, 7.31, 6.43, 0.24, 3.18, 1.41, 0.32, 1.8, 0.52, 2.49, 5.05, 1.31, 3.93, 0.66, 0.72, 2.66, 7.66, 4.25, 5.29, 0.58, 1.06, 3.68, 3.43, 0.74, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/aAg3LPuwfJM_filtered.json b/annotations_filtered/aAg3LPuwfJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cb04009d94a0bf32c80f8b5bb736583de4ea56f --- /dev/null +++ b/annotations_filtered/aAg3LPuwfJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 80.64], [81.0, 81.75], [82.0, 92.15], [94.0, 120.38], [121.0, 121.69], [127.0, 134.55]], "keep_status": [false, false, true, true, false, false], "silence_prob": [31.52, 0.0, 30.88, 32.56, 0.0, 46.02], "audiomae_on_audioset": [[["hum", 60.07], ["throbbing", 20.3], ["music", 5.75]], null, [["music", 30.4], ["electric shaver, electric razor", 11.13], ["thunk", 10.71]], [["hum", 35.88], ["music", 9.58], ["mains hum", 7.5]], null, [["noise", 30.63], ["speech", 28.04], ["radio", 11.38]]], "duration": [17.64, 0.75, 10.15, 26.38, 0.69, 7.55]} \ No newline at end of file diff --git a/annotations_filtered/aAkF2Du59Qw_filtered.json b/annotations_filtered/aAkF2Du59Qw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6c58564efde6b6bdea075cd3467c09b0e9ea871 --- /dev/null +++ b/annotations_filtered/aAkF2Du59Qw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.01], [9.0, 11.47], [16.0, 17.02], [31.0, 31.14], [33.0, 33.24], [37.0, 37.76], [40.0, 40.31], [49.0, 49.17], [50.0, 51.88], [55.0, 55.63], [60.0, 60.27], [60.0, 63.21], [67.0, 66.87], [75.0, 75.49], [87.0, 88.08], [89.0, 89.38], [90.0, 90.73], [94.0, 94.32], [95.0, 95.76], [100.0, 100.74], [124.0, 125.07], [126.0, 126.69], [127.0, 127.65], [133.0, 133.98], [137.0, 137.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.01, 2.47, 1.02, 0.14, 0.24, 0.76, 0.31, 0.17, 1.88, 0.63, 0.27, 3.21, -0.13, 0.49, 1.08, 0.38, 0.73, 0.32, 0.76, 0.74, 1.07, 0.69, 0.65, 0.98, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/aB0ABzNHvAE_filtered.json b/annotations_filtered/aB0ABzNHvAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9911472e4d172ffad9125296004e3f1b8f71ce1b --- /dev/null +++ b/annotations_filtered/aB0ABzNHvAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.09], [7.0, 7.65], [10.0, 17.07], [20.0, 22.94], [25.0, 25.71], [28.0, 30.48], [33.0, 35.6], [37.0, 44.0], [47.0, 48.84], [54.0, 55.09], [57.0, 70.5], [72.0, 72.4], [74.0, 77.55], [79.0, 81.46], [82.0, 82.8], [87.0, 88.42], [92.0, 94.2], [97.0, 103.33], [105.0, 107.92], [114.0, 115.59], [117.0, 117.91], [119.0, 123.08], [124.0, 125.0], [126.0, 129.57], [132.0, 150.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.91, 62.47, 0.0, 63.31, 63.53, 51.71, 0.0, 0.0, 59.77, 0.0, 89.19, 94.37, 0.0, 0.0, 94.66, 95.78, 95.37, 0.0, 0.0, 77.53, 0.0, 61.67, 72.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 0.65, 7.07, 2.94, 0.71, 2.48, 2.6, 7.0, 1.84, 1.09, 13.5, 0.4, 3.55, 2.46, 0.8, 1.42, 2.2, 6.33, 2.92, 1.59, 0.91, 4.08, 1.0, 3.57, 18.94]} \ No newline at end of file diff --git a/annotations_filtered/aBADjCeFnuU_filtered.json b/annotations_filtered/aBADjCeFnuU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..caa4c8890df973b1ed1571ed8b2bb53dd35b2620 --- /dev/null +++ b/annotations_filtered/aBADjCeFnuU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.89], [16.0, 16.6], [21.0, 20.83], [32.0, 33.42], [51.0, 51.9], [59.0, 59.76], [87.0, 91.27], [110.0, 110.42], [118.0, 117.96], [122.0, 124.38], [135.0, 135.78], [163.0, 165.82], [168.0, 167.93], [171.0, 172.57], [177.0, 179.69], [222.0, 224.48], [228.0, 233.59], [235.0, 237.66], [238.0, 238.03]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.25, 0.0, 0.0, 79.41, 0.0, 63.96, 0.0, 0.0, 63.1, 44.87, 45.18, 36.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 21.73], ["livestock, farm animals, working animals", 17.28], ["moo", 12.27]], null, null, null, null, null, null, null, null, [["grunt", 36.84], ["wild animals", 9.45], ["roaring cats (lions, tigers)", 6.72]], [["snicker", 17.78], ["whimper", 13.87], ["chuckle, chortle", 13.65]], [["sheep", 35.49], ["bleat", 29.91], ["livestock, farm animals, working animals", 6.59]], null], "duration": [0.89, 0.6, -0.17, 1.42, 0.9, 0.76, 4.27, 0.42, -0.04, 2.38, 0.78, 2.82, -0.07, 1.57, 2.69, 2.48, 5.59, 2.66, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/aBgs1Kxh9nM_filtered.json b/annotations_filtered/aBgs1Kxh9nM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a71013ebea048b44dbedc1181e1e25d215b22171 --- /dev/null +++ b/annotations_filtered/aBgs1Kxh9nM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.59], [16.0, 15.63], [17.0, 17.17], [18.0, 22.22], [24.0, 31.21], [32.0, 32.39], [33.0, 33.62], [36.0, 35.97], [37.0, 38.15], [41.0, 41.72], [43.0, 43.23], [44.0, 44.17], [47.0, 47.53], [49.0, 49.69], [52.0, 52.62], [53.0, 53.84], [57.0, 57.03], [58.0, 58.67], [62.0, 61.87], [65.0, 65.38], [75.0, 75.81], [78.0, 78.24], [84.0, 86.41], [88.0, 90.96], [106.0, 105.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 78.38, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, -0.37, 0.17, 4.22, 7.21, 0.39, 0.62, -0.03, 1.15, 0.72, 0.23, 0.17, 0.53, 0.69, 0.62, 0.84, 0.03, 0.67, -0.13, 0.38, 0.81, 0.24, 2.41, 2.96, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/aBpwrORhKWU_filtered.json b/annotations_filtered/aBpwrORhKWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0697fc2ea9060463b713195d3e5c016a13867fa --- /dev/null +++ b/annotations_filtered/aBpwrORhKWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 63.59], [68.0, 68.57], [71.0, 70.78], [72.0, 74.31], [76.0, 77.84], [79.0, 81.67], [83.0, 83.25], [85.0, 85.55], [87.0, 89.73], [90.0, 94.71], [98.0, 98.69], [99.0, 105.7], [107.0, 108.43], [112.0, 112.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.53, 0.0, 0.0, 71.87, 0.0, 77.7, 0.0, 0.0, 84.62, 66.76, 0.0, 46.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 83.8], ["ambient music", 1.59], ["synthesizer", 1.57]], null, null], "duration": [6.59, 0.57, -0.22, 2.31, 1.84, 2.67, 0.25, 0.55, 2.73, 4.71, 0.69, 6.7, 1.43, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/aBxlJkcHDSM_filtered.json b/annotations_filtered/aBxlJkcHDSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57ec44f7b43b8e43f3bcf0cc5ebafb3f667651e4 --- /dev/null +++ b/annotations_filtered/aBxlJkcHDSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [4.0, 5.44], [7.0, 8.68], [12.0, 13.29], [15.0, 96.09], [97.0, 98.52], [101.0, 101.14], [103.0, 139.97], [141.0, 141.59], [143.0, 155.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 57.15], ["didgeridoo", 21.86], ["grunt", 14.46]]], "duration": [0.61, 1.44, 1.68, 1.29, 81.09, 1.52, 0.14, 36.97, 0.59, 12.9]} \ No newline at end of file diff --git a/annotations_filtered/aCEjVC3Dtn8_filtered.json b/annotations_filtered/aCEjVC3Dtn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..152f06183c3481da86b4a253b5aa6f65251d6c00 --- /dev/null +++ b/annotations_filtered/aCEjVC3Dtn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.06], [20.0, 20.29], [22.0, 23.31], [46.0, 53.86], [60.0, 60.78], [63.0, 63.86], [71.0, 73.08], [74.0, 102.68], [104.0, 105.16], [107.0, 108.67], [111.0, 114.49], [116.0, 126.06]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 41.7, 0.0, 0.0, 39.47, 29.68, 0.0, 0.0, 33.77, 50.56], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 26.91], ["insect", 17.49], ["speech", 15.71]], null, null, [["cattle, bovinae", 34.32], ["moo", 30.48], ["livestock, farm animals, working animals", 11.36]], [["speech", 64.48], ["music", 13.2], ["outside, urban or manmade", 1.4]], null, null, [["vehicle", 36.17], ["aircraft", 18.37], ["music", 8.71]], null], "duration": [1.06, 0.29, 1.31, 7.86, 0.78, 0.86, 2.08, 28.68, 1.16, 1.67, 3.49, 10.06]} \ No newline at end of file diff --git a/annotations_filtered/aCaTMqs_Qsc_filtered.json b/annotations_filtered/aCaTMqs_Qsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65b1f3a25f64f26bd7ab47fc54f4cececfb9ea9a --- /dev/null +++ b/annotations_filtered/aCaTMqs_Qsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.29], [6.0, 6.64], [12.0, 13.09], [14.0, 14.5], [19.0, 19.7], [21.0, 22.6], [24.0, 25.84], [34.0, 34.53], [38.0, 42.74], [43.0, 46.94], [49.0, 49.76], [51.0, 51.56], [53.0, 55.26], [59.0, 58.63], [59.0, 58.68], [67.0, 68.49], [70.0, 69.84], [72.0, 72.64], [74.0, 74.19], [82.0, 82.93], [88.0, 88.48], [96.0, 95.93], [97.0, 97.21], [104.0, 107.06], [111.0, 111.62], [117.0, 118.45], [121.0, 121.69], [123.0, 124.19], [125.0, 126.03], [127.0, 128.07], [134.0, 135.35], [138.0, 138.87], [139.0, 140.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53, 72.01, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.64, 1.09, 0.5, 0.7, 1.6, 1.84, 0.53, 4.74, 3.94, 0.76, 0.56, 2.26, -0.37, -0.32, 1.49, -0.16, 0.64, 0.19, 0.93, 0.48, -0.07, 0.21, 3.06, 0.62, 1.45, 0.69, 1.19, 1.03, 1.07, 1.35, 0.87, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/aClqNJOXy-w_filtered.json b/annotations_filtered/aClqNJOXy-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a25dbcfac64ee15093ad2d5f70d16a5d99f2ded9 --- /dev/null +++ b/annotations_filtered/aClqNJOXy-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.75], [14.0, 29.49], [30.0, 31.78], [32.0, 33.57], [34.0, 35.45], [36.0, 59.04], [61.0, 78.21], [83.0, 84.3], [84.0, 84.33], [86.0, 86.97], [89.0, 124.93]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.54, 35.17, 0.0, 0.0, 0.0, 33.71, 33.72, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["synthesizer", 10.87], ["throbbing", 9.26], ["music", 9.03]], [["music", 71.63], ["musical instrument", 6.96], ["synthesizer", 6.53]], null, null, null, [["music", 79.46], ["musical instrument", 4.67], ["didgeridoo", 2.72]], [["music", 87.46], ["musical instrument", 2.43], ["synthesizer", 2.29]], null, null, null, null], "duration": [6.75, 15.49, 1.78, 1.57, 1.45, 23.04, 17.21, 1.3, 0.33, 0.97, 35.93]} \ No newline at end of file diff --git a/annotations_filtered/aCqhUO76MTU_filtered.json b/annotations_filtered/aCqhUO76MTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b01e5b2f361d1487b4785bd2c92d1b1a3bcef3f9 --- /dev/null +++ b/annotations_filtered/aCqhUO76MTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [17.0, 17.47], [20.0, 21.78], [29.0, 29.69], [38.0, 38.69], [41.0, 56.91], [58.0, 58.89], [68.0, 69.15], [85.0, 85.5], [88.0, 88.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.75, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["fly, housefly", 43.36], ["insect", 29.16], ["bee, wasp, etc.", 21.09]], null, null, null, null], "duration": [1.14, 0.47, 1.78, 0.69, 0.69, 15.91, 0.89, 1.15, 0.5, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/aD4ZPXHAVCA_filtered.json b/annotations_filtered/aD4ZPXHAVCA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7d837ddb7218560cd2c7b219f4bcbfaa6e2ce20 --- /dev/null +++ b/annotations_filtered/aD4ZPXHAVCA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.83], [8.0, 8.01], [8.0, 10.62], [14.0, 14.71], [16.0, 17.04], [18.0, 19.48], [22.0, 28.31], [29.0, 30.89], [33.0, 34.26], [35.0, 35.48], [37.0, 37.4], [45.0, 45.6], [49.0, 50.18], [54.0, 54.04], [56.0, 56.0], [57.0, 64.49], [71.0, 88.2], [93.0, 98.78], [101.0, 107.3], [114.0, 114.69], [116.0, 116.34], [118.0, 118.02], [122.0, 122.82], [125.0, 126.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 57.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.35, 29.69, 29.2, 29.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.63], ["frog", 15.2], ["croak", 14.39]], [["music", 53.96], ["saxophone", 11.21], ["singing", 7.08]], [["music", 87.59], ["music of latin america", 3.27], ["clarinet", 1.44]], [["livestock, farm animals, working animals", 38.08], ["moo", 25.42], ["cattle, bovinae", 21.81]], null, null, null, null, null], "duration": [0.83, 0.01, 2.62, 0.71, 1.04, 1.48, 6.31, 1.89, 1.26, 0.48, 0.4, 0.6, 1.18, 0.04, 0.0, 7.49, 17.2, 5.78, 6.3, 0.69, 0.34, 0.02, 0.82, 1.89]} \ No newline at end of file diff --git a/annotations_filtered/aDFJMSlmxBg_filtered.json b/annotations_filtered/aDFJMSlmxBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7725adb167828ecf48baf7fb0dc458538e4295db --- /dev/null +++ b/annotations_filtered/aDFJMSlmxBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.0], [7.0, 7.42], [22.0, 22.5], [23.0, 23.75], [52.0, 54.04], [58.0, 58.14], [59.0, 60.02]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.2, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 33.82], ["whale vocalization", 21.3], ["hum", 15.08]], null, null], "duration": [0.0, 0.42, 0.5, 0.75, 2.04, 0.14, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/aDJJBMXiwiI_filtered.json b/annotations_filtered/aDJJBMXiwiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..549ebc9d9f62135ab18ae3b5331700a1823cc457 --- /dev/null +++ b/annotations_filtered/aDJJBMXiwiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 24.41], [26.0, 29.67], [33.0, 33.72], [35.0, 108.5], [111.0, 158.79], [160.0, 162.99], [165.0, 167.1], [169.0, 170.95], [172.0, 173.26]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [99.93, 98.59, 0.0, 0.0, 0.0, 95.23, 83.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [21.41, 3.67, 0.72, 73.5, 47.79, 2.99, 2.1, 1.95, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/aDJgv1iARPg_filtered.json b/annotations_filtered/aDJgv1iARPg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0c19aba39d56c0114062dec44b8360fa5bbd42 --- /dev/null +++ b/annotations_filtered/aDJgv1iARPg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.44], [23.0, 22.84], [29.0, 29.71], [31.0, 31.02], [42.0, 43.78], [46.0, 47.07], [67.0, 67.29], [84.0, 84.96], [109.0, 112.89], [114.0, 116.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 59.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.44, -0.16, 0.71, 0.02, 1.78, 1.07, 0.29, 0.96, 3.89, 2.16]} \ No newline at end of file diff --git a/annotations_filtered/aDU5CcINqyI_filtered.json b/annotations_filtered/aDU5CcINqyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ed9c3f7f22048b7221f80fb14fbed1f5edc925e --- /dev/null +++ b/annotations_filtered/aDU5CcINqyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 31.21], [32.0, 36.85], [62.0, 61.89], [64.0, 66.77], [67.0, 77.63], [80.0, 102.96], [105.0, 105.14], [107.0, 107.96], [112.0, 113.32], [114.0, 139.65], [146.0, 151.71], [154.0, 154.77], [156.0, 156.29], [159.0, 164.15], [165.0, 166.06], [169.0, 173.47], [175.0, 175.1]], "keep_status": [false, false, false, true, true, true, false, false, false, true, true, false, false, true, false, true, false], "silence_prob": [31.47, 32.39, 0.0, 36.74, 35.37, 35.34, 0.0, 0.0, 0.0, 29.8, 29.9, 0.0, 0.0, 38.23, 0.0, 40.38, 0.0], "audiomae_on_audioset": [[["music", 57.49], ["hum", 8.86], ["mains hum", 7.33]], [["music", 69.99], ["synthesizer", 4.79], ["musical instrument", 4.61]], null, [["speech", 39.56], ["fly, housefly", 8.49], ["didgeridoo", 5.01]], [["didgeridoo", 29.83], ["music", 24.9], ["throbbing", 13.43]], [["music", 36.62], ["throbbing", 24.9], ["synthesizer", 6.93]], null, null, null, [["music", 29.68], ["whack, thwack", 19.23], ["smash, crash", 15.18]], [["speech", 57.73], ["music", 6.98], ["buzz", 4.26]], null, null, [["speech", 27.67], ["music", 12.09], ["animal", 8.88]], null, [["speech", 22.4], ["music", 18.05], ["didgeridoo", 4.71]], null], "duration": [27.21, 4.85, -0.11, 2.77, 10.63, 22.96, 0.14, 0.96, 1.32, 25.65, 5.71, 0.77, 0.29, 5.15, 1.06, 4.47, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/aDUZ8IC6wco_filtered.json b/annotations_filtered/aDUZ8IC6wco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e3c3f813cb0840e10c85566d79ae243a7d930da --- /dev/null +++ b/annotations_filtered/aDUZ8IC6wco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.44], [20.0, 24.36], [31.0, 33.29], [38.0, 38.03], [42.0, 42.58], [49.0, 49.47], [53.0, 53.35], [54.0, 55.14], [56.0, 57.1], [61.0, 61.15], [63.0, 64.59], [66.0, 66.72], [71.0, 71.79], [77.0, 77.63], [80.0, 80.1], [83.0, 83.81], [85.0, 85.35], [88.0, 89.26], [91.0, 92.8], [93.0, 93.33], [94.0, 94.07], [98.0, 97.9], [103.0, 103.5], [108.0, 108.26], [109.0, 110.02], [118.0, 119.2], [124.0, 124.5], [128.0, 128.48]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.63, 44.9, 48.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 17.6], ["music", 15.78], ["horse", 3.9]], [["music", 39.75], ["didgeridoo", 8.23], ["speech", 7.19]], [["speech", 53.36], ["busy signal", 6.31], ["chirp tone", 3.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.44, 4.36, 2.29, 0.03, 0.58, 0.47, 0.35, 1.14, 1.1, 0.15, 1.59, 0.72, 0.79, 0.63, 0.1, 0.81, 0.35, 1.26, 1.8, 0.33, 0.07, -0.1, 0.5, 0.26, 1.02, 1.2, 0.5, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/aDZSH05DM_c_filtered.json b/annotations_filtered/aDZSH05DM_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..780603d026bbec3e8e096e8d39761063be5e2f1a --- /dev/null +++ b/annotations_filtered/aDZSH05DM_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.96], [7.0, 8.53], [9.0, 47.53], [48.0, 48.63], [49.0, 50.43], [51.0, 53.11], [54.0, 56.94], [58.0, 76.45], [78.0, 78.04], [78.0, 81.21], [84.0, 85.04], [86.0, 92.87], [93.0, 98.88], [101.0, 101.14], [101.0, 101.87], [102.0, 102.95], [105.0, 105.58], [108.0, 111.06], [113.0, 113.64], [114.0, 115.18], [116.0, 116.83], [118.0, 121.12], [123.0, 123.65], [124.0, 126.06], [127.0, 153.23], [155.0, 160.08], [161.0, 161.81], [164.0, 173.67], [176.0, 175.95]], "keep_status": [false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [83.16, 0.0, 0.0, 0.0, 0.0, 35.94, 34.28, 45.62, 0.0, 38.79, 0.0, 38.78, 34.98, 0.0, 0.0, 0.0, 0.0, 37.61, 0.0, 0.0, 0.0, 39.28, 0.0, 37.89, 34.3, 40.02, 0.0, 29.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 44.18], ["rumble", 6.09], ["mains hum", 5.96]], [["music", 54.8], ["electronic music", 13.87], ["ambient music", 5.67]], [["rumble", 19.61], ["music", 19.1], ["hum", 17.1]], null, [["throbbing", 23.92], ["cattle, bovinae", 18.13], ["livestock, farm animals, working animals", 9.88]], null, [["hum", 37.82], ["throbbing", 22.21], ["speech", 14.95]], [["music", 52.72], ["hum", 17.82], ["throbbing", 13.14]], null, null, null, null, [["music", 53.08], ["throbbing", 8.26], ["hum", 7.44]], null, null, null, [["music", 53.16], ["hum", 16.65], ["throbbing", 14.57]], null, [["music", 58.93], ["hum", 12.37], ["throbbing", 10.59]], [["hum", 40.82], ["throbbing", 28.27], ["music", 13.53]], [["music", 26.72], ["sine wave", 20.37], ["sonar", 13.07]], null, [["hum", 43.63], ["throbbing", 24.97], ["mains hum", 19.35]], null], "duration": [2.96, 1.53, 38.53, 0.63, 1.43, 2.11, 2.94, 18.45, 0.04, 3.21, 1.04, 6.87, 5.88, 0.14, 0.87, 0.95, 0.58, 3.06, 0.64, 1.18, 0.83, 3.12, 0.65, 2.06, 26.23, 5.08, 0.81, 9.67, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/aDcfm_9GTyU_filtered.json b/annotations_filtered/aDcfm_9GTyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..104ecc079ddd3aba39b726305090fe5397b2a161 --- /dev/null +++ b/annotations_filtered/aDcfm_9GTyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.42], [21.0, 24.14], [29.0, 29.69], [30.0, 34.94], [36.0, 37.45], [38.0, 46.87]], "keep_status": [true, false, false, true, false, true], "silence_prob": [42.79, 33.6, 0.0, 33.41, 0.0, 31.73], "audiomae_on_audioset": [[["speech", 24.08], ["music", 12.77], ["wind instrument, woodwind instrument", 5.12]], [["theremin", 50.07], ["music", 33.2], ["musical instrument", 2.4]], null, [["music", 47.94], ["theremin", 7.41], ["trombone", 6.53]], null, [["whack, thwack", 39.31], ["speech", 8.2], ["breaking", 4.87]]], "duration": [2.42, 3.14, 0.69, 4.94, 1.45, 8.87]} \ No newline at end of file diff --git a/annotations_filtered/aDdBoZOylmo_filtered.json b/annotations_filtered/aDdBoZOylmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f736dfcc8d4bf2d8eef2dc1172f169d506018d54 --- /dev/null +++ b/annotations_filtered/aDdBoZOylmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.44], [19.0, 25.3], [28.0, 29.02], [30.0, 31.4], [33.0, 38.13], [39.0, 47.12], [53.0, 54.03], [55.0, 56.51], [58.0, 60.17], [63.0, 64.23], [68.0, 69.53], [73.0, 75.44], [79.0, 84.28], [86.0, 95.69], [98.0, 107.65], [110.0, 116.48], [119.0, 127.55], [128.0, 127.65], [137.0, 137.62], [143.0, 153.06]], "keep_status": [false, true, false, false, true, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [35.51, 37.27, 0.0, 0.0, 33.32, 31.41, 0.0, 0.0, 32.73, 0.0, 0.0, 32.6, 32.22, 29.57, 29.55, 31.62, 29.48, 0.0, 0.0, 29.55], "audiomae_on_audioset": [[["music", 43.94], ["speech", 24.76], ["singing bowl", 8.75]], [["music", 50.38], ["musical instrument", 8.4], ["synthesizer", 6.84]], null, null, [["music", 46.1], ["didgeridoo", 17.28], ["speech", 6.48]], [["music", 53.53], ["theremin", 6.3], ["ambient music", 4.98]], null, null, [["music", 33.89], ["theremin", 7.38], ["cello", 5.66]], null, null, [["music", 30.06], ["theremin", 13.44], ["hum", 10.6]], [["music", 57.39], ["theremin", 12.87], ["synthesizer", 7.46]], [["music", 35.57], ["hum", 20.56], ["mains hum", 15.55]], [["mains hum", 32.33], ["hum", 27.65], ["music", 24.19]], [["music", 66.0], ["ambient music", 6.43], ["theremin", 5.69]], [["music", 57.4], ["theremin", 13.76], ["hum", 5.49]], null, null, [["hum", 37.26], ["mains hum", 35.67], ["music", 12.19]]], "duration": [3.44, 6.3, 1.02, 1.4, 5.13, 8.12, 1.03, 1.51, 2.17, 1.23, 1.53, 2.44, 5.28, 9.69, 9.65, 6.48, 8.55, -0.35, 0.62, 10.06]} \ No newline at end of file diff --git a/annotations_filtered/aDm4L7gjYNs_filtered.json b/annotations_filtered/aDm4L7gjYNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8453fe68335368be921cc89c98015b11317950a --- /dev/null +++ b/annotations_filtered/aDm4L7gjYNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.05], [8.0, 9.44], [18.0, 19.03], [23.0, 24.73], [34.0, 34.69], [36.0, 39.18], [40.0, 41.74], [42.0, 51.09], [52.0, 53.99], [55.0, 58.89], [60.0, 60.86], [62.0, 80.1], [82.0, 84.92], [87.0, 87.39], [87.0, 89.61], [90.0, 93.12], [99.0, 101.11], [113.0, 133.74], [135.0, 135.4], [136.0, 136.16], [137.0, 138.32], [139.0, 139.75], [145.0, 145.83], [148.0, 148.85], [155.0, 162.28], [165.0, 169.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [74.44, 0.0, 0.0, 0.0, 0.0, 58.98, 0.0, 37.07, 0.0, 63.1, 0.0, 30.72, 32.0, 0.0, 32.29, 35.55, 45.49, 31.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.45, 35.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 69.66], ["synthesizer", 5.77], ["didgeridoo", 5.6]], null, null, null, [["music", 34.91], ["hum", 28.75], ["mains hum", 13.56]], [["music", 66.55], ["electronic music", 8.37], ["synthesizer", 7.45]], null, [["music", 38.87], ["didgeridoo", 33.23], ["theremin", 5.4]], [["music", 49.56], ["didgeridoo", 17.59], ["musical instrument", 12.98]], [["music", 64.86], ["didgeridoo", 12.19], ["musical instrument", 7.95]], [["music", 79.81], ["musical instrument", 3.1], ["synthesizer", 1.74]], null, null, null, null, null, null, [["music", 51.95], ["theremin", 15.73], ["musical instrument", 4.92]], [["music", 46.07], ["speech", 27.76], ["quack", 5.04]]], "duration": [3.05, 1.44, 1.03, 1.73, 0.69, 3.18, 1.74, 9.09, 1.99, 3.89, 0.86, 18.1, 2.92, 0.39, 2.61, 3.12, 2.11, 20.74, 0.4, 0.16, 1.32, 0.75, 0.83, 0.85, 7.28, 4.21]} \ No newline at end of file diff --git a/annotations_filtered/aDq_JsN2Y6c_filtered.json b/annotations_filtered/aDq_JsN2Y6c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c743836398ce014ec5947ab899f8d039869fa15 --- /dev/null +++ b/annotations_filtered/aDq_JsN2Y6c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.78], [10.0, 10.23], [13.0, 12.85], [13.0, 14.08], [14.0, 15.28], [17.0, 17.95], [21.0, 21.39], [25.0, 26.11], [27.0, 28.49], [33.0, 34.97], [37.0, 36.91], [38.0, 38.89], [42.0, 43.78], [48.0, 54.45], [56.0, 61.4], [64.0, 65.38], [66.0, 67.46], [70.0, 69.94], [71.0, 78.31], [80.0, 80.97], [81.0, 85.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.98, 58.89, 0.0, 0.0, 0.0, 58.05, 0.0, 47.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.55], ["speech", 20.71], ["sidetone", 12.46]], null, null, null, null, null, null, [["speech", 46.79], ["music", 14.78], ["hum", 4.11]]], "duration": [0.78, 0.23, -0.15, 1.08, 1.28, 0.95, 0.39, 1.11, 1.49, 1.97, -0.09, 0.89, 1.78, 6.45, 5.4, 1.38, 1.46, -0.06, 7.31, 0.97, 4.41]} \ No newline at end of file diff --git a/annotations_filtered/aDrR7riBeLA_filtered.json b/annotations_filtered/aDrR7riBeLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c66c1cb5bbbbcd4e9283df0b8dcdcf389451b84 --- /dev/null +++ b/annotations_filtered/aDrR7riBeLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 26.11], [28.0, 51.44], [52.0, 54.26], [55.0, 57.59], [60.0, 59.91], [62.0, 64.29], [65.0, 67.42], [68.0, 78.85], [80.0, 84.4], [85.0, 87.37], [88.0, 90.27], [91.0, 91.86], [92.0, 94.05], [95.0, 99.23], [100.0, 101.43], [102.0, 106.91], [107.0, 111.35], [112.0, 112.11], [112.0, 113.58], [116.0, 118.42], [119.0, 125.85], [126.0, 128.83], [129.0, 131.18], [131.0, 133.83], [136.0, 138.86], [139.0, 140.59], [141.0, 141.44], [143.0, 143.29], [144.0, 148.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 100.0, 99.95, 100.0, 0.0, 99.92, 98.27, 100.0, 100.0, 99.99, 100.0, 0.0, 97.92, 100.0, 0.0, 100.0, 98.1, 0.0, 0.0, 100.0, 100.0, 67.0, 99.88, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.11, 23.44, 2.26, 2.59, -0.09, 2.29, 2.42, 10.85, 4.4, 2.37, 2.27, 0.86, 2.05, 4.23, 1.43, 4.91, 4.35, 0.11, 1.58, 2.42, 6.85, 2.83, 2.18, 2.83, 2.86, 1.59, 0.44, 0.29, 4.2]} \ No newline at end of file diff --git a/annotations_filtered/aDvjCbdyEHw_filtered.json b/annotations_filtered/aDvjCbdyEHw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca2b909f8972676f7e158ba126b75bd240fcb33d --- /dev/null +++ b/annotations_filtered/aDvjCbdyEHw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.28], [14.0, 14.55], [15.0, 16.29], [19.0, 19.06], [20.0, 21.52], [23.0, 22.91], [24.0, 24.21], [30.0, 30.2], [66.0, 66.46], [72.0, 72.84], [96.0, 96.43], [102.0, 101.97], [105.0, 106.08], [119.0, 118.77], [137.0, 143.67], [146.0, 149.99], [151.0, 159.16], [164.0, 171.34], [174.0, 179.04], [179.0, 181.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.56, 33.19, 30.37, 30.23, 30.29, 32.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.65], ["sidetone", 5.69], ["synthesizer", 4.67]], [["music", 86.91], ["drum machine", 3.28], ["sampler", 2.11]], [["music", 79.89], ["fly, housefly", 4.88], ["insect", 1.52]], [["music", 85.53], ["electronic music", 3.55], ["throbbing", 2.7]], [["music", 78.23], ["electronic music", 5.27], ["drum machine", 3.9]], [["music", 61.26], ["boing", 5.14], ["electronic music", 4.95]]], "duration": [0.28, 0.55, 1.29, 0.06, 1.52, -0.09, 0.21, 0.2, 0.46, 0.84, 0.43, -0.03, 1.08, -0.23, 6.67, 3.99, 8.16, 7.34, 5.04, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/aE4h5rX9u3U_filtered.json b/annotations_filtered/aE4h5rX9u3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..444eb48f93540ca4a435a2a63c050196fb5aee2b --- /dev/null +++ b/annotations_filtered/aE4h5rX9u3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 15.23], [16.0, 38.77], [39.0, 114.89], [115.0, 115.5]], "keep_status": [false, true, false, false], "silence_prob": [49.22, 30.27, 0.0, 0.0], "audiomae_on_audioset": [[["music", 70.91], ["musical instrument", 6.42], ["synthesizer", 4.28]], [["music", 15.39], ["speech", 14.71], ["explosion", 9.43]], null, null], "duration": [14.23, 22.77, 75.89, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/aEBLrCGhTVM_filtered.json b/annotations_filtered/aEBLrCGhTVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2428d68ae0073c07c879a3b1c4fb04a880ece7ce --- /dev/null +++ b/annotations_filtered/aEBLrCGhTVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.84], [3.0, 2.89], [3.0, 3.5], [4.0, 6.99], [13.0, 13.29], [19.0, 29.05], [30.0, 30.79], [37.0, 44.88], [50.0, 59.58], [80.0, 83.84], [85.0, 88.57], [89.0, 100.82], [102.0, 104.3], [108.0, 108.38], [109.0, 109.63], [111.0, 120.34], [122.0, 122.76]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.15, 0.0, 33.38, 0.0, 33.83, 34.01, 34.1, 31.87, 34.39, 58.81, 0.0, 0.0, 35.23, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 76.89], ["music", 5.91], ["sidetone", 3.09]], null, [["speech", 58.21], ["whack, thwack", 10.71], ["groan", 4.74]], null, [["speech", 40.48], ["whack, thwack", 10.63], ["fart", 10.4]], [["speech", 53.44], ["grunt", 17.75], ["groan", 9.68]], [["speech", 56.76], ["fart", 10.57], ["sidetone", 8.78]], [["moo", 21.73], ["speech", 20.7], ["cattle, bovinae", 18.56]], [["speech", 29.65], ["cattle, bovinae", 11.32], ["livestock, farm animals, working animals", 10.9]], null, null, null, [["speech", 49.37], ["fart", 18.33], ["groan", 2.36]], null], "duration": [-0.16, -0.11, 0.5, 2.99, 0.29, 10.05, 0.79, 7.88, 9.58, 3.84, 3.57, 11.82, 2.3, 0.38, 0.63, 9.34, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/aEG9dwOsAAg_filtered.json b/annotations_filtered/aEG9dwOsAAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e22013af76387e1d9070c3831049d492d8820cfa --- /dev/null +++ b/annotations_filtered/aEG9dwOsAAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.38], [9.0, 10.54], [12.0, 12.97], [14.0, 14.74], [16.0, 17.51], [25.0, 26.15], [28.0, 30.33], [37.0, 39.85], [47.0, 47.63], [50.0, 50.53], [64.0, 63.86], [98.0, 103.17], [104.0, 109.86], [116.0, 115.96], [118.0, 118.62], [119.0, 120.04], [121.0, 128.46], [129.0, 129.12], [130.0, 130.0], [132.0, 134.74], [135.0, 135.97], [137.0, 139.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 92.64, 0.0, 0.0, 0.0, 32.68, 29.69, 0.0, 0.0, 0.0, 32.46, 0.0, 0.0, 43.1, 0.0, 59.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 40.91], ["speech", 24.01], ["sidetone", 15.84]], [["music", 41.37], ["speech", 13.66], ["explosion", 7.83]], null, null, null, [["speech", 34.54], ["music", 19.07], ["sidetone", 11.57]], null, null, [["speech", 23.07], ["music", 15.53], ["sidetone", 8.72]], null, null], "duration": [2.38, 1.54, 0.97, 0.74, 1.51, 1.15, 2.33, 2.85, 0.63, 0.53, -0.14, 5.17, 5.86, -0.04, 0.62, 1.04, 7.46, 0.12, 0.0, 2.74, 0.97, 2.45]} \ No newline at end of file diff --git a/annotations_filtered/aEIaR1nlEoo_filtered.json b/annotations_filtered/aEIaR1nlEoo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbbbfd3e2bc2df5fd4e3766fdb5bd1901d59c2c7 --- /dev/null +++ b/annotations_filtered/aEIaR1nlEoo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.45], [15.0, 20.09], [25.0, 25.76], [28.0, 31.29], [33.0, 33.86], [41.0, 42.74], [44.0, 45.13], [45.0, 45.87], [48.0, 48.03], [49.0, 49.92], [51.0, 59.83], [63.0, 64.35], [69.0, 69.13], [72.0, 72.57], [77.0, 77.67]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 32.49, 0.0, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 25.18], ["mains hum", 17.45], ["car", 8.78]], null, null, null, null, null, null, null, null, [["speech", 27.75], ["hum", 14.53], ["mains hum", 5.45]], null, null, null, null], "duration": [1.45, 5.09, 0.76, 3.29, 0.86, 1.74, 1.13, 0.87, 0.03, 0.92, 8.83, 1.35, 0.13, 0.57, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/aESwFtEWnpM_filtered.json b/annotations_filtered/aESwFtEWnpM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7a980c23e5fde37f7f30d957648c6f461f51f67 --- /dev/null +++ b/annotations_filtered/aESwFtEWnpM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.53], [24.0, 24.07], [26.0, 45.64], [48.0, 69.47], [70.0, 72.28], [78.0, 78.14], [83.0, 83.86], [91.0, 92.82], [96.0, 96.08], [104.0, 104.21]], "keep_status": [true, false, false, true, true, false, false, false, false, false], "silence_prob": [32.32, 0.0, 32.57, 34.58, 49.59, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.35], ["mosquito", 13.43], ["synthesizer", 5.68]], null, [["music", 50.74], ["drum machine", 13.07], ["speech", 7.43]], [["music", 41.45], ["drum machine", 7.03], ["didgeridoo", 6.41]], [["music", 38.12], ["speech", 16.89], ["drum machine", 5.87]], null, null, null, null, null], "duration": [2.53, 0.07, 19.64, 21.47, 2.28, 0.14, 0.86, 1.82, 0.08, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/aEfAFo99jEs_filtered.json b/annotations_filtered/aEfAFo99jEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a316b2d9bb4c6a0819ec5ba828b6e61621d2350 --- /dev/null +++ b/annotations_filtered/aEfAFo99jEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [7.0, 12.16], [13.0, 21.78], [23.0, 25.25], [26.0, 34.35], [36.0, 56.81], [58.0, 65.64], [67.0, 70.77], [72.0, 73.45], [75.0, 78.46], [81.0, 94.22], [96.0, 97.56], [104.0, 104.63], [105.0, 106.66], [108.0, 110.13], [114.0, 120.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.95, 61.97, 90.43, 61.97, 84.62, 90.43, 95.64, 0.0, 81.89, 79.59, 0.0, 0.0, 0.0, 97.43, 87.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 5.16, 8.78, 2.25, 8.35, 20.81, 7.64, 3.77, 1.45, 3.46, 13.22, 1.56, 0.63, 1.66, 2.13, 6.72]} \ No newline at end of file diff --git a/annotations_filtered/aEpa21af2j4_filtered.json b/annotations_filtered/aEpa21af2j4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12cda741f82d47101887083bc3da6519725a81d5 --- /dev/null +++ b/annotations_filtered/aEpa21af2j4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.61], [7.0, 8.19], [9.0, 9.81], [14.0, 14.5], [15.0, 15.57], [16.0, 17.47], [18.0, 18.74], [30.0, 30.69], [32.0, 37.56], [39.0, 40.14], [41.0, 48.74], [52.0, 65.53], [67.0, 97.6], [98.0, 126.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 99.99, 36.72, 0.0, 33.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["animal", 27.48], ["fart", 6.59], ["livestock, farm animals, working animals", 4.11]], null, [["music", 39.28], ["didgeridoo", 20.03], ["livestock, farm animals, working animals", 4.21]]], "duration": [0.61, 1.19, 0.81, 0.5, 0.57, 1.47, 0.74, 0.69, 5.56, 1.14, 7.74, 13.53, 30.6, 28.45]} \ No newline at end of file diff --git a/annotations_filtered/aErChTKF6u4_filtered.json b/annotations_filtered/aErChTKF6u4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daee08e7782594d4c02188a7e59ea04f6900662e --- /dev/null +++ b/annotations_filtered/aErChTKF6u4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [5.0, 15.65], [16.0, 27.13], [30.0, 31.83], [33.0, 33.62], [35.0, 41.01], [42.0, 47.29], [49.0, 50.58], [51.0, 52.98], [55.0, 60.18], [62.0, 63.31], [64.0, 65.4], [67.0, 68.18], [69.0, 69.67], [71.0, 71.15], [73.0, 77.89], [78.0, 80.0], [80.0, 82.36], [83.0, 90.27], [92.0, 92.84], [95.0, 99.4], [100.0, 102.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 99.91, 0.0, 0.0, 74.6, 100.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 99.96, 100.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 10.65, 11.13, 1.83, 0.62, 6.01, 5.29, 1.58, 1.98, 5.18, 1.31, 1.4, 1.18, 0.67, 0.15, 4.89, 2.0, 2.36, 7.27, 0.84, 4.4, 2.05]} \ No newline at end of file diff --git a/annotations_filtered/aF3BXL1cQYY_filtered.json b/annotations_filtered/aF3BXL1cQYY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eddca3b2d2a140372052417b6f49e7e6faa61e60 --- /dev/null +++ b/annotations_filtered/aF3BXL1cQYY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.61], [20.0, 45.91], [46.0, 96.85], [98.0, 117.71], [122.0, 123.01], [127.0, 127.85], [131.0, 131.73]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 30.06, 0.0, 30.11, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 77.9], ["didgeridoo", 5.02], ["musical instrument", 3.07]], null, [["music", 65.31], ["didgeridoo", 14.11], ["speech", 4.53]], null, null, null], "duration": [0.61, 25.91, 50.85, 19.71, 1.01, 0.85, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/aF3x3Bad2Wk_filtered.json b/annotations_filtered/aF3x3Bad2Wk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..641483683858e8a1c2a3601d3b3f9bdc8412271f --- /dev/null +++ b/annotations_filtered/aF3x3Bad2Wk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.99], [9.0, 9.27], [10.0, 10.56], [11.0, 15.84], [28.0, 28.8], [31.0, 32.93], [33.0, 34.18], [35.0, 37.88], [38.0, 38.33], [38.0, 43.21], [43.0, 53.96], [61.0, 66.82], [72.0, 72.87], [74.0, 76.65], [78.0, 80.57], [82.0, 84.3], [85.0, 89.06], [90.0, 93.88], [96.0, 96.16], [97.0, 103.1], [104.0, 108.67], [109.0, 109.75], [112.0, 112.62], [113.0, 114.12], [119.0, 119.33], [121.0, 121.49], [131.0, 140.58], [146.0, 147.56], [149.0, 150.28], [156.0, 156.91], [158.0, 163.22], [165.0, 165.52], [168.0, 168.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 61.18, 0.0, 0.0, 0.0, 38.86, 0.0, 39.96, 48.35, 31.48, 0.0, 76.37, 94.22, 62.99, 57.81, 50.81, 0.0, 48.48, 48.35, 0.0, 0.0, 0.0, 0.0, 0.0, 35.39, 0.0, 0.0, 0.0, 35.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 35.31], ["speech", 31.5], ["guitar", 6.09]], null, [["music", 61.73], ["speech", 19.93], ["echo", 3.23]], [["speech", 85.93], ["fart", 3.88], ["sidetone", 0.82]], [["speech", 37.56], ["fart", 11.11], ["music", 5.12]], null, null, null, null, null, null, null, [["music", 63.18], ["throbbing", 12.21], ["synthesizer", 3.66]], [["music", 43.6], ["speech", 10.11], ["throbbing", 6.67]], null, null, null, null, null, [["music", 59.81], ["speech", 14.16], ["didgeridoo", 5.66]], null, null, null, [["music", 29.35], ["musical instrument", 12.54], ["brass instrument", 9.64]], null, null], "duration": [0.99, 0.27, 0.56, 4.84, 0.8, 1.93, 1.18, 2.88, 0.33, 5.21, 10.96, 5.82, 0.87, 2.65, 2.57, 2.3, 4.06, 3.88, 0.16, 6.1, 4.67, 0.75, 0.62, 1.12, 0.33, 0.49, 9.58, 1.56, 1.28, 0.91, 5.22, 0.52, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/aF4En8CIaNk_filtered.json b/annotations_filtered/aF4En8CIaNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56b03913990d8df74a51e9de3db4d1e35db1b49a --- /dev/null +++ b/annotations_filtered/aF4En8CIaNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.63], [24.0, 24.04], [26.0, 26.27], [30.0, 32.02]], "keep_status": [false, false, false, false], "silence_prob": [29.78, 0.0, 0.0, 30.62], "audiomae_on_audioset": [[["music", 49.38], ["throbbing", 15.8], ["hum", 5.3]], null, null, [["music", 65.96], ["throbbing", 2.3], ["musical instrument", 2.15]]], "duration": [3.63, 0.04, 0.27, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/aFDFSGAIrxs_filtered.json b/annotations_filtered/aFDFSGAIrxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d7a91a8c34fcafe638a3c7a4e38b4100c3eaebd --- /dev/null +++ b/annotations_filtered/aFDFSGAIrxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 70.48], [72.0, 72.0], [73.0, 73.57], [75.0, 75.59], [77.0, 77.23], [79.0, 82.44], [84.0, 84.25], [85.0, 85.85], [87.0, 87.62], [89.0, 89.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 57.17, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.0, 0.57, 0.59, 0.23, 3.44, 0.25, 0.85, 0.62, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/aF_Ijr621tM_filtered.json b/annotations_filtered/aF_Ijr621tM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..579732b86c66ecd11643c98cd09a33697b199543 --- /dev/null +++ b/annotations_filtered/aF_Ijr621tM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.64], [14.0, 14.45], [19.0, 19.7], [21.0, 22.32], [25.0, 24.81], [25.0, 25.03], [30.0, 30.37], [32.0, 37.02], [38.0, 41.77], [43.0, 44.05], [45.0, 46.31], [47.0, 48.17], [52.0, 52.35], [56.0, 57.67], [59.0, 60.22], [61.0, 68.1], [69.0, 70.19], [72.0, 73.16], [76.0, 76.77], [78.0, 78.36], [80.0, 81.3], [82.0, 84.25], [87.0, 87.81], [89.0, 91.29], [92.0, 95.34], [98.0, 120.34], [123.0, 123.89], [125.0, 125.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.9, 37.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 60.7, 0.0, 35.98, 64.29, 31.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 29.5], ["mains hum", 25.26], ["hum", 18.85]], [["music", 54.32], ["scary music", 27.72], ["foghorn", 3.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.24], ["groan", 9.48], ["sound effect", 3.74]], null, [["throbbing", 35.48], ["hum", 26.41], ["music", 21.04]], null, null], "duration": [0.64, 0.45, 0.7, 1.32, -0.19, 0.03, 0.37, 5.02, 3.77, 1.05, 1.31, 1.17, 0.35, 1.67, 1.22, 7.1, 1.19, 1.16, 0.77, 0.36, 1.3, 2.25, 0.81, 2.29, 3.34, 22.34, 0.89, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/aFnS18LM8Ws_filtered.json b/annotations_filtered/aFnS18LM8Ws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8496630361b1e4f799153d6acb135bc6d489cc90 --- /dev/null +++ b/annotations_filtered/aFnS18LM8Ws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 35.19], [37.0, 46.28], [46.0, 50.41], [53.0, 53.87], [57.0, 59.04], [61.0, 61.77], [63.0, 64.84], [73.0, 75.05], [76.0, 147.48], [149.0, 151.63], [159.0, 160.1], [161.0, 161.82], [162.0, 173.1], [176.0, 175.98], [177.0, 177.74], [178.0, 184.57]], "keep_status": [true, true, true, false, true, false, false, true, false, false, false, false, true, false, false, true], "silence_prob": [34.65, 30.72, 33.69, 0.0, 36.22, 0.0, 0.0, 29.15, 0.0, 30.0, 0.0, 0.0, 29.67, 0.0, 0.0, 31.5], "audiomae_on_audioset": [[["speech", 24.97], ["music", 24.48], ["fart", 8.96]], [["speech", 35.3], ["music", 16.81], ["buzz", 8.21]], [["speech", 49.76], ["music", 12.95], ["whale vocalization", 6.78]], null, [["music", 36.95], ["hum", 7.79], ["throbbing", 4.71]], null, null, [["zipper (clothing)", 14.07], ["smash, crash", 11.9], ["whack, thwack", 11.68]], null, [["cattle, bovinae", 45.47], ["livestock, farm animals, working animals", 29.54], ["moo", 24.19]], null, null, [["speech", 19.61], ["music", 11.99], ["sidetone", 7.4]], null, null, [["music", 30.93], ["buzz", 11.51], ["didgeridoo", 8.24]]], "duration": [3.19, 9.28, 4.41, 0.87, 2.04, 0.77, 1.84, 2.05, 71.48, 2.63, 1.1, 0.82, 11.1, -0.02, 0.74, 6.57]} \ No newline at end of file diff --git a/annotations_filtered/aFqlaPLvkw8_filtered.json b/annotations_filtered/aFqlaPLvkw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d13dd236a5cf6a52ee59ea7d123ac3b8bbee1550 --- /dev/null +++ b/annotations_filtered/aFqlaPLvkw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.93], [11.0, 18.77], [20.0, 20.55], [22.0, 22.71], [27.0, 34.1], [35.0, 38.38], [39.0, 41.13], [42.0, 42.8], [43.0, 44.56], [45.0, 47.21], [48.0, 49.15], [50.0, 50.35], [51.0, 51.97], [53.0, 53.06], [54.0, 54.53], [55.0, 56.46], [59.0, 76.05], [79.0, 85.9], [87.0, 87.52], [90.0, 96.15], [99.0, 100.47], [102.0, 102.56], [103.0, 103.52], [104.0, 106.02], [106.0, 106.59], [115.0, 118.39], [120.0, 130.82], [138.0, 138.99], [140.0, 140.64], [142.0, 143.18], [145.0, 145.64], [147.0, 147.8], [153.0, 154.03], [157.0, 157.57], [159.0, 159.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.99, 0.0, 0.0, 99.99, 100.0, 100.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.98, 59.15, 0.0, 82.97, 0.0, 0.0, 0.0, 71.87, 0.0, 42.24, 29.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 24.63], ["insect", 15.83], ["bee, wasp, etc.", 10.81]], null, null, null, null, null, null, null, null, [["music", 40.2], ["speech", 8.15], ["theremin", 6.74]], [["music", 36.01], ["speech", 16.26], ["foghorn", 5.11]], null, null, null, null, null, null, null, null], "duration": [0.93, 7.77, 0.55, 0.71, 7.1, 3.38, 2.13, 0.8, 1.56, 2.21, 1.15, 0.35, 0.97, 0.06, 0.53, 1.46, 17.05, 6.9, 0.52, 6.15, 1.47, 0.56, 0.52, 2.02, 0.59, 3.39, 10.82, 0.99, 0.64, 1.18, 0.64, 0.8, 1.03, 0.57, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/aG3Oc5TNd-Y_filtered.json b/annotations_filtered/aG3Oc5TNd-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..329bf8b8e7a5cca918ce33ad353861dc899883c7 --- /dev/null +++ b/annotations_filtered/aG3Oc5TNd-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.17], [2.0, 2.24], [2.0, 2.27], [2.0, 10.47], [17.0, 29.66], [33.0, 36.32], [46.0, 47.55], [51.0, 51.14], [52.0, 58.45], [77.0, 77.79], [79.0, 93.46], [95.0, 96.47], [96.0, 96.5], [98.0, 97.88], [98.0, 107.03], [112.0, 112.35], [113.0, 113.1], [114.0, 113.75], [115.0, 140.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.29, 29.49, 45.08, 0.0, 0.0, 30.3, 0.0, 59.07, 0.0, 0.0, 0.0, 29.26, 0.0, 0.0, 0.0, 36.11], "audiomae_on_audioset": [null, null, null, [["music", 60.43], ["musical instrument", 11.1], ["didgeridoo", 5.28]], [["music", 80.59], ["synthetic singing", 2.78], ["singing", 2.19]], [["boing", 56.1], ["echo", 14.74], ["synthesizer", 5.32]], null, null, [["music", 28.3], ["crowd", 17.34], ["speech", 14.99]], null, null, null, null, null, [["cattle, bovinae", 41.66], ["moo", 27.56], ["livestock, farm animals, working animals", 19.74]], null, null, null, [["music", 26.17], ["speech", 19.46], ["hum", 7.26]]], "duration": [0.17, 0.24, 0.27, 8.47, 12.66, 3.32, 1.55, 0.14, 6.45, 0.79, 14.46, 1.47, 0.5, -0.12, 9.03, 0.35, 0.1, -0.25, 25.44]} \ No newline at end of file diff --git a/annotations_filtered/aG55Y-zpxyo_filtered.json b/annotations_filtered/aG55Y-zpxyo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76805fd821ceb5b92f4beb22cbcd5f7e69a30706 --- /dev/null +++ b/annotations_filtered/aG55Y-zpxyo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.25], [14.0, 20.31], [22.0, 22.52], [23.0, 27.01], [27.0, 29.12], [29.0, 30.06], [47.0, 47.87], [56.0, 56.54], [60.0, 60.39], [74.0, 87.03], [88.0, 92.48], [93.0, 93.65], [98.0, 99.18], [100.0, 101.66]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 33.71, 0.0, 34.14, 33.98, 0.0, 0.0, 0.0, 0.0, 30.77, 30.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 69.98], ["musical instrument", 5.29], ["speech", 2.84]], null, [["music", 61.67], ["speech", 15.76], ["musical instrument", 5.36]], [["music", 27.79], ["speech", 16.95], ["musical instrument", 4.81]], null, null, null, null, [["music", 69.75], ["musical instrument", 5.34], ["guitar", 4.33]], [["music", 53.27], ["musical instrument", 10.46], ["guitar", 6.02]], null, null, null], "duration": [1.25, 6.31, 0.52, 4.01, 2.12, 1.06, 0.87, 0.54, 0.39, 13.03, 4.48, 0.65, 1.18, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/aG8bSNpEGoE_filtered.json b/annotations_filtered/aG8bSNpEGoE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83f9b1d1f536e697fb607771ae60ba79a0167414 --- /dev/null +++ b/annotations_filtered/aG8bSNpEGoE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.69], [19.0, 19.03], [25.0, 25.83], [31.0, 34.08], [56.0, 56.93], [73.0, 77.99], [80.0, 80.5], [83.0, 86.14], [95.0, 95.69], [101.0, 104.57], [110.0, 111.57], [115.0, 115.2], [126.0, 126.49], [140.0, 147.19]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.9, 0.0, 32.6, 0.0, 35.25, 0.0, 32.96, 0.0, 0.0, 0.0, 30.95], "audiomae_on_audioset": [null, null, null, [["music", 61.27], ["musical instrument", 4.43], ["synthesizer", 3.63]], null, [["music", 66.0], ["boing", 3.39], ["musical instrument", 1.79]], null, [["music", 52.05], ["hum", 5.92], ["throbbing", 3.96]], null, [["music", 56.88], ["singing", 6.96], ["bass guitar", 2.67]], null, null, null, [["music", 77.17], ["musical instrument", 5.31], ["guitar", 2.64]]], "duration": [1.69, 0.03, 0.83, 3.08, 0.93, 4.99, 0.5, 3.14, 0.69, 3.57, 1.57, 0.2, 0.49, 7.19]} \ No newline at end of file diff --git a/annotations_filtered/aGAInDBQOoE_filtered.json b/annotations_filtered/aGAInDBQOoE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eb471c37224d89aa2f27ed0a908b02b5e9d21f6 --- /dev/null +++ b/annotations_filtered/aGAInDBQOoE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.11], [3.0, 6.1], [7.0, 12.48], [13.0, 14.98], [17.0, 18.74], [20.0, 27.4], [28.0, 30.33], [33.0, 34.01], [37.0, 39.26], [44.0, 45.57], [50.0, 53.49], [54.0, 57.11], [59.0, 61.94], [64.0, 72.17], [75.0, 81.6], [83.0, 85.92], [88.0, 98.76], [101.0, 104.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 65.67, 53.34, 0.0, 0.0, 78.72, 64.75, 0.0, 85.35, 0.0, 73.82, 70.02, 56.33, 88.46, 86.27, 60.89, 35.55, 33.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.78], ["theremin", 6.66], ["ambient music", 6.19]], [["music", 58.33], ["theremin", 13.28], ["ambient music", 3.09]]], "duration": [0.11, 3.1, 5.48, 1.98, 1.74, 7.4, 2.33, 1.01, 2.26, 1.57, 3.49, 3.11, 2.94, 8.17, 6.6, 2.92, 10.76, 3.58]} \ No newline at end of file diff --git a/annotations_filtered/aGMiaQISzq0_filtered.json b/annotations_filtered/aGMiaQISzq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79c722ce40a0ca0f2a3cc037cbf220d2d82fa889 --- /dev/null +++ b/annotations_filtered/aGMiaQISzq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.97], [10.0, 10.98], [11.0, 40.07], [41.0, 42.23], [43.0, 44.22], [45.0, 47.33], [49.0, 50.65], [52.0, 52.79], [55.0, 56.78], [58.0, 59.04]], "keep_status": [false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 28.19, 0.0, 0.0, 47.05, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 17.37], ["hum", 16.04], ["speech", 14.25]], null, null, [["music", 22.64], ["speech", 14.81], ["foghorn", 13.32]], null, null, null, null], "duration": [0.97, 0.98, 29.07, 1.23, 1.22, 2.33, 1.65, 0.79, 1.78, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/aGcvpWAhP6I_filtered.json b/annotations_filtered/aGcvpWAhP6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4c51996ce3440401ae509f192601f85b98931b2 --- /dev/null +++ b/annotations_filtered/aGcvpWAhP6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.1], [5.0, 6.88], [8.0, 9.12], [10.0, 10.0], [13.0, 13.36], [17.0, 17.17], [34.0, 34.59], [36.0, 36.36], [37.0, 37.52], [38.0, 38.38], [44.0, 45.37], [47.0, 47.34], [49.0, 51.07], [52.0, 53.33], [54.0, 54.48], [55.0, 56.0], [59.0, 59.73], [70.0, 70.63], [79.0, 79.39], [85.0, 85.51], [93.0, 93.39], [123.0, 122.93], [126.0, 127.36], [135.0, 135.65], [156.0, 155.82], [157.0, 160.93], [162.0, 162.45], [165.0, 165.13], [165.0, 166.31], [167.0, 168.12], [175.0, 175.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.3], ["hum", 5.15], ["throbbing", 2.84]], null, null, null, null, null], "duration": [1.1, 1.88, 1.12, 0.0, 0.36, 0.17, 0.59, 0.36, 0.52, 0.38, 1.37, 0.34, 2.07, 1.33, 0.48, 1.0, 0.73, 0.63, 0.39, 0.51, 0.39, -0.07, 1.36, 0.65, -0.18, 3.93, 0.45, 0.13, 1.31, 1.12, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/aHI-JX6Q3Xk_filtered.json b/annotations_filtered/aHI-JX6Q3Xk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/aHI-JX6Q3Xk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/aHJKwOGb7MI_filtered.json b/annotations_filtered/aHJKwOGb7MI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbd462dc6d1809fe5f5bd5f603c3c05dc240f051 --- /dev/null +++ b/annotations_filtered/aHJKwOGb7MI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [5.0, 45.66], [49.0, 48.81], [50.0, 76.99], [79.0, 80.27], [81.0, 81.75], [83.0, 84.55], [85.0, 87.2], [89.0, 90.51], [94.0, 95.12], [97.0, 98.0], [99.0, 99.54], [100.0, 101.12], [102.0, 104.13], [105.0, 105.9], [108.0, 112.29], [114.0, 114.37], [116.0, 116.41]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.25, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.59, 0.0, 34.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["white noise", 15.06], ["radio", 13.12], ["mains hum", 11.33]], null, null, null, [["sidetone", 31.59], ["radio", 20.95], ["speech", 15.44]], null, null, null, null, null, [["noise", 29.97], ["white noise", 11.85], ["hum", 9.04]], null, [["sidetone", 27.62], ["radio", 24.33], ["white noise", 11.56]], null, null], "duration": [0.94, 40.66, -0.19, 26.99, 1.27, 0.75, 1.55, 2.2, 1.51, 1.12, 1.0, 0.54, 1.12, 2.13, 0.9, 4.29, 0.37, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/aHM8kYwl1R4_filtered.json b/annotations_filtered/aHM8kYwl1R4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..676b4669cb4d23337fcfea019abf76d1400a457e --- /dev/null +++ b/annotations_filtered/aHM8kYwl1R4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.63], [7.0, 8.02], [9.0, 12.18], [13.0, 18.64], [21.0, 23.26], [24.0, 24.61], [25.0, 24.98], [27.0, 28.0], [31.0, 34.38], [36.0, 36.54], [37.0, 39.51], [40.0, 39.55], [40.0, 39.6], [40.0, 39.65], [40.0, 39.72], [40.0, 39.78], [41.0, 44.73], [45.0, 45.62], [46.0, 48.93], [51.0, 50.97]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.89, 62.58, 56.63, 0.0, 0.0, 0.0, 44.93, 0.0, 39.89, 0.0, 0.0, 0.0, 0.0, 0.0, 52.92, 0.0, 52.33, 0.0], "audiomae_on_audioset": [null, null, [["speech", 75.51], ["radio", 10.97], ["telephone", 1.11]], null, null, null, null, null, [["speech", 19.78], ["hum", 13.49], ["mains hum", 10.45]], null, [["speech", 75.2], ["radio", 7.93], ["telephone", 5.04]], null, null, null, null, null, null, null, null, null], "duration": [0.63, 1.02, 3.18, 5.64, 2.26, 0.61, -0.02, 1.0, 3.38, 0.54, 2.51, -0.45, -0.4, -0.35, -0.28, -0.22, 3.73, 0.62, 2.93, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/aHQQs4D3krU_filtered.json b/annotations_filtered/aHQQs4D3krU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..184ab8e54cfd75e2edb5fd449a8465c5ca0fcffe --- /dev/null +++ b/annotations_filtered/aHQQs4D3krU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.97], [28.0, 29.66], [31.0, 32.05], [34.0, 35.19], [38.0, 39.11], [40.0, 41.1], [42.0, 44.32], [46.0, 54.14], [56.0, 56.62], [63.0, 64.39], [73.0, 73.94], [78.0, 80.47], [84.0, 84.03], [94.0, 94.63], [96.0, 96.5], [99.0, 100.77], [101.0, 103.37], [105.0, 105.44], [106.0, 106.69], [108.0, 117.27], [124.0, 124.73], [129.0, 131.5], [132.0, 132.58]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.15, 29.75, 0.0, 0.0, 0.0, 29.25, 0.0, 0.0, 0.0, 0.0, 36.81, 0.0, 0.0, 34.94, 0.0, 31.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["livestock, farm animals, working animals", 50.24], ["cattle, bovinae", 22.97], ["moo", 20.48]], [["music", 28.65], ["hum", 22.87], ["throbbing", 17.03]], null, null, null, [["music", 28.6], ["speech", 13.44], ["moo", 7.92]], null, null, null, null, [["music", 39.1], ["throbbing", 10.76], ["speech", 9.52]], null, null, [["music", 78.33], ["speech", 6.7], ["electronic music", 1.73]], null, [["music", 75.65], ["yodeling", 3.29], ["middle eastern music", 1.02]], null], "duration": [0.97, 1.66, 1.05, 1.19, 1.11, 1.1, 2.32, 8.14, 0.62, 1.39, 0.94, 2.47, 0.03, 0.63, 0.5, 1.77, 2.37, 0.44, 0.69, 9.27, 0.73, 2.5, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/aHV7IUgaCy8_filtered.json b/annotations_filtered/aHV7IUgaCy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e22ce3d14ae6accc7ed44910e7bc223b698bc0b --- /dev/null +++ b/annotations_filtered/aHV7IUgaCy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.85], [11.0, 11.33], [17.0, 18.35], [20.0, 22.62], [23.0, 23.92], [25.0, 33.15], [35.0, 98.02], [99.0, 100.09], [100.0, 101.26], [102.0, 102.51], [103.0, 104.01], [105.0, 104.87], [106.0, 108.94], [111.0, 130.0], [130.0, 130.32], [131.0, 130.87], [133.0, 135.19], [136.0, 136.76], [138.0, 142.52], [145.0, 193.41], [195.0, 196.32], [197.0, 197.46], [204.0, 213.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 91.64, 0.0, 36.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 33.63, 0.0, 0.0, 35.59, 0.0, 33.32, 0.0, 0.0, 0.0, 34.4], "audiomae_on_audioset": [null, null, null, null, null, [["music", 52.53], ["speech", 14.07], ["throbbing", 5.04]], null, null, null, null, null, null, null, [["music", 77.27], ["didgeridoo", 3.26], ["fart", 3.0]], null, null, [["music", 64.58], ["video game music", 4.17], ["throbbing", 1.67]], null, [["music", 24.44], ["cattle, bovinae", 21.75], ["livestock, farm animals, working animals", 12.8]], null, null, null, [["music", 43.47], ["speech", 24.98], ["musical instrument", 3.04]]], "duration": [1.85, 0.33, 1.35, 2.62, 0.92, 8.15, 63.02, 1.09, 1.26, 0.51, 1.01, -0.13, 2.94, 19.0, 0.32, -0.13, 2.19, 0.76, 4.52, 48.41, 1.32, 0.46, 9.17]} \ No newline at end of file diff --git a/annotations_filtered/aIZsVuaUWB4_filtered.json b/annotations_filtered/aIZsVuaUWB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d60c3c22257577dec737c6dcd9e89e309af14901 --- /dev/null +++ b/annotations_filtered/aIZsVuaUWB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 46.06], [48.0, 48.15], [49.0, 135.6], [139.0, 140.0], [141.0, 158.94]], "keep_status": [true, false, false, false, false], "silence_prob": [39.99, 0.0, 0.0, 0.0, 37.78], "audiomae_on_audioset": [[["music", 50.5], ["animal", 8.52], ["speech", 6.55]], null, null, null, [["livestock, farm animals, working animals", 30.59], ["cattle, bovinae", 22.27], ["moo", 20.89]]], "duration": [14.06, 0.15, 86.6, 1.0, 17.94]} \ No newline at end of file diff --git a/annotations_filtered/aIau-DQHI3Y_filtered.json b/annotations_filtered/aIau-DQHI3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dce8f2739588d6e7959cbb1e23e73a536087219 --- /dev/null +++ b/annotations_filtered/aIau-DQHI3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.56], [30.0, 31.53], [58.0, 59.58], [74.0, 74.85], [78.0, 79.08], [80.0, 85.36], [98.0, 106.32], [122.0, 125.96]], "keep_status": [false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.24, 33.6, 42.35], "audiomae_on_audioset": [null, null, null, null, null, [["livestock, farm animals, working animals", 23.56], ["cattle, bovinae", 20.36], ["moo", 16.5]], [["music", 50.11], ["speech", 24.11], ["musical instrument", 3.55]], [["music", 42.49], ["speech", 7.92], ["guitar", 7.4]]], "duration": [0.56, 1.53, 1.58, 0.85, 1.08, 5.36, 8.32, 3.96]} \ No newline at end of file diff --git a/annotations_filtered/aIm1ZGm03WA_filtered.json b/annotations_filtered/aIm1ZGm03WA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03c257efac8b7f2ffa89c9a8606d4807e4d2ca68 --- /dev/null +++ b/annotations_filtered/aIm1ZGm03WA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.71], [8.0, 7.97], [11.0, 12.24], [15.0, 15.23], [19.0, 19.33], [22.0, 22.52], [31.0, 33.2], [34.0, 34.18], [37.0, 37.98], [41.0, 42.35], [50.0, 50.55], [55.0, 55.11], [85.0, 89.41], [93.0, 93.72], [100.0, 101.26], [107.0, 107.97], [129.0, 129.2], [138.0, 139.02], [142.0, 142.84], [148.0, 148.88], [150.0, 151.43], [158.0, 159.02], [159.0, 160.27], [161.0, 161.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, -0.03, 1.24, 0.23, 0.33, 0.52, 2.2, 0.18, 0.98, 1.35, 0.55, 0.11, 4.41, 0.72, 1.26, 0.97, 0.2, 1.02, 0.84, 0.88, 1.43, 1.02, 1.27, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/aJ67Fz1Jf6E_filtered.json b/annotations_filtered/aJ67Fz1Jf6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..088bacc6694c543a45ca8840fbeddb6d0770d5f5 --- /dev/null +++ b/annotations_filtered/aJ67Fz1Jf6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.89], [4.0, 6.1], [8.0, 9.46], [11.0, 13.17], [15.0, 15.36], [21.0, 23.25], [29.0, 31.55], [33.0, 38.94], [41.0, 41.28], [46.0, 48.47], [52.0, 56.13], [57.0, 58.13], [59.0, 60.76], [61.0, 61.55], [63.0, 64.0], [67.0, 67.36]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.88, 0.0, 60.6, 0.0, 52.92, 36.77, 47.66, 0.0, 49.13, 52.05, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 35.44], ["music", 29.12], ["shuffling cards", 14.62]], null, null, null, null, [["music", 54.63], ["scratch", 2.15], ["inside, small room", 2.12]], [["music", 85.33], ["soundtrack music", 4.18], ["scary music", 2.55]], null, [["zipper (clothing)", 71.12], ["music", 10.46], ["throbbing", 8.32]], null, null, null, null, null, null], "duration": [1.89, 2.1, 1.46, 2.17, 0.36, 2.25, 2.55, 5.94, 0.28, 2.47, 4.13, 1.13, 1.76, 0.55, 1.0, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/aJ7NA4hNNc0_filtered.json b/annotations_filtered/aJ7NA4hNNc0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e2d5110ca984e32d5421a8e35cd8a8c345e3972 --- /dev/null +++ b/annotations_filtered/aJ7NA4hNNc0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.69], [12.0, 12.46], [14.0, 13.73], [15.0, 16.33], [17.0, 17.39], [18.0, 24.22], [25.0, 26.08], [28.0, 28.43], [30.0, 33.29], [34.0, 34.35], [38.0, 38.43], [39.0, 40.02], [41.0, 41.62], [42.0, 46.8], [47.0, 47.58], [48.0, 47.66], [49.0, 49.82], [51.0, 53.0], [53.0, 61.38], [62.0, 63.48], [65.0, 65.58], [67.0, 68.71], [69.0, 69.7], [71.0, 72.66], [73.0, 76.54], [79.0, 80.1], [81.0, 88.33], [89.0, 93.16], [98.0, 98.1], [99.0, 114.59], [120.0, 121.83], [122.0, 123.57], [124.0, 124.39], [125.0, 129.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.33, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 87.19, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 91.98, 55.67, 0.0, 0.0, 0.0, 0.0, 0.0, 45.24, 0.0, 92.8, 90.78, 0.0, 68.67, 0.0, 0.0, 0.0, 99.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.04], ["speech", 5.52], ["animal", 4.63]], null, null, null, null, null, null, null, null, null], "duration": [3.69, 0.46, -0.27, 1.33, 0.39, 6.22, 1.08, 0.43, 3.29, 0.35, 0.43, 1.02, 0.62, 4.8, 0.58, -0.34, 0.82, 2.0, 8.38, 1.48, 0.58, 1.71, 0.7, 1.66, 3.54, 1.1, 7.33, 4.16, 0.1, 15.59, 1.83, 1.57, 0.39, 4.84]} \ No newline at end of file diff --git a/annotations_filtered/aJCCUdK7PiU_filtered.json b/annotations_filtered/aJCCUdK7PiU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3825489e6f89b420253464a8c442b2a52be22602 --- /dev/null +++ b/annotations_filtered/aJCCUdK7PiU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 24.87], [26.0, 28.31], [30.0, 29.93], [30.0, 37.98], [39.0, 48.36], [50.0, 50.5], [51.0, 52.05], [53.0, 53.6], [55.0, 74.61], [78.0, 78.49], [79.0, 83.51], [85.0, 85.41], [87.0, 87.84], [90.0, 91.05], [92.0, 91.81], [92.0, 93.21], [97.0, 97.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.56, 0.0, 55.18, 76.7, 0.0, 0.0, 0.0, 42.22, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 90.34], ["theremin", 1.21], ["soundtrack music", 1.12]], null, null, null, null, null, null, null, null], "duration": [-0.13, 2.31, -0.07, 7.98, 9.36, 0.5, 1.05, 0.6, 19.61, 0.49, 4.51, 0.41, 0.84, 1.05, -0.19, 1.21, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/aJHRyOrRnQk_filtered.json b/annotations_filtered/aJHRyOrRnQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2ccfaaceef64a8cc2a97065e59e92a3405c85f3 --- /dev/null +++ b/annotations_filtered/aJHRyOrRnQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 16.34], [18.0, 18.35], [19.0, 21.27], [22.0, 27.97], [29.0, 29.79], [31.0, 31.43], [33.0, 33.57], [37.0, 37.52], [38.0, 38.99], [39.0, 87.13], [92.0, 152.15], [153.0, 160.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [73.82, 0.0, 62.58, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.82], ["music", 9.85], ["throbbing", 3.64]]], "duration": [6.34, 0.35, 2.27, 5.97, 0.79, 0.43, 0.57, 0.52, 0.99, 48.13, 60.15, 7.29]} \ No newline at end of file diff --git a/annotations_filtered/aJVHnyq7Nz8_filtered.json b/annotations_filtered/aJVHnyq7Nz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a188da8bb59ee1f1e720f677e3bc5b0d13455dd7 --- /dev/null +++ b/annotations_filtered/aJVHnyq7Nz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.18], [13.0, 14.12], [15.0, 16.14], [20.0, 21.3], [23.0, 23.94], [25.0, 25.62], [27.0, 29.78], [34.0, 35.14], [37.0, 43.09]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 0.0, 60.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.18, 1.12, 1.14, 1.3, 0.94, 0.62, 2.78, 1.14, 6.09]} \ No newline at end of file diff --git a/annotations_filtered/aJY0vUsHL9Y_filtered.json b/annotations_filtered/aJY0vUsHL9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b3a2bd86f8d34e395902db1c401a87780e7d7aa --- /dev/null +++ b/annotations_filtered/aJY0vUsHL9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [9.0, 9.04], [37.0, 46.03], [47.0, 47.44], [50.0, 49.69], [55.0, 56.17], [62.0, 63.14], [66.0, 67.29], [70.0, 70.04], [76.0, 78.16], [80.0, 81.87], [92.0, 92.65], [94.0, 95.17], [97.0, 97.82], [100.0, 103.22], [104.0, 105.11], [105.0, 106.73], [112.0, 112.43], [114.0, 115.28], [118.0, 118.34], [123.0, 123.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.04, 9.03, 0.44, -0.31, 1.17, 1.14, 1.29, 0.04, 2.16, 1.87, 0.65, 1.17, 0.82, 3.22, 1.11, 1.73, 0.43, 1.28, 0.34, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/aJZL2uoPRZg_filtered.json b/annotations_filtered/aJZL2uoPRZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61a009632d6ae4aa17d776562dcdd3bd44cbe57f --- /dev/null +++ b/annotations_filtered/aJZL2uoPRZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.05], [6.0, 6.51], [11.0, 11.89], [14.0, 14.18], [15.0, 15.4], [18.0, 19.23], [22.0, 22.84], [24.0, 24.73], [25.0, 26.25], [27.0, 27.67], [32.0, 32.59], [35.0, 38.5], [39.0, 41.71], [45.0, 47.73], [50.0, 51.54], [52.0, 55.02], [57.0, 59.98], [61.0, 64.32], [65.0, 65.97], [69.0, 70.43], [72.0, 78.83], [82.0, 90.21], [92.0, 92.43], [92.0, 92.48], [95.0, 96.11], [97.0, 97.7], [101.0, 101.97], [106.0, 106.76], [108.0, 108.18], [110.0, 111.4], [112.0, 114.05], [119.0, 134.7], [140.0, 140.8], [143.0, 146.64], [152.0, 156.86], [159.0, 159.85], [160.0, 164.42], [165.0, 166.97], [167.0, 167.91], [169.0, 173.1], [175.0, 176.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 80.11, 97.22, 0.0, 62.78, 97.83, 63.42, 0.0, 0.0, 30.81, 30.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.77, 30.43, 0.0, 53.28, 84.43, 0.0, 59.07, 0.0, 0.0, 88.1, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 77.46], ["throbbing", 9.39], ["electronic music", 3.75]], [["music", 72.91], ["electronic music", 6.42], ["throbbing", 6.11]], null, null, null, null, null, null, null, null, [["music", 55.74], ["throbbing", 6.77], ["electronic music", 6.75]], [["music", 52.87], ["throbbing", 12.14], ["electronic music", 6.06]], null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.51, 0.89, 0.18, 0.4, 1.23, 0.84, 0.73, 1.25, 0.67, 0.59, 3.5, 2.71, 2.73, 1.54, 3.02, 2.98, 3.32, 0.97, 1.43, 6.83, 8.21, 0.43, 0.48, 1.11, 0.7, 0.97, 0.76, 0.18, 1.4, 2.05, 15.7, 0.8, 3.64, 4.86, 0.85, 4.42, 1.97, 0.91, 4.1, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/aJ_NWmLawAM_filtered.json b/annotations_filtered/aJ_NWmLawAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5000d07bae3d7eb003970af5f5de3408989a9bc3 --- /dev/null +++ b/annotations_filtered/aJ_NWmLawAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.72], [10.0, 13.76], [16.0, 17.05], [17.0, 19.21], [21.0, 23.33], [26.0, 28.05], [29.0, 31.67], [33.0, 33.45], [35.0, 41.99], [43.0, 45.94], [48.0, 48.1]], "keep_status": [true, false, false, true, true, true, true, false, true, false, false], "silence_prob": [35.72, 35.77, 0.0, 31.85, 33.86, 31.17, 35.86, 0.0, 36.05, 38.94, 0.0], "audiomae_on_audioset": [[["music", 49.57], ["hum", 8.55], ["mains hum", 6.42]], [["hum", 43.76], ["mains hum", 32.86], ["music", 5.87]], null, [["fly, housefly", 14.0], ["mains hum", 13.8], ["speech", 12.65]], [["hum", 24.7], ["mains hum", 10.35], ["music", 10.26]], [["mains hum", 37.43], ["hum", 15.18], ["buzz", 7.16]], [["mains hum", 9.56], ["hum", 9.38], ["music", 6.24]], null, [["music", 32.0], ["hum", 12.08], ["speech", 8.98]], [["hum", 42.04], ["mains hum", 26.21], ["throbbing", 6.28]], null], "duration": [3.72, 3.76, 1.05, 2.21, 2.33, 2.05, 2.67, 0.45, 6.99, 2.94, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/aJgS31WWIG8_filtered.json b/annotations_filtered/aJgS31WWIG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c03921ecc74d00c7f416d49d805074a288f1c464 --- /dev/null +++ b/annotations_filtered/aJgS31WWIG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.35], [21.0, 77.5], [78.0, 80.0], [82.0, 83.35]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 43.28, 0.0], "audiomae_on_audioset": [null, null, [["chirp tone", 14.2], ["music", 12.79], ["synthesizer", 7.37]], null], "duration": [0.35, 56.5, 2.0, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/aJh1RC2Z474_filtered.json b/annotations_filtered/aJh1RC2Z474_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9222b94dc9981ce7d911d12f191ec1757e2108fe --- /dev/null +++ b/annotations_filtered/aJh1RC2Z474_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.04], [17.0, 17.47], [23.0, 22.64], [24.0, 24.43], [44.0, 45.72], [47.0, 47.83], [51.0, 51.09], [56.0, 56.94], [60.0, 60.79], [62.0, 65.04], [66.0, 67.83], [76.0, 76.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.47, -0.36, 0.43, 1.72, 0.83, 0.09, 0.94, 0.79, 3.04, 1.83, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/aJhtBJETQF8_filtered.json b/annotations_filtered/aJhtBJETQF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81b14e1dae85a2cd3db2e9ed717307a343613458 --- /dev/null +++ b/annotations_filtered/aJhtBJETQF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.1], [22.0, 22.49], [24.0, 24.22], [29.0, 32.73], [36.0, 36.24], [38.0, 45.49], [50.0, 49.81], [61.0, 61.45], [62.0, 62.68], [64.0, 64.61], [72.0, 72.5], [75.0, 76.6], [78.0, 78.36], [82.0, 82.58], [83.0, 83.64], [86.0, 86.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 51.39, 0.0, 69.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.1, 0.49, 0.22, 3.73, 0.24, 7.49, -0.19, 0.45, 0.68, 0.61, 0.5, 1.6, 0.36, 0.58, 0.64, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/aJoVRUNmqIY_filtered.json b/annotations_filtered/aJoVRUNmqIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cbd226a23ef8054b77a0b6fde0bfdc040df47eb --- /dev/null +++ b/annotations_filtered/aJoVRUNmqIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [5.0, 4.95], [8.0, 8.04], [10.0, 11.18], [13.0, 13.47], [16.0, 20.36], [21.0, 24.09], [25.0, 29.69], [31.0, 31.82], [39.0, 39.65], [52.0, 51.78], [56.0, 57.06], [68.0, 69.01], [73.0, 74.06], [76.0, 77.57], [80.0, 80.65], [86.0, 88.3], [89.0, 99.6], [100.0, 101.28], [104.0, 104.57], [105.0, 115.23], [116.0, 116.85], [123.0, 131.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 99.99, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, -0.05, 0.04, 1.18, 0.47, 4.36, 3.09, 4.69, 0.82, 0.65, -0.22, 1.06, 1.01, 1.06, 1.57, 0.65, 2.3, 10.6, 1.28, 0.57, 10.23, 0.85, 8.95]} \ No newline at end of file diff --git a/annotations_filtered/aK1r7tBWnro_filtered.json b/annotations_filtered/aK1r7tBWnro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e2d77af83299e14f64fefcac9cbbb472e697984 --- /dev/null +++ b/annotations_filtered/aK1r7tBWnro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.8], [10.0, 13.07], [15.0, 21.09], [22.0, 26.25], [28.0, 29.73], [32.0, 34.42], [36.0, 44.32], [45.0, 86.71]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [100.0, 40.52, 100.0, 100.0, 0.0, 100.0, 54.3, 0.0], "audiomae_on_audioset": [null, [["sine wave", 59.48], ["speech", 10.11], ["dial tone", 7.67]], null, null, null, null, null, null], "duration": [2.8, 3.07, 6.09, 4.25, 1.73, 2.42, 8.32, 41.71]} \ No newline at end of file diff --git a/annotations_filtered/aKE0S2gCOfc_filtered.json b/annotations_filtered/aKE0S2gCOfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70a2f479883eb642036ae82ef802ad80f7e379e0 --- /dev/null +++ b/annotations_filtered/aKE0S2gCOfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.15], [10.0, 52.76], [55.0, 54.94], [57.0, 56.71], [60.0, 64.0], [68.0, 95.0], [96.0, 95.94], [99.0, 114.08], [115.0, 121.05], [124.0, 131.43], [132.0, 133.24], [137.0, 136.98], [137.0, 143.16], [147.0, 172.2], [173.0, 173.85], [174.0, 173.89]], "keep_status": [false, false, false, false, false, false, false, true, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.41, 30.75, 0.0, 31.05, 34.11, 31.35, 0.0, 0.0, 31.86, 32.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 62.53], ["throbbing", 11.21], ["hum", 8.22]], [["music", 40.8], ["hum", 24.21], ["mains hum", 16.66]], null, [["hum", 19.45], ["speech", 17.58], ["throbbing", 11.47]], [["speech", 26.3], ["hum", 14.69], ["mains hum", 13.73]], [["hum", 24.23], ["mains hum", 19.37], ["speech", 13.41]], null, null, [["speech", 53.16], ["music", 13.72], ["hum", 5.04]], [["hum", 35.58], ["throbbing", 17.01], ["music", 14.35]], null, null], "duration": [1.15, 42.76, -0.06, -0.29, 4.0, 27.0, -0.06, 15.08, 6.05, 7.43, 1.24, -0.02, 6.16, 25.2, 0.85, -0.11]} \ No newline at end of file diff --git a/annotations_filtered/aKIM6q3awws_filtered.json b/annotations_filtered/aKIM6q3awws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5bd53c0ca057828bcb476c674460f94e59b3397 --- /dev/null +++ b/annotations_filtered/aKIM6q3awws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.1], [9.0, 9.88], [12.0, 12.8], [15.0, 14.91], [23.0, 24.26], [39.0, 41.25], [42.0, 42.2], [47.0, 49.72], [50.0, 51.71], [53.0, 56.52], [58.0, 62.14], [62.0, 63.63], [65.0, 65.87], [67.0, 68.32], [70.0, 71.27], [75.0, 77.57], [78.0, 79.49], [81.0, 85.9], [86.0, 87.49], [90.0, 91.71], [95.0, 96.18], [99.0, 99.37], [101.0, 101.43], [103.0, 107.18], [108.0, 109.04], [112.0, 116.95], [118.0, 118.99], [126.0, 126.54], [128.0, 128.29], [131.0, 142.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 84.43, 0.0, 99.95, 99.92, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 99.21, 0.0, 0.0, 0.0, 95.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.1, 0.88, 0.8, -0.09, 1.26, 2.25, 0.2, 2.72, 1.71, 3.52, 4.14, 1.63, 0.87, 1.32, 1.27, 2.57, 1.49, 4.9, 1.49, 1.71, 1.18, 0.37, 0.43, 4.18, 1.04, 4.95, 0.99, 0.54, 0.29, 11.59]} \ No newline at end of file diff --git a/annotations_filtered/aKOmGhBOJZI_filtered.json b/annotations_filtered/aKOmGhBOJZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7698de606bb98790e6530961016881ec60e4d553 --- /dev/null +++ b/annotations_filtered/aKOmGhBOJZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [8.0, 12.55], [14.0, 13.93], [25.0, 25.54], [39.0, 40.29], [41.0, 41.37], [43.0, 43.04], [45.0, 47.19], [48.0, 65.8], [72.0, 72.98], [75.0, 74.9], [75.0, 77.3], [78.0, 78.29], [80.0, 81.57], [83.0, 84.54], [86.0, 86.61], [98.0, 98.51], [104.0, 106.27]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 31.44, 0.0, 0.0, 40.41, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 24.6], ["animal", 14.3], ["synthesizer", 4.73]], null, null, [["fart", 47.77], ["noise", 9.36], ["creak", 7.04]], null, null, null, null, null, null], "duration": [0.63, 4.55, -0.07, 0.54, 1.29, 0.37, 0.04, 2.19, 17.8, 0.98, -0.1, 2.3, 0.29, 1.57, 1.54, 0.61, 0.51, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/aKUcMTQgl5E_filtered.json b/annotations_filtered/aKUcMTQgl5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c2d02ab596a2f28d13dd8c787323ad3eed35fb1 --- /dev/null +++ b/annotations_filtered/aKUcMTQgl5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [4.0, 4.14], [8.0, 11.87], [13.0, 13.24], [16.0, 16.38], [18.0, 18.62], [21.0, 21.46], [22.0, 22.81], [23.0, 23.65], [33.0, 33.32], [34.0, 33.91], [39.0, 40.05], [41.0, 41.91], [43.0, 45.3], [46.0, 50.09], [51.0, 51.75], [58.0, 60.4], [61.0, 62.75], [70.0, 70.33], [76.0, 76.47], [77.0, 77.67], [79.0, 78.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.89, 54.7, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.01], ["sidetone", 21.52], ["echo", 3.74]], null, null, null, null, null, null, null, null], "duration": [0.42, 0.14, 3.87, 0.24, 0.38, 0.62, 0.46, 0.81, 0.65, 0.32, -0.09, 1.05, 0.91, 2.3, 4.09, 0.75, 2.4, 1.75, 0.33, 0.47, 0.67, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/aKgha2AsDNc_filtered.json b/annotations_filtered/aKgha2AsDNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..982c3ab0c88f23deb7782caccaaac334c7f441ba --- /dev/null +++ b/annotations_filtered/aKgha2AsDNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [9.0, 9.39], [12.0, 13.51], [18.0, 18.94], [23.0, 24.41], [30.0, 35.53], [40.0, 40.8], [47.0, 47.73], [51.0, 50.8], [53.0, 54.75], [62.0, 66.28], [68.0, 70.6], [75.0, 77.36], [79.0, 81.26], [82.0, 82.73], [86.0, 87.89], [89.0, 92.47], [93.0, 93.95], [100.0, 100.58], [104.0, 104.21], [107.0, 107.82], [112.0, 113.1], [118.0, 119.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 99.85, 67.63, 99.8, 99.85, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.39, 1.51, 0.94, 1.41, 5.53, 0.8, 0.73, -0.2, 1.75, 4.28, 2.6, 2.36, 2.26, 0.73, 1.89, 3.47, 0.95, 0.58, 0.21, 0.82, 1.1, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/aKnvOP-1U00_filtered.json b/annotations_filtered/aKnvOP-1U00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b986cb1792d2e407a2c1be5842ff276e5d80c2dd --- /dev/null +++ b/annotations_filtered/aKnvOP-1U00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.16], [8.0, 9.27], [10.0, 10.27], [11.0, 11.84], [20.0, 20.56], [22.0, 22.03], [25.0, 25.88], [30.0, 31.26], [32.0, 32.95], [34.0, 35.07], [40.0, 40.05], [48.0, 48.3], [51.0, 52.69], [55.0, 55.36], [56.0, 56.78], [58.0, 57.99], [60.0, 60.54], [63.0, 63.42], [65.0, 65.55], [70.0, 70.06], [81.0, 82.27], [86.0, 86.59], [91.0, 92.15], [95.0, 96.85], [99.0, 106.83], [108.0, 108.46], [112.0, 114.35], [116.0, 117.98], [118.0, 119.13], [121.0, 121.71], [123.0, 123.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.27, 0.27, 0.84, 0.56, 0.03, 0.88, 1.26, 0.95, 1.07, 0.05, 0.3, 1.69, 0.36, 0.78, -0.01, 0.54, 0.42, 0.55, 0.06, 1.27, 0.59, 1.15, 1.85, 7.83, 0.46, 2.35, 1.98, 1.13, 0.71, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/aKojFoPzQoQ_filtered.json b/annotations_filtered/aKojFoPzQoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0202d0dc418f4df306f630069bc1ba1cb5840e97 --- /dev/null +++ b/annotations_filtered/aKojFoPzQoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [5.0, 13.54], [14.0, 21.22], [36.0, 41.74], [45.0, 45.52], [48.0, 52.52], [54.0, 53.86], [66.0, 66.18], [67.0, 67.19], [70.0, 69.92], [72.0, 73.13], [73.0, 74.29], [74.0, 74.48], [76.0, 116.48], [118.0, 119.47], [122.0, 125.47], [127.0, 127.67], [128.0, 128.82], [129.0, 130.05]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 48.14, 29.59, 39.64, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 70.68], ["musical instrument", 4.9], ["guitar", 4.62]], [["fly, housefly", 32.25], ["insect", 12.67], ["speech", 12.3]], [["music", 23.57], ["speech", 12.83], ["throbbing", 9.72]], null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 22.3], ["music", 16.78], ["hum", 5.8]], null, null, null], "duration": [0.43, 8.54, 7.22, 5.74, 0.52, 4.52, -0.14, 0.18, 0.19, -0.08, 1.13, 1.29, 0.48, 40.48, 1.47, 3.47, 0.67, 0.82, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/aKtrjeCFCAg_filtered.json b/annotations_filtered/aKtrjeCFCAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2b91bfb215aa4d97228cf474e3e6001df6a88fb --- /dev/null +++ b/annotations_filtered/aKtrjeCFCAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.39], [10.0, 10.74], [23.0, 29.03], [31.0, 32.27], [33.0, 52.39], [59.0, 59.53], [62.0, 63.09], [70.0, 73.41], [78.0, 78.31], [86.0, 86.86], [89.0, 89.21], [89.0, 89.4], [89.0, 91.52], [96.0, 95.94], [103.0, 103.57], [107.0, 108.36], [117.0, 118.2], [120.0, 119.99], [121.0, 122.23], [131.0, 132.22], [135.0, 136.59], [138.0, 138.4], [139.0, 139.77], [142.0, 143.67], [159.0, 159.12], [165.0, 171.14], [172.0, 172.99], [174.0, 174.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.63, 0.0, 34.0, 0.0, 0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 71.48], ["speech", 15.43], ["hum", 1.77]], null, null, null, null, null, null, null, [["whale vocalization", 26.28], ["roaring cats (lions, tigers)", 9.41], ["speech", 8.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 0.74, 6.03, 1.27, 19.39, 0.53, 1.09, 3.41, 0.31, 0.86, 0.21, 0.4, 2.52, -0.06, 0.57, 1.36, 1.2, -0.01, 1.23, 1.22, 1.59, 0.4, 0.77, 1.67, 0.12, 6.14, 0.99, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/aL4dQo8iBLo_filtered.json b/annotations_filtered/aL4dQo8iBLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c3c642e5e440b9e6454aab99ecd41f7a906fe80 --- /dev/null +++ b/annotations_filtered/aL4dQo8iBLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.01], [15.0, 15.3], [16.0, 49.96], [79.0, 81.57], [82.0, 83.52], [89.0, 89.72], [95.0, 96.92], [101.0, 106.19], [109.0, 118.71], [120.0, 120.38]], "keep_status": [false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.31, 0.0, 0.0, 0.0, 28.98, 29.72, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 33.5], ["hum", 12.59], ["mains hum", 7.78]], null, null, null, [["music", 30.14], ["throbbing", 25.92], ["speech", 13.64]], [["mains hum", 60.81], ["hum", 35.71], ["throbbing", 2.97]], null], "duration": [1.01, 0.3, 33.96, 2.57, 1.52, 0.72, 1.92, 5.19, 9.71, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/aLDrW2AXClk_filtered.json b/annotations_filtered/aLDrW2AXClk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7af42ad08adeb595641bcc5f7bdf65a1b7900dbc --- /dev/null +++ b/annotations_filtered/aLDrW2AXClk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [6.0, 6.49], [11.0, 11.79], [14.0, 18.49], [21.0, 21.36], [25.0, 32.14], [34.0, 35.68], [43.0, 43.83], [46.0, 47.26], [57.0, 56.73], [58.0, 58.4], [63.0, 63.24], [67.0, 68.05], [70.0, 95.57], [96.0, 97.44], [99.0, 100.95], [102.0, 104.45], [104.0, 104.57], [105.0, 105.68], [115.0, 116.41], [121.0, 121.63], [122.0, 131.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 90.43, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 0.0, 39.41, 0.0, 0.0, 0.0, 0.0, 52.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 58.11], ["speech", 18.81], ["sidetone", 9.51]], null, null, null, null, null], "duration": [0.99, 0.49, 0.79, 4.49, 0.36, 7.14, 1.68, 0.83, 1.26, -0.27, 0.4, 0.24, 1.05, 25.57, 1.44, 1.95, 2.45, 0.57, 0.68, 1.41, 0.63, 9.7]} \ No newline at end of file diff --git a/annotations_filtered/aL_6-dQCzwg_filtered.json b/annotations_filtered/aL_6-dQCzwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..825210b6dba41e5bb7baaba93b3b99d5e1167491 --- /dev/null +++ b/annotations_filtered/aL_6-dQCzwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 42.77], [44.0, 64.15], [64.0, 73.2], [78.0, 80.59], [82.0, 83.1], [84.0, 110.54], [113.0, 114.08], [115.0, 124.28], [127.0, 127.43]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 53.59, 53.53, 41.78, 0.0, 34.49, 0.0, 36.89, 0.0], "audiomae_on_audioset": [null, null, null, [["singing bowl", 47.0], ["music", 14.82], ["speech", 9.61]], null, [["music", 57.06], ["wind instrument, woodwind instrument", 7.11], ["clarinet", 5.61]], null, [["music", 73.27], ["clarinet", 3.86], ["saxophone", 2.76]], null], "duration": [31.77, 20.15, 9.2, 2.59, 1.1, 26.54, 1.08, 9.28, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/aMQysPMcE4M_filtered.json b/annotations_filtered/aMQysPMcE4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6aab1f04ee4c8fd26fa6aa9d5e36344039c85247 --- /dev/null +++ b/annotations_filtered/aMQysPMcE4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [13.0, 13.36], [15.0, 18.72], [19.0, 18.82], [19.0, 20.68], [21.0, 21.49], [25.0, 27.94], [29.0, 29.2], [32.0, 32.54], [33.0, 39.09], [40.0, 52.68], [55.0, 60.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 31.12, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 37.39, 38.74, 46.36], "audiomae_on_audioset": [null, null, [["music", 57.39], ["speech", 25.92], ["domestic animals, pets", 2.21]], null, null, null, null, null, null, [["speech", 61.74], ["telephone", 11.66], ["hum", 3.63]], [["burping, eructation", 12.19], ["mechanisms", 10.49], ["music", 8.08]], [["speech", 57.78], ["hum", 16.78], ["whale vocalization", 5.21]]], "duration": [0.61, 0.36, 3.72, -0.18, 1.68, 0.49, 2.94, 0.2, 0.54, 6.09, 12.68, 5.22]} \ No newline at end of file diff --git a/annotations_filtered/aN0alpNLQak_filtered.json b/annotations_filtered/aN0alpNLQak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b65963612f351f9a8b038b00152de3df92faab5c --- /dev/null +++ b/annotations_filtered/aN0alpNLQak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 18.99], [20.0, 20.44], [21.0, 21.91], [22.0, 27.89], [28.0, 168.93], [181.0, 180.84]], "keep_status": [false, false, false, false, false, false], "silence_prob": [76.7, 0.0, 0.0, 74.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [17.99, 0.44, 0.91, 5.89, 140.93, -0.16]} \ No newline at end of file diff --git a/annotations_filtered/aNDj-H1jxV0_filtered.json b/annotations_filtered/aNDj-H1jxV0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0684ca8b1b556551f9e670652cb3a270ba74161 --- /dev/null +++ b/annotations_filtered/aNDj-H1jxV0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.42], [23.0, 26.82], [29.0, 30.05], [31.0, 32.49], [37.0, 38.92], [47.0, 52.41], [53.0, 54.21], [68.0, 68.23], [78.0, 78.43], [81.0, 80.77], [82.0, 83.73], [85.0, 89.33], [90.0, 91.57], [102.0, 103.4], [105.0, 105.61], [107.0, 108.5], [111.0, 111.25], [115.0, 115.82], [121.0, 122.23], [130.0, 130.08], [135.0, 135.85], [136.0, 136.43], [139.0, 140.73], [144.0, 144.36], [147.0, 148.05], [151.0, 151.51], [154.0, 154.99], [160.0, 159.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.64, 0.0, 0.0, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 3.82, 1.05, 1.49, 1.92, 5.41, 1.21, 0.23, 0.43, -0.23, 1.73, 4.33, 1.57, 1.4, 0.61, 1.5, 0.25, 0.82, 1.23, 0.08, 0.85, 0.43, 1.73, 0.36, 1.05, 0.51, 0.99, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/aNOmTuwnGYg_filtered.json b/annotations_filtered/aNOmTuwnGYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78e26e713d2255eb0f7aefadf5aff4f79a207d9b --- /dev/null +++ b/annotations_filtered/aNOmTuwnGYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.2], [12.0, 12.7], [14.0, 15.82], [17.0, 17.93], [19.0, 28.78], [30.0, 37.49], [38.0, 40.88], [42.0, 44.86], [46.0, 50.14], [51.0, 54.16], [55.0, 95.98], [97.0, 104.33], [105.0, 106.84], [108.0, 110.62], [111.0, 113.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 78.04, 77.7, 49.97, 78.38, 77.2, 53.4, 0.0, 88.64, 0.0, 68.93, 43.58], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 46.09], ["hum", 16.06], ["sine wave", 14.93]], null, null, null, null, null, null, null, [["whale vocalization", 21.87], ["animal", 14.41], ["domestic animals, pets", 8.32]]], "duration": [1.2, 0.7, 1.82, 0.93, 9.78, 7.49, 2.88, 2.86, 4.14, 3.16, 40.98, 7.33, 1.84, 2.62, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/aNQL0s6v8nI_filtered.json b/annotations_filtered/aNQL0s6v8nI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2281a6d90eb32b2c45e8803a2156eac7bba48b9b --- /dev/null +++ b/annotations_filtered/aNQL0s6v8nI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 29.66], [36.0, 37.67], [45.0, 65.97], [67.0, 68.03], [69.0, 69.6], [74.0, 75.22], [76.0, 79.61], [81.0, 82.07], [86.0, 86.19], [89.0, 89.51], [93.0, 93.21], [95.0, 95.57], [102.0, 102.39], [104.0, 104.58], [106.0, 107.13], [113.0, 114.98], [118.0, 118.81], [120.0, 120.92], [125.0, 125.44], [125.0, 125.56], [126.0, 129.0], [144.0, 145.07], [145.0, 146.33], [148.0, 149.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.22, 0.0, 60.14, 0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 42.68], ["music", 37.68], ["didgeridoo", 6.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.66, 1.67, 20.97, 1.03, 0.6, 1.22, 3.61, 1.07, 0.19, 0.51, 0.21, 0.57, 0.39, 0.58, 1.13, 1.98, 0.81, 0.92, 0.44, 0.56, 3.0, 1.07, 1.33, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/aNR8SIVnHTY_filtered.json b/annotations_filtered/aNR8SIVnHTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc53b5e272f5c32d8cbb089116ee8770a8299815 --- /dev/null +++ b/annotations_filtered/aNR8SIVnHTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [4.0, 7.82], [9.0, 9.1], [12.0, 12.92], [17.0, 27.41], [28.0, 62.65], [63.0, 64.02], [64.0, 66.16], [67.0, 69.45], [70.0, 72.54], [73.0, 73.77], [75.0, 76.2], [83.0, 82.85], [85.0, 86.44], [88.0, 88.59], [95.0, 95.13], [96.0, 98.25], [99.0, 100.65], [101.0, 121.0]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.73, 0.0, 0.0, 83.52, 0.0, 0.0, 46.94, 52.51, 33.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.66, 0.0, 54.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 58.53], ["speech", 7.8], ["musical instrument", 5.59]], null, [["speech", 23.39], ["music", 16.22], ["livestock, farm animals, working animals", 10.78]], null, null, null, null, null, null, [["moo", 36.09], ["cattle, bovinae", 31.62], ["livestock, farm animals, working animals", 17.53]], null, null], "duration": [1.21, 3.82, 0.1, 0.92, 10.41, 34.65, 1.02, 2.16, 2.45, 2.54, 0.77, 1.2, -0.15, 1.44, 0.59, 0.13, 2.25, 1.65, 20.0]} \ No newline at end of file diff --git a/annotations_filtered/aNUs1A_sUCc_filtered.json b/annotations_filtered/aNUs1A_sUCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1e3330a1737f22eba122c3d2843baffdb49acb1 --- /dev/null +++ b/annotations_filtered/aNUs1A_sUCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 74.43], [77.0, 77.68], [80.0, 79.96], [83.0, 85.83], [88.0, 89.68], [94.0, 97.51], [100.0, 104.63], [107.0, 108.46], [111.0, 113.14], [114.0, 114.61], [118.0, 119.21]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [36.43, 0.0, 0.0, 45.52, 0.0, 72.31, 75.23, 0.0, 42.76, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.03], ["speech", 10.38], ["fly, housefly", 2.95]], null, null, [["music", 33.56], ["whale vocalization", 31.39], ["wild animals", 7.73]], null, null, null, null, [["music", 30.96], ["musical instrument", 4.36], ["didgeridoo", 4.21]], null, null], "duration": [7.43, 0.68, -0.04, 2.83, 1.68, 3.51, 4.63, 1.46, 2.14, 0.61, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/aNbtnYXp9-k_filtered.json b/annotations_filtered/aNbtnYXp9-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2311a2050fb21a5f89a5a0f2faf437316ea22944 --- /dev/null +++ b/annotations_filtered/aNbtnYXp9-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.97], [6.0, 6.84], [9.0, 9.9], [12.0, 15.18], [23.0, 23.06], [25.0, 25.25], [38.0, 38.5], [39.0, 38.64], [51.0, 55.39], [56.0, 64.15], [70.0, 72.0], [74.0, 77.75], [80.0, 81.85], [98.0, 98.34], [105.0, 104.79], [109.0, 112.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [86.09, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 33.13, 32.48, 35.14, 32.18, 0.0, 0.0, 0.0, 35.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 58.42], ["speech", 8.64], ["electronic music", 7.48]], [["music", 42.57], ["throbbing", 24.67], ["speech", 11.44]], [["music", 60.06], ["synthesizer", 8.88], ["musical instrument", 6.24]], [["music", 68.28], ["speech", 9.11], ["electronic music", 6.26]], null, null, null, [["music", 67.63], ["sidetone", 12.73], ["drum machine", 2.45]]], "duration": [2.97, 0.84, 0.9, 3.18, 0.06, 0.25, 0.5, -0.36, 4.39, 8.15, 2.0, 3.75, 1.85, 0.34, -0.21, 3.7]} \ No newline at end of file diff --git a/annotations_filtered/aOAgGeW7abs_filtered.json b/annotations_filtered/aOAgGeW7abs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92121a4caf6d96a6d8b7557d6984b52feecff55a --- /dev/null +++ b/annotations_filtered/aOAgGeW7abs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [4.0, 4.55], [5.0, 6.07], [7.0, 7.67], [10.0, 10.47], [11.0, 11.85], [12.0, 13.04], [17.0, 16.71], [32.0, 32.56], [35.0, 35.9], [46.0, 45.81], [46.0, 46.79], [48.0, 47.93], [49.0, 48.88], [53.0, 53.13], [55.0, 55.16], [56.0, 56.27], [57.0, 58.6], [59.0, 60.07], [61.0, 61.77], [63.0, 64.02], [67.0, 67.19], [68.0, 68.13], [72.0, 72.22], [73.0, 73.11], [74.0, 73.89], [81.0, 81.48], [82.0, 82.43], [83.0, 83.98], [85.0, 86.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.55, 1.07, 0.67, 0.47, 0.85, 1.04, -0.29, 0.56, 0.9, -0.19, 0.79, -0.07, -0.12, 0.13, 0.16, 0.27, 1.6, 1.07, 0.77, 1.02, 0.19, 0.13, 0.22, 0.11, -0.11, 0.48, 0.43, 0.98, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/aOX72bZr_LA_filtered.json b/annotations_filtered/aOX72bZr_LA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe70b89c45eac42df523f74fc79a369a5a9fca3c --- /dev/null +++ b/annotations_filtered/aOX72bZr_LA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.61], [9.0, 10.71], [14.0, 14.84], [19.0, 20.04], [26.0, 26.43], [36.0, 36.29], [37.0, 38.38], [40.0, 41.2], [42.0, 44.66], [47.0, 47.88], [67.0, 72.42], [73.0, 74.38], [78.0, 78.95], [91.0, 91.23], [92.0, 94.32], [98.0, 98.49], [101.0, 102.88], [105.0, 111.84], [113.0, 116.95], [120.0, 121.02], [123.0, 123.57], [125.0, 126.79], [128.0, 130.08], [133.0, 135.01], [135.0, 136.76], [137.0, 138.27], [139.0, 144.09], [145.0, 146.35], [148.0, 149.82], [152.0, 195.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 71.57, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 67.63, 64.63, 0.0, 0.0, 0.0, 54.97, 54.5, 0.0, 0.0, 52.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 1.71, 0.84, 1.04, 0.43, 0.29, 1.38, 1.2, 2.66, 0.88, 5.42, 1.38, 0.95, 0.23, 2.32, 0.49, 1.88, 6.84, 3.95, 1.02, 0.57, 1.79, 2.08, 2.01, 1.76, 1.27, 5.09, 1.35, 1.82, 43.02]} \ No newline at end of file diff --git a/annotations_filtered/aOg9IcxuV2g_filtered.json b/annotations_filtered/aOg9IcxuV2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4a0e6d05fede4a3cbc1525d3e95d53d8b407d08 --- /dev/null +++ b/annotations_filtered/aOg9IcxuV2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.37], [8.0, 8.28], [10.0, 10.44], [12.0, 12.61], [14.0, 14.69], [16.0, 17.44], [19.0, 19.38], [23.0, 23.5], [25.0, 26.13], [31.0, 31.33], [33.0, 33.42], [34.0, 35.41], [40.0, 40.91], [42.0, 45.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.01], ["mains hum", 20.57], ["hum", 7.97]]], "duration": [0.37, 0.28, 0.44, 0.61, 0.69, 1.44, 0.38, 0.5, 1.13, 0.33, 0.42, 1.41, 0.91, 3.45]} \ No newline at end of file diff --git a/annotations_filtered/aP1FZToPFxA_filtered.json b/annotations_filtered/aP1FZToPFxA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e737d4e32e376b8df7dd8cc332373e5b1c8e9a19 --- /dev/null +++ b/annotations_filtered/aP1FZToPFxA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [5.0, 5.83], [7.0, 9.44], [10.0, 37.52], [38.0, 39.83], [41.0, 41.23], [43.0, 44.39], [46.0, 47.09], [52.0, 52.03], [54.0, 53.92], [55.0, 55.16], [60.0, 60.32], [71.0, 72.77], [73.0, 74.21], [75.0, 76.71], [78.0, 78.63], [80.0, 80.49], [82.0, 85.68], [87.0, 87.49], [89.0, 89.36], [90.0, 90.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.09, 37.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 88.4], ["whimper", 2.01], ["hum", 1.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.83, 2.44, 27.52, 1.83, 0.23, 1.39, 1.09, 0.03, -0.08, 0.16, 0.32, 1.77, 1.21, 1.71, 0.63, 0.49, 3.68, 0.49, 0.36, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/aP7GTu8tbvQ_filtered.json b/annotations_filtered/aP7GTu8tbvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb71893cd1b4b49aad16f7bb0c294a0f0d485937 --- /dev/null +++ b/annotations_filtered/aP7GTu8tbvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.44], [8.0, 9.15], [15.0, 16.14], [19.0, 19.38], [21.0, 22.76], [26.0, 26.15], [28.0, 28.7], [31.0, 31.83], [40.0, 43.07], [45.0, 46.62], [47.0, 48.37], [51.0, 52.3], [55.0, 58.89], [60.0, 64.39], [66.0, 66.51], [67.0, 68.15], [68.0, 68.82], [70.0, 70.34], [75.0, 75.63], [78.0, 80.54], [88.0, 88.33], [91.0, 90.85], [93.0, 93.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [36.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 0.0, 48.56, 38.49, 0.0, 0.0, 0.0, 0.0, 0.0, 36.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["snicker", 42.1], ["chuckle, chortle", 24.18], ["laughter", 10.02]], null, null, null, null, null, null, null, null, null, null, null, [["music", 79.4], ["musical instrument", 3.56], ["brass instrument", 2.76]], [["music", 42.5], ["synthesizer", 15.44], ["didgeridoo", 10.01]], null, null, null, null, null, [["laughter", 18.7], ["baby laughter", 16.47], ["snicker", 12.45]], null, null, null], "duration": [2.44, 1.15, 1.14, 0.38, 1.76, 0.15, 0.7, 0.83, 3.07, 1.62, 1.37, 1.3, 3.89, 4.39, 0.51, 1.15, 0.82, 0.34, 0.63, 2.54, 0.33, -0.15, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/aPElaYUCTmA_filtered.json b/annotations_filtered/aPElaYUCTmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47bd1c1610de7dba0c36321c1727a44ec9f06e00 --- /dev/null +++ b/annotations_filtered/aPElaYUCTmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [0.0, 2.22], [6.0, 7.57], [9.0, 8.99], [10.0, 12.5], [14.0, 14.74], [16.0, 15.9], [21.0, 22.6], [28.0, 28.95], [33.0, 34.72], [38.0, 38.82], [40.0, 42.31], [43.0, 62.68], [63.0, 63.73], [64.0, 71.22], [75.0, 75.3], [75.0, 91.94], [98.0, 97.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.31, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 35.83, 0.0, 36.52, 0.0, 39.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.47], ["theremin", 23.2], ["synthesizer", 6.32]], null, [["theremin", 90.47], ["music", 6.64], ["musical instrument", 0.46]], null, [["music", 43.84], ["brass instrument", 18.54], ["trombone", 11.65]], null], "duration": [0.04, 2.22, 1.57, -0.01, 2.5, 0.74, -0.1, 1.6, 0.95, 1.72, 0.82, 2.31, 19.68, 0.73, 7.22, 0.3, 16.94, -0.15]} \ No newline at end of file diff --git a/annotations_filtered/aPFbf954LJ0_filtered.json b/annotations_filtered/aPFbf954LJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a906a67d4aaf7402c41f466ac7d8a4f2740d450 --- /dev/null +++ b/annotations_filtered/aPFbf954LJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 35.95], [59.0, 58.97], [72.0, 72.49], [78.0, 78.36], [82.0, 82.34], [103.0, 103.57], [105.0, 106.1], [125.0, 125.73], [133.0, 133.62]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [-0.05, -0.03, 0.49, 0.36, 0.34, 0.57, 1.1, 0.73, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/aPPMHA65HIg_filtered.json b/annotations_filtered/aPPMHA65HIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..769e0e6ca12cd1eaed2c066b9c31ca8c05c1ac6c --- /dev/null +++ b/annotations_filtered/aPPMHA65HIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.26], [12.0, 13.9], [15.0, 15.65], [16.0, 16.53], [17.0, 17.76], [19.0, 21.22], [23.0, 25.22], [26.0, 27.4], [29.0, 32.36], [33.0, 36.36], [38.0, 39.92], [41.0, 48.56], [50.0, 59.31], [60.0, 70.93], [73.0, 88.8], [91.0, 95.88], [96.0, 98.1], [99.0, 105.36], [107.0, 121.51], [124.0, 127.94]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.41, 36.44, 0.0, 37.57, 37.84, 0.0, 37.61, 36.63, 38.62, 36.59, 35.32, 36.4, 36.71, 32.48, 31.42], "audiomae_on_audioset": [null, null, null, null, null, [["music", 35.64], ["hum", 18.51], ["mains hum", 11.31]], [["music", 44.23], ["scary music", 11.84], ["rumble", 2.63]], null, [["music", 75.61], ["ambient music", 3.14], ["electronic music", 3.01]], [["hum", 31.41], ["music", 21.47], ["ambient music", 9.18]], null, [["mains hum", 42.16], ["hum", 38.45], ["music", 6.79]], [["music", 39.7], ["speech", 22.58], ["scary music", 10.07]], [["music", 71.54], ["scary music", 8.55], ["ambient music", 4.99]], [["music", 65.5], ["scary music", 14.36], ["ambient music", 4.9]], [["music", 23.21], ["mains hum", 12.78], ["hum", 12.46]], [["speech", 21.87], ["music", 20.63], ["hum", 9.34]], [["music", 63.13], ["hum", 8.67], ["gong", 3.12]], [["music", 80.24], ["hum", 3.94], ["didgeridoo", 2.3]], [["music", 46.5], ["musical instrument", 7.3], ["brass instrument", 5.97]]], "duration": [0.26, 1.9, 0.65, 0.53, 0.76, 2.22, 2.22, 1.4, 3.36, 3.36, 1.92, 7.56, 9.31, 10.93, 15.8, 4.88, 2.1, 6.36, 14.51, 3.94]} \ No newline at end of file diff --git a/annotations_filtered/aPQcQ4IhHNE_filtered.json b/annotations_filtered/aPQcQ4IhHNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..579057547f6993958bedf65fb79e474a1c6f3687 --- /dev/null +++ b/annotations_filtered/aPQcQ4IhHNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 43.56], [46.0, 76.2], [76.0, 87.44], [89.0, 105.04]], "keep_status": [false, false, true, true], "silence_prob": [0.0, 0.0, 36.27, 36.11], "audiomae_on_audioset": [null, null, [["music", 27.36], ["buzz", 12.41], ["hum", 8.15]], [["music", 25.67], ["buzz", 22.5], ["breaking", 12.59]]], "duration": [30.56, 30.2, 11.44, 16.04]} \ No newline at end of file diff --git a/annotations_filtered/aPUaHUwJJk8_filtered.json b/annotations_filtered/aPUaHUwJJk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90551e3901056b20cb4750d14ade1faab5003028 --- /dev/null +++ b/annotations_filtered/aPUaHUwJJk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 72.23], [74.0, 96.87], [98.0, 99.01], [100.0, 105.24], [108.0, 109.41], [112.0, 113.31], [114.0, 113.85], [114.0, 114.32], [117.0, 117.37], [119.0, 119.4], [124.0, 145.27]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.44, 0.0, 32.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.69], "audiomae_on_audioset": [null, [["music", 55.09], ["hum", 12.1], ["throbbing", 10.45]], null, [["speech", 30.07], ["music", 23.7], ["gunshot, gunfire", 9.03]], null, null, null, null, null, null, [["hum", 37.68], ["mains hum", 21.17], ["throbbing", 14.7]]], "duration": [48.23, 22.87, 1.01, 5.24, 1.41, 1.31, -0.15, 0.32, 0.37, 0.4, 21.27]} \ No newline at end of file diff --git a/annotations_filtered/aPdLYN69cfE_filtered.json b/annotations_filtered/aPdLYN69cfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffee9e0e1f6fbc91e829115dc4948dbbd089223e --- /dev/null +++ b/annotations_filtered/aPdLYN69cfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.96], [4.0, 5.16], [6.0, 6.51], [7.0, 11.23], [12.0, 13.15], [23.0, 23.28], [24.0, 37.72], [43.0, 46.52], [47.0, 95.89], [97.0, 105.63], [106.0, 129.95], [131.0, 169.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [44.26, 0.0, 0.0, 31.11, 0.0, 0.0, 35.62, 36.2, 0.0, 47.27, 28.78, 0.0], "audiomae_on_audioset": [[["hum", 20.14], ["mains hum", 18.81], ["music", 17.3]], null, null, [["speech", 80.25], ["music", 3.65], ["whale vocalization", 3.32]], null, null, [["music", 60.66], ["sonar", 10.43], ["electronic music", 5.52]], [["music", 74.16], ["musical instrument", 5.42], ["synthesizer", 3.02]], null, [["music", 57.63], ["electronic music", 7.72], ["synthesizer", 7.11]], [["speech", 41.52], ["music", 20.43], ["mains hum", 6.68]], null], "duration": [2.96, 1.16, 0.51, 4.23, 1.15, 0.28, 13.72, 3.52, 48.89, 8.63, 23.95, 38.94]} \ No newline at end of file diff --git a/annotations_filtered/aPdxMGV1Y28_filtered.json b/annotations_filtered/aPdxMGV1Y28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71ec11589db79c1753e32bbd7edf29a1b9a4f8a5 --- /dev/null +++ b/annotations_filtered/aPdxMGV1Y28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.67], [29.0, 31.04], [33.0, 34.75], [36.0, 38.45], [40.0, 46.04], [47.0, 49.74], [51.0, 52.89], [54.0, 56.12], [58.0, 58.77], [60.0, 64.1], [65.0, 66.16], [67.0, 70.29], [71.0, 77.16], [78.0, 88.06], [94.0, 120.01], [121.0, 120.95], [122.0, 122.79], [125.0, 127.09], [128.0, 136.44], [137.0, 137.19], [137.0, 140.53], [144.0, 161.74]], "keep_status": [false, true, false, true, true, true, false, true, false, false, false, true, true, true, true, false, false, true, true, false, false, true], "silence_prob": [0.0, 37.74, 0.0, 41.85, 43.18, 40.41, 0.0, 37.69, 0.0, 37.31, 0.0, 33.94, 34.85, 33.87, 29.43, 0.0, 0.0, 29.56, 31.44, 0.0, 28.45, 28.21], "audiomae_on_audioset": [null, [["gong", 22.83], ["music", 17.86], ["ambient music", 13.36]], null, [["music", 48.18], ["sonar", 9.31], ["ambient music", 7.76]], [["music", 45.62], ["crow", 5.26], ["caw", 4.68]], [["quack", 14.71], ["frog", 14.35], ["gong", 7.53]], null, [["music", 44.52], ["gong", 7.37], ["electronic music", 6.53]], null, [["music", 39.21], ["gong", 27.89], ["electronic music", 10.2]], null, [["caw", 23.13], ["music", 15.49], ["crow", 14.59]], [["speech", 33.39], ["caw", 13.13], ["crow", 5.93]], [["music", 34.13], ["caw", 17.17], ["crow", 11.18]], [["hum", 21.27], ["mains hum", 19.81], ["music", 18.5]], null, null, [["music", 33.18], ["theremin", 21.75], ["civil defense siren", 6.99]], [["music", 25.47], ["whack, thwack", 14.32], ["hum", 6.85]], null, [["groan", 64.43], ["music", 14.2], ["grunt", 9.72]], [["music", 38.78], ["buzz", 6.77], ["outside, rural or natural", 3.89]]], "duration": [1.67, 2.04, 1.75, 2.45, 6.04, 2.74, 1.89, 2.12, 0.77, 4.1, 1.16, 3.29, 6.16, 10.06, 26.01, -0.05, 0.79, 2.09, 8.44, 0.19, 3.53, 17.74]} \ No newline at end of file diff --git a/annotations_filtered/aPeZmPcpiu8_filtered.json b/annotations_filtered/aPeZmPcpiu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3842cbc150ad777b384da900b9be9a273da0882 --- /dev/null +++ b/annotations_filtered/aPeZmPcpiu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.0], [29.0, 30.13], [31.0, 31.45], [36.0, 39.02], [40.0, 40.64], [42.0, 42.84], [60.0, 63.17], [66.0, 68.99], [72.0, 73.06], [74.0, 74.33], [76.0, 76.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.59, 0.0, 0.0, 99.68, 0.0, 0.0, 93.6, 94.07, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.0, 1.13, 0.45, 3.02, 0.64, 0.84, 3.17, 2.99, 1.06, 0.33, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/aPrURpNEtkg_filtered.json b/annotations_filtered/aPrURpNEtkg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54bda67362221afc313a3a9cabcc888920ef971d --- /dev/null +++ b/annotations_filtered/aPrURpNEtkg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [4.0, 5.05], [6.0, 7.28], [27.0, 28.58], [29.0, 29.4], [32.0, 32.36], [70.0, 70.44], [76.0, 76.35], [78.0, 78.04]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.99, 1.05, 1.28, 1.58, 0.4, 0.36, 0.44, 0.35, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/aPvptS4t6RA_filtered.json b/annotations_filtered/aPvptS4t6RA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..280e9e64cdd7f936d5dabca54b1520eb8443314b --- /dev/null +++ b/annotations_filtered/aPvptS4t6RA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [17.0, 17.56], [36.0, 36.8], [40.0, 41.42], [49.0, 49.08], [59.0, 59.66], [61.0, 62.65], [66.0, 67.86], [68.0, 67.96], [68.0, 68.01], [68.0, 68.23], [68.0, 68.98], [69.0, 69.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.56, 0.8, 1.42, 0.08, 0.66, 1.65, 1.86, -0.04, 0.01, 0.23, 0.98, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/aQ5PyaHQWVA_filtered.json b/annotations_filtered/aQ5PyaHQWVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7ceacb86d6a1721ad84aa59743be356a6b6fa51 --- /dev/null +++ b/annotations_filtered/aQ5PyaHQWVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.63], [16.0, 16.23], [29.0, 29.24], [35.0, 35.26], [37.0, 37.52], [44.0, 46.28], [47.0, 54.21], [55.0, 57.45], [58.0, 61.69], [63.0, 71.73], [73.0, 74.26], [76.0, 77.68], [79.0, 79.24], [82.0, 82.97], [87.0, 88.01], [90.0, 90.91], [93.0, 93.43], [96.0, 97.17]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.3, 39.41, 62.07, 58.13, 30.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 44.62], ["hum", 14.23], ["sidetone", 10.12]], [["speech", 20.1], ["hum", 14.95], ["vehicle", 6.19]], null, null, [["music", 44.9], ["didgeridoo", 14.75], ["theremin", 10.77]], null, null, null, null, null, null, null, null], "duration": [1.63, 0.23, 0.24, 0.26, 0.52, 2.28, 7.21, 2.45, 3.69, 8.73, 1.26, 1.68, 0.24, 0.97, 1.01, 0.91, 0.43, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/aQHOzbF0qH0_filtered.json b/annotations_filtered/aQHOzbF0qH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..415375b048e3345588a49d3e842ceab58929dd88 --- /dev/null +++ b/annotations_filtered/aQHOzbF0qH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 25.56], [34.0, 35.7], [36.0, 39.29], [40.0, 41.82], [43.0, 43.29], [45.0, 45.0], [46.0, 46.11], [47.0, 47.58], [48.0, 48.09], [51.0, 53.11], [60.0, 62.26], [72.0, 72.01], [82.0, 83.93], [93.0, 95.22], [100.0, 102.68], [109.0, 109.26], [113.0, 114.57], [129.0, 130.49]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.55, 0.0, 80.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.7, 51.12, 0.0, 0.0, 54.56, 66.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["explosion", 22.67], ["whack, thwack", 10.86], ["burst, pop", 8.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.56, 1.7, 3.29, 1.82, 0.29, 0.0, 0.11, 0.58, 0.09, 2.11, 2.26, 0.01, 1.93, 2.22, 2.68, 0.26, 1.57, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/aQQsBjOrNMY_filtered.json b/annotations_filtered/aQQsBjOrNMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e49a854fb1a4dd60fe39dcccad4b50301adfb0dd --- /dev/null +++ b/annotations_filtered/aQQsBjOrNMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.12], [39.0, 38.79], [39.0, 39.93], [44.0, 44.15], [45.0, 46.5], [53.0, 107.89], [109.0, 112.45], [114.0, 116.48]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 99.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.12, -0.21, 0.93, 0.15, 1.5, 54.89, 3.45, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/aQRjyav-x8o_filtered.json b/annotations_filtered/aQRjyav-x8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc0a2bd28ef77d2fd9f76a3f2dc7610a8ef98ceb --- /dev/null +++ b/annotations_filtered/aQRjyav-x8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.72], [9.0, 9.51], [10.0, 13.15], [19.0, 19.67], [20.0, 20.56], [23.0, 22.99], [36.0, 36.42], [69.0, 69.65], [72.0, 76.79]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 45.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 61.02], ["speech", 7.15], ["frog", 6.39]]], "duration": [0.72, 0.51, 3.15, 0.67, 0.56, -0.01, 0.42, 0.65, 4.79]} \ No newline at end of file diff --git a/annotations_filtered/aQqAUXKn7t4_filtered.json b/annotations_filtered/aQqAUXKn7t4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..392faab964b2b5d358ba70ecef62430ca8cb325a --- /dev/null +++ b/annotations_filtered/aQqAUXKn7t4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.69], [10.0, 10.27], [14.0, 14.45], [16.0, 21.15], [23.0, 28.51], [32.0, 32.21], [36.0, 37.15], [39.0, 38.74], [39.0, 39.61], [41.0, 41.0], [51.0, 54.19], [57.0, 59.37], [60.0, 60.42], [61.0, 63.41], [64.0, 137.37], [143.0, 149.01], [150.0, 150.89], [151.0, 152.51], [153.0, 154.85], [161.0, 161.94], [179.0, 179.63], [180.0, 181.25], [187.0, 187.96], [196.0, 200.06]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.68, 32.85, 0.0, 0.0, 0.0, 0.0, 0.0, 40.75, 40.88, 0.0, 38.66, 0.0, 39.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, [["hum", 25.61], ["mains hum", 25.19], ["music", 17.3]], [["fly, housefly", 45.56], ["insect", 21.52], ["bee, wasp, etc.", 9.31]], null, null, null, null, null, [["cattle, bovinae", 33.28], ["livestock, farm animals, working animals", 25.41], ["moo", 21.42]], [["fly, housefly", 37.91], ["insect", 22.83], ["mosquito", 15.14]], null, [["moo", 45.39], ["cattle, bovinae", 30.6], ["livestock, farm animals, working animals", 16.78]], null, [["fly, housefly", 27.8], ["insect", 14.23], ["speech", 8.29]], null, null, null, null, null, null, null, null], "duration": [0.69, 0.27, 0.45, 5.15, 5.51, 0.21, 1.15, -0.26, 0.61, 0.0, 3.19, 2.37, 0.42, 2.41, 73.37, 6.01, 0.89, 1.51, 1.85, 0.94, 0.63, 1.25, 0.96, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/aRM2YcGpmxg_filtered.json b/annotations_filtered/aRM2YcGpmxg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e33f17c1e3ff451060016553162658889bd432e --- /dev/null +++ b/annotations_filtered/aRM2YcGpmxg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.86], [4.0, 4.97], [8.0, 10.13], [11.0, 12.87], [14.0, 16.33], [17.0, 31.41], [34.0, 74.14], [80.0, 80.82], [88.0, 89.26], [90.0, 90.88], [95.0, 96.01], [99.0, 111.33], [113.0, 117.09], [118.0, 118.89], [120.0, 121.44], [123.0, 128.07]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 40.36, 0.0, 73.51, 31.74, 0.0, 0.0, 0.0, 0.0, 0.0, 32.43, 40.16, 0.0, 0.0, 39.49], "audiomae_on_audioset": [null, null, [["whale vocalization", 48.64], ["hum", 14.62], ["sidetone", 7.66]], null, null, [["music", 34.75], ["door", 14.81], ["crushing", 2.88]], null, null, null, null, null, [["sheep", 29.58], ["livestock, farm animals, working animals", 27.12], ["bleat", 10.06]], [["creak", 64.33], ["mechanisms", 19.5], ["speech", 2.71]], null, null, [["finger snapping", 23.19], ["hum", 12.24], ["sonar", 9.85]]], "duration": [-0.14, 0.97, 2.13, 1.87, 2.33, 14.41, 40.14, 0.82, 1.26, 0.88, 1.01, 12.33, 4.09, 0.89, 1.44, 5.07]} \ No newline at end of file diff --git a/annotations_filtered/aRPInpAD3_o_filtered.json b/annotations_filtered/aRPInpAD3_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed1f5f5c475e4b1224492859bdca1011bd223957 --- /dev/null +++ b/annotations_filtered/aRPInpAD3_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.36], [2.0, 2.96], [3.0, 4.23], [31.0, 33.34], [53.0, 69.77], [71.0, 84.79], [90.0, 89.68], [109.0, 109.49], [116.0, 116.31], [117.0, 116.72], [121.0, 126.15], [130.0, 129.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.99, 33.15, 30.43, 0.0, 0.0, 0.0, 0.0, 36.59, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 76.53], ["electronic music", 5.17], ["throbbing", 3.5]], [["music", 38.35], ["speech", 25.9], ["didgeridoo", 10.25]], null, null, null, null, [["music", 77.4], ["fart", 2.55], ["boing", 1.79]], null], "duration": [0.36, 0.96, 1.23, 2.34, 16.77, 13.79, -0.32, 0.49, 0.31, -0.28, 5.15, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/aRav_8OWESA_filtered.json b/annotations_filtered/aRav_8OWESA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6d2905eff05e22a14479e7f8f5ad4cb439be193 --- /dev/null +++ b/annotations_filtered/aRav_8OWESA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.75], [5.0, 6.69], [9.0, 9.63], [17.0, 18.82], [29.0, 33.15], [34.0, 34.28], [38.0, 39.18], [48.0, 51.29], [57.0, 57.99], [60.0, 71.1], [79.0, 80.57], [93.0, 93.38], [95.0, 95.18], [96.0, 97.38], [100.0, 102.24], [106.0, 107.38], [115.0, 115.96], [121.0, 124.06], [124.0, 124.8], [126.0, 127.45], [129.0, 130.99], [134.0, 135.19], [138.0, 138.48], [139.0, 141.37], [146.0, 146.65]], "keep_status": [true, false, false, false, true, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [32.56, 0.0, 0.0, 0.0, 31.66, 0.0, 0.0, 32.11, 0.0, 31.64, 0.0, 0.0, 0.0, 0.0, 36.32, 0.0, 0.0, 32.38, 0.0, 0.0, 0.0, 0.0, 0.0, 36.38, 0.0], "audiomae_on_audioset": [[["mosquito", 26.43], ["fly, housefly", 13.68], ["insect", 11.59]], null, null, null, [["music", 44.53], ["speech", 14.13], ["boing", 6.44]], null, null, [["music", 28.03], ["speech", 24.75], ["theremin", 6.97]], null, [["fly, housefly", 27.13], ["insect", 15.42], ["moo", 11.24]], null, null, null, null, [["music", 30.06], ["echo", 10.08], ["reverberation", 8.47]], null, null, [["moo", 36.13], ["cattle, bovinae", 25.46], ["livestock, farm animals, working animals", 12.56]], null, null, null, null, null, [["music", 55.22], ["guitar", 6.88], ["musical instrument", 6.07]], null], "duration": [2.75, 1.69, 0.63, 1.82, 4.15, 0.28, 1.18, 3.29, 0.99, 11.1, 1.57, 0.38, 0.18, 1.38, 2.24, 1.38, 0.96, 3.06, 0.8, 1.45, 1.99, 1.19, 0.48, 2.37, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/aRcxYPkFjh4_filtered.json b/annotations_filtered/aRcxYPkFjh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41bf1a0281085e1f80cc9c1954db89bb8b250a27 --- /dev/null +++ b/annotations_filtered/aRcxYPkFjh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.7], [9.0, 10.3], [13.0, 14.08], [17.0, 16.73], [31.0, 32.05], [38.0, 37.83], [38.0, 39.92], [42.0, 43.73]], "keep_status": [true, false, false, false, false, false, false, false], "silence_prob": [37.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["marimba, xylophone", 20.46], ["glockenspiel", 17.63], ["mallet percussion", 14.48]], null, null, null, null, null, null, null], "duration": [3.7, 1.3, 1.08, -0.27, 1.05, -0.17, 1.92, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/aRgUxpmvZpc_filtered.json b/annotations_filtered/aRgUxpmvZpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c761199a8172c207fa7b2d563f4141c1b6edfcea --- /dev/null +++ b/annotations_filtered/aRgUxpmvZpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.39], [10.0, 10.81], [12.0, 13.86], [23.0, 24.34], [26.0, 25.76], [34.0, 35.36]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.39, 0.81, 1.86, 1.34, -0.24, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/aRmaCLDJ8Xk_filtered.json b/annotations_filtered/aRmaCLDJ8Xk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4faf4623e5a27b30b96ddaaa69e0a77c89d0a3c --- /dev/null +++ b/annotations_filtered/aRmaCLDJ8Xk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 17.29], [24.0, 23.87], [26.0, 30.89], [35.0, 73.25], [76.0, 79.74], [82.0, 97.34], [103.0, 140.17], [141.0, 144.26], [156.0, 161.03], [164.0, 176.32]], "keep_status": [true, false, false, false, true, true, false, true, true, true], "silence_prob": [30.87, 0.0, 38.16, 0.0, 30.1, 33.45, 0.0, 28.71, 30.83, 33.24], "audiomae_on_audioset": [[["music", 33.51], ["speech", 31.6], ["hum", 4.66]], null, [["music", 68.53], ["synthesizer", 11.65], ["sampler", 2.8]], null, [["music", 42.01], ["synthesizer", 6.89], ["electronic music", 5.74]], [["music", 44.18], ["hum", 7.8], ["didgeridoo", 7.73]], null, [["white noise", 10.8], ["hum", 10.14], ["music", 9.9]], [["buzz", 18.63], ["noise", 17.84], ["hum", 12.71]], [["hum", 36.1], ["music", 20.43], ["throbbing", 10.75]]], "duration": [16.29, -0.13, 4.89, 38.25, 3.74, 15.34, 37.17, 3.26, 5.03, 12.32]} \ No newline at end of file diff --git a/annotations_filtered/aSUmLsp97mE_filtered.json b/annotations_filtered/aSUmLsp97mE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c0f17749af38dae24bf50841f59baeacd1e4353 --- /dev/null +++ b/annotations_filtered/aSUmLsp97mE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.19], [18.0, 24.6], [25.0, 29.88], [32.0, 32.54], [33.0, 33.59], [34.0, 34.64], [37.0, 40.56], [43.0, 44.47], [45.0, 47.7], [52.0, 52.24], [53.0, 53.84], [55.0, 55.92], [57.0, 59.58], [67.0, 66.87], [67.0, 68.89], [72.0, 72.03], [73.0, 73.95], [77.0, 77.53], [79.0, 79.88], [81.0, 81.72], [83.0, 90.14], [92.0, 92.3]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [37.84, 55.25, 60.6, 0.0, 0.0, 0.0, 93.91, 0.0, 43.66, 0.0, 0.0, 0.0, 35.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.7, 0.0], "audiomae_on_audioset": [[["music", 52.8], ["didgeridoo", 17.58], ["synthesizer", 5.87]], null, null, null, null, null, null, null, [["baby laughter", 16.98], ["fart", 8.6], ["frog", 7.55]], null, null, null, [["speech", 29.12], ["radio", 19.72], ["frog", 14.21]], null, null, null, null, null, null, null, [["animal", 26.41], ["speech", 17.4], ["livestock, farm animals, working animals", 11.34]], null], "duration": [13.19, 6.6, 4.88, 0.54, 0.59, 0.64, 3.56, 1.47, 2.7, 0.24, 0.84, 0.92, 2.58, -0.13, 1.89, 0.03, 0.95, 0.53, 0.88, 0.72, 7.14, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/aSajnx9QK-0_filtered.json b/annotations_filtered/aSajnx9QK-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a62e4b024215da840ca0b009efa83a8d1f696716 --- /dev/null +++ b/annotations_filtered/aSajnx9QK-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 15.3], [16.0, 16.92], [19.0, 20.14], [22.0, 23.13], [24.0, 27.62], [29.0, 29.57], [32.0, 32.76], [34.0, 35.16], [43.0, 44.05], [46.0, 46.14], [48.0, 50.53], [51.0, 51.7], [53.0, 56.25], [58.0, 58.95], [60.0, 64.0], [67.0, 75.22], [76.0, 89.95], [91.0, 91.54], [113.0, 114.67], [115.0, 115.84], [117.0, 117.73], [120.0, 120.7], [124.0, 125.78], [127.0, 128.87], [131.0, 131.06], [132.0, 135.97], [138.0, 138.84], [142.0, 144.51], [145.0, 147.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.81, 0.0, 0.0, 0.0, 57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 50.76, 0.0, 39.22, 0.0, 36.79, 33.69, 33.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 0.0, 71.0, 70.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 19.16], ["speech", 12.72], ["music", 11.68]], null, [["speech", 36.2], ["buzz", 14.19], ["sidetone", 10.06]], [["speech", 79.59], ["cattle, bovinae", 3.07], ["livestock, farm animals, working animals", 2.22]], [["hum", 27.01], ["mains hum", 26.91], ["speech", 19.55]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.3, 0.92, 1.14, 1.13, 3.62, 0.57, 0.76, 1.16, 1.05, 0.14, 2.53, 0.7, 3.25, 0.95, 4.0, 8.22, 13.95, 0.54, 1.67, 0.84, 0.73, 0.7, 1.78, 1.87, 0.06, 3.97, 0.84, 2.51, 2.36]} \ No newline at end of file diff --git a/annotations_filtered/aSsFjcw8R3Y_filtered.json b/annotations_filtered/aSsFjcw8R3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc2f447d145260181f589257627cb77234a4b38f --- /dev/null +++ b/annotations_filtered/aSsFjcw8R3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 16.93], [19.0, 26.23], [29.0, 29.71], [32.0, 32.49], [34.0, 34.23], [35.0, 36.41], [38.0, 39.77], [42.0, 64.27], [65.0, 64.91], [70.0, 69.89], [71.0, 73.48], [74.0, 76.86], [78.0, 78.22], [81.0, 81.35], [84.0, 84.47], [88.0, 88.53], [91.0, 91.76], [93.0, 93.97], [95.0, 96.01], [111.0, 111.28], [114.0, 114.05], [122.0, 122.03], [122.0, 122.08], [122.0, 122.47], [123.0, 122.57], [123.0, 123.2], [125.0, 125.91], [129.0, 128.76]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.05, 30.16, 0.0, 0.0, 0.0, 0.0, 0.0, 31.59, 0.0, 0.0, 98.73, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.22], ["speech", 17.04], ["throbbing", 6.09]], [["throbbing", 40.04], ["hum", 28.65], ["music", 21.99]], null, null, null, null, null, [["music", 52.81], ["throbbing", 7.24], ["speech", 5.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.93, 7.23, 0.71, 0.49, 0.23, 1.41, 1.77, 22.27, -0.09, -0.11, 2.48, 2.86, 0.22, 0.35, 0.47, 0.53, 0.76, 0.97, 1.01, 0.28, 0.05, 0.03, 0.08, 0.47, -0.43, 0.2, 0.91, -0.24]} \ No newline at end of file diff --git a/annotations_filtered/aSwH4lpuKE8_filtered.json b/annotations_filtered/aSwH4lpuKE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d5ac4b1f1b60431d040ec93cfacf7707dcaa8fe --- /dev/null +++ b/annotations_filtered/aSwH4lpuKE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [11.0, 12.66], [25.0, 26.03], [28.0, 28.21], [37.0, 38.65], [53.0, 54.19], [56.0, 56.3], [63.0, 65.53], [66.0, 67.69]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.63, 1.66, 1.03, 0.21, 1.65, 1.19, 0.3, 2.53, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/aSwi8mzc1gA_filtered.json b/annotations_filtered/aSwi8mzc1gA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c214bd1c7a42199f94d1c2049ec06efdc75c05a --- /dev/null +++ b/annotations_filtered/aSwi8mzc1gA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.02], [3.0, 14.4], [15.0, 15.85], [17.0, 17.27], [18.0, 18.79], [20.0, 21.05], [22.0, 22.23], [27.0, 29.84], [32.0, 33.0], [36.0, 36.56], [37.0, 39.83], [40.0, 41.77], [46.0, 46.16], [48.0, 47.9], [50.0, 51.76], [53.0, 53.38], [55.0, 57.57], [59.0, 58.89], [59.0, 59.75], [63.0, 76.99], [79.0, 81.08], [85.0, 85.78], [86.0, 87.42], [93.0, 93.53], [94.0, 94.05], [94.0, 95.59], [97.0, 97.92], [99.0, 99.2], [99.0, 99.67], [103.0, 102.9], [106.0, 105.71], [109.0, 109.54], [110.0, 111.28], [112.0, 115.86], [121.0, 122.44], [124.0, 131.08], [134.0, 133.62], [135.0, 148.61], [150.0, 150.47], [153.0, 155.01], [157.0, 156.84], [159.0, 159.66], [165.0, 165.64], [166.0, 166.58], [169.0, 170.31], [173.0, 173.7], [176.0, 178.61], [179.0, 180.32], [181.0, 181.52], [182.0, 182.26], [183.0, 183.36], [187.0, 189.23], [193.0, 196.74], [197.0, 198.32], [199.0, 203.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 92.64, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.59, 0.0, 85.9, 0.0, 50.66, 0.0, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 68.41, 75.23, 0.0, 60.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 19.05], ["chirp tone", 17.56], ["sine wave", 16.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 11.4, 0.85, 0.27, 0.79, 1.05, 0.23, 2.84, 1.0, 0.56, 2.83, 1.77, 0.16, -0.1, 1.76, 0.38, 2.57, -0.11, 0.75, 13.99, 2.08, 0.78, 1.42, 0.53, 0.05, 1.59, 0.92, 0.2, 0.67, -0.1, -0.29, 0.54, 1.28, 3.86, 1.44, 7.08, -0.38, 13.61, 0.47, 2.01, -0.16, 0.66, 0.64, 0.58, 1.31, 0.7, 2.61, 1.32, 0.52, 0.26, 0.36, 2.23, 3.74, 1.32, 4.96]} \ No newline at end of file diff --git a/annotations_filtered/aSxScp7zUpY_filtered.json b/annotations_filtered/aSxScp7zUpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56bd521843de6015e138374f049871f2b2538a84 --- /dev/null +++ b/annotations_filtered/aSxScp7zUpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.69], [20.0, 23.4], [24.0, 33.0], [33.0, 33.44], [36.0, 43.85], [46.0, 47.68], [51.0, 55.61], [57.0, 71.39], [72.0, 87.98], [91.0, 98.2], [105.0, 159.44], [163.0, 163.65]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.47, 32.31, 31.31, 0.0, 30.83, 0.0, 29.41, 30.3, 30.57, 34.4, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.43], ["throbbing", 11.65], ["vehicle", 8.02]], [["music", 49.11], ["electronic music", 10.76], ["dubstep", 4.67]], [["music", 53.33], ["vehicle", 6.48], ["siren", 5.46]], null, [["music", 61.82], ["car", 5.37], ["vehicle", 4.43]], null, [["music", 66.07], ["musical instrument", 5.4], ["cacophony", 5.22]], [["music", 70.3], ["speech", 8.1], ["throbbing", 5.26]], [["music", 64.05], ["throbbing", 8.15], ["electronic music", 3.82]], [["music", 77.61], ["hum", 3.56], ["synthesizer", 3.53]], null, null], "duration": [6.69, 3.4, 9.0, 0.44, 7.85, 1.68, 4.61, 14.39, 15.98, 7.2, 54.44, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/aTPdWYo9zhQ_filtered.json b/annotations_filtered/aTPdWYo9zhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6b18b04821bea12604ccfb592fe88f5061d6feb --- /dev/null +++ b/annotations_filtered/aTPdWYo9zhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.45], [7.0, 13.2], [16.0, 17.29], [20.0, 20.61], [28.0, 30.54], [40.0, 46.23], [49.0, 51.58], [57.0, 61.87], [65.0, 71.1], [73.0, 83.05], [85.0, 85.67], [87.0, 88.48], [89.0, 99.15], [101.0, 101.12], [105.0, 107.28], [108.0, 111.43], [113.0, 115.86]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [29.01, 30.05, 0.0, 0.0, 37.52, 29.72, 33.56, 31.35, 29.75, 30.81, 0.0, 0.0, 30.58, 0.0, 31.38, 38.23, 28.97], "audiomae_on_audioset": [[["music", 25.79], ["throbbing", 15.25], ["hum", 5.97]], [["music", 47.74], ["hum", 17.86], ["throbbing", 8.18]], null, null, [["music", 40.98], ["noise", 14.94], ["cacophony", 5.03]], [["hum", 37.46], ["throbbing", 32.1], ["music", 14.82]], [["music", 48.98], ["mains hum", 18.13], ["speech", 13.24]], [["music", 80.15], ["synthesizer", 3.89], ["musical instrument", 3.89]], [["speech", 54.51], ["music", 26.62], ["synthesizer", 3.12]], [["music", 61.99], ["synthesizer", 8.03], ["speech", 4.43]], null, null, [["music", 81.66], ["throbbing", 2.53], ["hum", 2.24]], null, [["music", 51.18], ["theremin", 6.45], ["musical instrument", 4.35]], [["music", 47.27], ["didgeridoo", 11.88], ["speech", 7.51]], [["music", 64.66], ["musical instrument", 7.39], ["guitar", 2.7]]], "duration": [2.45, 6.2, 1.29, 0.61, 2.54, 6.23, 2.58, 4.87, 6.1, 10.05, 0.67, 1.48, 10.15, 0.12, 2.28, 3.43, 2.86]} \ No newline at end of file diff --git a/annotations_filtered/aTSa6E4_Zgs_filtered.json b/annotations_filtered/aTSa6E4_Zgs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5eae597a09e2f6165e08de4640f7934dca5ba07 --- /dev/null +++ b/annotations_filtered/aTSa6E4_Zgs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 39.93], [41.0, 43.23], [44.0, 46.5], [47.0, 48.36], [50.0, 53.15], [54.0, 55.46], [57.0, 58.89], [59.0, 67.83], [69.0, 72.79], [81.0, 81.31], [85.0, 86.76], [88.0, 89.04], [89.0, 93.39], [94.0, 110.96], [113.0, 113.07], [116.0, 116.38]], "keep_status": [false, true, true, false, true, false, false, true, true, false, false, false, true, true, false, false], "silence_prob": [31.46, 33.75, 33.01, 0.0, 31.17, 0.0, 0.0, 32.51, 31.58, 0.0, 0.0, 0.0, 30.81, 29.95, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 34.89], ["moo", 20.95], ["livestock, farm animals, working animals", 19.99]], [["speech", 24.73], ["music", 12.01], ["mains hum", 6.82]], [["speech", 26.27], ["vehicle", 24.13], ["car", 6.2]], null, [["music", 11.94], ["vehicle", 10.3], ["car", 7.9]], null, null, [["music", 37.05], ["theremin", 6.13], ["synthesizer", 4.42]], [["music", 50.65], ["mains hum", 6.57], ["electronic music", 6.11]], null, null, null, [["music", 31.14], ["speech", 12.86], ["synthesizer", 6.16]], [["livestock, farm animals, working animals", 30.77], ["cattle, bovinae", 6.72], ["hum", 6.38]], null, null], "duration": [7.93, 2.23, 2.5, 1.36, 3.15, 1.46, 1.89, 8.83, 3.79, 0.31, 1.76, 1.04, 4.39, 16.96, 0.07, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/aTTbCJmc3Cg_filtered.json b/annotations_filtered/aTTbCJmc3Cg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a9ff6ab7caad902f2fce2bff0c140bf72546e36 --- /dev/null +++ b/annotations_filtered/aTTbCJmc3Cg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.95], [9.0, 10.57], [12.0, 12.38], [14.0, 16.75], [17.0, 17.81], [18.0, 19.13], [21.0, 22.0], [24.0, 24.83], [27.0, 28.27], [30.0, 31.75], [33.0, 33.47], [37.0, 37.59], [39.0, 40.96], [43.0, 45.99], [48.0, 50.19], [53.0, 54.01], [56.0, 56.98], [58.0, 58.95], [61.0, 62.33], [65.0, 65.5], [67.0, 68.17], [72.0, 72.89], [74.0, 74.8], [82.0, 82.61], [85.0, 86.24], [88.0, 88.35], [91.0, 91.79], [95.0, 95.54], [98.0, 103.49], [106.0, 107.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.95, 1.57, 0.38, 2.75, 0.81, 1.13, 1.0, 0.83, 1.27, 1.75, 0.47, 0.59, 1.96, 2.99, 2.19, 1.01, 0.98, 0.95, 1.33, 0.5, 1.17, 0.89, 0.8, 0.61, 1.24, 0.35, 0.79, 0.54, 5.49, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/aTaX_L7msxs_filtered.json b/annotations_filtered/aTaX_L7msxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a08802423cf82dc6dc5153ce285060c9485adca5 --- /dev/null +++ b/annotations_filtered/aTaX_L7msxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.26], [5.0, 6.59], [8.0, 8.99], [15.0, 16.17], [18.0, 18.86], [20.0, 20.41], [54.0, 55.38], [60.0, 60.15], [62.0, 62.24], [66.0, 65.96], [70.0, 71.49], [72.0, 72.52], [75.0, 75.02], [81.0, 81.08], [83.0, 91.44], [92.0, 92.16], [93.0, 93.82], [95.0, 94.93], [95.0, 95.49], [98.0, 97.98], [99.0, 101.95], [105.0, 105.92], [107.0, 107.74], [110.0, 111.27], [112.0, 112.58], [116.0, 116.38], [117.0, 117.32], [120.0, 119.94], [121.0, 122.3], [127.0, 128.29], [130.0, 130.65], [134.0, 134.38], [139.0, 139.56], [140.0, 141.84], [150.0, 149.99], [150.0, 150.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.09, 0.0, 0.0, 0.0, 0.0, 0.0, 33.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.55], ["frog", 13.31], ["animal", 7.39]], null, null, null, null, null, [["theremin", 17.32], ["whistling", 15.03], ["music", 12.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.26, 1.59, 0.99, 1.17, 0.86, 0.41, 1.38, 0.15, 0.24, -0.04, 1.49, 0.52, 0.02, 0.08, 8.44, 0.16, 0.82, -0.07, 0.49, -0.02, 2.95, 0.92, 0.74, 1.27, 0.58, 0.38, 0.32, -0.06, 1.3, 1.29, 0.65, 0.38, 0.56, 1.84, -0.01, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/aTc9vNCS8vo_filtered.json b/annotations_filtered/aTc9vNCS8vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46c90e90d64b7866fc8edf0ea50b2f42da63cc36 --- /dev/null +++ b/annotations_filtered/aTc9vNCS8vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.43], [8.0, 9.56], [12.0, 12.87], [15.0, 14.96], [28.0, 33.44], [33.0, 33.51], [34.0, 34.33], [46.0, 51.93], [53.0, 56.24], [62.0, 80.86], [82.0, 84.13], [85.0, 86.37], [87.0, 86.75], [88.0, 88.69], [90.0, 91.1], [94.0, 94.69], [97.0, 101.01], [108.0, 109.07], [109.0, 110.71], [111.0, 119.97], [121.0, 129.25], [130.0, 131.73], [134.0, 134.01], [136.0, 137.13], [137.0, 137.42], [140.0, 140.19], [141.0, 142.99], [146.0, 145.76], [149.0, 153.15], [153.0, 155.9], [156.0, 157.98], [159.0, 159.48], [160.0, 160.84], [163.0, 163.56], [165.0, 165.62], [170.0, 171.8], [174.0, 176.39], [179.0, 179.83], [181.0, 181.03], [182.0, 182.53], [183.0, 183.88], [185.0, 185.62]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [93.45, 0.0, 0.0, 0.0, 34.35, 0.0, 0.0, 46.19, 34.0, 39.28, 80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0, 99.71, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.83, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 87.01], ["radio", 5.9], ["sidetone", 3.03]], null, null, [["speech", 67.64], ["music", 5.34], ["animal", 1.76]], [["speech", 61.69], ["dog", 4.51], ["animal", 3.51]], [["speech", 55.21], ["telephone", 20.57], ["dial tone", 7.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 15.01], ["livestock, farm animals, working animals", 12.77], ["wild animals", 10.08]], null, null, null, null, null], "duration": [2.43, 1.56, 0.87, -0.04, 5.44, 0.51, 0.33, 5.93, 3.24, 18.86, 2.13, 1.37, -0.25, 0.69, 1.1, 0.69, 4.01, 1.07, 1.71, 8.97, 8.25, 1.73, 0.01, 1.13, 0.42, 0.19, 1.99, -0.24, 4.15, 2.9, 1.98, 0.48, 0.84, 0.56, 0.62, 1.8, 2.39, 0.83, 0.03, 0.53, 0.88, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/aTsjwO97Aow_filtered.json b/annotations_filtered/aTsjwO97Aow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2674060cb8a6f69c597e290d8e8d8d2f5e42fade --- /dev/null +++ b/annotations_filtered/aTsjwO97Aow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.72], [11.0, 12.01], [16.0, 15.79], [22.0, 50.31], [52.0, 52.49], [54.0, 53.79], [60.0, 60.35], [61.0, 61.77], [63.0, 63.54], [71.0, 72.6], [74.0, 73.9], [74.0, 77.63], [78.0, 78.48], [79.0, 84.21], [85.0, 86.34], [88.0, 88.35], [90.0, 97.12], [105.0, 105.92], [108.0, 109.75], [110.0, 113.49], [115.0, 116.85], [121.0, 122.89], [131.0, 131.45]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.91, 0.0, 33.55, 0.0, 0.0, 38.46, 0.0, 0.0, 58.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 44.67], ["music", 8.18], ["hum", 7.14]], null, null, null, null, null, null, null, [["speech", 67.27], ["thunk", 12.61], ["thump, thud", 2.58]], null, [["speech", 76.41], ["gunshot, gunfire", 4.15], ["explosion", 4.14]], null, null, [["speech", 81.25], ["explosion", 1.62], ["firecracker", 1.32]], null, null, null, null, null, null], "duration": [0.72, 1.01, -0.21, 28.31, 0.49, -0.21, 0.35, 0.77, 0.54, 1.6, -0.1, 3.63, 0.48, 5.21, 1.34, 0.35, 7.12, 0.92, 1.75, 3.49, 1.85, 1.89, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/aTxu-zthTgs_filtered.json b/annotations_filtered/aTxu-zthTgs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d66192ae7bb17ee9176d1a4378df83d6d790b178 --- /dev/null +++ b/annotations_filtered/aTxu-zthTgs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.95], [16.0, 27.97], [31.0, 42.16], [42.0, 69.25], [71.0, 83.44]], "keep_status": [true, false, true, true, false], "silence_prob": [31.3, 31.48, 32.33, 32.89, 34.45], "audiomae_on_audioset": [[["motorcycle", 14.65], ["vehicle", 11.89], ["fly, housefly", 10.91]], [["music", 40.4], ["throbbing", 20.49], ["hum", 14.15]], [["music", 19.5], ["hum", 18.48], ["vehicle", 12.51]], [["music", 27.25], ["vehicle", 18.3], ["speech", 9.19]], [["music", 79.5], ["speech", 3.93], ["brass instrument", 1.76]]], "duration": [5.95, 11.97, 11.16, 27.25, 12.44]} \ No newline at end of file diff --git a/annotations_filtered/aU-Qp-5TsB4_filtered.json b/annotations_filtered/aU-Qp-5TsB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f35fe6f93e39fac149ab83f8c3be3eccea308e8b --- /dev/null +++ b/annotations_filtered/aU-Qp-5TsB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.59], [5.0, 6.32], [7.0, 8.07], [10.0, 10.52], [13.0, 14.15], [15.0, 16.26], [18.0, 19.35], [22.0, 22.76], [24.0, 24.22], [25.0, 27.99], [36.0, 38.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 99.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.59, 1.32, 1.07, 0.52, 1.15, 1.26, 1.35, 0.76, 0.22, 2.99, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/aU9RYKxkRJk_filtered.json b/annotations_filtered/aU9RYKxkRJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b509256f7ff304a3e1eb35a443e833b751645e50 --- /dev/null +++ b/annotations_filtered/aU9RYKxkRJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.16], [9.0, 9.49], [11.0, 11.89], [13.0, 13.91], [16.0, 16.83], [19.0, 20.73], [21.0, 21.3], [24.0, 26.35], [30.0, 31.08], [31.0, 33.59], [36.0, 36.68], [38.0, 39.7], [41.0, 42.7], [47.0, 48.17], [50.0, 51.07], [52.0, 52.89], [55.0, 55.27], [57.0, 57.21], [58.0, 58.5], [60.0, 61.79], [65.0, 67.61], [69.0, 69.77], [70.0, 72.17], [73.0, 75.79], [77.0, 78.7], [80.0, 81.38], [83.0, 83.67], [85.0, 85.65], [87.0, 89.02], [92.0, 98.58], [99.0, 101.71], [103.0, 103.1], [107.0, 110.19], [112.0, 112.43], [115.0, 115.06], [117.0, 117.29], [119.0, 119.82], [121.0, 122.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 97.92, 99.31, 0.0, 0.0, 0.0, 0.0, 90.95, 82.97, 81.35, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.49, 0.89, 0.91, 0.83, 1.73, 0.3, 2.35, 1.08, 2.59, 0.68, 1.7, 1.7, 1.17, 1.07, 0.89, 0.27, 0.21, 0.5, 1.79, 2.61, 0.77, 2.17, 2.79, 1.7, 1.38, 0.67, 0.65, 2.02, 6.58, 2.71, 0.1, 3.19, 0.43, 0.06, 0.29, 0.82, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/aUAVPdrvwoA_filtered.json b/annotations_filtered/aUAVPdrvwoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df0908d69943f7c6063c5f62deda72afa8657b74 --- /dev/null +++ b/annotations_filtered/aUAVPdrvwoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.18], [7.0, 8.16], [9.0, 9.73], [11.0, 14.07], [14.0, 15.16], [16.0, 18.71], [21.0, 21.59], [25.0, 25.93], [27.0, 27.31], [29.0, 37.4], [40.0, 40.8], [42.0, 43.58], [44.0, 46.16], [47.0, 47.49], [52.0, 53.57], [59.0, 59.46], [62.0, 65.79], [66.0, 66.18], [81.0, 85.9], [90.0, 92.26], [96.0, 97.6], [100.0, 100.74]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.62, 0.0, 40.29, 0.0, 0.0, 0.0, 46.83, 0.0, 0.0, 34.04, 0.0, 0.0, 0.0, 30.98, 0.0, 31.72, 47.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 24.05], ["speech", 19.61], ["hum", 10.24]], null, [["gong", 35.21], ["music", 25.62], ["singing bowl", 11.46]], null, null, null, [["music", 48.22], ["gong", 16.39], ["singing bowl", 11.27]], null, null, [["music", 35.85], ["speech", 21.82], ["whale vocalization", 5.54]], null, null, null, [["music", 25.54], ["mains hum", 23.02], ["hum", 16.88]], null, [["music", 43.06], ["didgeridoo", 9.96], ["buzz", 8.68]], [["animal", 26.42], ["music", 11.48], ["livestock, farm animals, working animals", 5.25]], null, null], "duration": [0.18, 1.16, 0.73, 3.07, 1.16, 2.71, 0.59, 0.93, 0.31, 8.4, 0.8, 1.58, 2.16, 0.49, 1.57, 0.46, 3.79, 0.18, 4.9, 2.26, 1.6, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/aUCNlDzsDH0_filtered.json b/annotations_filtered/aUCNlDzsDH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c23ef7b5359e1dbc01f733957c4899b698f3f25 --- /dev/null +++ b/annotations_filtered/aUCNlDzsDH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.0], [6.0, 8.82], [10.0, 11.89], [14.0, 20.61], [24.0, 25.42], [28.0, 29.25], [31.0, 31.08], [32.0, 33.42], [37.0, 37.76], [39.0, 39.6], [40.0, 40.58], [42.0, 42.13], [43.0, 44.0], [48.0, 48.1], [50.0, 49.69], [51.0, 52.83], [54.0, 55.51], [56.0, 62.33], [63.0, 65.26], [68.0, 76.86], [78.0, 78.49], [81.0, 86.86], [87.0, 94.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [45.98, 47.16, 0.0, 39.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.76, 53.47, 40.54, 0.0, 42.02, 42.06], "audiomae_on_audioset": [[["music", 65.67], ["musical instrument", 4.64], ["didgeridoo", 3.09]], [["music", 47.68], ["didgeridoo", 14.74], ["speech", 12.92]], null, [["music", 49.47], ["theremin", 15.5], ["synthesizer", 5.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.93], ["musical instrument", 6.1], ["synthesizer", 5.27]], null, [["music", 38.55], ["synthesizer", 13.66], ["fart", 8.63]], null, [["music", 55.4], ["synthesizer", 9.14], ["musical instrument", 8.19]], [["music", 56.69], ["didgeridoo", 11.16], ["effects unit", 4.15]]], "duration": [3.0, 2.82, 1.89, 6.61, 1.42, 1.25, 0.08, 1.42, 0.76, 0.6, 0.58, 0.13, 1.0, 0.1, -0.31, 1.83, 1.51, 6.33, 2.26, 8.86, 0.49, 5.86, 7.19]} \ No newline at end of file diff --git a/annotations_filtered/aUIjcrHyvHU_filtered.json b/annotations_filtered/aUIjcrHyvHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fae6175b273f3643208226b09e3bd33247db6e5 --- /dev/null +++ b/annotations_filtered/aUIjcrHyvHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.38], [25.0, 25.69], [30.0, 30.59], [44.0, 43.77], [62.0, 62.5], [78.0, 79.02], [85.0, 86.61], [90.0, 90.78]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.38, 0.69, 0.59, -0.23, 0.5, 1.02, 1.61, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/aUNq34kNR0M_filtered.json b/annotations_filtered/aUNq34kNR0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55f06c89b2ee2c9b8dc2a115dd26df2f1dbf5e2a --- /dev/null +++ b/annotations_filtered/aUNq34kNR0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.58], [28.0, 28.44], [43.0, 45.17]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 53.34], "audiomae_on_audioset": [null, null, null], "duration": [0.58, 0.44, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/aURe7hHL-Dw_filtered.json b/annotations_filtered/aURe7hHL-Dw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ef70531c4f97d7a18b390ed3b53f387413fa12d --- /dev/null +++ b/annotations_filtered/aURe7hHL-Dw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.81], [18.0, 18.35], [23.0, 23.36], [28.0, 28.98], [30.0, 32.78], [33.0, 33.96], [35.0, 35.61], [39.0, 40.71], [41.0, 42.69], [43.0, 48.22], [49.0, 49.27], [50.0, 51.34], [52.0, 54.26], [55.0, 58.36], [63.0, 64.29], [65.0, 66.04], [69.0, 69.67], [75.0, 78.58]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.35, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 69.34, 50.71, 0.0, 0.0, 0.0, 46.75], "audiomae_on_audioset": [null, null, null, null, [["music", 31.02], ["thunk", 25.6], ["breaking", 15.17]], null, null, null, null, [["telephone", 41.51], ["telephone bell ringing", 15.28], ["speech", 12.47]], null, null, null, null, null, null, null, [["sine wave", 32.75], ["chirp tone", 12.9], ["busy signal", 9.04]]], "duration": [1.81, 0.35, 0.36, 0.98, 2.78, 0.96, 0.61, 1.71, 1.69, 5.22, 0.27, 1.34, 2.26, 3.36, 1.29, 1.04, 0.67, 3.58]} \ No newline at end of file diff --git a/annotations_filtered/aUWOzyo-Kec_filtered.json b/annotations_filtered/aUWOzyo-Kec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b49e4ca58873f99e7bb432e9e714daea4860c7f --- /dev/null +++ b/annotations_filtered/aUWOzyo-Kec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [2.0, 2.79], [6.0, 6.61], [9.0, 10.27], [13.0, 13.26], [23.0, 26.5], [28.0, 29.12], [32.0, 32.7], [43.0, 43.66], [45.0, 45.91], [46.0, 51.14], [54.0, 55.86], [57.0, 61.05], [64.0, 64.22], [65.0, 65.4], [68.0, 67.76], [71.0, 72.4], [73.0, 73.74], [75.0, 76.08], [79.0, 79.74], [80.0, 81.18], [82.0, 86.63], [91.0, 91.71], [93.0, 93.93], [96.0, 100.79], [106.0, 107.55], [112.0, 112.08], [114.0, 115.45], [116.0, 124.41], [126.0, 126.35], [127.0, 128.55], [129.0, 130.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 41.05, 0.0, 35.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.91, 0.0, 0.0, 35.08, 0.0, 0.0, 0.0, 90.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 55.11], ["sidetone", 6.07], ["music", 4.92]], null, [["speech", 76.31], ["music", 5.44], ["fart", 4.16]], null, null, null, null, null, null, null, null, [["whale vocalization", 31.13], ["music", 24.7], ["speech", 13.28]], null, null, [["speech", 63.32], ["boing", 11.5], ["thunk", 5.54]], null, null, null, null, null, null, null], "duration": [0.5, 0.79, 0.61, 1.27, 0.26, 3.5, 1.12, 0.7, 0.66, 0.91, 5.14, 1.86, 4.05, 0.22, 0.4, -0.24, 1.4, 0.74, 1.08, 0.74, 1.18, 4.63, 0.71, 0.93, 4.79, 1.55, 0.08, 1.45, 8.41, 0.35, 1.55, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/aUdbjoT_DPQ_filtered.json b/annotations_filtered/aUdbjoT_DPQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..026d3399ba96537db67c1229df857b5adc82b9ea --- /dev/null +++ b/annotations_filtered/aUdbjoT_DPQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [5.0, 33.22], [34.0, 35.46], [36.0, 36.42], [38.0, 46.2], [47.0, 52.88], [54.0, 66.14], [66.0, 66.8], [67.0, 91.52], [92.0, 92.92], [97.0, 97.88], [99.0, 101.04], [102.0, 121.12], [121.0, 121.15], [121.0, 121.24], [121.0, 121.29], [123.0, 124.24], [127.0, 127.77], [144.0, 145.4]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.5, 0.0, 0.0, 36.1, 37.73, 32.88, 0.0, 35.28, 0.0, 0.0, 32.89, 30.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 43.66], ["hum", 8.62], ["mains hum", 6.7]], [["music", 75.34], ["musical instrument", 3.31], ["electronic music", 1.84]], [["music", 79.36], ["musical instrument", 2.4], ["didgeridoo", 2.26]], null, [["music", 71.57], ["speech", 14.31], ["synthesizer", 1.64]], null, null, [["didgeridoo", 35.86], ["music", 25.2], ["musical instrument", 8.74]], [["music", 81.45], ["didgeridoo", 3.49], ["musical instrument", 3.1]], null, null, null, null, null, null], "duration": [0.55, 28.22, 1.46, 0.42, 8.2, 5.88, 12.14, 0.8, 24.52, 0.92, 0.88, 2.04, 19.12, 0.15, 0.24, 0.29, 1.24, 0.77, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/aVCOzbRPapo_filtered.json b/annotations_filtered/aVCOzbRPapo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f14e4dc90eb9549240b40a1a76c8287b01396960 --- /dev/null +++ b/annotations_filtered/aVCOzbRPapo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.97], [13.0, 22.96], [23.0, 24.65], [25.0, 43.71], [50.0, 63.21], [65.0, 73.03], [74.0, 74.8], [76.0, 80.0], [81.0, 81.36], [84.0, 85.92], [86.0, 90.49], [92.0, 94.98], [96.0, 96.72], [97.0, 97.11], [98.0, 98.14], [99.0, 99.32], [100.0, 100.48], [101.0, 108.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 64.41, 0.0, 66.76, 98.1, 98.1, 0.0, 30.31, 0.0, 0.0, 30.23, 29.89, 0.0, 0.0, 0.0, 0.0, 0.0, 30.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["didgeridoo", 34.91], ["speech", 26.15], ["music", 9.89]], null, null, [["mains hum", 31.98], ["hum", 22.63], ["speech", 15.46]], [["speech", 55.38], ["didgeridoo", 13.06], ["music", 9.32]], null, null, null, null, null, [["music", 18.21], ["whale vocalization", 13.74], ["grunt", 3.92]]], "duration": [0.97, 9.96, 1.65, 18.71, 13.21, 8.03, 0.8, 4.0, 0.36, 1.92, 4.49, 2.98, 0.72, 0.11, 0.14, 0.32, 0.48, 7.92]} \ No newline at end of file diff --git a/annotations_filtered/aVHgGXnna94_filtered.json b/annotations_filtered/aVHgGXnna94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f9b7a1b200628116928bef5708b5c6bfc62408c --- /dev/null +++ b/annotations_filtered/aVHgGXnna94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.25], [24.0, 24.8], [26.0, 26.6], [31.0, 36.21], [38.0, 38.64], [39.0, 39.63], [40.0, 40.74], [42.0, 46.38], [50.0, 53.42], [56.0, 58.14], [60.0, 61.11], [65.0, 72.39], [73.0, 74.76], [77.0, 89.51], [93.0, 105.93], [112.0, 112.4], [115.0, 130.98], [133.0, 151.16], [152.0, 155.29], [159.0, 159.21], [160.0, 161.35], [162.0, 164.93], [166.0, 167.78], [169.0, 170.23], [171.0, 176.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.16, 0.0, 0.0, 0.0, 73.21, 74.92, 56.63, 0.0, 31.9, 0.0, 31.09, 31.17, 0.0, 31.75, 30.43, 100.0, 0.0, 0.0, 39.78, 0.0, 0.0, 74.44], "audiomae_on_audioset": [null, null, null, [["music", 47.85], ["musical instrument", 15.49], ["synthesizer", 8.54]], null, null, null, null, null, null, null, [["mains hum", 31.07], ["hum", 27.78], ["music", 10.02]], null, [["music", 67.1], ["hum", 6.6], ["throbbing", 4.32]], [["music", 86.88], ["musical instrument", 2.6], ["scary music", 1.57]], null, [["music", 79.9], ["musical instrument", 4.12], ["didgeridoo", 2.76]], [["music", 69.67], ["theremin", 3.21], ["brass instrument", 3.01]], null, null, null, [["speech", 68.82], ["sidetone", 5.06], ["hum", 3.68]], null, null, null], "duration": [0.25, 0.8, 0.6, 5.21, 0.64, 0.63, 0.74, 4.38, 3.42, 2.14, 1.11, 7.39, 1.76, 12.51, 12.93, 0.4, 15.98, 18.16, 3.29, 0.21, 1.35, 2.93, 1.78, 1.23, 5.44]} \ No newline at end of file diff --git a/annotations_filtered/aW3-E3My-kc_filtered.json b/annotations_filtered/aW3-E3My-kc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7617753746995143795f422e67960333cdcbcaa --- /dev/null +++ b/annotations_filtered/aW3-E3My-kc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.68], [28.0, 32.95], [34.0, 34.96], [37.0, 37.05], [38.0, 37.99], [38.0, 38.04], [38.0, 40.22], [45.0, 46.31], [51.0, 51.8], [53.0, 57.94], [59.0, 59.8], [64.0, 82.27], [91.0, 93.23], [97.0, 99.66], [102.0, 104.72], [120.0, 120.11], [123.0, 122.99], [125.0, 126.74], [128.0, 133.79], [141.0, 141.93], [142.0, 142.67], [143.0, 143.13], [152.0, 154.53], [159.0, 161.5], [169.0, 171.32], [177.0, 177.67], [178.0, 177.72], [178.0, 179.39]], "keep_status": [true, true, false, false, false, false, true, false, false, true, false, true, true, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [28.78, 28.88, 0.0, 0.0, 0.0, 0.0, 29.41, 0.0, 0.0, 29.34, 0.0, 28.79, 29.85, 29.53, 29.56, 0.0, 0.0, 0.0, 29.08, 0.0, 0.0, 0.0, 29.29, 28.47, 28.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["creak", 21.97], ["throbbing", 19.36], ["music", 13.03]], [["hum", 25.95], ["throbbing", 25.17], ["music", 11.46]], null, null, null, null, [["music", 24.4], ["speech", 20.83], ["didgeridoo", 3.92]], null, null, [["music", 55.51], ["throbbing", 7.76], ["didgeridoo", 3.47]], null, [["speech", 28.06], ["music", 21.21], ["whack, thwack", 16.31]], [["throbbing", 19.33], ["music", 18.76], ["beatboxing", 7.25]], [["didgeridoo", 71.14], ["music", 14.71], ["musical instrument", 2.34]], [["music", 48.17], ["beatboxing", 17.26], ["didgeridoo", 12.36]], null, null, null, [["speech", 46.1], ["music", 19.35], ["throbbing", 3.51]], null, null, null, [["cattle, bovinae", 21.38], ["music", 9.92], ["throbbing", 9.26]], [["music", 55.03], ["speech", 14.92], ["electronic music", 6.59]], [["speech", 37.66], ["music", 31.67], ["explosion", 5.51]], null, null, null], "duration": [2.68, 4.95, 0.96, 0.05, -0.01, 0.04, 2.22, 1.31, 0.8, 4.94, 0.8, 18.27, 2.23, 2.66, 2.72, 0.11, -0.01, 1.74, 5.79, 0.93, 0.67, 0.13, 2.53, 2.5, 2.32, 0.67, -0.28, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/aW4tjKzDEDU_filtered.json b/annotations_filtered/aW4tjKzDEDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5c344c0e58a546fdb8099ca73fb445aced0057c --- /dev/null +++ b/annotations_filtered/aW4tjKzDEDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.39], [2.0, 3.2], [5.0, 5.21], [7.0, 11.28], [12.0, 13.44], [15.0, 16.75], [19.0, 19.97], [23.0, 28.51], [30.0, 31.55], [33.0, 33.37], [36.0, 36.86], [39.0, 38.96], [40.0, 40.22], [43.0, 46.11], [47.0, 48.46], [51.0, 51.41], [52.0, 52.74], [54.0, 54.94], [56.0, 56.08], [57.0, 58.83], [61.0, 61.57], [67.0, 67.58], [70.0, 75.15], [76.0, 79.39], [81.0, 85.19], [87.0, 86.86], [92.0, 94.24], [103.0, 106.05], [118.0, 117.73], [142.0, 141.96], [146.0, 150.9], [152.0, 154.47], [156.0, 157.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 56.63, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.96, 100.0, 0.0, 51.23, 54.97, 0.0, 0.0, 37.57, 77.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.48], ["speech", 25.81], ["fart", 8.11]], null, null], "duration": [0.39, 1.2, 0.21, 4.28, 1.44, 1.75, 0.97, 5.51, 1.55, 0.37, 0.86, -0.04, 0.22, 3.11, 1.46, 0.41, 0.74, 0.94, 0.08, 1.83, 0.57, 0.58, 5.15, 3.39, 4.19, -0.14, 2.24, 3.05, -0.27, -0.04, 4.9, 2.47, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/aW4x-PAnrO8_filtered.json b/annotations_filtered/aW4x-PAnrO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27ea29d07194f86e320e25b343a1920ff386faea --- /dev/null +++ b/annotations_filtered/aW4x-PAnrO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.69], [4.0, 3.86], [5.0, 5.1], [6.0, 7.65], [8.0, 9.66], [16.0, 21.39], [22.0, 23.23], [24.0, 24.98], [28.0, 29.29], [30.0, 37.44], [38.0, 39.68], [42.0, 42.69], [45.0, 46.4], [47.0, 48.84], [49.0, 50.6], [51.0, 52.49], [54.0, 55.63], [56.0, 58.18], [60.0, 59.81], [61.0, 61.64], [63.0, 64.59], [71.0, 76.81], [78.0, 79.07], [80.0, 84.0], [85.0, 85.68], [88.0, 89.46], [95.0, 95.57], [100.0, 101.46], [104.0, 104.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 67.51, 0.0, 51.82, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.69, -0.14, 0.1, 1.65, 1.66, 5.39, 1.23, 0.98, 1.29, 7.44, 1.68, 0.69, 1.4, 1.84, 1.6, 1.49, 1.63, 2.18, -0.19, 0.64, 1.59, 5.81, 1.07, 4.0, 0.68, 1.46, 0.57, 1.46, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/aWIcfkvKj9Q_filtered.json b/annotations_filtered/aWIcfkvKj9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f8fb51ec74fa2ca843ba5022e04a6837b2ea849 --- /dev/null +++ b/annotations_filtered/aWIcfkvKj9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.23], [5.0, 10.45], [11.0, 12.45], [13.0, 15.01], [16.0, 21.24], [22.0, 22.92], [24.0, 24.39], [25.0, 29.25], [31.0, 33.96], [35.0, 36.44], [37.0, 38.04], [40.0, 41.49], [43.0, 52.2], [53.0, 53.45], [55.0, 55.83], [56.0, 57.03], [60.0, 60.72], [61.0, 63.21], [64.0, 66.85], [68.0, 70.04], [70.0, 78.02], [78.0, 80.74], [82.0, 85.83], [87.0, 87.45], [88.0, 88.4], [89.0, 90.32], [91.0, 100.79], [102.0, 102.17], [110.0, 110.29], [111.0, 114.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.33, 100.0, 0.0, 93.76, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 99.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.23, 5.45, 1.45, 2.01, 5.24, 0.92, 0.39, 4.25, 2.96, 1.44, 1.04, 1.49, 9.2, 0.45, 0.83, 1.03, 0.72, 2.21, 2.85, 2.04, 8.02, 2.74, 3.83, 0.45, 0.4, 1.32, 9.79, 0.17, 0.29, 3.62]} \ No newline at end of file diff --git a/annotations_filtered/aWLRULhIyCE_filtered.json b/annotations_filtered/aWLRULhIyCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..644eb0c3414838f881e3cb28eee26308eba984ce --- /dev/null +++ b/annotations_filtered/aWLRULhIyCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [5.0, 5.78], [7.0, 6.94], [7.0, 8.34], [9.0, 11.53], [13.0, 12.85], [13.0, 14.08], [17.0, 17.9], [19.0, 31.24], [32.0, 34.1], [36.0, 36.42], [38.0, 38.55], [41.0, 41.2], [42.0, 42.42], [45.0, 45.94], [47.0, 47.68], [49.0, 50.31], [53.0, 53.43], [61.0, 61.35], [63.0, 64.05], [65.0, 65.57], [67.0, 68.2], [72.0, 72.39], [73.0, 74.85], [77.0, 77.99], [79.0, 80.35], [84.0, 84.91], [87.0, 87.69], [91.0, 91.18], [93.0, 94.27], [97.0, 96.62], [101.0, 107.77], [108.0, 108.18], [110.0, 111.23], [114.0, 114.91], [116.0, 117.98], [121.0, 121.51], [123.0, 126.55], [127.0, 129.49], [130.0, 131.7], [132.0, 133.03], [134.0, 138.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.38, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 90.08, 0.0, 0.0, 94.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.64], ["speech", 23.85], ["theremin", 9.4]], null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.78, -0.06, 1.34, 2.53, -0.15, 1.08, 0.9, 12.24, 2.1, 0.42, 0.55, 0.2, 0.42, 0.94, 0.68, 1.31, 0.43, 0.35, 1.05, 0.57, 1.2, 0.39, 1.85, 0.99, 1.35, 0.91, 0.69, 0.18, 1.27, -0.38, 6.77, 0.18, 1.23, 0.91, 1.98, 0.51, 3.55, 2.49, 1.7, 1.03, 4.08]} \ No newline at end of file diff --git a/annotations_filtered/aW_qXKNDWtU_filtered.json b/annotations_filtered/aW_qXKNDWtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b57f429d4f048a70b9fd981e93fbb400dd890251 --- /dev/null +++ b/annotations_filtered/aW_qXKNDWtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.07], [9.0, 10.22], [13.0, 18.37], [21.0, 22.49], [28.0, 28.73], [38.0, 38.43], [39.0, 47.73], [51.0, 50.97], [52.0, 53.45], [55.0, 56.56], [58.0, 59.19], [61.0, 61.87], [63.0, 66.87], [72.0, 72.5], [73.0, 80.27], [84.0, 84.67], [88.0, 88.32], [92.0, 92.25], [96.0, 95.67], [96.0, 98.44], [101.0, 104.43], [106.0, 108.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 96.17, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 85.54, 82.97, 76.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.07, 1.22, 5.37, 1.49, 0.73, 0.43, 8.73, -0.03, 1.45, 1.56, 1.19, 0.87, 3.87, 0.5, 7.27, 0.67, 0.32, 0.25, -0.33, 2.44, 3.43, 2.87]} \ No newline at end of file diff --git a/annotations_filtered/aWinsyIVC3E_filtered.json b/annotations_filtered/aWinsyIVC3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34e2ad323c7b711a608223ef539961e3e49226ec --- /dev/null +++ b/annotations_filtered/aWinsyIVC3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 42.08], [44.0, 53.92], [55.0, 61.64], [64.0, 65.75], [68.0, 102.37], [103.0, 103.03]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 31.15, 34.11, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 34.73], ["animal", 22.16], ["music", 14.08]], [["music", 29.82], ["horse", 17.4], ["neigh, whinny", 15.88]], null, null, null], "duration": [1.08, 9.92, 6.64, 1.75, 34.37, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/aWjBDI02kSE_filtered.json b/annotations_filtered/aWjBDI02kSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dda3f6ee0c55b8ce4f3117f6a8babf0d9cfdc2ce --- /dev/null +++ b/annotations_filtered/aWjBDI02kSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[94.0, 126.5], [129.0, 136.63], [138.0, 163.44], [164.0, 164.51], [169.0, 172.66], [175.0, 174.9], [180.0, 180.6], [188.0, 189.6], [192.0, 192.27]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 29.91, 29.36, 0.0, 34.47, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 35.08], ["throbbing", 22.95], ["hum", 13.93]], [["music", 61.81], ["cacophony", 5.93], ["musical instrument", 2.81]], null, [["thunk", 44.64], ["speech", 16.6], ["music", 7.59]], null, null, null, null], "duration": [32.5, 7.63, 25.44, 0.51, 3.66, -0.1, 0.6, 1.6, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/aWyYZ3-8oAM_filtered.json b/annotations_filtered/aWyYZ3-8oAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb5bed0206d81f4fe5b9788325641f66fb863534 --- /dev/null +++ b/annotations_filtered/aWyYZ3-8oAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.53], [12.0, 13.71], [20.0, 20.58], [22.0, 25.03], [27.0, 28.07], [29.0, 30.89], [34.0, 34.5], [35.0, 55.36], [58.0, 72.54], [73.0, 78.14], [81.0, 88.15], [89.0, 93.09], [96.0, 106.95], [110.0, 116.13], [117.0, 119.37], [119.0, 119.47], [120.0, 119.85]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.37, 0.0, 0.0, 0.0, 30.63, 31.11, 30.63, 31.93, 32.31, 29.21, 46.33, 40.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 36.76], ["throbbing", 20.74], ["sidetone", 12.38]], null, null, null, [["music", 79.38], ["throbbing", 3.1], ["hum", 2.8]], [["music", 55.39], ["throbbing", 5.86], ["hum", 5.04]], [["mains hum", 43.51], ["hum", 31.61], ["music", 7.55]], [["throbbing", 34.36], ["music", 29.62], ["hum", 13.99]], [["fly, housefly", 61.49], ["insect", 24.9], ["mosquito", 6.03]], [["buzz", 42.25], ["music", 19.31], ["hum", 5.57]], [["sidetone", 37.98], ["hum", 18.6], ["mains hum", 17.19]], [["sidetone", 47.87], ["speech", 27.8], ["music", 14.11]], null, null], "duration": [-0.47, 1.71, 0.58, 3.03, 1.07, 1.89, 0.5, 20.36, 14.54, 5.14, 7.15, 4.09, 10.95, 6.13, 2.37, 0.47, -0.15]} \ No newline at end of file diff --git a/annotations_filtered/aX9m-xzauMw_filtered.json b/annotations_filtered/aX9m-xzauMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2431dbd2e502cb492cb425e3e9812cbc058a4316 --- /dev/null +++ b/annotations_filtered/aX9m-xzauMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.51], [7.0, 29.76], [31.0, 33.42], [51.0, 52.29], [61.0, 61.13], [67.0, 67.53], [78.0, 80.55], [88.0, 88.79], [90.0, 91.0], [97.0, 98.2], [99.0, 99.37], [105.0, 105.7], [108.0, 108.36], [109.0, 112.58], [114.0, 114.67]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [31.48, 29.83, 32.56, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0], "audiomae_on_audioset": [[["music", 65.47], ["theremin", 5.26], ["musical instrument", 3.88]], [["music", 46.23], ["speech", 18.14], ["fly, housefly", 4.52]], [["music", 40.33], ["speech", 24.53], ["thunk", 5.69]], null, null, null, null, null, null, null, null, null, null, [["speech", 12.99], ["animal", 10.86], ["fart", 9.73]], null], "duration": [2.51, 22.76, 2.42, 1.29, 0.13, 0.53, 2.55, 0.79, 1.0, 1.2, 0.37, 0.7, 0.36, 3.58, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/aXbf3X56rGM_filtered.json b/annotations_filtered/aXbf3X56rGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a34bf312b0b49801de25a3ccdea0e7dc9a27a1f8 --- /dev/null +++ b/annotations_filtered/aXbf3X56rGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [4.0, 5.59], [8.0, 9.22], [10.0, 11.89], [15.0, 17.79], [19.0, 21.44], [23.0, 23.48], [25.0, 26.89], [31.0, 31.45], [34.0, 34.53], [41.0, 41.57], [47.0, 47.97], [58.0, 58.14], [60.0, 61.8], [62.0, 63.02], [66.0, 66.41], [68.0, 69.08], [70.0, 71.63], [82.0, 83.73], [86.0, 86.39], [92.0, 93.02], [96.0, 96.4], [101.0, 102.51], [104.0, 106.25], [107.0, 107.79], [110.0, 112.28], [114.0, 115.06], [116.0, 117.75], [118.0, 119.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 98.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 1.59, 1.22, 1.89, 2.79, 2.44, 0.48, 1.89, 0.45, 0.53, 0.57, 0.97, 0.14, 1.8, 1.02, 0.41, 1.08, 1.63, 1.73, 0.39, 1.02, 0.4, 1.51, 2.25, 0.79, 2.28, 1.06, 1.75, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/aY6ZwMZqaBk_filtered.json b/annotations_filtered/aY6ZwMZqaBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8102dd1be7e47d2f20710e0361fdb15d24847cf --- /dev/null +++ b/annotations_filtered/aY6ZwMZqaBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.11], [22.0, 22.13], [29.0, 31.13], [35.0, 37.44], [40.0, 39.75], [46.0, 50.94], [59.0, 64.23], [74.0, 78.76], [86.0, 86.53], [90.0, 91.39], [94.0, 96.3], [98.0, 99.67], [101.0, 101.16], [103.0, 102.84], [113.0, 120.43], [121.0, 124.97], [128.0, 129.12], [131.0, 131.03], [132.0, 135.57], [137.0, 150.63], [152.0, 155.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 100.0, 40.09, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0, 44.2, 66.88, 0.0, 0.0, 98.8, 86.09, 91.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 70.67], ["bouncing", 12.58], ["thunk", 5.97]], null, null, null, null, null, null, [["speech", 72.43], ["sidetone", 8.26], ["whimper", 4.93]], null, null, null, null, null, null], "duration": [1.11, 0.13, 2.13, 2.44, -0.25, 4.94, 5.23, 4.76, 0.53, 1.39, 2.3, 1.67, 0.16, -0.16, 7.43, 3.97, 1.12, 0.03, 3.57, 13.63, 3.63]} \ No newline at end of file diff --git a/annotations_filtered/aYBTp7dH_XE_filtered.json b/annotations_filtered/aYBTp7dH_XE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83b1c0290dd9978398d880de4192a703860d3745 --- /dev/null +++ b/annotations_filtered/aYBTp7dH_XE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 63.14], [66.0, 71.44], [72.0, 77.72], [80.0, 100.41], [104.0, 105.81], [108.0, 116.33]], "keep_status": [false, true, true, true, false, true], "silence_prob": [0.0, 35.33, 36.66, 41.14, 0.0, 34.99], "audiomae_on_audioset": [null, [["music", 28.58], ["speech", 15.96], ["cattle, bovinae", 10.65]], [["music", 43.92], ["speech", 14.96], ["mains hum", 9.59]], [["music", 16.15], ["hum", 15.85], ["speech", 13.61]], null, [["hum", 25.24], ["mains hum", 18.14], ["music", 17.32]]], "duration": [38.14, 5.44, 5.72, 20.41, 1.81, 8.33]} \ No newline at end of file diff --git a/annotations_filtered/aYSdnLgl-FQ_filtered.json b/annotations_filtered/aYSdnLgl-FQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57a6841d3d53c1fecafd7a17e2e8a4cb3a0c334c --- /dev/null +++ b/annotations_filtered/aYSdnLgl-FQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [4.0, 6.47], [8.0, 10.22], [13.0, 13.9], [18.0, 18.98], [26.0, 26.0], [28.0, 31.24], [35.0, 38.6], [39.0, 41.81], [46.0, 47.14], [48.0, 49.92], [52.0, 56.12], [59.0, 59.98], [64.0, 66.28], [68.0, 68.12], [69.0, 79.19], [80.0, 81.68], [87.0, 119.7], [121.0, 123.72], [126.0, 152.19], [155.0, 156.56], [158.0, 159.53], [161.0, 165.65], [166.0, 165.69], [171.0, 171.37], [174.0, 174.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 32.92, 53.34, 0.0, 0.0, 0.0, 80.11, 82.07, 57.97, 0.0, 0.0, 50.26, 0.0, 35.8, 0.0, 29.7, 0.0, 0.0, 32.24, 28.93, 0.0, 0.0, 38.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 39.4], ["music", 25.71], ["musical instrument", 5.48]], null, null, null, null, null, null, null, null, null, null, null, [["music", 12.56], ["guitar", 12.11], ["clang", 10.13]], null, [["thunk", 38.04], ["speech", 33.1], ["whack, thwack", 8.53]], null, null, [["music", 26.94], ["didgeridoo", 7.52], ["throat clearing", 5.98]], [["breaking", 27.99], ["music", 25.3], ["whack, thwack", 15.48]], null, null, [["speech", 40.66], ["music", 23.02], ["sonar", 8.77]], null, null, null], "duration": [0.08, 2.47, 2.22, 0.9, 0.98, 0.0, 3.24, 3.6, 2.81, 1.14, 1.92, 4.12, 0.98, 2.28, 0.12, 10.19, 1.68, 32.7, 2.72, 26.19, 1.56, 1.53, 4.65, -0.31, 0.37, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/aYbNb8eaTCY_filtered.json b/annotations_filtered/aYbNb8eaTCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb602ef9b985d73f55b8fb8ab0bc83961183b9a8 --- /dev/null +++ b/annotations_filtered/aYbNb8eaTCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.53], [18.0, 19.8], [23.0, 24.73], [25.0, 26.35], [29.0, 29.88], [31.0, 36.56], [39.0, 52.42], [54.0, 62.14], [63.0, 64.08], [65.0, 67.1], [69.0, 69.5], [71.0, 81.97], [84.0, 97.71], [103.0, 104.26], [106.0, 108.04]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, true, false, false, true], "silence_prob": [62.78, 0.0, 0.0, 0.0, 0.0, 57.01, 45.75, 37.68, 0.0, 39.09, 0.0, 34.37, 31.44, 0.0, 34.1], "audiomae_on_audioset": [null, null, null, null, null, null, [["thunk", 55.4], ["music", 21.73], ["theremin", 7.31]], [["hum", 21.43], ["fire", 16.85], ["speech", 10.53]], null, [["speech", 22.43], ["mains hum", 7.81], ["hum", 7.23]], null, [["music", 46.67], ["theremin", 11.25], ["musical instrument", 6.46]], [["theremin", 32.0], ["music", 27.11], ["hum", 20.95]], null, [["music", 44.05], ["theremin", 10.76], ["whale vocalization", 5.63]]], "duration": [2.53, 1.8, 1.73, 1.35, 0.88, 5.56, 13.42, 8.14, 1.08, 2.1, 0.5, 10.97, 13.71, 1.26, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/aYuatR0B8Uc_filtered.json b/annotations_filtered/aYuatR0B8Uc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10e462909c82c50f79390dda9159d6c39e4cf79e --- /dev/null +++ b/annotations_filtered/aYuatR0B8Uc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.48], [6.0, 6.62], [7.0, 9.86], [11.0, 11.92], [14.0, 14.23], [15.0, 20.17], [21.0, 21.83], [27.0, 27.23], [28.0, 28.58], [30.0, 31.5], [34.0, 35.55], [37.0, 38.08], [39.0, 45.39], [49.0, 49.32], [57.0, 57.4], [70.0, 69.7], [72.0, 72.55], [74.0, 75.37], [76.0, 76.89], [78.0, 82.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.35, 0.0, 97.33, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.48, 0.62, 2.86, 0.92, 0.23, 5.17, 0.83, 0.23, 0.58, 1.5, 1.55, 1.08, 6.39, 0.32, 0.4, -0.3, 0.55, 1.37, 0.89, 4.56]} \ No newline at end of file diff --git a/annotations_filtered/aYzPUa-6BLE_filtered.json b/annotations_filtered/aYzPUa-6BLE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8caf72af93d7716ec50f2e42619bcb73a97b619b --- /dev/null +++ b/annotations_filtered/aYzPUa-6BLE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.36], [17.0, 25.27], [27.0, 67.12], [70.0, 74.8], [80.0, 97.92], [98.0, 98.42], [98.0, 111.79]], "keep_status": [false, true, false, true, true, false, true], "silence_prob": [31.41, 31.07, 0.0, 35.12, 29.63, 0.0, 32.83], "audiomae_on_audioset": [[["music", 60.65], ["speech", 10.58], ["throbbing", 3.4]], [["music", 17.75], ["noise", 11.25], ["synthesizer", 8.07]], null, [["music", 20.82], ["mains hum", 13.14], ["hum", 11.75]], [["music", 47.28], ["vehicle", 8.72], ["car", 6.89]], null, [["music", 34.67], ["effects unit", 9.41], ["synthesizer", 5.8]]], "duration": [12.36, 8.27, 40.12, 4.8, 17.92, 0.42, 13.79]} \ No newline at end of file diff --git a/annotations_filtered/aZJG26fSy94_filtered.json b/annotations_filtered/aZJG26fSy94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4662b14ff23655d5c000b6b6781ae71a02d3470 --- /dev/null +++ b/annotations_filtered/aZJG26fSy94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.76], [12.0, 12.9], [17.0, 18.1], [24.0, 23.9], [24.0, 27.9], [28.0, 32.39], [38.0, 37.86], [61.0, 66.51], [87.0, 92.23], [104.0, 104.19], [109.0, 114.76]], "keep_status": [false, false, false, false, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.73, 38.03, 0.0, 30.42, 31.45, 0.0, 32.91], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 26.27], ["livestock, farm animals, working animals", 20.47], ["moo", 14.31]], [["drip", 9.13], ["whale vocalization", 8.05], ["music", 8.03]], null, [["rumble", 18.34], ["explosion", 10.26], ["speech", 7.66]], [["music", 22.71], ["hum", 8.77], ["explosion", 7.72]], null, [["sheep", 66.97], ["bleat", 11.9], ["animal", 5.96]]], "duration": [1.76, 0.9, 1.1, -0.1, 3.9, 4.39, -0.14, 5.51, 5.23, 0.19, 5.76]} \ No newline at end of file diff --git a/annotations_filtered/aZbGlkGWiZc_filtered.json b/annotations_filtered/aZbGlkGWiZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cbe64509533afc70f775ce89ac66e9ce08bbd6b --- /dev/null +++ b/annotations_filtered/aZbGlkGWiZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.68], [7.0, 7.84], [9.0, 9.29], [17.0, 18.27], [19.0, 21.05], [21.0, 32.85], [34.0, 35.14], [36.0, 36.22], [37.0, 40.41], [42.0, 44.36], [47.0, 69.92], [72.0, 101.88], [104.0, 104.92], [109.0, 110.52], [113.0, 123.84]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.47, 29.59, 0.0, 0.0, 44.69, 38.83, 29.77, 29.38, 0.0, 0.0, 32.15], "audiomae_on_audioset": [null, null, null, null, [["music", 39.73], ["speech", 12.02], ["house music", 7.49]], [["music", 44.43], ["throbbing", 13.38], ["hum", 6.68]], null, null, [["music", 82.6], ["synthesizer", 3.57], ["musical instrument", 1.76]], [["music", 80.08], ["synthesizer", 7.28], ["musical instrument", 5.65]], [["music", 70.45], ["house music", 6.22], ["electronic dance music", 5.63]], [["music", 40.48], ["speech", 7.79], ["electronic music", 6.53]], null, null, [["sidetone", 31.79], ["music", 25.18], ["speech", 9.28]]], "duration": [0.68, 0.84, 0.29, 1.27, 2.05, 11.85, 1.14, 0.22, 3.41, 2.36, 22.92, 29.88, 0.92, 1.52, 10.84]} \ No newline at end of file diff --git a/annotations_filtered/aZe77wShCbE_filtered.json b/annotations_filtered/aZe77wShCbE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..000f74b50f4dc85f67a757313087330f81629ff6 --- /dev/null +++ b/annotations_filtered/aZe77wShCbE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 50.45], [51.0, 51.48], [54.0, 54.19], [56.0, 56.52], [58.0, 60.79], [66.0, 66.88], [68.0, 79.79], [82.0, 83.0], [83.0, 83.66], [85.0, 86.19], [86.0, 87.27], [88.0, 94.22], [97.0, 97.55], [98.0, 104.68], [106.0, 105.95], [106.0, 116.41], [118.0, 119.45], [124.0, 123.79]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [29.82, 0.0, 0.0, 0.0, 40.88, 0.0, 31.69, 0.0, 0.0, 0.0, 0.0, 33.09, 0.0, 29.33, 0.0, 49.4, 0.0, 0.0], "audiomae_on_audioset": [[["music", 77.42], ["musical instrument", 3.22], ["angry music", 2.63]], null, null, null, [["music", 63.9], ["synthesizer", 8.5], ["speech", 3.72]], null, [["mains hum", 23.17], ["music", 23.14], ["hum", 21.83]], null, null, null, null, [["music", 66.9], ["synthesizer", 12.09], ["musical instrument", 10.05]], null, [["music", 73.08], ["theremin", 3.51], ["musical instrument", 2.58]], null, [["music", 40.01], ["ambient music", 9.83], ["singing bowl", 6.94]], null, null], "duration": [22.45, 0.48, 0.19, 0.52, 2.79, 0.88, 11.79, 1.0, 0.66, 1.19, 1.27, 6.22, 0.55, 6.68, -0.05, 10.41, 1.45, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/aZiDvfhRpz4_filtered.json b/annotations_filtered/aZiDvfhRpz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9244263890bfeb27cc5723ccdc175abd50f6db25 --- /dev/null +++ b/annotations_filtered/aZiDvfhRpz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 68.72]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [65.72]} \ No newline at end of file diff --git a/annotations_filtered/a_4TTRfXkgk_filtered.json b/annotations_filtered/a_4TTRfXkgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8033b530d81db1ac581283747cb93a9ad66cb88 --- /dev/null +++ b/annotations_filtered/a_4TTRfXkgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.51], [16.0, 17.12], [19.0, 18.86], [21.0, 21.25], [22.0, 22.71], [24.0, 24.38], [28.0, 29.17], [30.0, 32.43], [40.0, 42.11], [42.0, 43.83], [46.0, 47.48], [48.0, 49.11], [53.0, 53.94], [55.0, 55.17], [58.0, 58.9], [60.0, 60.24], [62.0, 64.93], [65.0, 65.94], [67.0, 68.07], [70.0, 70.56], [73.0, 74.43], [75.0, 77.19], [81.0, 83.3], [88.0, 89.23], [91.0, 95.49], [96.0, 99.81], [103.0, 108.03], [110.0, 112.97], [114.0, 115.05], [116.0, 128.58]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.83, 37.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.23, 0.0, 0.0, 0.0, 0.0, 77.2, 35.37, 0.0, 36.94, 37.11, 42.17, 38.88, 0.0, 37.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["civil defense siren", 13.84], ["vehicle", 12.25], ["car", 6.04]], [["artillery fire", 23.12], ["speech", 17.25], ["whip", 10.27]], null, null, null, null, null, null, null, [["animal", 16.14], ["skateboard", 15.28], ["mosquito", 5.3]], null, null, null, null, null, [["music", 19.82], ["theremin", 12.51], ["scary music", 4.58]], null, [["mains hum", 29.01], ["hum", 15.8], ["speech", 11.83]], [["speech", 27.92], ["music", 16.97], ["musical instrument", 6.39]], [["cattle, bovinae", 32.64], ["livestock, farm animals, working animals", 31.33], ["moo", 29.79]], [["moo", 29.73], ["cattle, bovinae", 25.38], ["livestock, farm animals, working animals", 21.89]], null, [["music", 33.71], ["speech", 20.05], ["theremin", 6.65]]], "duration": [1.51, 1.12, -0.14, 0.25, 0.71, 0.38, 1.17, 2.43, 2.11, 1.83, 1.48, 1.11, 0.94, 0.17, 0.9, 0.24, 2.93, 0.94, 1.07, 0.56, 1.43, 2.19, 2.3, 1.23, 4.49, 3.81, 5.03, 2.97, 1.05, 12.58]} \ No newline at end of file diff --git a/annotations_filtered/a_6tguZWgmU_filtered.json b/annotations_filtered/a_6tguZWgmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fb69ba8152c9de3a62d8b6f69832ecd26855654 --- /dev/null +++ b/annotations_filtered/a_6tguZWgmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 58.21], [60.0, 59.56], [61.0, 64.99], [67.0, 81.31], [88.0, 119.94]], "keep_status": [false, false, true, false, false], "silence_prob": [29.59, 0.0, 29.24, 29.57, 0.0], "audiomae_on_audioset": [[["music", 70.04], ["boing", 4.28], ["synthesizer", 2.97]], null, [["vehicle", 29.84], ["skidding", 18.43], ["car", 17.65]], [["music", 72.49], ["synthesizer", 6.95], ["sound effect", 2.73]], null], "duration": [14.21, -0.44, 3.99, 14.31, 31.94]} \ No newline at end of file diff --git a/annotations_filtered/a_9dO9k2TPQ_filtered.json b/annotations_filtered/a_9dO9k2TPQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/a_9dO9k2TPQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/a_DO8nd7FeA_filtered.json b/annotations_filtered/a_DO8nd7FeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2967988ee3ba931d891ece6a83a5e310248072db --- /dev/null +++ b/annotations_filtered/a_DO8nd7FeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 38.31], [45.0, 51.36], [53.0, 54.46], [56.0, 66.99], [68.0, 73.52], [78.0, 93.61], [96.0, 102.39], [108.0, 110.74], [112.0, 123.45], [124.0, 124.44]], "keep_status": [false, true, false, true, true, false, false, false, true, false], "silence_prob": [0.0, 35.71, 0.0, 32.69, 33.53, 38.84, 58.64, 86.45, 45.82, 0.0], "audiomae_on_audioset": [null, [["music", 26.47], ["throbbing", 21.53], ["speech", 16.53]], null, [["speech", 29.1], ["music", 25.92], ["foghorn", 6.71]], [["music", 45.01], ["speech", 21.14], ["hum", 3.83]], [["livestock, farm animals, working animals", 62.77], ["cattle, bovinae", 20.18], ["moo", 16.42]], null, null, [["electric shaver, electric razor", 23.74], ["buzz", 17.1], ["hum", 8.32]], null], "duration": [36.31, 6.36, 1.46, 10.99, 5.52, 15.61, 6.39, 2.74, 11.45, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/a_DkEkfAO4s_filtered.json b/annotations_filtered/a_DkEkfAO4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67b2bdc3e9ab36cd6a834c247340a4a2bd4cbf16 --- /dev/null +++ b/annotations_filtered/a_DkEkfAO4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 19.52], [23.0, 24.02], [25.0, 25.71], [28.0, 27.82], [29.0, 30.03], [31.0, 31.19], [32.0, 39.95], [42.0, 48.47], [55.0, 56.86], [59.0, 59.05], [64.0, 66.09], [75.0, 80.06], [86.0, 86.97], [89.0, 89.85], [94.0, 94.63], [98.0, 104.26], [108.0, 109.29], [123.0, 122.91], [127.0, 127.9], [134.0, 134.28], [136.0, 138.48], [145.0, 145.05], [152.0, 151.73], [159.0, 159.53], [161.0, 162.11], [174.0, 174.02], [176.0, 175.69], [178.0, 180.0], [186.0, 187.68], [199.0, 198.75], [199.0, 201.07], [206.0, 206.46], [213.0, 213.7], [227.0, 228.01], [233.0, 233.58]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.44, 0.0, 0.0, 0.0, 0.0, 0.0, 29.99, 35.01, 0.0, 0.0, 62.17, 31.54, 0.0, 0.0, 0.0, 52.27, 0.0, 0.0, 0.0, 0.0, 35.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.83], ["smash, crash", 28.59], ["breaking", 21.74]], null, null, null, null, null, [["sidetone", 23.93], ["buzz", 16.45], ["hum", 8.65]], [["explosion", 18.79], ["speech", 16.59], ["hum", 8.63]], null, null, null, [["music", 19.4], ["roar", 13.37], ["animal", 5.28]], null, null, null, null, null, null, null, null, [["moo", 27.98], ["cattle, bovinae", 25.55], ["livestock, farm animals, working animals", 24.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.52, 1.02, 0.71, -0.18, 1.03, 0.19, 7.95, 6.47, 1.86, 0.05, 2.09, 5.06, 0.97, 0.85, 0.63, 6.26, 1.29, -0.09, 0.9, 0.28, 2.48, 0.05, -0.27, 0.53, 1.11, 0.02, -0.31, 2.0, 1.68, -0.25, 2.07, 0.46, 0.7, 1.01, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/a_UjNi8M_bw_filtered.json b/annotations_filtered/a_UjNi8M_bw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d27df93c13c5537627bbab80a20950df10c1382b --- /dev/null +++ b/annotations_filtered/a_UjNi8M_bw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.18], [10.0, 13.71], [16.0, 16.97], [18.0, 48.95], [50.0, 95.99], [101.0, 100.89]], "keep_status": [true, false, false, false, false, false], "silence_prob": [29.07, 29.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["breaking", 32.84], ["music", 26.8], ["whack, thwack", 7.45]], [["mains hum", 44.12], ["hum", 30.82], ["music", 5.83]], null, null, null, null], "duration": [2.18, 3.71, 0.97, 30.95, 45.99, -0.11]} \ No newline at end of file diff --git a/annotations_filtered/a_VIjZa76jI_filtered.json b/annotations_filtered/a_VIjZa76jI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78330095a29ba96be26b1d8db5c6db96de3533bd --- /dev/null +++ b/annotations_filtered/a_VIjZa76jI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.31], [36.0, 36.9], [41.0, 41.67], [46.0, 46.53], [48.0, 53.77], [56.0, 56.66], [57.0, 71.07], [72.0, 73.82]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.33, 0.0, 30.39, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 43.03], ["speech", 24.2], ["crowd", 5.67]], null, [["music", 35.71], ["speech", 27.93], ["throbbing", 5.01]], null], "duration": [0.31, 0.9, 0.67, 0.53, 5.77, 0.66, 14.07, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/a_aZ01raOoI_filtered.json b/annotations_filtered/a_aZ01raOoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18a4c94fa32f7035dd14250f2cba2fe57e8b23b4 --- /dev/null +++ b/annotations_filtered/a_aZ01raOoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.45], [11.0, 11.96], [15.0, 18.37], [35.0, 35.45], [41.0, 44.34], [46.0, 46.16], [53.0, 52.89], [58.0, 58.18], [68.0, 68.1], [80.0, 80.45], [85.0, 85.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 38.2, 0.0, 54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 78.75], ["boing", 4.71], ["didgeridoo", 4.24]], null, null, null, null, null, null, null, null], "duration": [0.45, 0.96, 3.37, 0.45, 3.34, 0.16, -0.11, 0.18, 0.1, 0.45, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/a_hsjTExzbw_filtered.json b/annotations_filtered/a_hsjTExzbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a15b41f6fcc7cb88fc7f5e4f98f43f680b2253b --- /dev/null +++ b/annotations_filtered/a_hsjTExzbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.53], [26.0, 26.65], [32.0, 32.64], [36.0, 35.92], [38.0, 47.49], [51.0, 51.17], [61.0, 65.13], [67.0, 86.7], [90.0, 117.85]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.85, 0.0, 33.84, 31.26, 30.51], "audiomae_on_audioset": [null, null, null, null, [["music", 53.29], ["hum", 8.59], ["mains hum", 5.07]], null, [["music", 49.46], ["hum", 22.76], ["throbbing", 16.54]], [["music", 60.21], ["speech", 6.51], ["hum", 3.76]], [["music", 72.24], ["speech", 3.8], ["electronic music", 1.9]]], "duration": [0.53, 0.65, 0.64, -0.08, 9.49, 0.17, 4.13, 19.7, 27.85]} \ No newline at end of file diff --git a/annotations_filtered/a_i-mCZH5bo_filtered.json b/annotations_filtered/a_i-mCZH5bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9013d87bf1a70bbb5b7e017ec3d63c702e388a0 --- /dev/null +++ b/annotations_filtered/a_i-mCZH5bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 16.39], [17.0, 25.81], [32.0, 50.87], [54.0, 67.15], [68.0, 69.31], [72.0, 77.94], [85.0, 98.61], [99.0, 100.26], [101.0, 123.23], [126.0, 134.18], [135.0, 138.0]], "keep_status": [true, false, false, true, false, true, true, false, true, false, false], "silence_prob": [31.15, 32.87, 33.85, 32.82, 0.0, 34.41, 31.52, 0.0, 31.96, 33.98, 100.0], "audiomae_on_audioset": [[["hum", 21.12], ["music", 14.96], ["mains hum", 14.53]], [["throbbing", 53.8], ["hum", 29.68], ["mains hum", 9.18]], [["music", 66.69], ["electronic music", 7.16], ["throbbing", 5.55]], [["music", 47.66], ["hum", 9.57], ["mains hum", 9.08]], null, [["speech", 46.59], ["music", 16.05], ["fly, housefly", 5.13]], [["hum", 28.19], ["music", 22.9], ["mains hum", 13.96]], null, [["livestock, farm animals, working animals", 29.37], ["cattle, bovinae", 16.86], ["music", 11.02]], [["clang", 36.59], ["ding", 31.71], ["single-lens reflex camera", 8.69]], null], "duration": [16.39, 8.81, 18.87, 13.15, 1.31, 5.94, 13.61, 1.26, 22.23, 8.18, 3.0]} \ No newline at end of file diff --git a/annotations_filtered/a_iEYXLXbjY_filtered.json b/annotations_filtered/a_iEYXLXbjY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e564551477ea60276bbdc4654c3ec0a17450112f --- /dev/null +++ b/annotations_filtered/a_iEYXLXbjY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.32], [4.0, 4.9], [10.0, 12.45], [16.0, 16.23], [19.0, 19.72], [20.0, 20.87], [22.0, 22.71], [23.0, 24.9], [27.0, 27.5], [30.0, 30.84], [36.0, 38.35], [40.0, 50.57], [52.0, 53.23], [54.0, 56.88], [61.0, 61.94], [73.0, 79.29], [81.0, 86.9], [88.0, 88.26], [93.0, 93.93], [94.0, 96.63], [100.0, 101.21], [102.0, 103.94], [107.0, 134.45], [136.0, 136.95], [145.0, 146.06], [147.0, 147.29], [150.0, 150.48], [154.0, 154.28]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 31.65, 0.0, 56.03, 0.0, 99.99, 46.33, 0.0, 0.0, 44.26, 0.0, 0.0, 30.36, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["moo", 29.82], ["cattle, bovinae", 18.95], ["livestock, farm animals, working animals", 5.51]], null, null, null, null, null, null, null, [["music", 10.19], ["moo", 6.83], ["speech", 6.06]], [["whack, thwack", 35.76], ["speech", 21.1], ["fly, housefly", 6.6]], null, null, null, null, [["music", 54.21], ["thunk", 16.41], ["hum", 2.83]], null, null, [["speech", 28.19], ["music", 19.66], ["gong", 12.71]], null, null, [["music", 79.43], ["psychedelic rock", 3.76], ["punk rock", 1.9]], null, null, null, null, null], "duration": [0.32, 0.9, 2.45, 0.23, 0.72, 0.87, 0.71, 1.9, 0.5, 0.84, 2.35, 10.57, 1.23, 2.88, 0.94, 6.29, 5.9, 0.26, 0.93, 2.63, 1.21, 1.94, 27.45, 0.95, 1.06, 0.29, 0.48, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/a_z4IuxAqpE_filtered.json b/annotations_filtered/a_z4IuxAqpE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff09052a871d6de4ad1501f450da3dd740922479 --- /dev/null +++ b/annotations_filtered/a_z4IuxAqpE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.75], [3.0, 8.24], [9.0, 26.1], [28.0, 28.43], [29.0, 29.83], [32.0, 31.94], [32.0, 45.08], [46.0, 118.56], [124.0, 125.66], [132.0, 131.97], [134.0, 135.08], [135.0, 135.63], [136.0, 141.03], [147.0, 157.17], [159.0, 160.93]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.6, 35.13, 0.0, 0.0, 0.0, 33.85, 0.0, 0.0, 0.0, 0.0, 0.0, 32.01, 30.58, 0.0], "audiomae_on_audioset": [null, null, [["music", 38.15], ["speech", 21.93], ["hum", 5.33]], null, null, null, [["speech", 29.41], ["livestock, farm animals, working animals", 10.48], ["cattle, bovinae", 8.16]], null, null, null, null, null, [["speech", 72.3], ["music", 10.6], ["explosion", 1.78]], [["speech", 71.76], ["music", 7.11], ["hum", 2.69]], null], "duration": [-0.25, 5.24, 17.1, 0.43, 0.83, -0.06, 13.08, 72.56, 1.66, -0.03, 1.08, 0.63, 5.03, 10.17, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/aa0NlkF7Rug_filtered.json b/annotations_filtered/aa0NlkF7Rug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97eae174bd75a070cf43fbdf7bdc903afcfa09e6 --- /dev/null +++ b/annotations_filtered/aa0NlkF7Rug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.94], [1.0, 1.07], [1.0, 17.71], [20.0, 28.93], [29.0, 29.94], [30.0, 50.06], [54.0, 66.82], [68.0, 92.4], [96.0, 98.47]], "keep_status": [false, false, true, true, false, true, true, true, true], "silence_prob": [0.0, 0.0, 35.41, 33.53, 0.0, 30.0, 29.58, 30.73, 29.67], "audiomae_on_audioset": [null, null, [["electric shaver, electric razor", 35.41], ["noise", 13.26], ["speech", 9.92]], [["livestock, farm animals, working animals", 22.35], ["whale vocalization", 13.21], ["cattle, bovinae", 11.57]], null, [["music", 17.58], ["speech", 16.68], ["didgeridoo", 14.11]], [["speech", 40.88], ["knock", 10.72], ["music", 10.49]], [["speech", 46.44], ["music", 9.06], ["animal", 7.33]], [["fly, housefly", 30.73], ["insect", 17.58], ["bee, wasp, etc.", 11.53]]], "duration": [-0.06, 0.07, 16.71, 8.93, 0.94, 20.06, 12.82, 24.4, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/aa2agiADM04_filtered.json b/annotations_filtered/aa2agiADM04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47f9db8eee70a2209bd92a3ec02c57a5637ebfa7 --- /dev/null +++ b/annotations_filtered/aa2agiADM04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.25], [13.0, 13.36], [14.0, 15.42], [17.0, 18.54], [21.0, 21.68], [25.0, 32.21], [35.0, 47.22], [49.0, 49.74], [51.0, 82.7], [83.0, 83.94], [85.0, 87.94], [95.0, 95.77], [96.0, 98.59], [99.0, 101.48], [103.0, 103.71], [104.0, 110.66], [112.0, 116.77], [119.0, 136.04], [137.0, 137.69], [144.0, 150.45], [154.0, 154.38], [158.0, 167.61]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.2, 30.15, 0.0, 0.0, 0.0, 33.12, 0.0, 34.03, 37.06, 0.0, 29.02, 32.82, 29.06, 0.0, 29.78, 0.0, 29.26], "audiomae_on_audioset": [null, null, null, null, null, [["bow-wow", 24.76], ["animal", 23.47], ["rumble", 9.06]], [["hum", 47.09], ["throbbing", 36.05], ["music", 7.94]], null, null, null, [["fireworks", 12.82], ["explosion", 11.61], ["throbbing", 8.72]], null, [["speech", 63.31], ["rumble", 17.7], ["music", 2.92]], [["music", 26.29], ["hum", 19.01], ["ambient music", 10.12]], null, [["speech", 65.81], ["breaking", 9.94], ["music", 7.63]], [["hum", 39.71], ["throbbing", 23.48], ["mains hum", 6.11]], [["speech", 14.63], ["breaking", 14.24], ["glass", 9.12]], null, [["speech", 38.71], ["hum", 20.01], ["throbbing", 5.42]], null, [["hum", 33.41], ["speech", 31.79], ["throbbing", 11.88]]], "duration": [0.25, 0.36, 1.42, 1.54, 0.68, 7.21, 12.22, 0.74, 31.7, 0.94, 2.94, 0.77, 2.59, 2.48, 0.71, 6.66, 4.77, 17.04, 0.69, 6.45, 0.38, 9.61]} \ No newline at end of file diff --git a/annotations_filtered/aaGlVyyFOl0_filtered.json b/annotations_filtered/aaGlVyyFOl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91f8e79358b2371f0d10fadd5d3c940d1829c8c4 --- /dev/null +++ b/annotations_filtered/aaGlVyyFOl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.15], [13.0, 14.0], [25.0, 26.54], [27.0, 27.33], [28.0, 28.34], [38.0, 44.85], [46.0, 48.12], [49.0, 52.24], [56.0, 57.5], [60.0, 60.61], [63.0, 63.66], [66.0, 67.73], [69.0, 70.82], [72.0, 73.28], [77.0, 78.83], [80.0, 81.89], [83.0, 84.0], [87.0, 88.25], [90.0, 91.2], [92.0, 93.23], [95.0, 95.55], [96.0, 97.23], [98.0, 97.6], [98.0, 97.63], [98.0, 102.3], [103.0, 103.55], [108.0, 108.55], [112.0, 115.28], [117.0, 118.62], [120.0, 120.51], [121.0, 121.78], [124.0, 126.57]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.86, 44.01, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.33, 0.0, 0.0, 47.31, 0.0, 0.0, 0.0, 99.4], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 20.79], ["screaming", 10.88], ["whack, thwack", 9.49]], [["speech", 37.78], ["sidetone", 11.85], ["frog", 3.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 76.64], ["speech", 9.26], ["bee, wasp, etc.", 2.36]], null, null, [["music", 43.2], ["hum", 10.75], ["ambient music", 5.09]], null, null, null, null], "duration": [0.15, 1.0, 1.54, 0.33, 0.34, 6.85, 2.12, 3.24, 1.5, 0.61, 0.66, 1.73, 1.82, 1.28, 1.83, 1.89, 1.0, 1.25, 1.2, 1.23, 0.55, 1.23, -0.4, -0.37, 4.3, 0.55, 0.55, 3.28, 1.62, 0.51, 0.78, 2.57]} \ No newline at end of file diff --git a/annotations_filtered/aaU-KRx8Zc8_filtered.json b/annotations_filtered/aaU-KRx8Zc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07b46383c4d95614fa514917cf234383e3608070 --- /dev/null +++ b/annotations_filtered/aaU-KRx8Zc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.78], [8.0, 35.11], [36.0, 39.58], [41.0, 41.79], [42.0, 47.29], [52.0, 52.0], [54.0, 57.48], [60.0, 60.89], [64.0, 72.12], [73.0, 79.3], [81.0, 81.08], [83.0, 86.27], [88.0, 97.16], [98.0, 99.47], [100.0, 100.94], [103.0, 106.96], [108.0, 108.89]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.81, 33.53, 0.0, 33.16, 0.0, 38.14, 0.0, 30.08, 33.4, 0.0, 35.04, 31.21, 0.0, 0.0, 48.44, 0.0], "audiomae_on_audioset": [null, [["music", 25.68], ["vehicle", 24.59], ["car", 15.36]], [["speech", 41.36], ["music", 33.53], ["electronic music", 3.22]], null, [["music", 58.85], ["electronic music", 5.87], ["throbbing", 5.37]], null, [["music", 57.41], ["speech", 8.6], ["electronic music", 4.44]], null, [["music", 70.07], ["speech", 8.03], ["sidetone", 2.94]], [["hum", 28.32], ["music", 27.25], ["mains hum", 15.37]], null, [["hum", 28.32], ["music", 24.58], ["mains hum", 19.41]], [["hum", 37.45], ["throbbing", 32.12], ["mains hum", 12.87]], null, null, [["music", 63.43], ["musical instrument", 5.92], ["electronic music", 3.95]], null], "duration": [1.78, 27.11, 3.58, 0.79, 5.29, 0.0, 3.48, 0.89, 8.12, 6.3, 0.08, 3.27, 9.16, 1.47, 0.94, 3.96, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/aaaIdkgVahY_filtered.json b/annotations_filtered/aaaIdkgVahY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26883293752a87eacb6d7690dc944ed07ec84011 --- /dev/null +++ b/annotations_filtered/aaaIdkgVahY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.67], [30.0, 31.68], [33.0, 35.02], [36.0, 35.85], [38.0, 39.07], [40.0, 40.2], [43.0, 45.62], [47.0, 48.64], [49.0, 58.43], [65.0, 65.5], [66.0, 68.76], [71.0, 71.59], [72.0, 81.45], [83.0, 84.62], [86.0, 88.91], [89.0, 99.93], [103.0, 106.41]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.98, 0.0, 0.0, 0.0, 50.91, 0.0, 46.68, 0.0, 84.8, 0.0, 99.4, 0.0, 99.85, 99.98, 87.92], "audiomae_on_audioset": [null, null, [["music", 38.11], ["speech", 28.92], ["synthesizer", 4.11]], null, null, null, null, null, [["speech", 11.1], ["music", 10.41], ["thunk", 5.58]], null, null, null, null, null, null, null, null], "duration": [0.67, 1.68, 2.02, -0.15, 1.07, 0.2, 2.62, 1.64, 9.43, 0.5, 2.76, 0.59, 9.45, 1.62, 2.91, 10.93, 3.41]} \ No newline at end of file diff --git a/annotations_filtered/aak6BqNR150_filtered.json b/annotations_filtered/aak6BqNR150_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc8fd7791554715f004b570d7ca72a475b6fe3b --- /dev/null +++ b/annotations_filtered/aak6BqNR150_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.66], [18.0, 18.49], [19.0, 20.68], [22.0, 22.81], [31.0, 32.71], [44.0, 44.69], [47.0, 48.66], [52.0, 52.56], [62.0, 62.77], [72.0, 72.49], [82.0, 86.1], [93.0, 94.34], [100.0, 117.59], [126.0, 126.2], [135.0, 140.73], [141.0, 141.13], [153.0, 153.96], [163.0, 163.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.99, 0.0, 31.53, 0.0, 30.55, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["thunk", 41.42], ["music", 26.83], ["fly, housefly", 4.54]], null, [["music", 65.1], ["synthesizer", 7.41], ["musical instrument", 4.9]], null, [["moo", 26.67], ["cattle, bovinae", 21.96], ["groan", 9.72]], null, null, null], "duration": [1.66, 0.49, 1.68, 0.81, 1.71, 0.69, 1.66, 0.56, 0.77, 0.49, 4.1, 1.34, 17.59, 0.2, 5.73, 0.13, 0.96, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/aazXc06Oycs_filtered.json b/annotations_filtered/aazXc06Oycs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c698cac7e4df8e2582eebb8f9564b342afcb1b35 --- /dev/null +++ b/annotations_filtered/aazXc06Oycs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.08], [3.0, 5.59], [24.0, 24.85], [34.0, 33.57], [42.0, 43.28], [46.0, 47.58], [49.0, 50.18], [60.0, 62.18], [74.0, 76.96], [78.0, 79.68], [83.0, 83.49], [102.0, 105.07], [107.0, 108.41], [122.0, 122.77], [123.0, 123.72], [128.0, 128.44], [132.0, 133.74], [135.0, 143.26], [149.0, 151.38], [153.0, 152.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 93.29, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 96.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.08, 2.59, 0.85, -0.43, 1.28, 1.58, 1.18, 2.18, 2.96, 1.68, 0.49, 3.07, 1.41, 0.77, 0.72, 0.44, 1.74, 8.26, 2.38, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/ab4MM9cHidM_filtered.json b/annotations_filtered/ab4MM9cHidM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e202f25e1c77b71d6aebbe355ad3d812634f8d4d --- /dev/null +++ b/annotations_filtered/ab4MM9cHidM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.07], [3.0, 3.59], [4.0, 7.64], [10.0, 11.55], [13.0, 14.72], [15.0, 16.65], [18.0, 25.61], [30.0, 32.95], [34.0, 38.15], [38.0, 38.72], [39.0, 38.96], [39.0, 39.31], [44.0, 43.85], [47.0, 47.83], [51.0, 51.58], [53.0, 54.57], [66.0, 68.12], [70.0, 71.1], [75.0, 75.09], [79.0, 81.57], [85.0, 86.31], [87.0, 88.6], [89.0, 90.85], [94.0, 97.19], [100.0, 128.97], [131.0, 133.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.05, 0.0, 0.0, 0.0, 67.63, 60.05, 33.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 74.76, 79.41, 64.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 58.08], ["sidetone", 16.77], ["radio", 11.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.07, 0.59, 3.64, 1.55, 1.72, 1.65, 7.61, 2.95, 4.15, 0.72, -0.04, 0.31, -0.15, 0.83, 0.58, 1.57, 2.12, 1.1, 0.09, 2.57, 1.31, 1.6, 1.85, 3.19, 28.97, 2.64]} \ No newline at end of file diff --git a/annotations_filtered/abTZPgqiEto_filtered.json b/annotations_filtered/abTZPgqiEto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1206f041d85bf9eee083a7744cff8126d021defe --- /dev/null +++ b/annotations_filtered/abTZPgqiEto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[85.0, 133.25]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [48.25]} \ No newline at end of file diff --git a/annotations_filtered/abXL2HrEjyE_filtered.json b/annotations_filtered/abXL2HrEjyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..601c4cc270155fdb30db78da6fd9359ae33889a5 --- /dev/null +++ b/annotations_filtered/abXL2HrEjyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.73], [23.0, 23.26], [25.0, 51.26], [53.0, 74.95], [79.0, 126.45]], "keep_status": [false, false, true, true, false], "silence_prob": [0.0, 0.0, 34.75, 29.95, 0.0], "audiomae_on_audioset": [null, null, [["hum", 13.45], ["eruption", 8.12], ["animal", 7.03]], [["animal", 37.85], ["horse", 6.6], ["music", 5.31]], null], "duration": [1.73, 0.26, 26.26, 21.95, 47.45]} \ No newline at end of file diff --git a/annotations_filtered/abgTPYfdbOE_filtered.json b/annotations_filtered/abgTPYfdbOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec048553218ca79e829b6168ef6d4e2b814b7a96 --- /dev/null +++ b/annotations_filtered/abgTPYfdbOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.7], [13.0, 21.47], [24.0, 25.78], [26.0, 28.61], [30.0, 30.52], [33.0, 34.01], [37.0, 37.57], [38.0, 39.61], [40.0, 45.05], [55.0, 55.7], [59.0, 59.7], [61.0, 64.18], [66.0, 67.66], [69.0, 70.17], [71.0, 72.42], [74.0, 76.0], [77.0, 91.32], [95.0, 99.86], [100.0, 111.87], [112.0, 113.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 99.21, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.7, 8.47, 1.78, 2.61, 0.52, 1.01, 0.57, 1.61, 5.05, 0.7, 0.7, 3.18, 1.66, 1.17, 1.42, 2.0, 14.32, 4.86, 11.87, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/abhF5CFFW4s_filtered.json b/annotations_filtered/abhF5CFFW4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35bf88cf2a24298a229f4962d0c337551f9447e6 --- /dev/null +++ b/annotations_filtered/abhF5CFFW4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.56], [4.0, 6.76], [8.0, 9.37], [10.0, 11.48], [16.0, 17.37], [20.0, 21.2], [23.0, 27.18], [29.0, 45.91], [47.0, 49.98], [52.0, 54.3], [55.0, 61.82], [63.0, 65.82], [67.0, 68.44], [70.0, 70.66], [71.0, 72.55], [74.0, 94.0], [96.0, 98.14], [101.0, 100.84], [102.0, 115.79], [119.0, 127.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 87.74, 91.13, 99.44, 63.21, 64.86, 99.4, 0.0, 0.0, 0.0, 69.34, 35.92, 0.0, 39.54, 36.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 58.88], ["speech", 14.0], ["music", 4.72]], null, [["speech", 57.24], ["cattle, bovinae", 5.05], ["livestock, farm animals, working animals", 4.9]], [["whack, thwack", 43.24], ["speech", 7.68], ["fart", 7.16]]], "duration": [1.56, 2.76, 1.37, 1.48, 1.37, 1.2, 4.18, 16.91, 2.98, 2.3, 6.82, 2.82, 1.44, 0.66, 1.55, 20.0, 2.14, -0.16, 13.79, 8.2]} \ No newline at end of file diff --git a/annotations_filtered/ac7D9kcETUg_filtered.json b/annotations_filtered/ac7D9kcETUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..547b14215a8fca1f5fd6d935643f486b38a54005 --- /dev/null +++ b/annotations_filtered/ac7D9kcETUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.16], [7.0, 8.48], [10.0, 10.72], [19.0, 59.36], [60.0, 76.11], [87.0, 90.86]], "keep_status": [false, false, false, false, true, true], "silence_prob": [57.4, 0.0, 0.0, 0.0, 41.62, 34.85], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 24.83], ["speech", 18.66], ["music", 17.85]], [["speech", 49.55], ["fireworks", 4.56], ["explosion", 3.34]]], "duration": [2.16, 1.48, 0.72, 40.36, 16.11, 3.86]} \ No newline at end of file diff --git a/annotations_filtered/ac9w0rKTRPM_filtered.json b/annotations_filtered/ac9w0rKTRPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..822e1b9e09bd8d375d4a8261b4f88a5a26c6a37c --- /dev/null +++ b/annotations_filtered/ac9w0rKTRPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [4.0, 4.28], [7.0, 8.88], [10.0, 10.99], [12.0, 16.55], [17.0, 21.24], [24.0, 25.27]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 81.53, 64.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.54, 0.28, 1.88, 0.99, 4.55, 4.24, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/acO1g9PEIBM_filtered.json b/annotations_filtered/acO1g9PEIBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..581391c0dc716d6a9882caeb8edd4fff98ee8f9c --- /dev/null +++ b/annotations_filtered/acO1g9PEIBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.68], [18.0, 106.78], [111.0, 112.56], [114.0, 114.22]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.68, 88.78, 1.56, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/acZDS8WDtHs_filtered.json b/annotations_filtered/acZDS8WDtHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb22d128a04ee709f1c265f76b0d6c213ba95584 --- /dev/null +++ b/annotations_filtered/acZDS8WDtHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[68.0, 68.28], [72.0, 81.31], [83.0, 86.95], [88.0, 88.57], [89.0, 92.3], [94.0, 99.17], [101.0, 107.13], [109.0, 117.95], [118.0, 118.08]], "keep_status": [false, true, false, false, true, true, true, true, false], "silence_prob": [0.0, 40.31, 38.9, 0.0, 34.66, 29.37, 29.65, 29.3, 0.0], "audiomae_on_audioset": [null, [["hum", 22.44], ["speech", 19.08], ["mains hum", 8.79]], [["hum", 51.65], ["mains hum", 9.63], ["throbbing", 8.91]], null, [["speech", 32.87], ["mains hum", 11.21], ["music", 10.81]], [["music", 44.68], ["speech", 9.43], ["musical instrument", 3.51]], [["music", 25.83], ["frog", 10.92], ["electric shaver, electric razor", 5.93]], [["music", 37.94], ["speech", 9.15], ["groan", 7.94]], null], "duration": [0.28, 9.31, 3.95, 0.57, 3.3, 5.17, 6.13, 8.95, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/acnUb2KcgdU_filtered.json b/annotations_filtered/acnUb2KcgdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eda2be243623409943cc6b1a6db7a2008d0101fc --- /dev/null +++ b/annotations_filtered/acnUb2KcgdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.62], [19.0, 19.65], [22.0, 23.95], [28.0, 32.7], [34.0, 34.97], [36.0, 38.37], [39.0, 40.81], [47.0, 52.35], [56.0, 87.94], [99.0, 99.89], [107.0, 110.57], [112.0, 112.6], [115.0, 120.46]], "keep_status": [true, false, false, true, false, true, false, true, false, false, true, false, true], "silence_prob": [34.98, 0.0, 0.0, 32.37, 0.0, 42.81, 0.0, 32.61, 0.0, 0.0, 29.9, 0.0, 30.17], "audiomae_on_audioset": [[["hum", 43.3], ["mains hum", 13.25], ["electric shaver, electric razor", 9.66]], null, null, [["electric shaver, electric razor", 21.84], ["mains hum", 17.31], ["hum", 16.16]], null, [["speech", 11.54], ["vehicle", 8.13], ["whale vocalization", 6.56]], null, [["speech", 21.68], ["mains hum", 21.3], ["hum", 21.22]], null, null, [["mains hum", 38.88], ["hum", 13.46], ["speech", 9.49]], null, [["livestock, farm animals, working animals", 35.77], ["cattle, bovinae", 18.17], ["moo", 15.19]]], "duration": [9.62, 0.65, 1.95, 4.7, 0.97, 2.37, 1.81, 5.35, 31.94, 0.89, 3.57, 0.6, 5.46]} \ No newline at end of file diff --git a/annotations_filtered/acs2qgkCHvw_filtered.json b/annotations_filtered/acs2qgkCHvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a4e4d28bd6ab343a0bce2a14a21a0930ecfe3eb --- /dev/null +++ b/annotations_filtered/acs2qgkCHvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.31], [21.0, 22.87], [26.0, 32.75], [61.0, 61.47], [63.0, 63.37], [71.0, 78.95]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 48.61, 0.0, 0.0, 54.63], "audiomae_on_audioset": [null, null, [["fly, housefly", 27.23], ["fart", 16.79], ["speech", 12.62]], null, null, null], "duration": [0.31, 1.87, 6.75, 0.47, 0.37, 7.95]} \ No newline at end of file diff --git a/annotations_filtered/ad65spfln8w_filtered.json b/annotations_filtered/ad65spfln8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6c3f80d658feb2148641ba1bd1be812d9dc2232 --- /dev/null +++ b/annotations_filtered/ad65spfln8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [3.0, 150.42], [153.0, 153.28], [153.0, 156.63], [164.0, 164.46]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 35.31, 0.0], "audiomae_on_audioset": [null, null, null, [["moo", 24.31], ["music", 20.95], ["cattle, bovinae", 14.55]], null], "duration": [0.34, 147.42, 0.28, 3.63, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/adFRKm9ezw4_filtered.json b/annotations_filtered/adFRKm9ezw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5360d5e14e6592c94dbb197e90dcf64c0cda73ef --- /dev/null +++ b/annotations_filtered/adFRKm9ezw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 67.42], [72.0, 74.01], [78.0, 81.19], [82.0, 82.29], [86.0, 87.42], [90.0, 91.86], [95.0, 96.47], [99.0, 102.95], [106.0, 107.32], [108.0, 118.12], [122.0, 142.52], [148.0, 148.59], [153.0, 156.44], [161.0, 180.18]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, true, true], "silence_prob": [83.34, 74.76, 74.76, 0.0, 0.0, 0.0, 0.0, 39.78, 0.0, 32.58, 31.0, 0.0, 29.46, 33.06], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 48.89], ["theremin", 13.17], ["synthesizer", 6.17]], null, [["music", 50.55], ["theremin", 22.91], ["buzz", 2.57]], [["music", 13.35], ["hum", 10.61], ["gong", 9.27]], null, [["foghorn", 28.78], ["music", 11.82], ["reverberation", 6.55]], [["music", 34.54], ["sound effect", 5.68], ["insect", 5.19]]], "duration": [6.42, 2.01, 3.19, 0.29, 1.42, 1.86, 1.47, 3.95, 1.32, 10.12, 20.52, 0.59, 3.44, 19.18]} \ No newline at end of file diff --git a/annotations_filtered/adOO9YXZ9Ys_filtered.json b/annotations_filtered/adOO9YXZ9Ys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51f15e29985866c6d45de209cb82909664deca36 --- /dev/null +++ b/annotations_filtered/adOO9YXZ9Ys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.14], [13.0, 16.44], [22.0, 23.25], [26.0, 62.18], [66.0, 146.31], [148.0, 154.94], [155.0, 155.16]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [48.35, 49.97, 0.0, 0.0, 0.0, 65.2, 0.0], "audiomae_on_audioset": [[["throbbing", 30.57], ["run", 14.4], ["heart sounds, heartbeat", 12.16]], [["speech", 30.32], ["clip-clop", 27.48], ["horse", 26.44]], null, null, null, null, null], "duration": [3.14, 3.44, 1.25, 36.18, 80.31, 6.94, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/adatkf9XY44_filtered.json b/annotations_filtered/adatkf9XY44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80680f9213b3e76199bdeab8c65f33e3b6e74776 --- /dev/null +++ b/annotations_filtered/adatkf9XY44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.47], [9.0, 10.94], [24.0, 24.92], [27.0, 26.62], [27.0, 28.19], [35.0, 36.0], [39.0, 40.54], [44.0, 44.15], [48.0, 58.31], [59.0, 61.05], [62.0, 67.93], [69.0, 95.27], [102.0, 107.67], [108.0, 110.13], [112.0, 113.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 99.93, 52.68, 28.83, 35.78, 39.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.42], ["whack, thwack", 12.98], ["artillery fire", 11.29]], [["fly, housefly", 67.84], ["insect", 10.35], ["mosquito", 5.99]], [["speech", 37.39], ["sidetone", 26.62], ["telephone", 15.76]], null], "duration": [0.47, 1.94, 0.92, -0.38, 1.19, 1.0, 1.54, 0.15, 10.31, 2.05, 5.93, 26.27, 5.67, 2.13, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/adjuOPzkpw4_filtered.json b/annotations_filtered/adjuOPzkpw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92b71aa54383e1c0193c78c6661b17774be76e1d --- /dev/null +++ b/annotations_filtered/adjuOPzkpw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.55], [28.0, 29.67], [30.0, 31.43], [34.0, 34.2], [37.0, 40.74], [42.0, 43.95], [45.0, 66.39], [72.0, 78.04], [87.0, 89.23], [91.0, 92.18], [95.0, 96.5], [106.0, 108.46], [110.0, 111.47], [113.0, 114.37], [123.0, 123.7], [127.0, 128.46], [132.0, 134.0], [135.0, 139.72], [145.0, 151.38], [152.0, 152.61], [153.0, 159.07], [173.0, 174.34], [176.0, 177.55], [181.0, 182.51], [188.0, 191.62]], "keep_status": [false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.91, 0.0, 32.85, 34.67, 40.47, 0.0, 0.0, 34.57, 0.0, 0.0, 0.0, 0.0, 36.01, 41.85, 38.56, 0.0, 37.01, 0.0, 0.0, 0.0, 95.51], "audiomae_on_audioset": [null, null, null, null, [["music", 38.16], ["hum", 13.07], ["throbbing", 8.35]], null, [["speech", 28.36], ["music", 23.21], ["hum", 8.74]], [["music", 48.8], ["moo", 10.86], ["cattle, bovinae", 10.4]], [["music", 37.83], ["throbbing", 11.93], ["hum", 10.73]], null, null, [["music", 69.85], ["speech", 5.88], ["boom", 1.73]], null, null, null, null, [["explosion", 19.77], ["hum", 13.79], ["eruption", 10.46]], [["speech", 67.22], ["rowboat, canoe, kayak", 8.0], ["boat, water vehicle", 4.42]], [["speech", 48.49], ["vehicle", 5.1], ["hum", 5.02]], null, [["speech", 30.34], ["animal", 5.76], ["honk", 4.74]], null, null, null, null], "duration": [1.55, 1.67, 1.43, 0.2, 3.74, 1.95, 21.39, 6.04, 2.23, 1.18, 1.5, 2.46, 1.47, 1.37, 0.7, 1.46, 2.0, 4.72, 6.38, 0.61, 6.07, 1.34, 1.55, 1.51, 3.62]} \ No newline at end of file diff --git a/annotations_filtered/adxwpSdHj90_filtered.json b/annotations_filtered/adxwpSdHj90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..810ae234695a3217947e88507e4c86c434bbb0ac --- /dev/null +++ b/annotations_filtered/adxwpSdHj90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [4.0, 4.6], [6.0, 6.74], [12.0, 13.47], [14.0, 17.09], [20.0, 20.7], [30.0, 31.09], [38.0, 38.04], [43.0, 42.97], [44.0, 44.15], [45.0, 46.53], [52.0, 53.15], [55.0, 56.46], [57.0, 61.37], [63.0, 62.94], [78.0, 80.23], [86.0, 88.59], [89.0, 89.19], [90.0, 90.81], [94.0, 94.58], [95.0, 99.76], [115.0, 114.59], [133.0, 134.03], [139.0, 139.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 0.0, 72.6, 36.69, 0.0, 0.0, 0.0, 31.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.41], ["neigh, whinny", 26.89], ["horse", 9.34]], null, null, null, [["speech", 89.93], ["music", 2.74], ["synthesizer", 0.72]], null, null, null], "duration": [0.97, 0.6, 0.74, 1.47, 3.09, 0.7, 1.09, 0.04, -0.03, 0.15, 1.53, 1.15, 1.46, 4.37, -0.06, 2.23, 2.59, 0.19, 0.81, 0.58, 4.76, -0.41, 1.03, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/ae-cYVuxBKI_filtered.json b/annotations_filtered/ae-cYVuxBKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85971bf459de59d9547bea2d81385f7065edd90e --- /dev/null +++ b/annotations_filtered/ae-cYVuxBKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.29], [10.0, 9.75], [11.0, 19.25], [20.0, 38.8], [43.0, 58.09], [58.0, 58.45], [58.0, 126.08]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [99.88, 0.0, 58.47, 32.05, 35.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 62.8], ["smash, crash", 10.79], ["whack, thwack", 5.2]], [["speech", 35.66], ["music", 33.81], ["fart", 9.94]], null, null], "duration": [2.29, -0.25, 8.25, 18.8, 15.09, 0.45, 68.08]} \ No newline at end of file diff --git a/annotations_filtered/aeF3Q6eTU5k_filtered.json b/annotations_filtered/aeF3Q6eTU5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a4694280fdacc71f9722e94e7454310fe3d4986 --- /dev/null +++ b/annotations_filtered/aeF3Q6eTU5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.96], [15.0, 16.12], [18.0, 18.77], [21.0, 21.29], [25.0, 26.99], [29.0, 40.2], [41.0, 41.44], [45.0, 45.1], [46.0, 46.67], [50.0, 59.43], [61.0, 72.3], [74.0, 77.01], [77.0, 80.84], [83.0, 84.89], [93.0, 93.7], [94.0, 95.81], [103.0, 104.21], [106.0, 106.96], [107.0, 112.02]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true], "silence_prob": [60.42, 0.0, 0.0, 0.0, 0.0, 45.82, 0.0, 0.0, 0.0, 44.69, 35.22, 85.72, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 38.27], "audiomae_on_audioset": [null, null, null, null, null, [["music", 59.82], ["theremin", 8.41], ["didgeridoo", 5.01]], null, null, null, [["music", 46.27], ["speech", 16.87], ["whack, thwack", 6.84]], [["speech", 18.59], ["music", 12.6], ["cattle, bovinae", 11.41]], null, null, null, null, null, null, null, [["music", 28.9], ["boing", 28.26], ["speech", 7.9]]], "duration": [4.96, 1.12, 0.77, 0.29, 1.99, 11.2, 0.44, 0.1, 0.67, 9.43, 11.3, 3.01, 3.84, 1.89, 0.7, 1.81, 1.21, 0.96, 5.02]} \ No newline at end of file diff --git a/annotations_filtered/aecYY1vUiDU_filtered.json b/annotations_filtered/aecYY1vUiDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1301bd2b39dbebfbfcf91fd212c4728c14903b1d --- /dev/null +++ b/annotations_filtered/aecYY1vUiDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [6.0, 10.15], [18.0, 18.5], [47.0, 48.83], [57.0, 57.28], [66.0, 67.39], [68.0, 68.27], [86.0, 87.56], [88.0, 95.25], [103.0, 104.01], [115.0, 115.23], [133.0, 132.9], [136.0, 136.66], [149.0, 150.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 4.15, 0.5, 1.83, 0.28, 1.39, 0.27, 1.56, 7.25, 1.01, 0.23, -0.1, 0.66, 1.92]} \ No newline at end of file diff --git a/annotations_filtered/aeneVqyoBTo_filtered.json b/annotations_filtered/aeneVqyoBTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9d01ce48eb215770bafadf3d1b10aaa7cf81d72 --- /dev/null +++ b/annotations_filtered/aeneVqyoBTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.39], [8.0, 9.0], [11.0, 11.43], [14.0, 18.13], [20.0, 22.13], [23.0, 25.3], [27.0, 27.65], [28.0, 55.41], [55.0, 55.49], [56.0, 55.75], [56.0, 62.26]], "keep_status": [false, false, false, false, true, true, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 30.88, 32.46, 35.01, 0.0, 30.57, 0.0, 0.0, 30.32], "audiomae_on_audioset": [null, null, null, [["music", 48.78], ["musical instrument", 18.24], ["synthesizer", 7.78]], [["noise", 13.83], ["hum", 11.64], ["music", 8.51]], [["mains hum", 14.64], ["hum", 13.96], ["music", 8.43]], null, [["speech", 24.04], ["sidetone", 12.2], ["hum", 10.29]], null, null, [["music", 26.31], ["hum", 14.96], ["mains hum", 12.04]]], "duration": [0.39, 1.0, 0.43, 4.13, 2.13, 2.3, 0.65, 27.41, 0.49, -0.25, 6.26]} \ No newline at end of file diff --git a/annotations_filtered/af1gSplQfPU_filtered.json b/annotations_filtered/af1gSplQfPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eff0eb76fd4d3dc214ffd6222250191bad78eab0 --- /dev/null +++ b/annotations_filtered/af1gSplQfPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 32.97], [36.0, 40.04], [43.0, 55.09], [57.0, 63.1], [64.0, 73.4], [75.0, 78.48], [79.0, 79.34], [81.0, 83.98], [86.0, 89.31], [90.0, 90.46], [91.0, 91.71], [93.0, 92.85]], "keep_status": [false, true, true, false, true, false, false, true, false, false, false, false], "silence_prob": [29.57, 29.05, 29.12, 29.44, 30.71, 42.84, 0.0, 31.04, 52.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 71.15], ["boing", 7.66], ["burst, pop", 1.58]], [["music", 55.11], ["boing", 6.13], ["speech", 3.37]], [["groan", 34.9], ["music", 18.99], ["cattle, bovinae", 5.12]], [["music", 44.84], ["boing", 22.49], ["speech", 3.55]], [["throbbing", 20.69], ["music", 8.72], ["hum", 8.26]], [["speech", 67.16], ["sidetone", 7.05], ["radio", 4.27]], null, [["speech", 27.48], ["animal", 16.57], ["cattle, bovinae", 12.1]], null, null, null, null], "duration": [10.97, 4.04, 12.09, 6.1, 9.4, 3.48, 0.34, 2.98, 3.31, 0.46, 0.71, -0.15]} \ No newline at end of file diff --git a/annotations_filtered/afBwkWnwlD0_filtered.json b/annotations_filtered/afBwkWnwlD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55ee9d1106b088fb247b5929ec01de30ebd133aa --- /dev/null +++ b/annotations_filtered/afBwkWnwlD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.29], [7.0, 8.06], [10.0, 10.61], [12.0, 12.82], [14.0, 15.01], [18.0, 17.9], [19.0, 20.82], [23.0, 24.95], [27.0, 28.0], [29.0, 30.91], [35.0, 35.58], [36.0, 37.4], [40.0, 40.54], [45.0, 46.16], [47.0, 48.64], [53.0, 53.97], [58.0, 58.04], [60.0, 60.88], [62.0, 62.97], [66.0, 65.91], [68.0, 68.54], [71.0, 73.97], [76.0, 77.82], [80.0, 81.45], [83.0, 84.21], [90.0, 91.91], [96.0, 97.31], [102.0, 108.92], [110.0, 111.57], [113.0, 113.73], [115.0, 115.67], [116.0, 117.9], [121.0, 124.29], [126.0, 128.26], [132.0, 135.23], [138.0, 139.56], [140.0, 141.35], [142.0, 143.43], [146.0, 146.82], [153.0, 154.55], [156.0, 156.3], [162.0, 165.62], [166.0, 168.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 70.86, 63.64, 58.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 45.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 66.68], ["music", 8.9], ["singing bowl", 3.17]]], "duration": [0.29, 1.06, 0.61, 0.82, 1.01, -0.1, 1.82, 1.95, 1.0, 1.91, 0.58, 1.4, 0.54, 1.16, 1.64, 0.97, 0.04, 0.88, 0.97, -0.09, 0.54, 2.97, 1.82, 1.45, 1.21, 1.91, 1.31, 6.92, 1.57, 0.73, 0.67, 1.9, 3.29, 2.26, 3.23, 1.56, 1.35, 1.43, 0.82, 1.55, 0.3, 3.62, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/afW8dxL3qZM_filtered.json b/annotations_filtered/afW8dxL3qZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e596280c8459840a9a88c7ebc83509ddd324d5b --- /dev/null +++ b/annotations_filtered/afW8dxL3qZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [6.0, 7.43], [9.0, 9.53], [12.0, 18.1], [21.0, 22.49], [23.0, 23.38], [25.0, 25.34], [27.0, 35.56], [36.0, 37.03], [41.0, 53.06], [55.0, 55.95], [57.0, 64.02], [64.0, 66.21], [67.0, 68.89], [70.0, 71.59], [72.0, 73.26], [75.0, 76.35], [78.0, 82.38], [88.0, 88.1], [104.0, 105.83], [107.0, 110.83], [112.0, 114.88], [115.0, 117.12], [118.0, 123.7], [125.0, 128.33]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, true, true, false, false, false, false, false, false, false, true, true, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 58.98, 0.0, 0.0, 0.0, 31.14, 0.0, 33.44, 0.0, 32.84, 35.42, 0.0, 0.0, 0.0, 0.0, 44.69, 0.0, 0.0, 39.12, 38.71, 34.57, 44.66, 34.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 21.29], ["mains hum", 16.24], ["animal", 4.86]], null, [["speech", 22.65], ["hum", 15.91], ["music", 9.1]], null, [["hum", 36.97], ["whale vocalization", 19.06], ["mains hum", 12.12]], [["livestock, farm animals, working animals", 20.08], ["whale vocalization", 18.09], ["music", 14.1]], null, null, null, null, [["music", 61.84], ["hum", 8.47], ["theremin", 2.22]], null, null, [["music", 22.38], ["gong", 19.87], ["hum", 9.52]], [["music", 21.55], ["speech", 21.14], ["singing bowl", 13.44]], [["whale vocalization", 29.24], ["music", 14.18], ["speech", 12.3]], [["music", 31.71], ["electronic music", 9.75], ["whale vocalization", 8.66]], [["music", 35.86], ["singing bowl", 13.85], ["electronic music", 11.35]]], "duration": [0.54, 1.43, 0.53, 6.1, 1.49, 0.38, 0.34, 8.56, 1.03, 12.06, 0.95, 7.02, 2.21, 1.89, 1.59, 1.26, 1.35, 4.38, 0.1, 1.83, 3.83, 2.88, 2.12, 5.7, 3.33]} \ No newline at end of file diff --git a/annotations_filtered/af_J2e4r328_filtered.json b/annotations_filtered/af_J2e4r328_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdc4f6889abfcd621ceee2cd2d9ffa9aaaf9d952 --- /dev/null +++ b/annotations_filtered/af_J2e4r328_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.95], [9.0, 13.44], [15.0, 15.58], [16.0, 24.22], [26.0, 26.1], [34.0, 35.29], [48.0, 48.25], [53.0, 53.76], [59.0, 60.42], [70.0, 71.19], [73.0, 73.36], [81.0, 80.64], [82.0, 87.81], [88.0, 97.9], [101.0, 102.02], [102.0, 102.42], [106.0, 107.3]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 33.06, 0.0, 32.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.13, 30.79, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.59], ["throbbing", 12.59], ["didgeridoo", 5.45]], null, [["music", 49.59], ["hum", 8.08], ["mains hum", 7.55]], null, null, null, null, null, null, null, null, [["music", 29.98], ["brass instrument", 13.31], ["speech", 12.69]], [["music", 46.09], ["speech", 29.7], ["electronic music", 3.71]], null, null, null], "duration": [1.95, 4.44, 0.58, 8.22, 0.1, 1.29, 0.25, 0.76, 1.42, 1.19, 0.36, -0.36, 5.81, 9.9, 1.02, 0.42, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/afnlOjES53Y_filtered.json b/annotations_filtered/afnlOjES53Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36492e184c05d12bcad7a91e1173cf066f7c1659 --- /dev/null +++ b/annotations_filtered/afnlOjES53Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [6.0, 10.47], [11.0, 17.59], [23.0, 24.51], [28.0, 35.45], [41.0, 41.91], [44.0, 45.76], [46.0, 48.12], [54.0, 54.53], [56.0, 56.91], [60.0, 60.59], [61.0, 61.67], [63.0, 75.44], [79.0, 80.47], [86.0, 89.92], [91.0, 91.52], [92.0, 94.63], [95.0, 96.16], [106.0, 107.03], [108.0, 109.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 55.67, 48.69, 0.0, 44.01, 0.0, 0.0, 39.31, 0.0, 0.0, 0.0, 0.0, 44.81, 0.0, 48.91, 0.0, 42.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 46.96], ["throbbing", 30.35], ["mains hum", 11.82]], null, [["sidetone", 37.91], ["hum", 25.29], ["mains hum", 11.08]], null, null, [["hum", 39.81], ["mains hum", 37.22], ["speech", 3.16]], null, null, null, null, [["hum", 46.24], ["mains hum", 23.96], ["squish", 5.3]], null, [["hum", 38.23], ["throbbing", 33.54], ["heart sounds, heartbeat", 5.75]], null, [["mains hum", 17.03], ["hum", 16.9], ["speech", 14.46]], null, null, null], "duration": [0.96, 4.47, 6.59, 1.51, 7.45, 0.91, 1.76, 2.12, 0.53, 0.91, 0.59, 0.67, 12.44, 1.47, 3.92, 0.52, 2.63, 1.16, 1.03, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/ag14Ao_xO4c_filtered.json b/annotations_filtered/ag14Ao_xO4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3585044019ef91e436a2fc4221f9803553396fbb --- /dev/null +++ b/annotations_filtered/ag14Ao_xO4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.78], [8.0, 8.67], [10.0, 10.1], [11.0, 11.37], [12.0, 13.04], [14.0, 15.3], [19.0, 20.41], [24.0, 24.68], [26.0, 29.24], [30.0, 31.85], [33.0, 35.63], [36.0, 38.92], [39.0, 40.42], [41.0, 43.11], [45.0, 46.57], [47.0, 48.15], [52.0, 56.52], [58.0, 58.95], [60.0, 66.55], [71.0, 72.55], [74.0, 75.47], [77.0, 78.22], [80.0, 80.38], [86.0, 85.92], [87.0, 87.76], [92.0, 91.88], [95.0, 95.44], [96.0, 96.21], [100.0, 100.09], [100.0, 100.23], [101.0, 101.22], [102.0, 103.37], [107.0, 108.21], [111.0, 111.64], [118.0, 119.84], [123.0, 125.12], [128.0, 128.39], [133.0, 133.57], [144.0, 145.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.71, 97.64, 0.0, 87.92, 0.0, 0.0, 100.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.78, 0.67, 0.1, 0.37, 1.04, 1.3, 1.41, 0.68, 3.24, 1.85, 2.63, 2.92, 1.42, 2.11, 1.57, 1.15, 4.52, 0.95, 6.55, 1.55, 1.47, 1.22, 0.38, -0.08, 0.76, -0.12, 0.44, 0.21, 0.09, 0.23, 0.22, 1.37, 1.21, 0.64, 1.84, 2.12, 0.39, 0.57, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/ag2wbvh5VDs_filtered.json b/annotations_filtered/ag2wbvh5VDs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6dac6caedc300ff9814d4db7102c419c48af821 --- /dev/null +++ b/annotations_filtered/ag2wbvh5VDs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.12], [6.0, 9.21], [11.0, 28.29], [35.0, 66.16], [72.0, 72.01], [77.0, 90.07], [91.0, 104.14], [105.0, 106.12], [110.0, 115.03], [116.0, 119.65], [121.0, 122.17], [132.0, 132.26], [139.0, 139.5]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.56, 35.34, 30.66, 0.0, 0.0, 29.03, 28.48, 0.0, 36.7, 38.11, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.2], ["whale vocalization", 11.01], ["theremin", 7.37]], [["music", 52.49], ["musical instrument", 5.59], ["throbbing", 4.16]], [["music", 42.82], ["synthesizer", 13.48], ["cacophony", 6.42]], null, null, [["music", 73.12], ["hum", 7.95], ["throbbing", 3.79]], [["music", 51.98], ["speech", 14.78], ["throbbing", 7.59]], null, [["music", 51.07], ["hum", 15.12], ["throbbing", 12.77]], [["music", 67.45], ["throbbing", 4.42], ["electronic music", 4.38]], null, null, null], "duration": [3.12, 3.21, 17.29, 31.16, 0.01, 13.07, 13.14, 1.12, 5.03, 3.65, 1.17, 0.26, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/agrpQQWiX48_filtered.json b/annotations_filtered/agrpQQWiX48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47aa3fed46c9498f368c92502ac933f08859087b --- /dev/null +++ b/annotations_filtered/agrpQQWiX48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.34], [10.0, 10.27], [19.0, 23.99], [24.0, 47.85], [48.0, 48.36], [49.0, 54.58], [56.0, 59.85], [62.0, 65.7], [66.0, 68.23], [71.0, 71.78], [73.0, 73.84], [79.0, 80.11], [82.0, 82.19], [83.0, 89.36], [91.0, 93.33], [97.0, 97.7], [101.0, 101.58], [122.0, 121.96], [123.0, 124.5], [129.0, 129.74], [131.0, 130.72], [135.0, 135.63], [141.0, 140.58], [144.0, 144.66], [151.0, 152.09], [153.0, 160.78], [164.0, 165.99], [167.0, 168.69], [169.0, 169.87]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 73.97, 80.11, 0.0, 48.23, 69.47, 89.72, 99.76, 0.0, 0.0, 0.0, 0.0, 84.8, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.68], ["theremin", 3.36], ["musical instrument", 3.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.47], ["speech", 12.24], ["fart", 11.49]], null, null, null], "duration": [1.34, 0.27, 4.99, 23.85, 0.36, 5.58, 3.85, 3.7, 2.23, 0.78, 0.84, 1.11, 0.19, 6.36, 2.33, 0.7, 0.58, -0.04, 1.5, 0.74, -0.28, 0.63, -0.42, 0.66, 1.09, 7.78, 1.99, 1.69, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/ah-M2AYI4Ac_filtered.json b/annotations_filtered/ah-M2AYI4Ac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95ca31a362bb9eff7382829b320f736054ee267c --- /dev/null +++ b/annotations_filtered/ah-M2AYI4Ac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 43.53], [45.0, 46.6], [48.0, 50.57], [51.0, 62.38], [65.0, 67.24], [69.0, 75.44], [76.0, 76.82], [78.0, 78.49], [80.0, 81.21], [83.0, 83.17], [83.0, 84.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 71.14, 56.78, 82.43, 35.42, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 48.27], ["theremin", 23.49], ["synthesizer", 6.81]], null, null, null, null, null], "duration": [1.53, 1.6, 2.57, 11.38, 2.24, 6.44, 0.82, 0.49, 1.21, 0.17, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/ah6TYuJ1iQg_filtered.json b/annotations_filtered/ah6TYuJ1iQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/ah6TYuJ1iQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ah7mS9H_TOM_filtered.json b/annotations_filtered/ah7mS9H_TOM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ecc6a350faef79fed68f5e7cdb19b0da934e05a --- /dev/null +++ b/annotations_filtered/ah7mS9H_TOM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [6.0, 7.13], [10.0, 11.4], [14.0, 14.59], [25.0, 25.83], [27.0, 27.67], [37.0, 37.29], [38.0, 38.18], [46.0, 48.84], [60.0, 60.25], [66.0, 66.5], [68.0, 69.7], [71.0, 73.08], [75.0, 78.54], [82.0, 83.79], [91.0, 91.84], [97.0, 97.8], [100.0, 102.1], [104.0, 113.53], [117.0, 117.02], [121.0, 120.9], [121.0, 122.82], [126.0, 130.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.71, 0.0, 0.0, 0.0, 41.54, 51.55, 0.0, 0.0, 0.0, 81.53, 95.09, 0.0, 0.0, 0.0, 90.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.72], ["didgeridoo", 10.65], ["hum", 5.13]], null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.13, 1.4, 0.59, 0.83, 0.67, 0.29, 0.18, 2.84, 0.25, 0.5, 1.7, 2.08, 3.54, 1.79, 0.84, 0.8, 2.1, 9.53, 0.02, -0.1, 1.82, 4.59]} \ No newline at end of file diff --git a/annotations_filtered/ahCOQjOPTZw_filtered.json b/annotations_filtered/ahCOQjOPTZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b6eb25e002efa1281cd62a701c8833ac2618100 --- /dev/null +++ b/annotations_filtered/ahCOQjOPTZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.0], [5.0, 6.29], [7.0, 9.36], [10.0, 32.02], [35.0, 46.79], [48.0, 54.08], [55.0, 69.94], [71.0, 74.48], [75.0, 85.89], [87.0, 138.48], [141.0, 142.13], [143.0, 151.46], [152.0, 152.85], [153.0, 153.93], [155.0, 163.49], [166.0, 170.95]], "keep_status": [false, false, false, false, false, true, true, true, true, false, false, false, false, false, true, true], "silence_prob": [64.97, 0.0, 79.59, 30.23, 30.49, 29.91, 28.58, 36.48, 34.19, 0.0, 0.0, 34.14, 0.0, 0.0, 34.85, 37.19], "audiomae_on_audioset": [null, null, null, [["didgeridoo", 42.19], ["music", 31.17], ["speech", 4.04]], [["music", 53.75], ["speech", 28.93], ["electronic music", 3.39]], [["music", 34.44], ["didgeridoo", 24.76], ["hum", 5.79]], [["music", 33.95], ["throbbing", 14.01], ["hum", 13.72]], [["music", 47.84], ["theremin", 6.98], ["whack, thwack", 5.36]], [["music", 26.75], ["speech", 13.86], ["dog", 5.0]], null, null, [["music", 50.55], ["didgeridoo", 19.02], ["musical instrument", 7.41]], null, null, [["music", 36.96], ["didgeridoo", 10.51], ["singing bowl", 9.74]], [["music", 49.94], ["synthesizer", 9.18], ["hum", 6.12]]], "duration": [2.0, 1.29, 2.36, 22.02, 11.79, 6.08, 14.94, 3.48, 10.89, 51.48, 1.13, 8.46, 0.85, 0.93, 8.49, 4.95]} \ No newline at end of file diff --git a/annotations_filtered/ahCg__rBh1Q_filtered.json b/annotations_filtered/ahCg__rBh1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..867f971b73b147a15be19548658410d749c485b9 --- /dev/null +++ b/annotations_filtered/ahCg__rBh1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 27.04], [29.0, 40.39], [43.0, 66.63], [70.0, 83.98], [88.0, 88.48], [93.0, 93.88], [97.0, 98.0], [100.0, 105.34], [108.0, 155.01], [156.0, 156.0]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [30.48, 30.44, 29.87, 36.02, 0.0, 0.0, 0.0, 31.6, 0.0, 0.0], "audiomae_on_audioset": [[["music", 74.07], ["didgeridoo", 2.83], ["musical instrument", 2.72]], [["music", 39.39], ["throbbing", 24.17], ["hum", 8.94]], [["music", 63.28], ["speech", 5.86], ["throbbing", 4.64]], [["hum", 46.5], ["music", 18.04], ["mains hum", 17.01]], null, null, null, [["music", 31.04], ["throbbing", 16.76], ["speech", 15.52]], null, null], "duration": [18.04, 11.39, 23.63, 13.98, 0.48, 0.88, 1.0, 5.34, 47.01, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/ahP1JZwHSh8_filtered.json b/annotations_filtered/ahP1JZwHSh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c07fd3a72ae73a2ffad2e82dcc6f066be37c81d1 --- /dev/null +++ b/annotations_filtered/ahP1JZwHSh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.95], [12.0, 43.24], [46.0, 50.13], [52.0, 52.44], [52.0, 57.42], [58.0, 62.94], [64.0, 68.27], [69.0, 77.45], [79.0, 84.11], [87.0, 106.76], [113.0, 113.85], [116.0, 117.12], [128.0, 128.61], [130.0, 130.08]], "keep_status": [true, false, false, false, false, true, true, false, true, true, false, false, false, false], "silence_prob": [35.39, 0.0, 30.52, 0.0, 39.12, 31.95, 33.45, 32.74, 33.72, 30.95, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 41.39], ["foghorn", 13.24], ["fly, housefly", 6.72]], null, [["music", 60.37], ["smash, crash", 7.14], ["speech", 3.74]], null, [["speech", 61.22], ["music", 14.11], ["hum", 2.95]], [["mains hum", 28.85], ["hum", 21.25], ["music", 13.78]], [["speech", 27.7], ["hum", 19.09], ["rumble", 9.16]], [["speech", 56.11], ["hum", 9.88], ["music", 7.3]], [["speech", 27.23], ["music", 16.59], ["hum", 11.21]], [["fly, housefly", 14.61], ["hum", 11.83], ["music", 9.85]], null, null, null, null], "duration": [3.95, 31.24, 4.13, 0.44, 5.42, 4.94, 4.27, 8.45, 5.11, 19.76, 0.85, 1.12, 0.61, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/ah_Egywb780_filtered.json b/annotations_filtered/ah_Egywb780_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..500b2109aeb4aef41779e029e03f2264aca09883 --- /dev/null +++ b/annotations_filtered/ah_Egywb780_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 22.32], [25.0, 30.28], [31.0, 57.35], [58.0, 60.27], [66.0, 68.37], [69.0, 72.57], [74.0, 75.71], [77.0, 78.33], [79.0, 80.45], [82.0, 88.06], [89.0, 96.55], [100.0, 101.61], [103.0, 105.17], [106.0, 108.46], [110.0, 112.92], [114.0, 121.24], [122.0, 127.23], [128.0, 130.22], [131.0, 134.11], [137.0, 139.89], [141.0, 146.13], [147.0, 147.97], [150.0, 161.35], [162.0, 164.1], [166.0, 166.36], [167.0, 168.84], [171.0, 173.37], [175.0, 177.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.29, 99.36, 61.37, 99.94, 99.87, 92.15, 0.0, 0.0, 0.0, 98.44, 99.87, 0.0, 99.94, 99.98, 95.51, 93.91, 99.56, 100.0, 90.95, 96.66, 98.36, 0.0, 87.0, 92.48, 0.0, 0.0, 55.74, 95.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.32, 5.28, 26.35, 2.27, 2.37, 3.57, 1.71, 1.33, 1.45, 6.06, 7.55, 1.61, 2.17, 2.46, 2.92, 7.24, 5.23, 2.22, 3.11, 2.89, 5.13, 0.97, 11.35, 2.1, 0.36, 1.84, 2.37, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/ahkwQhQZWG8_filtered.json b/annotations_filtered/ahkwQhQZWG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a447d37f514c090c3e9604174c80d9fcf5f93bd9 --- /dev/null +++ b/annotations_filtered/ahkwQhQZWG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [4.0, 5.37], [7.0, 7.99], [10.0, 12.11], [14.0, 14.99], [17.0, 17.74], [25.0, 28.02], [31.0, 32.39], [33.0, 35.45], [38.0, 39.18], [41.0, 44.19], [47.0, 52.3], [53.0, 52.95], [53.0, 58.83], [63.0, 64.83], [65.0, 67.44], [69.0, 71.54], [75.0, 76.62], [79.0, 80.86], [82.0, 87.94], [93.0, 100.57], [101.0, 108.01], [111.0, 111.37], [113.0, 113.75], [116.0, 122.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 50.02, 0.0, 70.16, 0.0, 46.79, 37.47, 0.0, 34.47, 0.0, 33.47, 40.52, 0.0, 0.0, 35.42, 31.1, 30.46, 0.0, 0.0, 31.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 33.84], ["hum", 9.41], ["speech", 7.1]], [["music", 37.2], ["didgeridoo", 34.25], ["musical instrument", 5.39]], null, [["music", 53.25], ["musical instrument", 6.89], ["speech", 6.73]], null, [["speech", 24.41], ["music", 12.57], ["effects unit", 10.87]], [["speech", 41.54], ["music", 33.66], ["hum", 3.04]], null, null, [["foghorn", 39.47], ["music", 24.87], ["musical instrument", 6.32]], [["music", 45.56], ["speech", 6.88], ["mains hum", 5.71]], [["music", 53.29], ["foghorn", 14.6], ["speech", 6.28]], null, null, [["music", 40.32], ["buzz", 10.95], ["didgeridoo", 7.66]]], "duration": [0.08, 1.37, 0.99, 2.11, 0.99, 0.74, 3.02, 1.39, 2.45, 1.18, 3.19, 5.3, -0.05, 5.83, 1.83, 2.44, 2.54, 1.62, 1.86, 5.94, 7.57, 7.01, 0.37, 0.75, 6.05]} \ No newline at end of file diff --git a/annotations_filtered/ahuPW6_t-z0_filtered.json b/annotations_filtered/ahuPW6_t-z0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6ccae4dd048989bba5d44f077f317900b0f458f --- /dev/null +++ b/annotations_filtered/ahuPW6_t-z0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.82], [6.0, 8.29], [10.0, 22.38], [33.0, 34.01], [44.0, 45.44], [47.0, 48.59], [52.0, 55.49], [56.0, 56.47], [60.0, 63.8], [67.0, 69.96]], "keep_status": [true, true, true, false, false, false, false, false, false, false], "silence_prob": [41.98, 39.99, 37.55, 0.0, 0.0, 0.0, 51.99, 0.0, 46.36, 53.72], "audiomae_on_audioset": [[["clang", 13.29], ["ding", 7.23], ["bell", 6.82]], [["bee, wasp, etc.", 26.07], ["fly, housefly", 20.29], ["speech", 16.84]], [["hum", 28.37], ["speech", 17.66], ["throbbing", 16.75]], null, null, null, null, null, [["crushing", 65.71], ["fart", 6.91], ["sidetone", 3.12]], null], "duration": [2.82, 2.29, 12.38, 1.01, 1.44, 1.59, 3.49, 0.47, 3.8, 2.96]} \ No newline at end of file diff --git a/annotations_filtered/ahxDiseuAak_filtered.json b/annotations_filtered/ahxDiseuAak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ec49e992384edd844a95b7a2fffdc0632dcc10a --- /dev/null +++ b/annotations_filtered/ahxDiseuAak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.25], [48.0, 49.55], [91.0, 103.06], [104.0, 105.38], [107.0, 112.77]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 59.68, 0.0, 69.34], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.25, 1.55, 12.06, 1.38, 5.77]} \ No newline at end of file diff --git a/annotations_filtered/aiJtAU0V_60_filtered.json b/annotations_filtered/aiJtAU0V_60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1cfd10e6b60a9394d09a9a313e7c6d1e3f0036f --- /dev/null +++ b/annotations_filtered/aiJtAU0V_60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.46], [9.0, 12.88], [16.0, 17.71], [19.0, 19.72], [22.0, 23.5], [32.0, 32.49], [36.0, 37.29], [40.0, 41.64], [43.0, 44.52], [52.0, 53.94], [67.0, 68.42], [77.0, 80.08], [82.0, 93.78], [95.0, 96.45], [104.0, 105.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.46, 3.88, 1.71, 0.72, 1.5, 0.49, 1.29, 1.64, 1.52, 1.94, 1.42, 3.08, 11.78, 1.45, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/aiiJ0fBFjCQ_filtered.json b/annotations_filtered/aiiJ0fBFjCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b28fbfc8e4ab238c3fe980678ae8b4f69ffe934d --- /dev/null +++ b/annotations_filtered/aiiJ0fBFjCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [3.0, 3.23], [7.0, 12.82], [15.0, 17.58], [18.0, 18.76], [22.0, 31.95], [34.0, 45.17], [46.0, 50.03], [51.0, 52.54], [54.0, 57.59], [59.0, 61.08], [62.0, 63.31], [64.0, 65.08], [67.0, 67.56], [69.0, 69.08], [72.0, 73.63], [75.0, 78.7], [80.0, 80.96], [83.0, 84.74], [86.0, 89.19], [90.0, 90.12], [92.0, 100.94], [102.0, 103.1], [105.0, 105.95], [113.0, 116.33], [120.0, 125.9], [129.0, 130.87], [132.0, 134.25], [135.0, 137.02], [138.0, 140.02], [143.0, 144.39]], "keep_status": [false, false, true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.0, 40.48, 0.0, 32.79, 63.1, 46.68, 0.0, 99.16, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 75.23, 0.0, 44.9, 0.0, 0.0, 44.84, 45.11, 0.0, 98.51, 57.17, 91.47, 0.0], "audiomae_on_audioset": [null, null, [["music", 33.58], ["harp", 14.17], ["harmonic", 6.09]], [["music", 49.91], ["rowboat, canoe, kayak", 8.14], ["boat, water vehicle", 5.32]], null, [["livestock, farm animals, working animals", 41.3], ["sheep", 14.7], ["bleat", 6.98]], null, [["whale vocalization", 25.65], ["speech", 14.22], ["hum", 5.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["splash, splatter", 20.91], ["gurgling", 14.26], ["fly, housefly", 10.6]], null, null, [["liquid", 33.65], ["water", 10.79], ["trickle, dribble", 6.6]], [["whale vocalization", 43.57], ["speech", 17.94], ["music", 8.64]], null, null, null, null, null], "duration": [0.75, 0.23, 5.82, 2.58, 0.76, 9.95, 11.17, 4.03, 1.54, 3.59, 2.08, 1.31, 1.08, 0.56, 0.08, 1.63, 3.7, 0.96, 1.74, 3.19, 0.12, 8.94, 1.1, 0.95, 3.33, 5.9, 1.87, 2.25, 2.02, 2.02, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/aiilV691CzY_filtered.json b/annotations_filtered/aiilV691CzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04380d9752a523a913675650f23ebee1cd251574 --- /dev/null +++ b/annotations_filtered/aiilV691CzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.26], [21.0, 31.29], [37.0, 37.86], [48.0, 63.0], [65.0, 65.53], [73.0, 73.68], [76.0, 77.36]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [53.97, 39.4, 0.0, 36.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 52.57], ["speech", 17.64], ["guitar", 8.26]], null, [["music", 42.52], ["moo", 16.39], ["cattle, bovinae", 12.72]], null, null, null], "duration": [2.26, 10.29, 0.86, 15.0, 0.53, 0.68, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/aikBhgSFE2A_filtered.json b/annotations_filtered/aikBhgSFE2A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b257251e9da25727a5fc2b0a1eb88474f87c68e --- /dev/null +++ b/annotations_filtered/aikBhgSFE2A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.88], [20.0, 19.84], [25.0, 25.69], [27.0, 28.46], [30.0, 31.45], [36.0, 36.71], [37.0, 38.03], [39.0, 39.26], [40.0, 41.69], [47.0, 48.2], [50.0, 51.43], [52.0, 59.54], [61.0, 63.09], [64.0, 65.97], [70.0, 72.96], [75.0, 76.5], [79.0, 78.92], [79.0, 80.43], [82.0, 83.84], [85.0, 87.34], [89.0, 90.71], [92.0, 95.07], [98.0, 100.09], [103.0, 105.0], [106.0, 107.42], [108.0, 110.32], [113.0, 114.74], [125.0, 126.6], [128.0, 129.15], [131.0, 132.27], [133.0, 139.62], [141.0, 149.74], [151.0, 154.97], [156.0, 158.01], [159.0, 160.46], [162.0, 163.75], [166.0, 166.65], [168.0, 176.23], [178.0, 179.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.11, 93.45, 0.0, 50.91, 0.0, 0.0, 0.0, 0.0, 39.05, 0.0, 53.53, 74.13, 34.88, 0.0, 33.86, 0.0, 0.0, 0.0, 0.0, 33.45, 66.27, 94.95, 71.0, 0.0, 0.0, 0.0, 32.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.71], ["didgeridoo", 19.58], ["speech", 10.27]], null, null, null, [["music", 41.07], ["mains hum", 7.36], ["speech", 7.36]], null, [["music", 27.37], ["speech", 10.28], ["mains hum", 9.9]], null, null, null, null, [["music", 25.63], ["speech", 21.7], ["mains hum", 13.69]], null, null, null, null, null, null, [["music", 32.42], ["whimper", 10.97], ["gasp", 10.11]], null], "duration": [0.88, -0.16, 0.69, 1.46, 1.45, 0.71, 1.03, 0.26, 1.69, 1.2, 1.43, 7.54, 2.09, 1.97, 2.96, 1.5, -0.08, 1.43, 1.84, 2.34, 1.71, 3.07, 2.09, 2.0, 1.42, 2.32, 1.74, 1.6, 1.15, 1.27, 6.62, 8.74, 3.97, 2.01, 1.46, 1.75, 0.65, 8.23, 1.98]} \ No newline at end of file diff --git a/annotations_filtered/aj-OpTHixpU_filtered.json b/annotations_filtered/aj-OpTHixpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7480309d107f1801c06cae6a1ebbbb3ea3bc8105 --- /dev/null +++ b/annotations_filtered/aj-OpTHixpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 27.82], [29.0, 35.78], [39.0, 42.38], [45.0, 46.65], [49.0, 49.57], [51.0, 52.03], [52.0, 55.43], [58.0, 59.85], [60.0, 62.23], [64.0, 67.2], [69.0, 69.23], [71.0, 70.92], [75.0, 77.26], [79.0, 79.59], [81.0, 82.04], [85.0, 90.56], [95.0, 95.98], [97.0, 97.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.43, 53.22, 81.53, 0.0, 0.0, 0.0, 67.13, 0.0, 90.78, 66.63, 0.0, 0.0, 78.04, 0.0, 0.0, 56.4, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.82, 6.78, 3.38, 1.65, 0.57, 1.03, 3.43, 1.85, 2.23, 3.2, 0.23, -0.08, 2.26, 0.59, 1.04, 5.56, 0.98, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/aj71pJABFFU_filtered.json b/annotations_filtered/aj71pJABFFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0206bad1ad9685662947056dd5a64ae2733feece --- /dev/null +++ b/annotations_filtered/aj71pJABFFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [4.0, 8.16], [10.0, 11.67], [12.0, 24.76], [27.0, 55.0], [58.0, 59.64], [62.0, 83.29]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 36.47, 0.0, 31.32, 40.93, 0.0, 38.68], "audiomae_on_audioset": [null, [["music", 62.05], ["hum", 5.41], ["cacophony", 5.31]], null, [["music", 53.6], ["hum", 17.37], ["throbbing", 7.38]], [["music", 49.1], ["hum", 23.17], ["throbbing", 11.49]], null, [["hum", 39.55], ["throbbing", 20.09], ["music", 19.1]]], "duration": [1.08, 4.16, 1.67, 12.76, 28.0, 1.64, 21.29]} \ No newline at end of file diff --git a/annotations_filtered/ajBHZKoKYbU_filtered.json b/annotations_filtered/ajBHZKoKYbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07f97d5b2f0a7d212d3f852cb0ada29abb6fa52e --- /dev/null +++ b/annotations_filtered/ajBHZKoKYbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 25.42], [31.0, 32.32], [33.0, 33.98], [36.0, 37.49], [40.0, 40.96], [44.0, 45.54], [47.0, 48.88], [50.0, 51.68], [53.0, 53.64], [55.0, 56.13], [57.0, 58.43], [62.0, 62.87], [64.0, 64.57], [68.0, 68.96], [71.0, 71.04], [72.0, 72.47], [76.0, 78.14], [80.0, 80.18], [82.0, 82.24], [84.0, 86.7], [88.0, 89.92], [91.0, 91.79], [93.0, 99.33], [100.0, 100.79], [102.0, 103.35], [111.0, 111.97], [120.0, 120.73], [122.0, 126.72], [128.0, 128.29], [129.0, 130.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 100.0, 0.0, 0.0, 96.17, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [23.42, 1.32, 0.98, 1.49, 0.96, 1.54, 1.88, 1.68, 0.64, 1.13, 1.43, 0.87, 0.57, 0.96, 0.04, 0.47, 2.14, 0.18, 0.24, 2.7, 1.92, 0.79, 6.33, 0.79, 1.35, 0.97, 0.73, 4.72, 0.29, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/ajBK8B_kYO0_filtered.json b/annotations_filtered/ajBK8B_kYO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c641b40db48d99dd80ac6068174bf1640781a0d --- /dev/null +++ b/annotations_filtered/ajBK8B_kYO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 28.29], [35.0, 36.05], [37.0, 38.52], [40.0, 41.13], [43.0, 58.9], [62.0, 71.96], [73.0, 73.92], [79.0, 79.84], [103.0, 106.79], [109.0, 116.87]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [41.34, 0.0, 0.0, 0.0, 33.04, 52.62, 0.0, 0.0, 37.05, 52.92], "audiomae_on_audioset": [[["music", 66.54], ["synthesizer", 6.79], ["ambient music", 5.8]], null, null, null, [["music", 47.66], ["speech", 20.18], ["buzz", 8.64]], null, null, null, [["speech", 42.8], ["music", 8.83], ["mosquito", 3.59]], null], "duration": [6.29, 1.05, 1.52, 1.13, 15.9, 9.96, 0.92, 0.84, 3.79, 7.87]} \ No newline at end of file diff --git a/annotations_filtered/ajE9h1zUbMs_filtered.json b/annotations_filtered/ajE9h1zUbMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b511230fbdba0c2428b5e31fd5f8b321c6e768b --- /dev/null +++ b/annotations_filtered/ajE9h1zUbMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.91], [7.0, 6.98], [8.0, 9.59], [11.0, 11.13], [11.0, 11.99], [21.0, 21.12], [22.0, 23.67], [28.0, 29.15], [30.0, 31.46], [33.0, 34.45], [35.0, 44.32], [46.0, 47.14], [48.0, 49.05], [50.0, 52.86], [65.0, 64.89], [76.0, 76.42], [80.0, 80.18], [82.0, 81.82], [84.0, 84.52], [88.0, 90.58], [91.0, 93.75], [94.0, 95.64], [97.0, 101.24], [102.0, 104.26], [106.0, 106.91], [107.0, 107.81], [108.0, 108.68], [110.0, 111.5], [114.0, 114.22], [115.0, 116.36], [118.0, 118.72], [121.0, 121.73], [122.0, 122.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 78.72, 0.0, 99.68, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.91, -0.02, 1.59, 0.13, 0.99, 0.12, 1.67, 1.15, 1.46, 1.45, 9.32, 1.14, 1.05, 2.86, -0.11, 0.42, 0.18, -0.18, 0.52, 2.58, 2.75, 1.64, 4.24, 2.26, 0.91, 0.81, 0.68, 1.5, 0.22, 1.36, 0.72, 0.73, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/ajMVBGbsL_E_filtered.json b/annotations_filtered/ajMVBGbsL_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da6da53fae4c5c1fd5c0a41c8a250dcc35561e05 --- /dev/null +++ b/annotations_filtered/ajMVBGbsL_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.85], [10.0, 18.69], [20.0, 20.97], [21.0, 69.13], [69.0, 129.09]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 49.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 40.06], ["music", 18.28], ["throbbing", 12.1]], null, null, null], "duration": [0.85, 8.69, 0.97, 48.13, 60.09]} \ No newline at end of file diff --git a/annotations_filtered/ajRRS6NzMBU_filtered.json b/annotations_filtered/ajRRS6NzMBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f185120e993c73247164835201d580bd25534f3 --- /dev/null +++ b/annotations_filtered/ajRRS6NzMBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.28], [5.0, 5.91], [7.0, 8.09], [12.0, 16.73], [17.0, 17.19], [18.0, 19.84], [22.0, 23.13], [24.0, 25.08], [30.0, 30.86], [32.0, 32.22], [38.0, 38.64], [46.0, 46.43], [49.0, 50.35], [53.0, 52.73], [54.0, 54.62], [59.0, 60.79], [62.0, 63.63], [66.0, 67.47], [74.0, 76.67], [79.0, 79.1], [80.0, 80.32], [84.0, 85.04], [86.0, 86.54], [91.0, 92.13], [94.0, 95.08], [100.0, 101.93], [103.0, 103.0], [107.0, 108.82], [115.0, 115.06], [116.0, 116.67], [118.0, 119.06], [121.0, 121.91], [123.0, 123.69], [125.0, 125.39], [133.0, 133.42], [134.0, 141.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.91, 1.09, 4.73, 0.19, 1.84, 1.13, 1.08, 0.86, 0.22, 0.64, 0.43, 1.35, -0.27, 0.62, 1.79, 1.63, 1.47, 2.67, 0.1, 0.32, 1.04, 0.54, 1.13, 1.08, 1.93, 0.0, 1.82, 0.06, 0.67, 1.06, 0.91, 0.69, 0.39, 0.42, 7.02]} \ No newline at end of file diff --git a/annotations_filtered/ajb31pJMQmw_filtered.json b/annotations_filtered/ajb31pJMQmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29d0731ccc2edc2153145eaa2adaf74afd31cb7d --- /dev/null +++ b/annotations_filtered/ajb31pJMQmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.87], [12.0, 13.15], [16.0, 16.36], [19.0, 23.38], [24.0, 26.59], [39.0, 39.97], [44.0, 53.6], [59.0, 62.85], [65.0, 80.11], [82.0, 84.13], [98.0, 99.79], [100.0, 101.21], [103.0, 104.41], [112.0, 114.51], [117.0, 124.48]], "keep_status": [false, false, false, false, true, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.32, 30.09, 0.0, 30.18, 29.88, 29.24, 29.03, 0.0, 0.0, 0.0, 31.15, 29.0], "audiomae_on_audioset": [null, null, null, [["music", 58.73], ["electric shaver, electric razor", 12.66], ["inside, small room", 2.17]], [["music", 44.16], ["mosquito", 7.04], ["boing", 5.88]], null, [["music", 43.49], ["boing", 18.75], ["whack, thwack", 10.24]], [["whack, thwack", 54.72], ["clang", 10.52], ["music", 9.39]], [["boing", 42.23], ["music", 19.9], ["speech", 5.58]], [["livestock, farm animals, working animals", 15.15], ["cattle, bovinae", 12.31], ["breaking", 8.34]], null, null, null, [["music", 44.7], ["foghorn", 27.42], ["speech", 3.25]], [["music", 56.71], ["speech", 10.55], ["buzz", 4.38]]], "duration": [0.87, 1.15, 0.36, 4.38, 2.59, 0.97, 9.6, 3.85, 15.11, 2.13, 1.79, 1.21, 1.41, 2.51, 7.48]} \ No newline at end of file diff --git a/annotations_filtered/ajgeUrUcqfE_filtered.json b/annotations_filtered/ajgeUrUcqfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0093a826813ca65907b54fe597bdd388730c4c17 --- /dev/null +++ b/annotations_filtered/ajgeUrUcqfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.63], [10.0, 11.8], [14.0, 15.85], [18.0, 19.8], [20.0, 27.01], [29.0, 35.92], [36.0, 42.04], [43.0, 45.55], [46.0, 53.59], [54.0, 56.4], [59.0, 59.0], [64.0, 66.01], [66.0, 68.32], [70.0, 70.48], [72.0, 78.34], [80.0, 82.32], [84.0, 84.82], [87.0, 88.21], [90.0, 90.71], [104.0, 104.8], [105.0, 106.29], [107.0, 108.77], [110.0, 112.67], [115.0, 116.45], [118.0, 121.42]], "keep_status": [true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [46.26, 0.0, 0.0, 0.0, 71.29, 35.2, 39.86, 73.82, 48.56, 49.97, 0.0, 42.91, 52.22, 0.0, 51.66, 48.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 78.89], "audiomae_on_audioset": [[["speech", 38.66], ["chirp tone", 10.88], ["sine wave", 9.66]], null, null, null, null, [["speech", 60.84], ["throbbing", 12.33], ["hum", 11.67]], [["thunk", 20.12], ["fart", 17.71], ["hum", 13.96]], null, [["speech", 66.51], ["coin (dropping)", 9.19], ["glass", 4.37]], [["speech", 46.46], ["sidetone", 7.14], ["fart", 4.68]], null, [["sine wave", 56.31], ["chirp tone", 31.56], ["speech", 8.55]], null, null, null, [["speech", 31.45], ["animal", 6.43], ["chirp tone", 5.17]], null, null, null, null, null, null, null, null, null], "duration": [5.63, 1.8, 1.85, 1.8, 7.01, 6.92, 6.04, 2.55, 7.59, 2.4, 0.0, 2.01, 2.32, 0.48, 6.34, 2.32, 0.82, 1.21, 0.71, 0.8, 1.29, 1.77, 2.67, 1.45, 3.42]} \ No newline at end of file diff --git a/annotations_filtered/ajm_632U-Ac_filtered.json b/annotations_filtered/ajm_632U-Ac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db26d1b97d31f7fb664994274f8a2615c7c2b874 --- /dev/null +++ b/annotations_filtered/ajm_632U-Ac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.94], [11.0, 11.03], [11.0, 11.87], [13.0, 16.97], [32.0, 32.49], [35.0, 38.58], [42.0, 42.58], [46.0, 49.45], [50.0, 51.04], [62.0, 62.41], [63.0, 67.12], [76.0, 76.54], [96.0, 97.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.07, 0.0, 87.0, 0.0, 37.21, 0.0, 0.0, 40.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mosquito", 37.81], ["insect", 23.24], ["fly, housefly", 20.08]], null, null, [["speech", 19.81], ["music", 18.85], ["boing", 6.87]], null, null], "duration": [-0.06, 0.03, 0.87, 3.97, 0.49, 3.58, 0.58, 3.45, 1.04, 0.41, 4.12, 0.54, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/ajvCMC8Na3M_filtered.json b/annotations_filtered/ajvCMC8Na3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7982244939086e2cb72170b402a4b99c697d5d73 --- /dev/null +++ b/annotations_filtered/ajvCMC8Na3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.1], [8.0, 8.14], [12.0, 13.46], [16.0, 15.65]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [1.1, 0.14, 1.46, -0.35]} \ No newline at end of file diff --git a/annotations_filtered/akMZQpIbTm4_filtered.json b/annotations_filtered/akMZQpIbTm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18ee052aa64f1215f2050d42e05b49e3bf093044 --- /dev/null +++ b/annotations_filtered/akMZQpIbTm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.71], [8.0, 22.54], [24.0, 35.41], [37.0, 51.6], [52.0, 51.63], [52.0, 51.68], [52.0, 57.06], [63.0, 73.85], [86.0, 91.45], [96.0, 97.17], [102.0, 103.17], [104.0, 108.11]], "keep_status": [true, false, true, true, false, false, false, false, true, false, false, true], "silence_prob": [39.57, 35.77, 33.8, 30.65, 0.0, 0.0, 29.46, 29.38, 33.96, 0.0, 0.0, 44.84], "audiomae_on_audioset": [[["speech", 43.12], ["hum", 10.62], ["sidetone", 9.29]], [["music", 51.39], ["bleat", 15.13], ["sheep", 13.86]], [["music", 49.74], ["speech", 9.52], ["rumble", 7.88]], [["music", 44.44], ["hum", 11.48], ["mains hum", 5.35]], null, null, [["music", 43.3], ["speech", 24.45], ["musical instrument", 2.89]], [["music", 45.34], ["speech", 23.06], ["musical instrument", 2.68]], [["groan", 27.67], ["grunt", 11.21], ["cattle, bovinae", 8.04]], null, null, [["speech", 20.28], ["animal", 6.18], ["whimper", 4.89]]], "duration": [3.71, 14.54, 11.41, 14.6, -0.37, -0.32, 5.06, 10.85, 5.45, 1.17, 1.17, 4.11]} \ No newline at end of file diff --git a/annotations_filtered/akSjCFfKAMo_filtered.json b/annotations_filtered/akSjCFfKAMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1883b9c755c6797ceab38704e6ff4c3e295c0078 --- /dev/null +++ b/annotations_filtered/akSjCFfKAMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.41], [24.0, 28.7], [29.0, 29.69], [30.0, 44.69]], "keep_status": [false, false, false, false], "silence_prob": [100.0, 98.8, 0.0, 50.56], "audiomae_on_audioset": [null, null, null, null], "duration": [2.41, 4.7, 0.69, 14.69]} \ No newline at end of file diff --git a/annotations_filtered/akrTlYc40XE_filtered.json b/annotations_filtered/akrTlYc40XE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f69ff74f8d7300744745b722830b8f87e2ef431d --- /dev/null +++ b/annotations_filtered/akrTlYc40XE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [20.0, 22.03], [32.0, 33.64], [37.0, 36.73], [42.0, 42.62], [47.0, 49.91], [54.0, 55.34], [56.0, 56.42]], "keep_status": [false, true, false, false, false, true, false, false], "silence_prob": [0.0, 36.9, 0.0, 0.0, 0.0, 46.33, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 23.6], ["sheep", 11.37], ["moo", 9.73]], null, null, null, [["speech", 27.26], ["fly, housefly", 12.45], ["mosquito", 11.88]], null, null], "duration": [0.74, 2.03, 1.64, -0.27, 0.62, 2.91, 1.34, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/akyfR8zcmIo_filtered.json b/annotations_filtered/akyfR8zcmIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4be68e6c8ebf7b5ee87244486707c21e75d7d21d --- /dev/null +++ b/annotations_filtered/akyfR8zcmIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.93], [31.0, 31.18], [33.0, 34.38], [42.0, 44.69], [45.0, 72.33], [73.0, 76.94], [79.0, 80.01], [81.0, 81.63], [85.0, 84.7], [100.0, 102.81], [105.0, 105.43], [107.0, 106.62], [111.0, 112.21], [114.0, 114.07]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 77.53, 47.05, 32.65, 0.0, 0.0, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 45.11], ["music", 19.87], ["ice cream truck, ice cream van", 15.29]], [["music", 25.55], ["speech", 9.76], ["mains hum", 4.09]], null, null, null, null, null, null, null, null], "duration": [0.93, 0.18, 1.38, 2.69, 27.33, 3.94, 1.01, 0.63, -0.3, 2.81, 0.43, -0.38, 1.21, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/al-tdoT3gL8_filtered.json b/annotations_filtered/al-tdoT3gL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bab2087e6d8cf031fe7d54d9edc6330500ef2c22 --- /dev/null +++ b/annotations_filtered/al-tdoT3gL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.13], [31.0, 32.51], [33.0, 34.6], [46.0, 49.87], [68.0, 69.4], [73.0, 73.45], [75.0, 75.22], [82.0, 90.34], [91.0, 95.94], [96.0, 98.85], [113.0, 115.48], [116.0, 116.34]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.92, 0.0, 0.0, 0.0, 31.52, 30.5, 30.99, 31.61, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 66.57], ["speech", 4.73], ["boing", 3.47]], null, null, null, [["music", 65.68], ["reggae", 7.64], ["musical instrument", 2.94]], [["music", 55.58], ["boing", 23.91], ["funny music", 3.26]], [["music", 32.84], ["boing", 30.52], ["didgeridoo", 6.33]], [["music", 50.94], ["speech", 11.49], ["musical instrument", 8.68]], null], "duration": [1.13, 1.51, 1.6, 3.87, 1.4, 0.45, 0.22, 8.34, 4.94, 2.85, 2.48, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/alE17GLFoQE_filtered.json b/annotations_filtered/alE17GLFoQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac4599fc26fd264c8f612c4f3ee4f575ecbd9cb5 --- /dev/null +++ b/annotations_filtered/alE17GLFoQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.74], [9.0, 10.54], [12.0, 14.44], [17.0, 17.9], [19.0, 19.85], [21.0, 21.34], [24.0, 24.24], [26.0, 27.14], [35.0, 36.29], [41.0, 42.94], [45.0, 44.9], [53.0, 55.53], [63.0, 63.68], [67.0, 69.01], [70.0, 71.56], [72.0, 72.81], [79.0, 79.41], [80.0, 83.96], [86.0, 87.51], [89.0, 95.55], [100.0, 106.19], [115.0, 115.42], [122.0, 123.47], [124.0, 129.12], [132.0, 145.27], [149.0, 156.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, true, true], "silence_prob": [0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.68, 0.0, 68.02, 0.0, 0.0, 0.0, 77.03, 0.0, 41.98, 39.12, 0.0, 0.0, 32.66, 34.19, 36.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 51.95], ["timpani", 4.41], ["shofar", 3.8]], null, null, null, null, null, null, null, [["cattle, bovinae", 39.74], ["moo", 34.87], ["livestock, farm animals, working animals", 22.54]], [["buzz", 21.92], ["mosquito", 14.21], ["electric shaver, electric razor", 13.78]], null, null, [["speech", 48.39], ["crying, sobbing", 7.29], ["electric shaver, electric razor", 6.71]], [["speech", 41.57], ["music", 15.11], ["fly, housefly", 3.54]], [["speech", 37.13], ["electric shaver, electric razor", 14.99], ["hum", 8.6]]], "duration": [0.74, 1.54, 2.44, 0.9, 0.85, 0.34, 0.24, 1.14, 1.29, 1.94, -0.1, 2.53, 0.68, 2.01, 1.56, 0.81, 0.41, 3.96, 1.51, 6.55, 6.19, 0.42, 1.47, 5.12, 13.27, 7.64]} \ No newline at end of file diff --git a/annotations_filtered/alQVZ9YxUJw_filtered.json b/annotations_filtered/alQVZ9YxUJw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/alQVZ9YxUJw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/alYZ8jQ5L3A_filtered.json b/annotations_filtered/alYZ8jQ5L3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac463b8114720d2c64c66b96aaec3f1338d79855 --- /dev/null +++ b/annotations_filtered/alYZ8jQ5L3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [13.0, 13.81], [23.0, 23.58], [28.0, 29.07], [30.0, 43.7], [46.0, 58.7], [61.0, 70.33], [71.0, 71.25], [71.0, 73.47], [74.0, 76.74], [78.0, 78.19], [79.0, 79.12], [83.0, 93.07], [96.0, 96.74], [99.0, 99.77], [102.0, 103.4], [105.0, 104.84], [109.0, 109.02], [109.0, 113.04], [116.0, 116.83], [118.0, 118.52], [119.0, 123.21]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.52, 40.79, 30.99, 0.0, 30.57, 46.75, 0.0, 0.0, 32.68, 0.0, 0.0, 0.0, 0.0, 0.0, 31.48, 0.0, 0.0, 33.37], "audiomae_on_audioset": [null, null, null, null, [["music", 63.61], ["theremin", 8.14], ["didgeridoo", 5.42]], [["music", 70.11], ["throbbing", 4.94], ["hum", 3.85]], [["speech", 16.25], ["music", 6.86], ["beatboxing", 6.52]], null, [["speech", 77.36], ["boing", 2.12], ["inside, small room", 1.92]], [["speech", 36.14], ["mains hum", 24.51], ["hum", 19.09]], null, null, [["didgeridoo", 23.86], ["electric shaver, electric razor", 23.15], ["speech", 20.74]], null, null, null, null, null, [["fly, housefly", 26.95], ["insect", 19.32], ["speech", 16.14]], null, null, [["speech", 30.59], ["wail, moan", 20.38], ["whimper", 12.79]]], "duration": [0.34, 0.81, 0.58, 1.07, 13.7, 12.7, 9.33, 0.25, 2.47, 2.74, 0.19, 0.12, 10.07, 0.74, 0.77, 1.4, -0.16, 0.02, 4.04, 0.83, 0.52, 4.21]} \ No newline at end of file diff --git a/annotations_filtered/alh8b1lYuRU_filtered.json b/annotations_filtered/alh8b1lYuRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87a9a1cf0f5da78bb52fb8579bae0b3f9df3327a --- /dev/null +++ b/annotations_filtered/alh8b1lYuRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.77], [7.0, 8.73], [11.0, 11.03], [12.0, 12.6], [16.0, 16.75], [19.0, 19.47], [20.0, 21.2], [26.0, 27.46], [31.0, 32.34], [35.0, 36.17], [42.0, 43.28], [48.0, 48.36], [51.0, 53.2], [55.0, 61.69], [72.0, 79.59], [83.0, 83.0], [90.0, 101.04], [102.0, 121.64], [122.0, 124.34], [125.0, 125.73], [126.0, 127.11], [130.0, 131.57], [133.0, 133.52], [140.0, 140.59], [141.0, 141.67], [143.0, 143.7], [144.0, 144.0], [149.0, 149.88], [152.0, 152.51], [154.0, 155.6], [157.0, 158.08], [161.0, 165.43], [167.0, 169.72], [171.0, 175.98], [178.0, 178.98], [183.0, 188.18], [188.0, 188.54], [190.0, 191.51], [193.0, 203.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 83.88, 36.65, 0.0, 38.16, 39.12, 52.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.7, 38.7, 51.18, 0.0, 35.97, 0.0, 0.0, 48.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 72.82], ["didgeridoo", 4.64], ["throbbing", 2.56]], null, [["music", 66.08], ["speech", 12.98], ["thunk", 2.72]], [["music", 76.45], ["guitar", 5.71], ["musical instrument", 4.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.54], ["musical instrument", 5.25], ["guitar", 4.52]], [["music", 61.33], ["musical instrument", 5.2], ["synthesizer", 3.78]], null, null, [["speech", 37.6], ["music", 32.13], ["thunk", 7.44]], null, null, [["music", 45.41], ["speech", 17.12], ["synthesizer", 4.87]]], "duration": [-0.23, 1.73, 0.03, 0.6, 0.75, 0.47, 1.2, 1.46, 1.34, 1.17, 1.28, 0.36, 2.2, 6.69, 7.59, 0.0, 11.04, 19.64, 2.34, 0.73, 1.11, 1.57, 0.52, 0.59, 0.67, 0.7, 0.0, 0.88, 0.51, 1.6, 1.08, 4.43, 2.72, 4.98, 0.98, 5.18, 0.54, 1.51, 10.37]} \ No newline at end of file diff --git a/annotations_filtered/alhVUKh36_Q_filtered.json b/annotations_filtered/alhVUKh36_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43b4210b3e8963f17e24fd8fdb87473e28e07ef7 --- /dev/null +++ b/annotations_filtered/alhVUKh36_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 33.64], [37.0, 42.28], [45.0, 44.58], [45.0, 79.22], [81.0, 81.18], [87.0, 87.78], [101.0, 128.01], [136.0, 136.29], [137.0, 145.89], [151.0, 174.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.15, 28.67, 0.0, 0.0, 0.0, 0.0, 29.07, 0.0, 29.06, 28.83], "audiomae_on_audioset": [[["music", 83.19], ["house music", 1.87], ["sampler", 1.51]], [["music", 81.23], ["electronic music", 2.22], ["house music", 2.04]], null, null, null, null, [["music", 84.82], ["funk", 2.03], ["singing", 0.85]], null, [["music", 73.69], ["didgeridoo", 3.22], ["musical instrument", 2.47]], [["music", 89.1], ["swing music", 0.96], ["funk", 0.82]]], "duration": [9.64, 5.28, -0.42, 34.22, 0.18, 0.78, 27.01, 0.29, 8.89, 23.38]} \ No newline at end of file diff --git a/annotations_filtered/amtxyPO7At8_filtered.json b/annotations_filtered/amtxyPO7At8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/amtxyPO7At8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/an8Z9J29zWo_filtered.json b/annotations_filtered/an8Z9J29zWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d6726e61a0701118e63b138900c8789a9b1940d --- /dev/null +++ b/annotations_filtered/an8Z9J29zWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.96], [5.0, 7.08], [7.0, 7.25], [8.0, 9.29], [13.0, 13.29], [18.0, 18.79], [21.0, 22.98], [25.0, 25.62], [28.0, 28.63], [31.0, 34.64], [40.0, 41.47], [42.0, 42.9], [44.0, 46.35], [52.0, 52.05], [58.0, 58.55], [59.0, 59.63], [61.0, 61.38], [62.0, 62.41], [65.0, 65.43], [68.0, 68.18], [71.0, 74.46], [75.0, 77.03], [78.0, 79.22], [80.0, 82.41], [83.0, 87.17], [87.0, 90.17], [94.0, 95.25], [96.0, 96.15], [98.0, 99.01], [101.0, 102.17], [104.0, 104.82], [111.0, 112.01], [118.0, 118.83], [126.0, 128.9], [130.0, 130.79], [134.0, 133.71], [136.0, 137.22], [139.0, 141.51], [142.0, 143.51], [145.0, 149.22], [153.0, 153.52]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 41.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 96.77, 55.67, 72.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 80.11, 0.0, 44.32, 0.0], "audiomae_on_audioset": [null, [["speech", 42.07], ["music", 14.91], ["animal", 3.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 9.89], ["burping, eructation", 6.92], ["moo", 5.97]], null], "duration": [1.96, 2.08, 0.25, 1.29, 0.29, 0.79, 1.98, 0.62, 0.63, 3.64, 1.47, 0.9, 2.35, 0.05, 0.55, 0.63, 0.38, 0.41, 0.43, 0.18, 3.46, 2.03, 1.22, 2.41, 4.17, 3.17, 1.25, 0.15, 1.01, 1.17, 0.82, 1.01, 0.83, 2.9, 0.79, -0.29, 1.22, 2.51, 1.51, 4.22, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/an9Zfn3IZCY_filtered.json b/annotations_filtered/an9Zfn3IZCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17b138828e62dc8eaf64d83a678f21c9ec703920 --- /dev/null +++ b/annotations_filtered/an9Zfn3IZCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[94.0, 110.4], [112.0, 112.35], [114.0, 138.91], [139.0, 145.98], [147.0, 152.93], [155.0, 192.84], [193.0, 192.94]], "keep_status": [true, false, false, true, false, false, false], "silence_prob": [46.26, 0.0, 50.02, 44.9, 51.6, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 22.1], ["hum", 20.02], ["throbbing", 11.74]], null, null, [["whale vocalization", 33.31], ["animal", 12.88], ["music", 10.94]], null, null, null], "duration": [16.4, 0.35, 24.91, 6.98, 5.93, 37.84, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/aoBeDwBxv04_filtered.json b/annotations_filtered/aoBeDwBxv04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1952cd69c1fe21c1aea637fddd65593313444886 --- /dev/null +++ b/annotations_filtered/aoBeDwBxv04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.61], [3.0, 8.48], [12.0, 12.31], [13.0, 15.28], [17.0, 16.98], [27.0, 27.08], [29.0, 33.0], [37.0, 37.02], [38.0, 38.18], [43.0, 43.28], [45.0, 59.21], [60.0, 61.16], [63.0, 63.73], [67.0, 71.27], [73.0, 74.04], [79.0, 82.38], [84.0, 86.8], [89.0, 90.61], [92.0, 92.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.43, 0.0, 72.75, 0.0, 0.0, 33.18, 0.0, 0.0, 0.0, 59.07, 0.0, 0.0, 100.0, 0.0, 34.83, 95.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 62.87], ["fart", 11.96], ["crying, sobbing", 5.12]], null, null, null, null, null, null, null, null, [["moo", 40.51], ["cattle, bovinae", 34.17], ["livestock, farm animals, working animals", 24.97]], null, null, null], "duration": [0.61, 5.48, 0.31, 2.28, -0.02, 0.08, 4.0, 0.02, 0.18, 0.28, 14.21, 1.16, 0.73, 4.27, 1.04, 3.38, 2.8, 1.61, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/aoXg7SSmGyk_filtered.json b/annotations_filtered/aoXg7SSmGyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c24a940d1d1f781dbaa304b57c5480142c3a8c3 --- /dev/null +++ b/annotations_filtered/aoXg7SSmGyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.36], [7.0, 11.4], [15.0, 14.96], [17.0, 18.93], [20.0, 20.39], [23.0, 24.0], [27.0, 29.32], [33.0, 34.38], [36.0, 36.68], [39.0, 38.91], [41.0, 41.88], [43.0, 43.7], [47.0, 47.73], [49.0, 49.77], [52.0, 52.91], [56.0, 57.18], [58.0, 59.29], [61.0, 62.92], [64.0, 65.25], [66.0, 67.59], [69.0, 69.48], [70.0, 70.73], [72.0, 72.76], [75.0, 76.4], [81.0, 80.62], [82.0, 88.25], [89.0, 89.58], [90.0, 91.77]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.98, 30.32, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.3, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 27.53], ["clip-clop", 10.63], ["animal", 4.76]], [["honk", 31.68], ["goose", 15.16], ["cattle, bovinae", 9.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.34], ["musical instrument", 4.62], ["guitar", 2.29]], null, null], "duration": [2.36, 4.4, -0.04, 1.93, 0.39, 1.0, 2.32, 1.38, 0.68, -0.09, 0.88, 0.7, 0.73, 0.77, 0.91, 1.18, 1.29, 1.92, 1.25, 1.59, 0.48, 0.73, 0.76, 1.4, -0.38, 6.25, 0.58, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/aoc1wqaK8cc_filtered.json b/annotations_filtered/aoc1wqaK8cc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cd0c86889b63975bee721f5985b8735ccb2f91c --- /dev/null +++ b/annotations_filtered/aoc1wqaK8cc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.92], [4.0, 3.99], [11.0, 10.94], [13.0, 12.97], [14.0, 14.57], [15.0, 21.59], [23.0, 26.2], [28.0, 29.1], [32.0, 32.29], [35.0, 35.5], [40.0, 41.07], [44.0, 45.99], [59.0, 59.71], [79.0, 86.22], [87.0, 87.32], [89.0, 89.11], [104.0, 104.92], [120.0, 126.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 50.46, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.86, 0.0, 0.0, 0.0, 29.61], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 53.57], ["guitar", 13.38], ["effects unit", 7.66]], null, null, null, null, null, null, [["music", 76.59], ["synthetic singing", 2.15], ["sidetone", 2.04]], null, null, null, [["music", 77.07], ["synthetic singing", 3.98], ["trombone", 1.84]]], "duration": [-0.08, -0.01, -0.06, -0.03, 0.57, 6.59, 3.2, 1.1, 0.29, 0.5, 1.07, 1.99, 0.71, 7.22, 0.32, 0.11, 0.92, 6.62]} \ No newline at end of file diff --git a/annotations_filtered/aogWdNKef2o_filtered.json b/annotations_filtered/aogWdNKef2o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1af4c47e1926533bfc86eaccbd24d1488e4fd2e --- /dev/null +++ b/annotations_filtered/aogWdNKef2o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.6], [5.0, 5.04], [6.0, 6.45], [8.0, 8.75], [11.0, 12.36], [15.0, 15.3], [17.0, 18.17], [19.0, 19.04], [20.0, 20.51], [24.0, 24.78], [25.0, 25.91], [33.0, 33.37], [37.0, 37.27], [40.0, 40.39], [42.0, 43.07], [44.0, 45.0], [48.0, 48.37], [50.0, 50.55], [52.0, 53.87], [54.0, 55.27], [56.0, 58.08], [60.0, 60.61], [63.0, 64.17], [65.0, 65.82], [68.0, 68.13], [69.0, 69.45], [71.0, 71.83], [72.0, 73.3], [75.0, 76.03], [79.0, 79.17], [80.0, 80.5], [82.0, 82.36], [83.0, 83.88], [85.0, 84.67], [86.0, 86.48], [89.0, 89.24], [90.0, 93.14], [97.0, 98.17], [100.0, 101.11], [102.0, 104.11], [105.0, 105.53], [107.0, 107.42], [108.0, 109.17], [111.0, 112.23], [114.0, 115.05], [118.0, 125.19], [126.0, 126.6], [129.0, 129.68], [134.0, 134.32], [136.0, 136.93], [141.0, 142.23], [143.0, 143.02], [144.0, 145.03], [146.0, 146.6], [147.0, 151.14], [152.0, 152.71], [164.0, 164.02], [168.0, 168.54], [169.0, 169.28], [171.0, 172.44], [174.0, 175.46], [177.0, 177.45], [178.0, 189.06], [191.0, 192.08], [193.0, 193.23], [194.0, 193.72], [197.0, 198.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.02, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 75.22], ["didgeridoo", 3.74], ["brass instrument", 3.72]], null, null, null, null], "duration": [0.6, 0.04, 0.45, 0.75, 1.36, 0.3, 1.17, 0.04, 0.51, 0.78, 0.91, 0.37, 0.27, 0.39, 1.07, 1.0, 0.37, 0.55, 1.87, 1.27, 2.08, 0.61, 1.17, 0.82, 0.13, 0.45, 0.83, 1.3, 1.03, 0.17, 0.5, 0.36, 0.88, -0.33, 0.48, 0.24, 3.14, 1.17, 1.11, 2.11, 0.53, 0.42, 1.17, 1.23, 1.05, 7.19, 0.6, 0.68, 0.32, 0.93, 1.23, 0.02, 1.03, 0.6, 4.14, 0.71, 0.02, 0.54, 0.28, 1.44, 1.46, 0.45, 11.06, 1.08, 0.23, -0.28, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/aokJADOVMC0_filtered.json b/annotations_filtered/aokJADOVMC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01a0f885dea5680798dc2872bf3a2005059aed41 --- /dev/null +++ b/annotations_filtered/aokJADOVMC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.71], [8.0, 9.26], [11.0, 14.74], [17.0, 18.66], [22.0, 24.61], [25.0, 27.03], [29.0, 29.59], [31.0, 33.02], [35.0, 34.99], [36.0, 37.0], [38.0, 39.36], [44.0, 45.81], [48.0, 48.24], [51.0, 52.44], [54.0, 57.99], [58.0, 64.54], [74.0, 81.06], [84.0, 85.21], [86.0, 88.55], [94.0, 95.28], [98.0, 105.97], [108.0, 110.57], [118.0, 120.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [79.94, 0.0, 100.0, 0.0, 99.99, 99.59, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 35.44, 32.55, 0.0, 44.34, 0.0, 31.68, 32.67, 58.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.58], ["speech", 23.37], ["didgeridoo", 2.78]], [["music", 67.36], ["speech", 12.5], ["didgeridoo", 7.81]], null, [["music", 51.89], ["speech", 14.63], ["scary music", 8.03]], null, [["music", 49.81], ["speech", 17.55], ["synthesizer", 4.32]], [["music", 57.5], ["throbbing", 3.74], ["electronic music", 1.89]], null], "duration": [2.71, 1.26, 3.74, 1.66, 2.61, 2.03, 0.59, 2.02, -0.01, 1.0, 1.36, 1.81, 0.24, 1.44, 3.99, 6.54, 7.06, 1.21, 2.55, 1.28, 7.97, 2.57, 2.87]} \ No newline at end of file diff --git a/annotations_filtered/aopdD9Cu-So_filtered.json b/annotations_filtered/aopdD9Cu-So_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..475c87d348a4b1b98ba9b0516a424c2b892c700e --- /dev/null +++ b/annotations_filtered/aopdD9Cu-So_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.8], [8.0, 15.82], [25.0, 25.42], [26.0, 27.95], [28.0, 29.52], [30.0, 30.38], [35.0, 35.77], [41.0, 61.25], [63.0, 63.04], [64.0, 64.3], [66.0, 66.18], [67.0, 67.83], [77.0, 77.58], [78.0, 78.87]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 34.43, 0.0, 0.0, 0.0, 0.0, 0.0, 36.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["theremin", 74.57], ["music", 17.15], ["musical instrument", 0.72]], null, null, null, null, null, [["animal", 55.62], ["domestic animals, pets", 7.02], ["howl", 6.15]], null, null, null, null, null, null], "duration": [0.8, 7.82, 0.42, 1.95, 1.52, 0.38, 0.77, 20.25, 0.04, 0.3, 0.18, 0.83, 0.58, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/apasYYh6nEA_filtered.json b/annotations_filtered/apasYYh6nEA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3348c95219d62b89ade2a87ffc2a8ea97db6f64d --- /dev/null +++ b/annotations_filtered/apasYYh6nEA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 24.7], [25.0, 24.8], [25.0, 25.46], [25.0, 36.78], [39.0, 38.84], [39.0, 46.77], [58.0, 60.74], [62.0, 63.49], [65.0, 65.84], [69.0, 73.89], [79.0, 79.25], [79.0, 79.61], [80.0, 80.81], [85.0, 85.36], [93.0, 93.18], [98.0, 98.05], [99.0, 99.17], [100.0, 100.25], [101.0, 101.46], [106.0, 106.3], [107.0, 107.7], [109.0, 109.49], [110.0, 118.2], [125.0, 127.18], [130.0, 132.76], [136.0, 140.78], [143.0, 143.55], [146.0, 151.6]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 38.43, 0.0, 36.46, 46.54, 0.0, 0.0, 30.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.88, 39.58, 33.49, 38.12, 0.0, 36.84], "audiomae_on_audioset": [null, null, null, [["speech", 82.47], ["whack, thwack", 6.59], ["hammer", 3.21]], null, [["speech", 84.48], ["firecracker", 3.76], ["explosion", 3.57]], [["speech", 27.46], ["fly, housefly", 17.17], ["insect", 8.19]], null, null, [["fart", 66.72], ["speech", 19.08], ["groan", 1.27]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 12.38], ["police car (siren)", 11.07], ["groan", 10.63]], [["cowbell", 26.14], ["speech", 14.66], ["music", 5.07]], [["speech", 43.31], ["music", 4.96], ["fart", 3.85]], [["speech", 61.44], ["fart", 3.95], ["eruption", 2.15]], null, [["speech", 25.96], ["livestock, farm animals, working animals", 11.02], ["cowbell", 10.34]]], "duration": [-0.3, -0.2, 0.46, 11.78, -0.16, 7.77, 2.74, 1.49, 0.84, 4.89, 0.25, 0.61, 0.81, 0.36, 0.18, 0.05, 0.17, 0.25, 0.46, 0.3, 0.7, 0.49, 8.2, 2.18, 2.76, 4.78, 0.55, 5.6]} \ No newline at end of file diff --git a/annotations_filtered/aqIYxDk4vh8_filtered.json b/annotations_filtered/aqIYxDk4vh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..895a0a53eeb7addd350ea308dfc2c993ddb82546 --- /dev/null +++ b/annotations_filtered/aqIYxDk4vh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.7], [6.0, 10.07], [15.0, 22.79], [24.0, 30.33], [36.0, 36.0], [40.0, 46.04], [49.0, 55.71], [58.0, 58.04], [61.0, 62.13], [64.0, 64.34], [66.0, 70.68], [71.0, 72.57], [76.0, 78.16], [83.0, 89.45], [94.0, 98.61], [103.0, 104.85], [107.0, 114.62], [117.0, 118.18], [121.0, 127.52], [128.0, 127.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false], "silence_prob": [0.0, 34.16, 31.01, 30.67, 0.0, 30.9, 31.07, 0.0, 0.0, 0.0, 31.92, 0.0, 33.54, 31.15, 30.92, 0.0, 30.55, 0.0, 31.36, 0.0], "audiomae_on_audioset": [null, [["music", 64.08], ["synthesizer", 6.68], ["sampler", 2.94]], [["music", 64.41], ["singing", 4.12], ["synthesizer", 2.82]], [["music", 76.61], ["middle eastern music", 2.32], ["singing", 1.75]], null, [["music", 78.72], ["didgeridoo", 3.04], ["vocal music", 3.02]], [["music", 58.5], ["synthesizer", 13.46], ["musical instrument", 5.57]], null, null, null, [["music", 72.76], ["singing", 1.75], ["carnatic music", 1.7]], null, [["music", 57.88], ["synthesizer", 14.68], ["sampler", 4.16]], [["music", 44.4], ["didgeridoo", 12.05], ["synthesizer", 9.08]], [["music", 83.76], ["singing", 1.61], ["musical instrument", 1.27]], null, [["music", 44.05], ["livestock, farm animals, working animals", 10.7], ["moo", 10.59]], null, [["music", 43.21], ["theremin", 17.82], ["guitar", 6.07]], null], "duration": [0.7, 4.07, 7.79, 6.33, 0.0, 6.04, 6.71, 0.04, 1.13, 0.34, 4.68, 1.57, 2.16, 6.45, 4.61, 1.85, 7.62, 1.18, 6.52, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/aqa74uEbtDE_filtered.json b/annotations_filtered/aqa74uEbtDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc9f2bb2fb7365c8e33a0a230ceac056ca427f04 --- /dev/null +++ b/annotations_filtered/aqa74uEbtDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.16], [13.0, 33.83], [35.0, 42.45], [44.0, 43.95], [44.0, 67.44], [70.0, 70.16], [70.0, 70.19], [70.0, 94.29], [95.0, 101.22], [102.0, 129.54]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [54.5, 53.1, 50.06, 0.0, 50.36, 0.0, 0.0, 52.8, 55.25, 44.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 43.1], ["hum", 10.86], ["speech", 8.99]]], "duration": [5.16, 20.83, 7.45, -0.05, 23.44, 0.16, 0.19, 24.29, 6.22, 27.54]} \ No newline at end of file diff --git a/annotations_filtered/aqsJPtd8Cis_filtered.json b/annotations_filtered/aqsJPtd8Cis_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea45a0d1858452986d0deb46415b8e57c92be219 --- /dev/null +++ b/annotations_filtered/aqsJPtd8Cis_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [8.0, 9.53], [12.0, 13.58], [16.0, 16.61], [18.0, 19.23], [21.0, 21.27], [24.0, 24.8], [28.0, 29.15], [30.0, 30.52], [36.0, 35.92], [36.0, 43.02], [43.0, 44.02], [48.0, 49.2], [50.0, 50.23], [55.0, 55.97], [57.0, 60.59], [62.0, 65.92], [69.0, 69.47], [71.0, 71.17], [73.0, 75.17], [78.0, 78.76], [82.0, 82.8], [87.0, 87.54], [89.0, 89.23], [90.0, 90.46], [91.0, 91.71], [96.0, 96.53], [98.0, 99.79], [102.0, 106.74], [107.0, 108.01], [109.0, 111.89], [115.0, 115.92], [119.0, 120.6], [121.0, 121.66], [128.0, 128.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 0.0, 0.0, 72.9, 97.43, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.51, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["bouncing", 19.13], ["noise", 11.46], ["speech", 9.26]], null, null, null, null, null, null], "duration": [1.42, 1.53, 1.58, 0.61, 1.23, 0.27, 0.8, 1.15, 0.52, -0.08, 7.02, 1.02, 1.2, 0.23, 0.97, 3.59, 3.92, 0.47, 0.17, 2.17, 0.76, 0.8, 0.54, 0.23, 0.46, 0.71, 0.53, 1.79, 4.74, 1.01, 2.89, 0.92, 1.6, 0.66, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/aqvTaYLP8yc_filtered.json b/annotations_filtered/aqvTaYLP8yc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bfa6be6a7e7cfce0c33a3a83bcb00ca21021949 --- /dev/null +++ b/annotations_filtered/aqvTaYLP8yc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.55], [5.0, 5.36], [6.0, 6.05], [7.0, 7.43], [8.0, 8.92], [10.0, 10.3], [10.0, 19.28], [20.0, 20.6], [22.0, 22.67], [25.0, 26.28], [27.0, 29.61], [32.0, 32.97], [37.0, 38.13], [40.0, 40.46], [42.0, 42.28], [44.0, 44.71], [45.0, 45.35], [46.0, 46.25], [50.0, 51.49], [54.0, 54.08], [57.0, 57.52], [58.0, 58.56], [62.0, 62.7], [67.0, 67.09], [68.0, 68.42], [70.0, 71.05], [72.0, 74.75], [75.0, 77.89], [84.0, 85.97], [86.0, 86.78], [90.0, 90.36], [91.0, 91.03], [92.0, 92.37], [94.0, 94.46], [101.0, 101.39], [103.0, 104.11], [106.0, 106.34], [107.0, 107.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 68.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.55, 0.36, 0.05, 0.43, 0.92, 0.3, 9.28, 0.6, 0.67, 1.28, 2.61, 0.97, 1.13, 0.46, 0.28, 0.71, 0.35, 0.25, 1.49, 0.08, 0.52, 0.56, 0.7, 0.09, 0.42, 1.05, 2.75, 2.89, 1.97, 0.78, 0.36, 0.03, 0.37, 0.46, 0.39, 1.11, 0.34, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/ar0xLps7WSY_filtered.json b/annotations_filtered/ar0xLps7WSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/ar0xLps7WSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ar5YGIFyEUY_filtered.json b/annotations_filtered/ar5YGIFyEUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70960828d7bff0bd2c9d3cf32647783ba72d53fd --- /dev/null +++ b/annotations_filtered/ar5YGIFyEUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.48], [19.0, 19.55], [20.0, 21.96], [23.0, 23.6], [29.0, 29.52], [30.0, 32.63], [40.0, 40.91], [50.0, 49.98], [66.0, 66.9], [75.0, 74.82], [84.0, 85.21], [88.0, 87.76], [96.0, 98.63], [101.0, 101.63], [121.0, 123.26], [126.0, 126.12], [127.0, 128.39]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [33.97, 0.0, 0.0, 0.0, 0.0, 37.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.34, 0.0, 44.84, 0.0, 0.0], "audiomae_on_audioset": [[["rumble", 33.12], ["speech", 14.76], ["hum", 12.29]], null, null, null, null, [["music", 24.06], ["synthesizer", 8.98], ["echo", 8.97]], null, null, null, null, null, null, [["speech", 29.97], ["hum", 19.99], ["rumble", 16.14]], null, [["sonar", 22.64], ["hum", 17.01], ["music", 15.33]], null, null], "duration": [6.48, 0.55, 1.96, 0.6, 0.52, 2.63, 0.91, -0.02, 0.9, -0.18, 1.21, -0.24, 2.63, 0.63, 2.26, 0.12, 1.39]} \ No newline at end of file diff --git a/annotations_filtered/ar72efkbkSo_filtered.json b/annotations_filtered/ar72efkbkSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba126c0ab6ea124e08e9b4b2baeabe7d7969d84b --- /dev/null +++ b/annotations_filtered/ar72efkbkSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.13], [5.0, 8.36], [9.0, 12.09], [14.0, 22.42], [23.0, 37.23], [38.0, 48.24], [48.0, 53.81], [54.0, 55.49], [56.0, 57.3], [60.0, 60.17], [61.0, 61.4], [64.0, 64.27], [67.0, 69.9], [77.0, 77.35], [79.0, 78.88], [92.0, 96.13], [109.0, 111.81], [112.0, 113.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 100.0, 100.0, 100.0, 99.99, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 53.59, 81.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.13, 3.36, 3.09, 8.42, 14.23, 10.24, 5.81, 1.49, 1.3, 0.17, 0.4, 0.27, 2.9, 0.35, -0.12, 4.13, 2.81, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/arQDNf6cjaw_filtered.json b/annotations_filtered/arQDNf6cjaw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb234195961544437178b6eb9f83f8d8b94a29a2 --- /dev/null +++ b/annotations_filtered/arQDNf6cjaw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [22.0, 23.26], [56.0, 56.67], [78.0, 87.44], [88.0, 88.82], [90.0, 93.53], [97.0, 99.35], [100.0, 100.47]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 55.31, 0.0, 74.92, 70.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.43, 1.26, 0.67, 9.44, 0.82, 3.53, 2.35, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/ar_o_qS68oA_filtered.json b/annotations_filtered/ar_o_qS68oA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e4e3dca489d28892fe80d8f43e12bd26af54d00 --- /dev/null +++ b/annotations_filtered/ar_o_qS68oA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.7], [11.0, 11.91], [14.0, 15.18], [15.0, 16.29], [17.0, 50.23], [52.0, 52.02], [53.0, 53.64], [54.0, 55.19], [57.0, 59.02], [60.0, 60.13], [63.0, 64.18], [67.0, 68.07], [70.0, 70.04], [80.0, 82.05], [84.0, 85.8], [87.0, 108.23], [109.0, 110.17], [113.0, 112.95], [116.0, 115.72], [117.0, 118.15], [119.0, 119.37], [119.0, 119.4], [119.0, 119.43], [119.0, 119.47], [119.0, 119.5], [121.0, 122.64], [125.0, 127.7], [134.0, 142.52], [144.0, 147.43], [149.0, 150.03], [150.0, 152.41], [156.0, 156.24], [158.0, 159.6]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [41.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 0.0, 48.14, 0.0, 29.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.8, 43.9, 30.2, 0.0, 37.73, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 17.62], ["speech", 11.91], ["hum", 11.43]], null, null, null, null, null, null, null, [["speech", 25.95], ["sidetone", 24.98], ["radio", 16.7]], null, null, null, null, [["music", 28.69], ["hum", 17.11], ["radio", 10.88]], null, [["didgeridoo", 32.08], ["music", 18.57], ["mains hum", 14.89]], null, null, null, null, null, null, null, null, null, null, [["speech", 29.42], ["cattle, bovinae", 28.61], ["moo", 17.25]], [["mains hum", 73.94], ["hum", 17.21], ["buzz", 2.13]], [["music", 10.09], ["didgeridoo", 9.29], ["reverberation", 8.44]], null, [["mains hum", 35.42], ["hum", 29.7], ["speech", 12.82]], null, null], "duration": [2.7, 0.91, 1.18, 1.29, 33.23, 0.02, 0.64, 1.19, 2.02, 0.13, 1.18, 1.07, 0.04, 2.05, 1.8, 21.23, 1.17, -0.05, -0.28, 1.15, 0.37, 0.4, 0.43, 0.47, 0.5, 1.64, 2.7, 8.52, 3.43, 1.03, 2.41, 0.24, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/arf7Bi4CCmU_filtered.json b/annotations_filtered/arf7Bi4CCmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8c11242439316ff897c7324685b5a19d04d28dc --- /dev/null +++ b/annotations_filtered/arf7Bi4CCmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.86], [8.0, 37.91], [39.0, 42.06], [43.0, 45.82], [49.0, 50.38], [52.0, 54.13], [55.0, 89.43], [91.0, 93.66], [95.0, 97.7], [100.0, 104.77], [105.0, 106.56], [109.0, 113.1], [114.0, 116.56], [117.0, 119.48]], "keep_status": [false, false, false, true, false, false, false, true, true, false, false, true, true, true], "silence_prob": [0.0, 54.63, 53.1, 45.56, 0.0, 52.22, 0.0, 35.46, 35.18, 35.89, 0.0, 37.43, 38.54, 34.1], "audiomae_on_audioset": [null, null, null, [["buzz", 13.35], ["sine wave", 11.36], ["mains hum", 10.84]], null, null, null, [["music", 45.84], ["theremin", 8.09], ["foghorn", 7.56]], [["music", 51.26], ["foghorn", 9.6], ["scary music", 7.46]], [["speech", 40.15], ["music", 25.08], ["synthesizer", 5.24]], null, [["music", 37.02], ["speech", 19.44], ["buzz", 4.0]], [["music", 20.47], ["speech", 18.81], ["hum", 5.66]], [["speech", 19.6], ["mains hum", 14.99], ["hum", 14.13]]], "duration": [0.86, 29.91, 3.06, 2.82, 1.38, 2.13, 34.43, 2.66, 2.7, 4.77, 1.56, 4.1, 2.56, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/arfamPuUOek_filtered.json b/annotations_filtered/arfamPuUOek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79e662676d390dcda3e161c6a1670e946788d08e --- /dev/null +++ b/annotations_filtered/arfamPuUOek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.89], [9.0, 9.46], [12.0, 12.65], [14.0, 21.96], [23.0, 22.71], [24.0, 28.98], [30.0, 30.32], [34.0, 35.97], [37.0, 37.84], [42.0, 43.78], [45.0, 45.86], [49.0, 50.33], [58.0, 57.81], [66.0, 102.59], [108.0, 112.73], [113.0, 117.66], [120.0, 122.15], [125.0, 128.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [33.89, 0.0, 0.0, 32.46, 0.0, 41.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.42, 31.19, 33.69, 99.98], "audiomae_on_audioset": [[["music", 71.43], ["musical instrument", 6.31], ["guitar", 4.64]], null, null, [["music", 62.02], ["quack", 11.39], ["bleat", 4.32]], null, [["music", 58.82], ["guitar", 9.85], ["effects unit", 7.63]], null, null, null, null, null, null, null, null, [["music", 64.06], ["musical instrument", 7.35], ["guitar", 5.41]], [["music", 30.17], ["bass guitar", 20.55], ["speech", 11.49]], [["music", 63.3], ["musical instrument", 5.87], ["effects unit", 4.67]], null], "duration": [3.89, 0.46, 0.65, 7.96, -0.29, 4.98, 0.32, 1.97, 0.84, 1.78, 0.86, 1.33, -0.19, 36.59, 4.73, 4.66, 2.15, 3.87]} \ No newline at end of file diff --git a/annotations_filtered/ariuokNFhSw_filtered.json b/annotations_filtered/ariuokNFhSw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c5d967f1ab5a165bca181026ccbc0e7d7be31e8 --- /dev/null +++ b/annotations_filtered/ariuokNFhSw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 24.8], [26.0, 32.14], [33.0, 37.22], [43.0, 80.27], [83.0, 136.04], [138.0, 138.28], [142.0, 145.71], [146.0, 145.94], [146.0, 153.91], [155.0, 164.47], [166.0, 165.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.94, 30.83, 30.29, 0.0, 0.0, 0.0, 29.87, 0.0, 30.41, 30.89, 0.0], "audiomae_on_audioset": [[["music", 45.15], ["theremin", 22.79], ["musical instrument", 6.11]], [["theremin", 35.6], ["music", 30.11], ["brass instrument", 5.43]], [["music", 66.2], ["theremin", 16.41], ["musical instrument", 5.72]], null, null, null, [["music", 49.94], ["brass instrument", 11.39], ["musical instrument", 10.22]], null, [["music", 48.59], ["foghorn", 30.91], ["musical instrument", 6.51]], [["music", 59.5], ["musical instrument", 12.47], ["brass instrument", 7.74]], null], "duration": [9.8, 6.14, 4.22, 37.27, 53.04, 0.28, 3.71, -0.06, 7.91, 9.47, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/arsAllZIa1Y_filtered.json b/annotations_filtered/arsAllZIa1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..883422ce9e65f52c617cb2b7812ac7238b3b1368 --- /dev/null +++ b/annotations_filtered/arsAllZIa1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 36.17], [38.0, 57.25], [60.0, 60.03]], "keep_status": [false, false, false], "silence_prob": [0.0, 34.21, 0.0], "audiomae_on_audioset": [null, [["music", 65.8], ["soundtrack music", 7.56], ["scary music", 6.11]], null], "duration": [1.17, 19.25, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/arzwnRoAQP0_filtered.json b/annotations_filtered/arzwnRoAQP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4ec7d03da5cf881cd77bfced05bb820999b8994 --- /dev/null +++ b/annotations_filtered/arzwnRoAQP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.74], [8.0, 8.95], [14.0, 16.68], [17.0, 17.85], [26.0, 27.58], [40.0, 40.12], [41.0, 41.15], [42.0, 43.5], [52.0, 52.78], [53.0, 54.09], [55.0, 59.7], [61.0, 61.62], [63.0, 64.86], [96.0, 103.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 32.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.08], ["hum", 2.7], ["speech", 2.59]]], "duration": [0.74, 0.95, 2.68, 0.85, 1.58, 0.12, 0.15, 1.5, 0.78, 1.09, 4.7, 0.62, 1.86, 7.62]} \ No newline at end of file diff --git a/annotations_filtered/asNSRS-UbHM_filtered.json b/annotations_filtered/asNSRS-UbHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2fc869758193ec69389e7b4c9eeeae3946a8622 --- /dev/null +++ b/annotations_filtered/asNSRS-UbHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.2], [20.0, 21.17], [22.0, 23.63], [25.0, 52.39], [53.0, 58.19], [62.0, 65.8], [69.0, 69.35], [71.0, 71.41], [72.0, 71.69], [72.0, 71.74], [72.0, 71.79], [72.0, 72.44], [73.0, 73.25], [73.0, 73.28], [77.0, 85.45], [87.0, 91.62], [93.0, 93.99], [94.0, 94.63], [96.0, 105.38], [108.0, 109.98], [111.0, 111.5], [113.0, 114.0], [115.0, 115.59], [117.0, 118.08]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.27, 35.21, 35.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.08, 37.61, 0.0, 0.0, 33.81, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 40.91], ["mains hum", 23.29], ["fly, housefly", 8.01]], [["speech", 60.43], ["music", 7.53], ["thump, thud", 2.58]], [["speech", 46.1], ["music", 17.51], ["didgeridoo", 5.84]], null, null, null, null, null, null, null, null, [["didgeridoo", 34.78], ["speech", 20.34], ["music", 13.73]], [["whale vocalization", 34.53], ["speech", 24.75], ["animal", 12.65]], null, null, [["animal", 25.69], ["music", 19.44], ["buzz", 11.88]], null, null, null, null, null], "duration": [1.2, 1.17, 1.63, 27.39, 5.19, 3.8, 0.35, 0.41, -0.31, -0.26, -0.21, 0.44, 0.25, 0.28, 8.45, 4.62, 0.99, 0.63, 9.38, 1.98, 0.5, 1.0, 0.59, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/as_lXF3HqCY_filtered.json b/annotations_filtered/as_lXF3HqCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b3e67688ca2fe1ef84170a6d8774b51d89f7a6c --- /dev/null +++ b/annotations_filtered/as_lXF3HqCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.7], [10.0, 10.57], [15.0, 15.94], [18.0, 19.41], [20.0, 20.78], [23.0, 24.39], [29.0, 29.3], [36.0, 38.25], [52.0, 52.88], [55.0, 55.22], [57.0, 59.29], [65.0, 67.78], [70.0, 75.68], [76.0, 77.08], [78.0, 78.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.7, 0.57, 0.94, 1.41, 0.78, 1.39, 0.3, 2.25, 0.88, 0.22, 2.29, 2.78, 5.68, 1.08, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/asxNFYNfOWI_filtered.json b/annotations_filtered/asxNFYNfOWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e12904fd36adde6551d9ebf8d0c0ae90a1dc0640 --- /dev/null +++ b/annotations_filtered/asxNFYNfOWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 26.03], [27.0, 31.5], [32.0, 32.56], [47.0, 48.66]], "keep_status": [true, true, false, false], "silence_prob": [40.38, 40.16, 0.0, 0.0], "audiomae_on_audioset": [[["music", 36.19], ["theremin", 20.59], ["musical instrument", 7.14]], [["hum", 13.02], ["tabla", 12.69], ["music", 11.95]], null, null], "duration": [5.03, 4.5, 0.56, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/asySRpuqnTM_filtered.json b/annotations_filtered/asySRpuqnTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..153706e0c97a4686d2741c584a55c43dbe4f2d1a --- /dev/null +++ b/annotations_filtered/asySRpuqnTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.75], [22.0, 35.67], [43.0, 46.04], [48.0, 55.61], [68.0, 68.77], [70.0, 89.43], [94.0, 95.82], [98.0, 108.65]], "keep_status": [false, false, true, true, false, false, false, false], "silence_prob": [0.0, 31.83, 30.66, 30.81, 0.0, 31.31, 0.0, 31.8], "audiomae_on_audioset": [null, [["music", 75.69], ["musical instrument", 3.13], ["rock and roll", 2.52]], [["music", 31.78], ["boing", 7.24], ["speech", 6.69]], [["music", 23.44], ["sidetone", 17.52], ["boing", 10.32]], null, [["music", 63.26], ["speech", 7.01], ["synthesizer", 5.6]], null, [["music", 70.56], ["cacophony", 3.9], ["boing", 3.42]]], "duration": [1.75, 13.67, 3.04, 7.61, 0.77, 19.43, 1.82, 10.65]} \ No newline at end of file diff --git a/annotations_filtered/at0yN2HBrt8_filtered.json b/annotations_filtered/at0yN2HBrt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d02d4ed0f590bcf244e6d95827a940e9023f421a --- /dev/null +++ b/annotations_filtered/at0yN2HBrt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.39], [11.0, 12.38], [17.0, 17.46], [22.0, 79.12], [81.0, 91.29], [92.0, 95.77], [97.0, 98.51], [100.0, 101.92], [104.0, 108.03], [110.0, 111.25], [112.0, 114.69], [121.0, 122.91], [124.0, 140.26], [149.0, 153.23], [157.0, 160.83], [161.0, 169.1], [170.0, 175.12], [176.0, 180.17], [182.0, 183.22], [186.0, 187.69], [189.0, 192.5], [194.0, 198.63], [205.0, 205.98], [209.0, 213.95], [218.0, 224.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 82.97, 79.59, 0.0, 0.0, 98.8, 0.0, 97.33, 0.0, 79.07, 89.72, 89.54, 99.95, 100.0, 99.96, 0.0, 0.0, 100.0, 96.66, 0.0, 75.07, 60.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 1.38, 0.46, 57.12, 10.29, 3.77, 1.51, 1.92, 4.03, 1.25, 2.69, 1.91, 16.26, 4.23, 3.83, 8.1, 5.12, 4.17, 1.22, 1.69, 3.5, 4.63, 0.98, 4.95, 6.85]} \ No newline at end of file diff --git a/annotations_filtered/atBUgwJAD0U_filtered.json b/annotations_filtered/atBUgwJAD0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d073aaebaf8decb6a5484f34a0f1e935e5f2f42 --- /dev/null +++ b/annotations_filtered/atBUgwJAD0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.88], [8.0, 9.21], [13.0, 14.72], [17.0, 23.87], [26.0, 123.8], [127.0, 126.98], [128.0, 131.75], [132.0, 165.27], [166.0, 175.69], [181.0, 182.19]], "keep_status": [false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.76, 0.0, 0.0, 35.97, 0.0, 37.54, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 24.43], ["music", 24.12], ["throbbing", 15.97]], null, null, [["throbbing", 25.54], ["music", 23.49], ["hum", 18.69]], null, [["music", 40.54], ["hum", 16.88], ["throbbing", 14.54]], null], "duration": [0.88, 1.21, 1.72, 6.87, 97.8, -0.02, 3.75, 33.27, 9.69, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/atGNvojXOvM_filtered.json b/annotations_filtered/atGNvojXOvM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3e2412921cbee35e9218b4f7010db5889f790c7 --- /dev/null +++ b/annotations_filtered/atGNvojXOvM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.76], [4.0, 5.19], [6.0, 6.86], [8.0, 15.65], [18.0, 18.22], [31.0, 31.48], [32.0, 33.29], [36.0, 36.44], [41.0, 41.42], [47.0, 48.52], [49.0, 50.89], [52.0, 52.81], [64.0, 64.34], [68.0, 69.33], [71.0, 72.4], [73.0, 74.06], [75.0, 77.4], [78.0, 80.74], [82.0, 84.18], [85.0, 86.19], [88.0, 89.73], [94.0, 93.77], [95.0, 96.35], [102.0, 103.3], [109.0, 111.23], [112.0, 113.29], [114.0, 116.72], [127.0, 127.99]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 82.97, 95.23, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 0.0, 89.01, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 15.33], ["explosion", 14.0], ["whale vocalization", 7.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.24, 1.19, 0.86, 7.65, 0.22, 0.48, 1.29, 0.44, 0.42, 1.52, 1.89, 0.81, 0.34, 1.33, 1.4, 1.06, 2.4, 2.74, 2.18, 1.19, 1.73, -0.23, 1.35, 1.3, 2.23, 1.29, 2.72, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/atQYOl5KL-o_filtered.json b/annotations_filtered/atQYOl5KL-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dff3df03b1f8ed90e117a1cca5bb15f0d181d82 --- /dev/null +++ b/annotations_filtered/atQYOl5KL-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 39.61], [40.0, 41.0], [41.0, 45.52], [46.0, 53.52], [54.0, 60.86], [69.0, 69.92]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.64, 63.42, 98.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [35.61, 1.0, 4.52, 7.52, 6.86, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/ataOtn-F5s4_filtered.json b/annotations_filtered/ataOtn-F5s4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adb9ff8bd85bff7995d18d5759b5a487ba6a5c96 --- /dev/null +++ b/annotations_filtered/ataOtn-F5s4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 74.26], [77.0, 91.18], [94.0, 107.62], [108.0, 118.47], [124.0, 124.23]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 32.64, 31.73, 37.4, 0.0], "audiomae_on_audioset": [null, [["music", 73.39], ["didgeridoo", 16.41], ["musical instrument", 1.75]], [["music", 59.09], ["speech", 16.15], ["hum", 2.77]], [["music", 44.73], ["hum", 21.24], ["mains hum", 15.98]], null], "duration": [73.26, 14.18, 13.62, 10.47, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/athtiym8OYE_filtered.json b/annotations_filtered/athtiym8OYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea2ed5d39b9b1049378271aede85de866c3628a0 --- /dev/null +++ b/annotations_filtered/athtiym8OYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.16], [23.0, 24.92], [28.0, 28.05], [29.0, 30.38], [34.0, 33.83], [36.0, 37.25], [38.0, 39.29], [42.0, 42.2], [45.0, 45.1], [46.0, 47.24], [48.0, 49.15], [51.0, 51.48], [52.0, 52.78], [54.0, 54.43], [56.0, 56.91], [59.0, 58.9], [60.0, 62.68], [67.0, 66.88]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [29.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.33, 0.0], "audiomae_on_audioset": [[["music", 21.91], ["throbbing", 20.81], ["sidetone", 9.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.91], ["throbbing", 14.24], ["hum", 12.2]], null], "duration": [4.16, 1.92, 0.05, 1.38, -0.17, 1.25, 1.29, 0.2, 0.1, 1.24, 1.15, 0.48, 0.78, 0.43, 0.91, -0.1, 2.68, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/atzQpAlaojg_filtered.json b/annotations_filtered/atzQpAlaojg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..658a81b87fa9a66a5cd6ad5bf4aa8f99b00b6aaa --- /dev/null +++ b/annotations_filtered/atzQpAlaojg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.99], [15.0, 31.6], [33.0, 44.41]], "keep_status": [true, false, false], "silence_prob": [32.21, 33.97, 56.86], "audiomae_on_audioset": [[["music", 32.4], ["animal", 15.32], ["dog", 10.46]], [["music", 63.84], ["musical instrument", 6.45], ["didgeridoo", 3.5]], null], "duration": [3.99, 16.6, 11.41]} \ No newline at end of file diff --git a/annotations_filtered/au5XE48PEeU_filtered.json b/annotations_filtered/au5XE48PEeU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae28eb9422018bd4f4ee713b937e3eac41b77946 --- /dev/null +++ b/annotations_filtered/au5XE48PEeU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.95], [6.0, 6.64], [8.0, 8.34], [9.0, 12.19], [14.0, 14.74], [18.0, 18.52], [19.0, 19.52], [20.0, 24.11], [25.0, 25.2], [31.0, 31.45], [32.0, 35.48], [36.0, 36.98], [37.0, 37.84], [42.0, 42.11], [45.0, 52.49], [53.0, 53.49], [55.0, 56.84], [57.0, 57.6], [58.0, 59.56], [61.0, 62.6], [63.0, 63.85], [65.0, 67.05], [96.0, 98.52], [99.0, 99.49], [102.0, 102.32], [103.0, 103.05], [105.0, 105.48], [107.0, 107.62], [109.0, 109.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 35.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.29, 43.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 24.85], ["firecracker", 14.94], ["burst, pop", 11.37]], null, null, null, null, null, null, [["music", 36.79], ["speech", 27.02], ["smash, crash", 5.23]], [["speech", 76.33], ["radio", 5.81], ["fart", 1.75]], null, null, null, null, null, null], "duration": [0.95, 0.64, 0.34, 3.19, 0.74, 0.52, 0.52, 4.11, 0.2, 0.45, 3.48, 0.98, 0.84, 0.11, 7.49, 0.49, 1.84, 0.6, 1.56, 1.6, 0.85, 2.05, 2.52, 0.49, 0.32, 0.05, 0.48, 0.62, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/au9pGQ9AuUs_filtered.json b/annotations_filtered/au9pGQ9AuUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d81146e905c08eaebcc8e5c075e91c661ca8154b --- /dev/null +++ b/annotations_filtered/au9pGQ9AuUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.72], [5.0, 7.87], [11.0, 11.94], [17.0, 17.56], [19.0, 20.11], [30.0, 30.64], [32.0, 32.91], [34.0, 38.31], [44.0, 44.78], [48.0, 48.91], [52.0, 52.39], [69.0, 70.17], [71.0, 75.05], [76.0, 77.06], [82.0, 82.86], [96.0, 96.89], [103.0, 103.74], [117.0, 117.75], [123.0, 123.82], [127.0, 128.87], [129.0, 131.4], [135.0, 135.24], [138.0, 138.75], [142.0, 141.61], [145.0, 144.86], [145.0, 146.8], [151.0, 152.91], [160.0, 160.25], [168.0, 169.72], [174.0, 175.02], [217.0, 221.83], [224.0, 225.22], [227.0, 227.57], [230.0, 231.08], [237.0, 237.0]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 34.91, 0.0, 0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 32.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 38.17], ["synthesizer", 8.69], ["effects unit", 4.98]], null, null, null, null, null, [["speech", 71.06], ["sidetone", 6.88], ["hum", 4.89]], null, null, null, null, [["music", 64.93], ["synthesizer", 12.14], ["theremin", 3.79]], null, null, null, null, null, null, null, [["music", 48.61], ["theremin", 15.47], ["musical instrument", 3.14]], null, null, null, null, null, null, null, null, null, [["music", 50.61], ["middle eastern music", 5.83], ["singing", 3.77]], null, null, null, null], "duration": [1.72, 2.87, 0.94, 0.56, 1.11, 0.64, 0.91, 4.31, 0.78, 0.91, 0.39, 1.17, 4.05, 1.06, 0.86, 0.89, 0.74, 0.75, 0.82, 1.87, 2.4, 0.24, 0.75, -0.39, -0.14, 1.8, 1.91, 0.25, 1.72, 1.02, 4.83, 1.22, 0.57, 1.08, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/auNkHDpPil4_filtered.json b/annotations_filtered/auNkHDpPil4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f48deeaf61038691386684d0ada0fe2b8a211945 --- /dev/null +++ b/annotations_filtered/auNkHDpPil4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 26.77], [36.0, 37.89], [38.0, 43.02], [44.0, 44.63], [48.0, 48.39], [50.0, 52.15], [59.0, 63.63], [72.0, 76.81], [82.0, 82.02], [82.0, 82.26], [83.0, 86.41], [87.0, 89.28], [90.0, 91.71], [95.0, 104.26], [106.0, 108.18], [110.0, 117.58], [121.0, 121.83], [124.0, 124.5], [125.0, 127.35], [130.0, 131.09], [138.0, 138.57], [139.0, 140.9], [143.0, 148.49], [152.0, 154.82], [157.0, 159.27], [160.0, 162.3], [163.0, 164.86], [166.0, 167.34], [169.0, 170.07], [171.0, 174.66]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [30.58, 0.0, 30.7, 0.0, 0.0, 31.28, 29.11, 62.17, 0.0, 0.0, 55.11, 56.1, 0.0, 52.45, 56.86, 43.93, 0.0, 0.0, 45.05, 0.0, 0.0, 0.0, 39.75, 61.18, 45.36, 53.1, 0.0, 0.0, 0.0, 56.55], "audiomae_on_audioset": [[["music", 55.64], ["didgeridoo", 15.11], ["musical instrument", 3.2]], null, [["music", 38.21], ["moo", 14.15], ["boing", 10.63]], null, null, [["speech", 33.9], ["livestock, farm animals, working animals", 11.9], ["moo", 8.37]], [["speech", 43.59], ["applause", 7.73], ["fart", 6.18]], null, null, null, null, null, null, null, null, [["music", 42.4], ["speech", 7.95], ["hum", 6.96]], null, null, [["music", 18.33], ["speech", 12.33], ["hum", 8.56]], null, null, null, [["frog", 20.31], ["whale vocalization", 12.89], ["speech", 9.71]], null, [["speech", 43.17], ["music", 6.1], ["fly, housefly", 3.89]], null, null, null, null, null], "duration": [21.77, 1.89, 5.02, 0.63, 0.39, 2.15, 4.63, 4.81, 0.02, 0.26, 3.41, 2.28, 1.71, 9.26, 2.18, 7.58, 0.83, 0.5, 2.35, 1.09, 0.57, 1.9, 5.49, 2.82, 2.27, 2.3, 1.86, 1.34, 1.07, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/au_5dPh_Dm8_filtered.json b/annotations_filtered/au_5dPh_Dm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52d1d11dc846781bcf2f5a6d0358c6bd3b061ffe --- /dev/null +++ b/annotations_filtered/au_5dPh_Dm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.84], [25.0, 24.8], [31.0, 30.65], [32.0, 31.9], [38.0, 38.82], [42.0, 42.26], [48.0, 48.12], [48.0, 48.78]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.84, -0.2, -0.35, -0.1, 0.82, 0.26, 0.12, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/auccmqO45a8_filtered.json b/annotations_filtered/auccmqO45a8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..551bcde5f907641a9c136a61af90931dd882665f --- /dev/null +++ b/annotations_filtered/auccmqO45a8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.45], [10.0, 10.27], [11.0, 11.37], [13.0, 14.2], [16.0, 18.57], [21.0, 21.41], [28.0, 29.02], [31.0, 34.52], [37.0, 37.83], [47.0, 47.85], [50.0, 50.46], [51.0, 52.46], [54.0, 55.02], [56.0, 56.66], [57.0, 57.62], [64.0, 64.1], [71.0, 72.0], [75.0, 78.26], [81.0, 83.34], [86.0, 87.51], [90.0, 90.09], [91.0, 92.4], [94.0, 94.36], [96.0, 96.5], [98.0, 98.81], [100.0, 100.11], [101.0, 101.53], [109.0, 112.24], [114.0, 122.88], [126.0, 129.27], [131.0, 134.45], [135.0, 135.68], [138.0, 139.67], [142.0, 144.51], [145.0, 148.15], [150.0, 156.1], [157.0, 157.33]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [64.07, 0.0, 0.0, 0.0, 31.97, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.52, 44.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 39.0, 37.31, 62.68, 0.0, 0.0, 42.81, 37.28, 95.78, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 27.9], ["speech", 17.64], ["radio", 15.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.11], ["cattle, bovinae", 12.27], ["moo", 9.22]], null, null, null, null, null, null, null, null, null, [["speech", 30.95], ["radio", 18.96], ["animal", 8.08]], [["radio", 46.08], ["splinter", 10.61], ["sidetone", 4.25]], null, null, null, [["speech", 52.67], ["radio", 8.43], ["telephone", 6.46]], [["sidetone", 75.13], ["speech", 13.33], ["radio", 3.98]], null, null], "duration": [4.45, 0.27, 0.37, 1.2, 2.57, 0.41, 1.02, 3.52, 0.83, 0.85, 0.46, 1.46, 1.02, 0.66, 0.62, 0.1, 1.0, 3.26, 2.34, 1.51, 0.09, 1.4, 0.36, 0.5, 0.81, 0.11, 0.53, 3.24, 8.88, 3.27, 3.45, 0.68, 1.67, 2.51, 3.15, 6.1, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/aucs5KRFzhE_filtered.json b/annotations_filtered/aucs5KRFzhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b72fa63a0307119beff3c521d5593a9a840f405 --- /dev/null +++ b/annotations_filtered/aucs5KRFzhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.02], [16.0, 16.7], [20.0, 20.93], [43.0, 51.61], [55.0, 55.68], [56.0, 57.57], [61.0, 62.06], [65.0, 66.28], [68.0, 72.64], [77.0, 79.95], [80.0, 89.92], [94.0, 100.13], [105.0, 108.6], [109.0, 109.81], [111.0, 131.11], [132.0, 133.79], [135.0, 155.55], [159.0, 167.95], [169.0, 171.39], [171.0, 177.62], [180.0, 201.31]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, false, true, false, true, false, false, false, true], "silence_prob": [40.62, 0.0, 0.0, 28.8, 0.0, 0.0, 0.0, 0.0, 28.29, 28.42, 28.26, 28.37, 28.78, 0.0, 28.62, 0.0, 28.64, 28.97, 28.9, 28.67, 28.29], "audiomae_on_audioset": [[["music", 46.43], ["fart", 31.28], ["zipper (clothing)", 12.49]], null, null, [["mains hum", 44.99], ["hum", 29.79], ["throbbing", 13.19]], null, null, null, null, [["speech", 46.62], ["music", 18.22], ["explosion", 7.18]], [["music", 46.18], ["buzz", 5.55], ["mains hum", 5.0]], [["music", 18.81], ["car", 5.58], ["mains hum", 5.41]], [["music", 59.66], ["speech", 12.87], ["electronic music", 7.13]], [["speech", 28.65], ["music", 19.15], ["vehicle", 5.36]], null, [["music", 55.25], ["cacophony", 6.05], ["synthesizer", 3.72]], null, [["music", 29.86], ["speech", 25.01], ["machine gun", 11.04]], [["music", 62.73], ["didgeridoo", 6.26], ["musical instrument", 4.17]], [["speech", 43.93], ["music", 29.81], ["boing", 4.34]], [["music", 67.33], ["speech", 12.19], ["throbbing", 2.46]], [["hum", 24.27], ["music", 22.65], ["mains hum", 14.2]]], "duration": [2.02, 0.7, 0.93, 8.61, 0.68, 1.57, 1.06, 1.28, 4.64, 2.95, 9.92, 6.13, 3.6, 0.81, 20.11, 1.79, 20.55, 8.95, 2.39, 6.62, 21.31]} \ No newline at end of file diff --git a/annotations_filtered/aumRE2Eq88o_filtered.json b/annotations_filtered/aumRE2Eq88o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..187c8c75c4e56279b2ac37ee396b4bc80d70d4da --- /dev/null +++ b/annotations_filtered/aumRE2Eq88o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.24], [6.0, 12.06], [13.0, 14.69], [16.0, 21.25], [22.0, 22.11], [23.0, 26.86], [30.0, 31.46], [33.0, 34.05], [35.0, 36.51], [38.0, 40.76], [45.0, 47.46], [52.0, 58.65], [59.0, 66.5], [67.0, 74.68], [78.0, 78.29], [83.0, 115.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [100.0, 100.0, 0.0, 92.97, 0.0, 81.71, 0.0, 0.0, 0.0, 99.65, 97.92, 73.82, 42.26, 41.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.27], ["keyboard (musical)", 13.21], ["musical instrument", 11.38]], [["music", 22.68], ["speech", 15.01], ["keyboard (musical)", 8.83]], null, null], "duration": [2.24, 6.06, 1.69, 5.25, 0.11, 3.86, 1.46, 1.05, 1.51, 2.76, 2.46, 6.65, 7.5, 7.68, 0.29, 32.94]} \ No newline at end of file diff --git a/annotations_filtered/avH2K1iR8Oo_filtered.json b/annotations_filtered/avH2K1iR8Oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6c48f1e3bd24a319d1a419b5149b758dd513a3a --- /dev/null +++ b/annotations_filtered/avH2K1iR8Oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.48], [8.0, 16.43], [17.0, 20.46], [22.0, 22.28], [23.0, 24.66], [26.0, 26.59], [27.0, 30.7], [33.0, 34.67], [39.0, 39.04], [41.0, 42.52], [45.0, 47.65], [51.0, 52.02], [54.0, 55.04], [56.0, 56.86], [57.0, 57.06], [57.0, 58.67], [60.0, 60.44], [61.0, 63.05], [64.0, 64.74], [65.0, 68.12], [70.0, 73.62], [74.0, 74.49], [75.0, 76.45], [87.0, 91.84], [94.0, 94.04], [95.0, 103.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 82.61, 53.91, 0.0, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 82.79, 49.59, 0.0, 0.0, 88.46, 0.0, 57.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.92], ["fly, housefly", 21.48], ["insect", 13.23]], null, null, null, null, null], "duration": [0.48, 8.43, 3.46, 0.28, 1.66, 0.59, 3.7, 1.67, 0.04, 1.52, 2.65, 1.02, 1.04, 0.86, 0.06, 1.67, 0.44, 2.05, 0.74, 3.12, 3.62, 0.49, 1.45, 4.84, 0.04, 8.13]} \ No newline at end of file diff --git a/annotations_filtered/avXk2EamFs4_filtered.json b/annotations_filtered/avXk2EamFs4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60fe7745481e2bee0e3b9bce5005a61f5314e70e --- /dev/null +++ b/annotations_filtered/avXk2EamFs4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.69], [16.0, 64.5], [69.0, 72.23], [73.0, 74.19], [77.0, 87.44]], "keep_status": [false, false, false, false, false], "silence_prob": [36.85, 0.0, 33.43, 0.0, 31.09], "audiomae_on_audioset": [[["music", 31.76], ["mains hum", 21.05], ["hum", 20.9]], null, [["hum", 34.47], ["music", 30.31], ["mains hum", 10.29]], null, [["music", 33.63], ["speech", 19.92], ["hum", 17.85]]], "duration": [5.69, 48.5, 3.23, 1.19, 10.44]} \ No newline at end of file diff --git a/annotations_filtered/avjdKTqiVvQ_filtered.json b/annotations_filtered/avjdKTqiVvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d95ab994506e30459d716fd0e9cb7b434c036a6 --- /dev/null +++ b/annotations_filtered/avjdKTqiVvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 89.56], [93.0, 117.04], [118.0, 117.95], [124.0, 124.17], [128.0, 133.96], [138.0, 138.82]], "keep_status": [false, false, false, false, false, false], "silence_prob": [86.82, 47.62, 0.0, 0.0, 83.7, 0.0], "audiomae_on_audioset": [null, [["music", 66.82], ["theremin", 20.3], ["ambient music", 4.36]], null, null, null, null], "duration": [10.56, 24.04, -0.05, 0.17, 5.96, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/awPDaFp70yI_filtered.json b/annotations_filtered/awPDaFp70yI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32a01fa9630037d760a49fb132c39d5708d5c9c6 --- /dev/null +++ b/annotations_filtered/awPDaFp70yI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.25], [15.0, 40.73], [41.0, 41.64], [43.0, 42.77], [43.0, 45.72], [48.0, 54.36], [55.0, 55.07], [58.0, 60.29], [66.0, 79.88], [82.0, 88.53]], "keep_status": [false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 34.74, 0.0, 0.0, 33.4, 37.05, 0.0, 40.68, 41.62, 35.61], "audiomae_on_audioset": [null, [["music", 72.93], ["electronic music", 3.64], ["hum", 3.37]], null, null, [["music", 59.98], ["theremin", 29.28], ["video game music", 0.83]], [["music", 55.25], ["theremin", 5.65], ["musical instrument", 2.15]], null, [["music", 36.3], ["hum", 10.2], ["synthesizer", 8.91]], [["music", 37.06], ["theremin", 32.25], ["didgeridoo", 5.2]], [["music", 76.5], ["timpani", 5.3], ["animal", 3.52]]], "duration": [1.25, 25.73, 0.64, -0.23, 2.72, 6.36, 0.07, 2.29, 13.88, 6.53]} \ No newline at end of file diff --git a/annotations_filtered/awYi2rXf1Ws_filtered.json b/annotations_filtered/awYi2rXf1Ws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..326c7f09826973e5908cbb29f3e223c8851ce52f --- /dev/null +++ b/annotations_filtered/awYi2rXf1Ws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.98], [15.0, 18.13], [19.0, 19.67], [21.0, 21.27], [22.0, 27.75], [31.0, 70.41], [71.0, 71.76], [73.0, 73.38], [75.0, 78.14], [79.0, 79.74], [81.0, 81.36], [82.0, 90.39], [91.0, 94.05], [96.0, 96.79], [98.0, 99.17], [100.0, 100.92], [103.0, 104.18], [105.0, 105.48], [107.0, 109.53], [111.0, 111.45], [115.0, 116.07], [117.0, 118.08], [121.0, 120.99], [122.0, 123.35], [125.0, 130.45]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.53, 0.0, 0.0, 52.62, 0.0, 0.0, 0.0, 42.53, 0.0, 0.0, 43.2, 42.42, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 51.77], "audiomae_on_audioset": [null, [["music", 27.6], ["cello", 15.88], ["double bass", 9.02]], null, null, null, null, null, null, [["singing bowl", 27.8], ["music", 26.3], ["guitar", 5.21]], null, null, [["music", 54.35], ["synthesizer", 12.78], ["singing bowl", 7.04]], [["music", 54.04], ["didgeridoo", 9.63], ["percussion", 7.23]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.98, 3.13, 0.67, 0.27, 5.75, 39.41, 0.76, 0.38, 3.14, 0.74, 0.36, 8.39, 3.05, 0.79, 1.17, 0.92, 1.18, 0.48, 2.53, 0.45, 1.07, 1.08, -0.01, 1.35, 5.45]} \ No newline at end of file diff --git a/annotations_filtered/awkGgPALfho_filtered.json b/annotations_filtered/awkGgPALfho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8e7e6c283bc229e64f53afcdf2594afa8cf4f3b --- /dev/null +++ b/annotations_filtered/awkGgPALfho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.59], [30.0, 30.35], [31.0, 34.52], [41.0, 41.94], [59.0, 68.05], [70.0, 73.21], [75.0, 77.06], [79.0, 84.59], [85.0, 93.06], [97.0, 98.74], [102.0, 110.4], [126.0, 128.07], [128.0, 130.32], [137.0, 138.08], [138.0, 141.62], [144.0, 143.97], [145.0, 145.22], [146.0, 146.64], [155.0, 155.44]], "keep_status": [false, false, true, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 35.84, 0.0, 30.57, 32.64, 31.9, 29.97, 29.95, 0.0, 29.74, 54.76, 62.47, 0.0, 31.38, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 37.08], ["music", 22.35], ["bow-wow", 5.4]], null, [["music", 73.87], ["animal", 2.26], ["bow-wow", 1.92]], [["music", 59.33], ["music of latin america", 8.58], ["musical instrument", 4.59]], [["mosquito", 38.93], ["music", 27.48], ["fly, housefly", 7.91]], [["mosquito", 44.18], ["fly, housefly", 35.67], ["insect", 17.63]], [["fly, housefly", 17.36], ["music", 11.8], ["cattle, bovinae", 11.18]], null, [["fly, housefly", 26.66], ["mosquito", 24.29], ["music", 11.48]], null, null, null, [["crying, sobbing", 14.33], ["grunt", 12.72], ["fart", 8.2]], null, null, null, null], "duration": [0.59, 0.35, 3.52, 0.94, 9.05, 3.21, 2.06, 5.59, 8.06, 1.74, 8.4, 2.07, 2.32, 1.08, 3.62, -0.03, 0.22, 0.64, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/awuqJuO5WOc_filtered.json b/annotations_filtered/awuqJuO5WOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a52fc4138e83f5298f1534a1cfa844c62d051ec --- /dev/null +++ b/annotations_filtered/awuqJuO5WOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 20.46], [21.0, 56.08], [57.0, 58.53], [59.0, 60.94], [61.0, 62.19], [64.0, 65.52], [68.0, 74.93], [78.0, 78.34], [80.0, 80.03], [82.0, 102.83], [106.0, 115.13], [116.0, 119.97], [123.0, 124.73], [131.0, 137.29], [139.0, 140.24], [141.0, 142.01], [143.0, 144.44], [145.0, 146.94], [148.0, 148.22], [149.0, 155.24]], "keep_status": [true, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [30.56, 0.0, 0.0, 0.0, 0.0, 0.0, 30.75, 0.0, 0.0, 30.6, 34.29, 55.6, 0.0, 46.72, 0.0, 0.0, 0.0, 0.0, 0.0, 44.49], "audiomae_on_audioset": [[["music", 48.94], ["synthesizer", 6.77], ["sound effect", 3.85]], null, null, null, null, null, [["music", 10.69], ["breaking", 10.37], ["whale vocalization", 8.25]], null, null, [["music", 79.26], ["musical instrument", 4.2], ["synthesizer", 2.09]], [["hum", 30.61], ["noise", 14.58], ["whale vocalization", 10.48]], null, null, [["hum", 24.39], ["speech", 22.09], ["music", 13.23]], null, null, null, null, null, [["hum", 36.53], ["whale vocalization", 23.21], ["throbbing", 6.34]]], "duration": [10.46, 35.08, 1.53, 1.94, 1.19, 1.52, 6.93, 0.34, 0.03, 20.83, 9.13, 3.97, 1.73, 6.29, 1.24, 1.01, 1.44, 1.94, 0.22, 6.24]} \ No newline at end of file diff --git a/annotations_filtered/ax0943uaZUk_filtered.json b/annotations_filtered/ax0943uaZUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ad740cebff483fe24b6d80ac8e5653984333411 --- /dev/null +++ b/annotations_filtered/ax0943uaZUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.17], [5.0, 8.43], [13.0, 24.53], [26.0, 26.49], [27.0, 39.43], [40.0, 40.47], [42.0, 42.6], [44.0, 44.56], [47.0, 47.97], [52.0, 52.52], [55.0, 64.0], [65.0, 79.22], [81.0, 83.71], [87.0, 89.45], [91.0, 91.72], [93.0, 93.19], [94.0, 95.42], [98.0, 99.96], [101.0, 104.77], [105.0, 105.65], [107.0, 110.15], [113.0, 114.17], [115.0, 115.75], [117.0, 119.55], [120.0, 121.85], [123.0, 123.62], [124.0, 132.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 56.33, 56.7, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0, 63.64, 32.85, 83.34, 78.55, 0.0, 0.0, 0.0, 0.0, 65.55, 0.0, 47.27, 0.0, 0.0, 58.22, 0.0, 0.0, 55.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["animal", 22.89], ["horse", 20.8], ["neigh, whinny", 15.93]], null, null, null, null, null, null, null, null, [["speech", 42.68], ["sidetone", 27.52], ["radio", 7.49]], null, null, null, null, null, null], "duration": [0.17, 3.43, 11.53, 0.49, 12.43, 0.47, 0.6, 0.56, 0.97, 0.52, 9.0, 14.22, 2.71, 2.45, 0.72, 0.19, 1.42, 1.96, 3.77, 0.65, 3.15, 1.17, 0.75, 2.55, 1.85, 0.62, 8.14]} \ No newline at end of file diff --git a/annotations_filtered/ax3ZNv5jqQY_filtered.json b/annotations_filtered/ax3ZNv5jqQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1356a6a40ba48923b3245ac6b6ad17e8462eb67e --- /dev/null +++ b/annotations_filtered/ax3ZNv5jqQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.16], [7.0, 7.23], [14.0, 15.31], [16.0, 16.65], [19.0, 19.75], [22.0, 40.78], [41.0, 43.87], [47.0, 53.42], [61.0, 62.56], [65.0, 76.35], [77.0, 84.75], [86.0, 88.38], [98.0, 98.36], [111.0, 111.81], [113.0, 113.58], [119.0, 120.16], [121.0, 130.2], [132.0, 157.89]], "keep_status": [false, false, false, false, false, true, true, true, false, true, true, true, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.39, 31.84, 29.91, 0.0, 29.04, 30.36, 42.96, 0.0, 0.0, 0.0, 0.0, 30.62, 31.17], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 21.66], ["music", 20.22], ["mains hum", 18.09]], [["music", 19.74], ["speech", 17.47], ["animal", 4.39]], [["foghorn", 33.4], ["fly, housefly", 19.69], ["music", 8.03]], null, [["motorcycle", 18.71], ["vehicle", 14.15], ["speech", 13.32]], [["speech", 9.77], ["grunt", 9.44], ["sound effect", 9.25]], [["speech", 26.51], ["sheep", 15.22], ["sine wave", 9.21]], null, null, null, null, [["speech", 30.36], ["music", 18.86], ["buzz", 16.26]], [["sheep", 22.22], ["bleat", 21.85], ["mosquito", 15.99]]], "duration": [1.16, 0.23, 1.31, 0.65, 0.75, 18.78, 2.87, 6.42, 1.56, 11.35, 7.75, 2.38, 0.36, 0.81, 0.58, 1.16, 9.2, 25.89]} \ No newline at end of file diff --git a/annotations_filtered/axWtCnuctw0_filtered.json b/annotations_filtered/axWtCnuctw0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86880854117d11d7eebe66feeebdbea89d0d1ec7 --- /dev/null +++ b/annotations_filtered/axWtCnuctw0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 45.01], [47.0, 47.01], [47.0, 47.28], [52.0, 80.0], [84.0, 90.91]], "keep_status": [true, false, false, true, true], "silence_prob": [32.76, 0.0, 0.0, 28.55, 31.1], "audiomae_on_audioset": [[["music", 18.11], ["whale vocalization", 16.83], ["noise", 7.83]], null, null, [["whale vocalization", 18.4], ["music", 14.47], ["echo", 10.28]], [["gong", 33.69], ["music", 23.0], ["synthesizer", 6.07]]], "duration": [8.01, 0.01, 0.28, 28.0, 6.91]} \ No newline at end of file diff --git a/annotations_filtered/axcECZzlPVI_filtered.json b/annotations_filtered/axcECZzlPVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..179976d7d12559d1d6be5e8917b71b8a7b0e3b46 --- /dev/null +++ b/annotations_filtered/axcECZzlPVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.79], [11.0, 11.65], [13.0, 14.1], [19.0, 20.29], [24.0, 27.97], [30.0, 48.91], [54.0, 65.64], [69.0, 71.02], [76.0, 76.38], [81.0, 100.01], [103.0, 103.06], [111.0, 111.5]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.71, 31.95, 31.11, 30.65, 0.0, 30.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 35.98], ["throbbing", 20.41], ["speech", 17.48]], [["music", 58.08], ["speech", 9.08], ["drum and bass", 4.38]], [["music", 71.2], ["musical instrument", 3.34], ["guitar", 2.4]], null, [["music", 42.82], ["vehicle", 12.26], ["motorcycle", 6.59]], null, null], "duration": [1.79, 0.65, 1.1, 1.29, 3.97, 18.91, 11.64, 2.02, 0.38, 19.01, 0.06, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/axhUtepWokA_filtered.json b/annotations_filtered/axhUtepWokA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfba58030d1b8414f59c30682f2b6c2b3f146e6a --- /dev/null +++ b/annotations_filtered/axhUtepWokA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.56], [10.0, 11.42], [13.0, 12.7], [13.0, 15.23], [16.0, 28.19], [30.0, 32.9], [42.0, 57.01], [61.0, 73.09], [74.0, 80.57], [82.0, 83.03], [84.0, 84.27], [85.0, 85.6], [92.0, 98.51], [101.0, 100.97], [102.0, 102.95], [107.0, 109.09], [109.0, 126.59], [128.0, 128.92], [131.0, 133.08], [133.0, 133.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 50.41, 29.89, 29.76, 30.84, 34.81, 40.81, 0.0, 0.0, 0.0, 30.09, 0.0, 0.0, 32.1, 32.32, 0.0, 35.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 59.29], ["throbbing", 22.18], ["electronic music", 3.14]], [["music", 79.96], ["dubstep", 6.62], ["electronic music", 3.85]], [["music", 81.95], ["electronic music", 4.82], ["throbbing", 2.45]], [["music", 48.55], ["throbbing", 26.92], ["hum", 11.54]], [["throbbing", 33.9], ["music", 20.75], ["hum", 20.24]], null, null, null, [["music", 43.96], ["electronic music", 9.66], ["moo", 8.65]], null, null, [["speech", 26.94], ["music", 13.46], ["crowd", 13.03]], [["music", 52.76], ["didgeridoo", 8.1], ["throbbing", 4.49]], null, [["music", 40.26], ["throbbing", 11.71], ["cattle, bovinae", 5.84]], null], "duration": [0.56, 1.42, -0.3, 2.23, 12.19, 2.9, 15.01, 12.09, 6.57, 1.03, 0.27, 0.6, 6.51, -0.03, 0.95, 2.09, 17.59, 0.92, 2.08, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/axqYHL-KPRk_filtered.json b/annotations_filtered/axqYHL-KPRk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/axqYHL-KPRk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/ay1hpFWZQnI_filtered.json b/annotations_filtered/ay1hpFWZQnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b1f13b204a55ec6ee8c1966d8dee28141819587 --- /dev/null +++ b/annotations_filtered/ay1hpFWZQnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [28.0, 28.02], [30.0, 29.62], [30.0, 31.43], [34.0, 34.53], [48.0, 48.66], [50.0, 50.45], [51.0, 57.0], [60.0, 60.13], [61.0, 63.02], [64.0, 64.59], [88.0, 89.48]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 45.4, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 29.67], ["music", 22.04], ["electronic music", 5.65]], null, null], "duration": [0.64, 0.02, -0.38, 1.43, 0.53, 0.66, 0.45, 6.0, 0.13, 2.02, 0.59, 1.48]} \ No newline at end of file diff --git a/annotations_filtered/ayOLECuygTQ_filtered.json b/annotations_filtered/ayOLECuygTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c83b192b0f0962baaf04e0e8ba2764fa5e67a148 --- /dev/null +++ b/annotations_filtered/ayOLECuygTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.82], [12.0, 16.02], [18.0, 17.98], [19.0, 31.87], [34.0, 34.69], [36.0, 37.86], [39.0, 39.75], [42.0, 43.7], [46.0, 46.28], [55.0, 76.84], [78.0, 78.06], [80.0, 80.28], [87.0, 88.64], [91.0, 94.27], [95.0, 98.51], [101.0, 104.84], [106.0, 107.35], [109.0, 109.81], [112.0, 117.71]], "keep_status": [false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 36.1, 0.0, 35.45, 0.0, 0.0, 0.0, 0.0, 0.0, 34.56, 0.0, 0.0, 0.0, 100.0, 100.0, 31.57, 0.0, 0.0, 32.12], "audiomae_on_audioset": [null, [["moo", 36.59], ["cattle, bovinae", 23.47], ["livestock, farm animals, working animals", 6.96]], null, [["music", 25.44], ["quack", 9.97], ["groan", 9.6]], null, null, null, null, null, [["speech", 34.61], ["livestock, farm animals, working animals", 7.28], ["cattle, bovinae", 6.99]], null, null, null, null, null, [["music", 27.1], ["speech", 15.73], ["breaking", 12.15]], null, null, [["whale vocalization", 24.37], ["hum", 18.06], ["mains hum", 15.4]]], "duration": [0.82, 4.02, -0.02, 12.87, 0.69, 1.86, 0.75, 1.7, 0.28, 21.84, 0.06, 0.28, 1.64, 3.27, 3.51, 3.84, 1.35, 0.81, 5.71]} \ No newline at end of file diff --git a/annotations_filtered/ayjftbSDeVA_filtered.json b/annotations_filtered/ayjftbSDeVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad4156c94e5ac07b30015efa881ea31cbd6622cf --- /dev/null +++ b/annotations_filtered/ayjftbSDeVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.69], [6.0, 8.72], [10.0, 11.55], [14.0, 15.4], [18.0, 18.18], [22.0, 23.5], [25.0, 25.71], [30.0, 29.83], [31.0, 33.08], [35.0, 35.4], [40.0, 40.46], [41.0, 41.28], [42.0, 43.97], [50.0, 51.51], [54.0, 55.92], [57.0, 56.88], [59.0, 59.37], [60.0, 61.26], [67.0, 67.41], [71.0, 82.46], [84.0, 86.68], [88.0, 96.4], [98.0, 116.9], [118.0, 122.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 99.73, 99.88, 99.84, 99.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 2.72, 1.55, 1.4, 0.18, 1.5, 0.71, -0.17, 2.08, 0.4, 0.46, 0.28, 1.97, 1.51, 1.92, -0.12, 0.37, 1.26, 0.41, 11.46, 2.68, 8.4, 18.9, 4.47]} \ No newline at end of file diff --git a/annotations_filtered/ayl2X5zfUAk_filtered.json b/annotations_filtered/ayl2X5zfUAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27b38abbe3fdcf7c59975b50b8dc85423bbc9875 --- /dev/null +++ b/annotations_filtered/ayl2X5zfUAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 27.18], [33.0, 34.03], [36.0, 37.0], [39.0, 39.51], [41.0, 45.82], [47.0, 48.19], [50.0, 62.31], [75.0, 75.22], [80.0, 82.76], [90.0, 91.07], [92.0, 94.36], [97.0, 100.84], [101.0, 101.6], [102.0, 102.83], [103.0, 103.59], [106.0, 106.37], [111.0, 115.23]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [33.49, 0.0, 0.0, 0.0, 35.5, 0.0, 31.03, 0.0, 89.54, 0.0, 43.71, 35.08, 0.0, 0.0, 0.0, 0.0, 46.43], "audiomae_on_audioset": [[["music", 21.66], ["wind chime", 13.45], ["singing bowl", 11.32]], null, null, null, [["music", 33.1], ["chime", 12.88], ["wind chime", 12.1]], null, [["hum", 35.96], ["mains hum", 19.01], ["music", 11.53]], null, null, null, [["fly, housefly", 45.76], ["insect", 15.41], ["mosquito", 12.51]], [["sidetone", 30.01], ["mains hum", 23.52], ["hum", 23.37]], null, null, null, null, [["speech", 33.98], ["didgeridoo", 21.18], ["music", 8.06]]], "duration": [3.18, 1.03, 1.0, 0.51, 4.82, 1.19, 12.31, 0.22, 2.76, 1.07, 2.36, 3.84, 0.6, 0.83, 0.59, 0.37, 4.23]} \ No newline at end of file diff --git a/annotations_filtered/az-Q_fYNZrU_filtered.json b/annotations_filtered/az-Q_fYNZrU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75714cafa01a928305c41952fda7ec1349e7d284 --- /dev/null +++ b/annotations_filtered/az-Q_fYNZrU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.57], [19.0, 23.26], [25.0, 27.58], [29.0, 54.18], [58.0, 59.63], [63.0, 65.38], [71.0, 72.32], [74.0, 74.66], [76.0, 78.48], [81.0, 83.27], [84.0, 86.66]], "keep_status": [false, false, true, true, false, true, false, false, false, true, false], "silence_prob": [36.96, 34.88, 36.8, 29.65, 0.0, 30.32, 0.0, 0.0, 32.38, 34.91, 38.2], "audiomae_on_audioset": [[["music", 72.82], ["didgeridoo", 3.57], ["electronic music", 2.79]], [["music", 86.37], ["electronic music", 2.61], ["ambient music", 1.33]], [["cattle, bovinae", 25.82], ["moo", 19.69], ["didgeridoo", 17.93]], [["music", 28.32], ["throbbing", 28.31], ["hum", 10.06]], null, [["music", 24.92], ["hum", 12.37], ["mains hum", 11.86]], null, null, [["music", 54.3], ["throbbing", 9.81], ["hum", 9.33]], [["music", 59.17], ["musical instrument", 6.9], ["didgeridoo", 3.92]], [["music", 62.26], ["ambient music", 8.88], ["harmonic", 2.96]]], "duration": [2.57, 4.26, 2.58, 25.18, 1.63, 2.38, 1.32, 0.66, 2.48, 2.27, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/azYL1oPxMGg_filtered.json b/annotations_filtered/azYL1oPxMGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/azYL1oPxMGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/azkJMOVoNys_filtered.json b/annotations_filtered/azkJMOVoNys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fedd66bd2e04fc93a4938fe814aced9609d3aea6 --- /dev/null +++ b/annotations_filtered/azkJMOVoNys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [6.0, 6.1], [7.0, 6.98], [8.0, 9.96], [17.0, 19.04], [28.0, 28.44], [34.0, 35.53], [37.0, 38.94], [39.0, 41.18], [41.0, 41.22], [46.0, 45.72], [53.0, 53.55], [58.0, 60.42], [64.0, 65.65], [71.0, 71.2], [72.0, 72.39], [74.0, 74.78], [76.0, 76.15], [76.0, 77.99], [80.0, 81.46], [83.0, 84.77], [88.0, 89.65], [97.0, 97.93], [102.0, 103.65], [106.0, 107.4], [112.0, 114.3], [118.0, 119.3], [123.0, 123.35], [130.0, 131.4], [133.0, 135.21], [139.0, 140.75], [145.0, 154.31], [157.0, 158.43], [160.0, 160.47], [161.0, 161.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 65.79, 0.0, 0.0, 0.0, 49.64, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 73.51, 0.0, 94.07, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 46.45], ["hum", 18.06], ["mains hum", 8.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.1, -0.02, 1.96, 2.04, 0.44, 1.53, 1.94, 2.18, 0.22, -0.28, 0.55, 2.42, 1.65, 0.2, 0.39, 0.78, 0.15, 1.99, 1.46, 1.77, 1.65, 0.93, 1.65, 1.4, 2.3, 1.3, 0.35, 1.4, 2.21, 1.75, 9.31, 1.43, 0.47, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/azot-mIuW3Y_filtered.json b/annotations_filtered/azot-mIuW3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad59e2f4bcafa2b1e18274e280d6dabf9f6d2554 --- /dev/null +++ b/annotations_filtered/azot-mIuW3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 62.51], [65.0, 97.48], [98.0, 97.87], [99.0, 99.98], [104.0, 108.92]], "keep_status": [false, false, false, false, true], "silence_prob": [61.87, 0.0, 0.0, 0.0, 31.66], "audiomae_on_audioset": [null, null, null, null, [["music", 32.09], ["throbbing", 5.41], ["fart", 4.73]]], "duration": [17.51, 32.48, -0.13, 0.98, 4.92]} \ No newline at end of file diff --git a/app.py b/app.py index 41f22c594a48ae19ffc7a1aad296e67a0b95edb2..3d0996d01b81f6a7c25e647d2e7945c075b29567 100644 --- a/app.py +++ b/app.py @@ -51,7 +51,7 @@ def get_data_root_from_hostname(): return data_root -def load_clips_df(df_path, data_dir, verbose=True): +def load_clips_df(df_path, data_dir, verbose=True, use_local=False): assert exists(df_path), f"File {df_path} does not exist" df = pd.read_csv(df_path) print(df.columns) @@ -59,15 +59,18 @@ def load_clips_df(df_path, data_dir, verbose=True): print("Number of clips:", len(df)) # filter out clips that are not downloaded df["video_path"] = df["videoid"].apply(lambda x: join(data_dir, "pytube_videos", f"{x}.mp4")) - df = df[df["video_path"].apply(exists)] + if use_local: + df = df[df["video_path"].apply(exists)] if verbose: print("Number of clips (with videos available):", len(df)) df["audio_path"] = df["videoid"].apply(lambda x: join(data_dir, "pytube_audio", f"{x}.wav")) - df = df[df["audio_path"].apply(exists)] + if use_local: + df = df[df["audio_path"].apply(exists)] if verbose: print("Number of clips (with audio available):", len(df)) df["annot_path"] = df["videoid"].apply(lambda x: join(data_dir, "annotations", f"{x}.json")) - df = df[df["annot_path"].apply(exists)] + if use_local: + df = df[df["annot_path"].apply(exists)] if verbose: print("Number of clips (with annotations available):", len(df)) return df