diff --git a/annotations_filtered/d-2r0wMjfrY_filtered.json b/annotations_filtered/d-2r0wMjfrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ce2d459d19b351398e96da772c23b0f363fc6e1 --- /dev/null +++ b/annotations_filtered/d-2r0wMjfrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [3.0, 3.08], [5.0, 22.57]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 30.4], "audiomae_on_audioset": [null, null, [["music", 58.47], ["speech", 17.54], ["musical instrument", 3.9]]], "duration": [0.29, 0.08, 17.57]} \ No newline at end of file diff --git a/annotations_filtered/d-RR_vV7qDU_filtered.json b/annotations_filtered/d-RR_vV7qDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc591e9a033ec5f94b7378a51b5734352f031972 --- /dev/null +++ b/annotations_filtered/d-RR_vV7qDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.99], [16.0, 19.48], [22.0, 23.03], [27.0, 28.75], [30.0, 35.09], [41.0, 53.23], [55.0, 85.6], [87.0, 93.39], [96.0, 99.52], [102.0, 105.31], [108.0, 108.82], [109.0, 118.2], [125.0, 127.06], [129.0, 131.13]], "keep_status": [true, false, false, false, true, true, false, false, true, true, false, false, false, true], "silence_prob": [31.64, 30.83, 0.0, 0.0, 31.61, 32.3, 0.0, 31.11, 31.77, 32.18, 0.0, 31.62, 32.23, 33.24], "audiomae_on_audioset": [[["cacophony", 23.96], ["vehicle", 9.44], ["music", 8.97]], [["sidetone", 32.38], ["music", 29.07], ["speech", 17.33]], null, null, [["music", 38.68], ["hum", 16.72], ["throbbing", 9.88]], [["music", 24.24], ["speech", 23.55], ["sonar", 9.01]], null, [["speech", 46.38], ["sidetone", 20.62], ["music", 12.17]], [["music", 30.9], ["electronic music", 11.26], ["cacophony", 7.68]], [["music", 38.97], ["speech", 16.23], ["sidetone", 6.9]], null, [["speech", 79.81], ["music", 8.27], ["cacophony", 2.73]], [["music", 76.3], ["musical instrument", 5.27], ["theremin", 2.64]], [["speech", 38.32], ["music", 13.44], ["synthesizer", 5.86]]], "duration": [3.99, 3.48, 1.03, 1.75, 5.09, 12.23, 30.6, 6.39, 3.52, 3.31, 0.82, 9.2, 2.06, 2.13]} \ No newline at end of file diff --git a/annotations_filtered/d-kcczAff40_filtered.json b/annotations_filtered/d-kcczAff40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..948ea2f9ffb6875bbf5625498dc5a2c7849e15b4 --- /dev/null +++ b/annotations_filtered/d-kcczAff40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[101.0, 101.46], [102.0, 103.1], [104.0, 105.17], [106.0, 106.44]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.46, 1.1, 1.17, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/d-nJUGK8ABk_filtered.json b/annotations_filtered/d-nJUGK8ABk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec519593ea34d0c11e1338cc79d1cfe9631947c3 --- /dev/null +++ b/annotations_filtered/d-nJUGK8ABk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.91], [10.0, 10.45], [16.0, 32.12], [32.0, 32.16], [33.0, 33.2], [34.0, 35.16], [36.0, 46.97], [51.0, 90.78], [97.0, 98.15], [102.0, 102.74], [108.0, 108.87], [111.0, 112.16], [115.0, 115.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.44, 0.0, 0.0, 0.0, 33.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 65.94], ["drum machine", 13.79], ["speech", 12.33]], null, null, null, [["music", 61.13], ["speech", 17.13], ["drum machine", 2.44]], null, null, null, null, null, null], "duration": [0.91, 0.45, 16.12, 0.16, 0.2, 1.16, 10.97, 39.78, 1.15, 0.74, 0.87, 1.16, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/d0ZOz1i5-PE_filtered.json b/annotations_filtered/d0ZOz1i5-PE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cf28bd6763eee9c1ac7a938c2bb1878d3e7c6b8 --- /dev/null +++ b/annotations_filtered/d0ZOz1i5-PE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.53], [23.0, 24.8], [26.0, 26.22], [28.0, 29.3], [31.0, 36.14], [37.0, 37.23], [40.0, 40.46], [44.0, 46.06], [46.0, 46.6], [49.0, 49.11], [54.0, 54.43], [59.0, 59.48], [63.0, 68.88], [69.0, 70.17], [72.0, 72.15], [84.0, 86.59], [90.0, 91.18], [93.0, 96.3], [103.0, 103.89], [107.0, 109.21], [117.0, 118.34], [122.0, 125.56]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.15, 0.0, 0.0, 34.96, 0.0, 0.0, 0.0, 0.0, 33.86, 0.0, 0.0, 36.11, 0.0, 31.57, 0.0, 36.76, 0.0, 39.55], "audiomae_on_audioset": [null, null, null, null, [["speech", 39.08], ["fly, housefly", 17.56], ["insect", 13.84]], null, null, [["music", 32.73], ["speech", 19.45], ["timpani", 8.0]], null, null, null, null, [["music", 47.04], ["speech", 22.91], ["boing", 11.62]], null, null, [["speech", 26.29], ["boing", 17.4], ["music", 15.57]], null, [["music", 14.96], ["speech", 14.4], ["moo", 13.19]], null, [["music", 39.33], ["speech", 9.48], ["didgeridoo", 5.21]], null, [["music", 49.65], ["boing", 3.43], ["sampler", 2.9]]], "duration": [1.53, 1.8, 0.22, 1.3, 5.14, 0.23, 0.46, 2.06, 0.6, 0.11, 0.43, 0.48, 5.88, 1.17, 0.15, 2.59, 1.18, 3.3, 0.89, 2.21, 1.34, 3.56]} \ No newline at end of file diff --git a/annotations_filtered/d0c6KWKMAF8_filtered.json b/annotations_filtered/d0c6KWKMAF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..731c01f8d96a24d937cfce3fef7b0fb7bb71b100 --- /dev/null +++ b/annotations_filtered/d0c6KWKMAF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.35], [7.0, 7.69], [9.0, 11.2], [12.0, 20.8], [22.0, 47.97], [49.0, 50.6], [52.0, 53.18], [55.0, 56.15], [57.0, 62.46], [64.0, 65.57], [66.0, 67.26], [68.0, 68.39], [80.0, 93.93], [96.0, 103.32], [106.0, 106.86], [109.0, 114.91], [116.0, 117.22]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [38.15, 0.0, 84.25, 44.55, 36.2, 0.0, 0.0, 0.0, 36.47, 0.0, 0.0, 0.0, 31.59, 53.1, 0.0, 90.43, 0.0], "audiomae_on_audioset": [[["speech", 56.49], ["music", 8.86], ["synthesizer", 2.92]], null, null, [["hum", 46.55], ["throbbing", 30.95], ["mains hum", 16.7]], [["hum", 41.44], ["throbbing", 40.18], ["mains hum", 7.96]], null, null, null, [["throbbing", 27.99], ["music", 26.95], ["hum", 19.67]], null, null, null, [["hum", 33.15], ["speech", 15.04], ["throbbing", 14.93]], null, null, null, null], "duration": [3.35, 0.69, 2.2, 8.8, 25.97, 1.6, 1.18, 1.15, 5.46, 1.57, 1.26, 0.39, 13.93, 7.32, 0.86, 5.91, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/d0hM2Ekkk-8_filtered.json b/annotations_filtered/d0hM2Ekkk-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb78b671029d6789fb1405872c581adaf7580e1b --- /dev/null +++ b/annotations_filtered/d0hM2Ekkk-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.28], [24.0, 24.33], [33.0, 49.08], [77.0, 76.79], [101.0, 101.39], [135.0, 135.82]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.28, 0.33, 16.08, -0.21, 0.39, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/d0x7-oo9NAk_filtered.json b/annotations_filtered/d0x7-oo9NAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db01663b578c82513461769daa66a8573e4c8a56 --- /dev/null +++ b/annotations_filtered/d0x7-oo9NAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[85.0, 85.85], [88.0, 87.83], [90.0, 100.82], [103.0, 106.05], [107.0, 120.41], [121.0, 122.76], [123.0, 140.53], [142.0, 142.92], [147.0, 183.22], [184.0, 185.53], [186.0, 194.43], [198.0, 203.5]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 29.67, 40.55, 29.93, 0.0, 32.82, 0.0, 0.0, 0.0, 33.46, 33.63], "audiomae_on_audioset": [null, null, [["hum", 33.27], ["throbbing", 24.19], ["music", 18.59]], [["music", 58.6], ["throbbing", 6.78], ["theme music", 3.25]], [["throbbing", 41.88], ["music", 28.89], ["hum", 16.73]], null, [["speech", 26.93], ["hum", 22.73], ["music", 14.61]], null, null, null, [["grunt", 67.15], ["speech", 4.83], ["sound effect", 4.43]], [["music", 30.39], ["effects unit", 26.24], ["musical instrument", 10.2]]], "duration": [0.85, -0.17, 10.82, 3.05, 13.41, 1.76, 17.53, 0.92, 36.22, 1.53, 8.43, 5.5]} \ No newline at end of file diff --git a/annotations_filtered/d1ZUnCbVoZQ_filtered.json b/annotations_filtered/d1ZUnCbVoZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57e8e0441de433fe7052eae36f6d52438774c402 --- /dev/null +++ b/annotations_filtered/d1ZUnCbVoZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.58], [6.0, 9.66], [11.0, 14.17], [15.0, 15.7], [16.0, 16.09], [17.0, 17.37], [19.0, 21.57], [22.0, 23.36], [25.0, 25.78], [27.0, 29.49], [30.0, 39.73], [43.0, 42.79], [43.0, 45.35], [51.0, 51.54], [57.0, 57.33], [58.0, 58.48], [59.0, 60.35], [63.0, 63.36], [65.0, 71.52], [76.0, 76.1], [76.0, 78.24], [79.0, 80.01], [82.0, 82.58], [85.0, 86.83], [87.0, 88.32], [89.0, 90.14], [94.0, 95.77], [101.0, 102.63], [104.0, 105.48], [107.0, 107.7], [109.0, 109.75], [112.0, 112.8], [114.0, 114.44], [117.0, 117.37], [122.0, 123.63], [125.0, 126.15], [128.0, 128.97], [134.0, 133.88], [154.0, 154.09], [159.0, 161.06], [163.0, 164.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.07, 99.05, 93.29, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 57.4, 96.42, 0.0, 51.55, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.58, 3.66, 3.17, 0.7, 0.09, 0.37, 2.57, 1.36, 0.78, 2.49, 9.73, -0.21, 2.35, 0.54, 0.33, 0.48, 1.35, 0.36, 6.52, 0.1, 2.24, 1.01, 0.58, 1.83, 1.32, 1.14, 1.77, 1.63, 1.48, 0.7, 0.75, 0.8, 0.44, 0.37, 1.63, 1.15, 0.97, -0.12, 0.09, 2.06, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/d1lql0Z0e-E_filtered.json b/annotations_filtered/d1lql0Z0e-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e44e0e0f132852e82ad1e254c54a2a2d1d7fad95 --- /dev/null +++ b/annotations_filtered/d1lql0Z0e-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [6.0, 7.28], [13.0, 13.71], [16.0, 19.33], [20.0, 27.24], [29.0, 49.45], [50.0, 49.55], [50.0, 57.5], [58.0, 72.69], [76.0, 86.9], [89.0, 91.13], [92.0, 92.43], [93.0, 94.31], [96.0, 98.25], [101.0, 102.52], [104.0, 104.68], [108.0, 108.85], [111.0, 111.94]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.63, 32.98, 37.89, 0.0, 38.19, 55.39, 41.72, 61.08, 0.0, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["crowd", 31.19], ["cheering", 19.04], ["cattle, bovinae", 16.75]], [["music", 44.16], ["theremin", 30.2], ["didgeridoo", 4.5]], [["music", 42.04], ["musical instrument", 13.75], ["gong", 8.69]], null, [["speech", 80.42], ["sidetone", 4.27], ["hum", 2.55]], null, [["didgeridoo", 44.64], ["music", 37.06], ["musical instrument", 3.67]], null, null, null, null, null, null, null, null], "duration": [0.98, 1.28, 0.71, 3.33, 7.24, 20.45, -0.45, 7.5, 14.69, 10.9, 2.13, 0.43, 1.31, 2.25, 1.52, 0.68, 0.85, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/d2uvpiz5up0_filtered.json b/annotations_filtered/d2uvpiz5up0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46ce078010198df4e2b3af6db53c3373725ae8a0 --- /dev/null +++ b/annotations_filtered/d2uvpiz5up0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.16], [17.0, 30.81], [34.0, 68.66], [70.0, 103.82], [107.0, 118.37]], "keep_status": [true, false, false, false, true], "silence_prob": [32.14, 31.49, 0.0, 0.0, 30.63], "audiomae_on_audioset": [[["hum", 27.24], ["speech", 25.41], ["mains hum", 15.35]], [["speech", 68.8], ["vehicle", 9.05], ["helicopter", 3.48]], null, null, [["hum", 36.31], ["music", 19.79], ["mains hum", 8.46]]], "duration": [9.16, 13.81, 34.66, 33.82, 11.37]} \ No newline at end of file diff --git a/annotations_filtered/d3-AXjkz3Pk_filtered.json b/annotations_filtered/d3-AXjkz3Pk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b9ca79fbb81781138a4cc8af506cb92d21d4eea --- /dev/null +++ b/annotations_filtered/d3-AXjkz3Pk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.4], [8.0, 7.99], [9.0, 10.08], [10.0, 11.91], [13.0, 20.92], [28.0, 29.25], [31.0, 34.16], [36.0, 39.63], [42.0, 44.91], [53.0, 53.96], [55.0, 56.24], [57.0, 60.44], [69.0, 69.8], [71.0, 71.44], [72.0, 73.09], [87.0, 87.61], [88.0, 88.23], [90.0, 91.47], [103.0, 107.55], [110.0, 110.89]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.0, 0.0, 0.0, 0.0, 33.97, 0.0, 57.89, 49.36, 66.51, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0], "audiomae_on_audioset": [[["music", 44.32], ["whip", 6.97], ["musical instrument", 4.6]], null, null, null, [["cattle, bovinae", 33.94], ["moo", 26.72], ["fly, housefly", 9.45]], null, null, [["mosquito", 22.84], ["fly, housefly", 10.68], ["insect", 7.64]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.4, -0.01, 1.08, 1.91, 7.92, 1.25, 3.16, 3.63, 2.91, 0.96, 1.24, 3.44, 0.8, 0.44, 1.09, 0.61, 0.23, 1.47, 4.55, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/d35M7d-E_PY_filtered.json b/annotations_filtered/d35M7d-E_PY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b995c834871dfd270a13f7beb4a22a2ac4e4c35c --- /dev/null +++ b/annotations_filtered/d35M7d-E_PY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.24], [7.0, 7.65], [9.0, 9.69], [10.0, 11.23], [18.0, 18.32], [30.0, 30.67], [33.0, 33.17], [38.0, 39.5], [43.0, 43.04], [44.0, 44.59], [48.0, 49.59], [51.0, 51.11], [53.0, 53.82], [54.0, 55.53], [59.0, 59.81], [65.0, 65.42], [70.0, 70.55], [74.0, 74.36], [87.0, 87.54], [94.0, 95.01], [99.0, 99.72], [102.0, 102.54], [107.0, 107.62], [109.0, 109.26], [117.0, 118.5], [121.0, 121.86], [125.0, 125.58], [128.0, 129.03], [131.0, 131.68], [132.0, 132.34], [132.0, 133.68], [135.0, 136.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.24, 0.65, 0.69, 1.23, 0.32, 0.67, 0.17, 1.5, 0.04, 0.59, 1.59, 0.11, 0.82, 1.53, 0.81, 0.42, 0.55, 0.36, 0.54, 1.01, 0.72, 0.54, 0.62, 0.26, 1.5, 0.86, 0.58, 1.03, 0.68, 0.34, 1.68, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/d3GeSiD2HIs_filtered.json b/annotations_filtered/d3GeSiD2HIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3441eb0c53f5c73bd52418b4c48f2d32234a916 --- /dev/null +++ b/annotations_filtered/d3GeSiD2HIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 32.09], [37.0, 37.44], [39.0, 121.81], [122.0, 123.16], [124.0, 125.2], [128.0, 171.04]], "keep_status": [true, false, false, false, false, false], "silence_prob": [49.64, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 12.36], ["roaring cats (lions, tigers)", 12.33], ["stomach rumble", 9.94]], null, null, null, null, null], "duration": [14.09, 0.44, 82.81, 1.16, 1.2, 43.04]} \ No newline at end of file diff --git a/annotations_filtered/d3HAOZbAj1Q_filtered.json b/annotations_filtered/d3HAOZbAj1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..160d21a3eb64e839e2d0bfcccefc6d29ec9a8bc8 --- /dev/null +++ b/annotations_filtered/d3HAOZbAj1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.94], [25.0, 25.46], [30.0, 36.85], [45.0, 45.69], [53.0, 53.45], [53.0, 69.4]], "keep_status": [true, false, true, false, false, true], "silence_prob": [29.84, 0.0, 30.51, 0.0, 0.0, 29.74], "audiomae_on_audioset": [[["music", 28.79], ["hum", 14.97], ["mains hum", 14.13]], null, [["rumble", 22.82], ["speech", 16.18], ["hum", 13.03]], null, null, [["music", 51.69], ["hum", 11.58], ["grunt", 6.59]]], "duration": [3.94, 0.46, 6.85, 0.69, 0.45, 16.4]} \ No newline at end of file diff --git a/annotations_filtered/d3ZUSI1_lOc_filtered.json b/annotations_filtered/d3ZUSI1_lOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3668a4c09b68035caee2298831393ef95eab4238 --- /dev/null +++ b/annotations_filtered/d3ZUSI1_lOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.47], [37.0, 38.15], [44.0, 43.87], [53.0, 55.97]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 30.38], "audiomae_on_audioset": [null, null, null, [["noise", 38.03], ["music", 9.97], ["livestock, farm animals, working animals", 6.98]]], "duration": [0.47, 1.15, -0.13, 2.97]} \ No newline at end of file diff --git a/annotations_filtered/d3hs2M_0vLE_filtered.json b/annotations_filtered/d3hs2M_0vLE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c39ba55fbaa7d22677e7415d3eff19c8d835b686 --- /dev/null +++ b/annotations_filtered/d3hs2M_0vLE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.08], [12.0, 13.09], [25.0, 27.51], [28.0, 29.52], [31.0, 31.18], [32.0, 32.29], [37.0, 37.77], [45.0, 46.06], [48.0, 50.85], [66.0, 66.51], [69.0, 69.36], [73.0, 83.54], [84.0, 84.96], [97.0, 100.79], [106.0, 107.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 100.0, 0.0, 84.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.08, 1.09, 2.51, 1.52, 0.18, 0.29, 0.77, 1.06, 2.85, 0.51, 0.36, 10.54, 0.96, 3.79, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/d46cDtFv_Rw_filtered.json b/annotations_filtered/d46cDtFv_Rw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27e94b11ffa738dfff01a742d70d214a852f138b --- /dev/null +++ b/annotations_filtered/d46cDtFv_Rw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [6.0, 6.45], [8.0, 9.04], [9.0, 10.37], [11.0, 12.83], [19.0, 21.81], [22.0, 23.65], [28.0, 31.46], [38.0, 40.29], [43.0, 43.95], [46.0, 50.99], [52.0, 54.3], [55.0, 57.11], [59.0, 60.57], [62.0, 65.26], [66.0, 67.24], [69.0, 73.84], [76.0, 79.29], [81.0, 82.81], [85.0, 95.61], [99.0, 108.31], [110.0, 111.45], [113.0, 112.78], [115.0, 116.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 97.43, 72.16, 0.0, 77.36, 65.55, 49.13, 0.0, 99.16, 0.0, 76.2, 65.67, 0.0, 72.31, 71.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.8], ["insect", 3.49], ["hum", 3.27]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.45, 1.04, 1.37, 1.83, 2.81, 1.65, 3.46, 2.29, 0.95, 4.99, 2.3, 2.11, 1.57, 3.26, 1.24, 4.84, 3.29, 1.81, 10.61, 9.31, 1.45, -0.22, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/d4Ljj8W1hE8_filtered.json b/annotations_filtered/d4Ljj8W1hE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3985c1745ebb88e32a016c5474ba13f55116eb87 --- /dev/null +++ b/annotations_filtered/d4Ljj8W1hE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.16], [18.0, 18.76], [19.0, 20.17], [24.0, 24.02], [32.0, 33.45], [35.0, 36.0], [37.0, 37.45], [38.0, 41.0], [43.0, 53.91], [55.0, 58.97], [61.0, 72.64], [73.0, 72.69], [73.0, 75.59], [76.0, 77.97], [79.0, 79.37], [80.0, 81.65], [84.0, 84.35], [88.0, 90.31], [91.0, 95.18], [96.0, 101.22], [102.0, 102.81], [105.0, 105.56], [109.0, 109.66], [110.0, 114.64], [116.0, 126.59], [129.0, 129.07], [132.0, 136.98], [138.0, 138.65]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [39.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.12, 36.0, 95.51, 36.71, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 88.28, 97.22, 65.91, 0.0, 0.0, 0.0, 70.44, 62.17, 0.0, 40.55, 0.0], "audiomae_on_audioset": [[["speech", 82.42], ["fart", 5.38], ["radio", 2.72]], null, null, null, null, null, null, [["chirp tone", 49.29], ["sine wave", 17.16], ["noise", 11.24]], [["mains hum", 24.24], ["hum", 17.67], ["music", 17.07]], null, [["creak", 19.25], ["percussion", 15.43], ["tabla", 14.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 43.27], ["speech", 7.1], ["hiccup", 4.23]], null], "duration": [3.16, 0.76, 1.17, 0.02, 1.45, 1.0, 0.45, 3.0, 10.91, 3.97, 11.64, -0.31, 2.59, 1.97, 0.37, 1.65, 0.35, 2.31, 4.18, 5.22, 0.81, 0.56, 0.66, 4.64, 10.59, 0.07, 4.98, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/d4MZPbERTFs_filtered.json b/annotations_filtered/d4MZPbERTFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da87738d275f5c43af7ffa3d02b6c7c2a07a4172 --- /dev/null +++ b/annotations_filtered/d4MZPbERTFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [4.0, 3.62], [4.0, 5.04], [6.0, 6.54], [7.0, 7.45], [8.0, 10.72], [11.0, 12.33], [15.0, 15.48], [16.0, 17.61], [18.0, 19.84], [20.0, 23.55], [24.0, 26.0], [27.0, 27.97], [29.0, 32.27], [33.0, 34.25], [42.0, 42.11], [43.0, 43.95], [44.0, 45.05], [46.0, 45.76], [46.0, 55.39], [66.0, 66.01], [71.0, 72.47], [73.0, 79.52], [81.0, 83.32], [84.0, 84.91], [87.0, 88.94], [92.0, 92.16], [94.0, 97.38], [103.0, 104.89], [107.0, 107.55], [108.0, 109.44], [112.0, 119.94], [121.0, 124.34], [127.0, 127.3], [128.0, 132.12], [135.0, 135.51], [141.0, 142.21], [145.0, 146.3], [147.0, 146.97], [149.0, 150.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 84.8, 93.29, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 32.25, 0.0, 0.0, 32.95, 52.92, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 30.58, 56.86, 0.0, 42.51, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.47], ["music", 18.97], ["hum", 4.54]], null, null, [["hum", 25.88], ["mains hum", 15.84], ["speech", 15.61]], null, null, null, null, [["hum", 49.32], ["throbbing", 33.4], ["stomach rumble", 3.31]], null, null, null, [["hum", 19.8], ["whip", 10.36], ["explosion", 10.24]], null, null, [["mains hum", 35.26], ["hum", 25.43], ["speech", 8.37]], null, null, null, null, null], "duration": [0.81, -0.38, 1.04, 0.54, 0.45, 2.72, 1.33, 0.48, 1.61, 1.84, 3.55, 2.0, 0.97, 3.27, 1.25, 0.11, 0.95, 1.05, -0.24, 9.39, 0.01, 1.47, 6.52, 2.32, 0.91, 1.94, 0.16, 3.38, 1.89, 0.55, 1.44, 7.94, 3.34, 0.3, 4.12, 0.51, 1.21, 1.3, -0.03, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/d4ftmOI5NnI_filtered.json b/annotations_filtered/d4ftmOI5NnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39547a47de2761fba454ad1629f1c8a4344200dd --- /dev/null +++ b/annotations_filtered/d4ftmOI5NnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.41], [2.0, 1.98], [2.0, 2.91], [4.0, 4.8], [6.0, 5.97], [8.0, 8.75], [9.0, 10.0], [16.0, 17.78], [19.0, 19.52], [21.0, 22.65], [25.0, 26.27], [27.0, 28.02], [36.0, 36.68], [38.0, 38.1], [39.0, 41.07], [52.0, 53.67], [55.0, 54.73], [63.0, 63.04], [64.0, 64.23], [66.0, 72.47], [73.0, 74.02], [76.0, 75.71], [78.0, 78.39], [81.0, 85.68], [87.0, 86.85], [87.0, 89.09], [92.0, 92.52], [94.0, 93.7], [96.0, 96.96], [125.0, 125.29], [155.0, 156.07], [159.0, 159.54], [161.0, 163.21], [169.0, 173.87], [175.0, 175.8], [189.0, 189.89], [194.0, 194.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.27, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 100.0, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 87.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 11.32], ["boing", 8.13], ["animal", 7.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, -0.02, 0.91, 0.8, -0.03, 0.75, 1.0, 1.78, 0.52, 1.65, 1.27, 1.02, 0.68, 0.1, 2.07, 1.67, -0.27, 0.04, 0.23, 6.47, 1.02, -0.29, 0.39, 4.68, -0.15, 2.09, 0.52, -0.3, 0.96, 0.29, 1.07, 0.54, 2.21, 4.87, 0.8, 0.89, 0.05]} \ No newline at end of file diff --git a/annotations_filtered/d5MJBYofzhs_filtered.json b/annotations_filtered/d5MJBYofzhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce48b1e9ccfa12741e1e8ad05cedf1c24acd480b --- /dev/null +++ b/annotations_filtered/d5MJBYofzhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 57.69]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [40.69]} \ No newline at end of file diff --git a/annotations_filtered/d5Pc-tNsvT4_filtered.json b/annotations_filtered/d5Pc-tNsvT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4561cfa53942a6ef1b7706a8dd66dd9d6da0071d --- /dev/null +++ b/annotations_filtered/d5Pc-tNsvT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.23], [5.0, 5.54], [7.0, 7.21], [16.0, 17.22], [19.0, 19.77], [22.0, 23.95], [33.0, 33.15], [38.0, 38.64], [49.0, 49.47], [53.0, 54.08], [59.0, 59.54], [70.0, 70.02], [73.0, 72.91], [75.0, 75.19], [79.0, 79.88], [82.0, 82.53], [101.0, 107.59], [110.0, 110.96], [115.0, 115.05], [117.0, 116.95], [121.0, 121.58], [129.0, 128.82], [139.0, 145.15], [151.0, 156.63], [159.0, 160.32], [162.0, 165.87]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [40.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 29.29, 42.44, 0.0, 45.75], "audiomae_on_audioset": [[["music", 27.05], ["hum", 20.14], ["speech", 10.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.64], ["trombone", 10.17], ["brass instrument", 5.23]], [["hum", 40.68], ["mains hum", 14.25], ["rumble", 14.17]], null, [["music", 24.48], ["whale vocalization", 11.18], ["sidetone", 8.62]]], "duration": [2.23, 0.54, 0.21, 1.22, 0.77, 1.95, 0.15, 0.64, 0.47, 1.08, 0.54, 0.02, -0.09, 0.19, 0.88, 0.53, 6.59, 0.96, 0.05, -0.05, 0.58, -0.18, 6.15, 5.63, 1.32, 3.87]} \ No newline at end of file diff --git a/annotations_filtered/d5gSQLPcya0_filtered.json b/annotations_filtered/d5gSQLPcya0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..245b6dc04837831af18ac439e7fbc9c9fca1fb8b --- /dev/null +++ b/annotations_filtered/d5gSQLPcya0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.37], [15.0, 17.12], [18.0, 33.78], [37.0, 57.6], [60.0, 82.29], [84.0, 96.85], [98.0, 104.19], [106.0, 107.28], [111.0, 112.5], [123.0, 127.99], [131.0, 134.45], [138.0, 141.32], [143.0, 165.67]], "keep_status": [false, true, false, true, true, true, true, false, false, true, false, true, false], "silence_prob": [30.27, 46.94, 78.21, 30.87, 35.64, 31.96, 36.21, 0.0, 0.0, 31.29, 30.82, 30.15, 50.51], "audiomae_on_audioset": [[["music", 29.9], ["hum", 23.69], ["throbbing", 19.61]], [["speech", 20.15], ["sonar", 10.51], ["music", 9.41]], null, [["speech", 30.81], ["buzz", 13.54], ["livestock, farm animals, working animals", 7.68]], [["music", 36.4], ["hum", 17.42], ["throbbing", 6.06]], [["speech", 34.02], ["music", 14.55], ["hum", 9.58]], [["speech", 45.62], ["music", 9.59], ["sidetone", 6.24]], null, null, [["speech", 41.25], ["vehicle", 10.17], ["mains hum", 5.22]], [["speech", 48.47], ["music", 13.0], ["vehicle", 9.08]], [["speech", 21.31], ["music", 16.95], ["noise", 5.82]], null], "duration": [9.37, 2.12, 15.78, 20.6, 22.29, 12.85, 6.19, 1.28, 1.5, 4.99, 3.45, 3.32, 22.67]} \ No newline at end of file diff --git a/annotations_filtered/d5jxXkpstv4_filtered.json b/annotations_filtered/d5jxXkpstv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f80bb8fe5b929b81552624769a5b78c6aad23f60 --- /dev/null +++ b/annotations_filtered/d5jxXkpstv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 17.37], [20.0, 43.39], [48.0, 48.78], [50.0, 50.94], [53.0, 53.22], [55.0, 55.88], [57.0, 57.25], [58.0, 58.75], [61.0, 61.84], [63.0, 63.54], [68.0, 68.44], [74.0, 88.4], [90.0, 93.82], [97.0, 107.87], [115.0, 124.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [55.96, 52.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.45, 51.02, 41.03, 30.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 40.7], ["speech", 16.89], ["throbbing", 16.5]], null, [["speech", 35.36], ["music", 30.94], ["buzz", 2.03]], [["speech", 38.39], ["music", 17.25], ["cacophony", 9.03]]], "duration": [13.37, 23.39, 0.78, 0.94, 0.22, 0.88, 0.25, 0.75, 0.84, 0.54, 0.44, 14.4, 3.82, 10.87, 9.95]} \ No newline at end of file diff --git a/annotations_filtered/d5nAgnojNgk_filtered.json b/annotations_filtered/d5nAgnojNgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29721cda86083b68e8c2869cd3db3c9aa3bbd1b6 --- /dev/null +++ b/annotations_filtered/d5nAgnojNgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.51], [8.0, 10.25], [11.0, 14.49], [15.0, 19.99], [22.0, 28.0], [37.0, 44.51], [48.0, 70.51], [72.0, 101.97], [107.0, 108.87], [110.0, 137.15], [138.0, 139.04], [141.0, 146.21], [147.0, 147.12]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 99.71, 77.7, 99.82, 99.88, 34.43, 38.56, 43.61, 0.0, 47.9, 0.0, 52.68, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 63.98], ["singing bowl", 15.83], ["ambient music", 6.12]], [["music", 54.89], ["singing bowl", 10.56], ["musical instrument", 4.91]], [["fly, housefly", 46.69], ["insect", 23.94], ["music", 7.17]], null, [["fly, housefly", 21.33], ["speech", 13.45], ["music", 11.62]], null, null, null], "duration": [1.51, 2.25, 3.49, 4.99, 6.0, 7.51, 22.51, 29.97, 1.87, 27.15, 1.04, 5.21, 0.12]} \ No newline at end of file diff --git a/annotations_filtered/d6263F3UkWo_filtered.json b/annotations_filtered/d6263F3UkWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b660f419e9e06bb36debcd14623aa221a5d0262 --- /dev/null +++ b/annotations_filtered/d6263F3UkWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 29.73], [30.0, 29.89], [31.0, 33.79], [36.0, 36.04], [37.0, 39.09], [40.0, 43.56], [44.0, 43.6], [44.0, 49.23], [50.0, 88.11], [89.0, 91.93], [94.0, 104.46], [105.0, 109.22], [112.0, 122.59], [124.0, 131.11], [133.0, 135.21], [138.0, 146.23], [147.0, 169.5], [171.0, 178.56], [184.0, 185.53], [186.0, 186.39]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.31, 0.0, 30.17, 31.18, 0.0, 30.84, 0.0, 29.99, 31.1, 29.49, 31.59, 49.36, 82.61, 79.24, 50.81, 46.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["boing", 66.53], ["music", 20.82], ["didgeridoo", 1.16]], null, [["music", 58.91], ["livestock, farm animals, working animals", 7.1], ["cattle, bovinae", 4.92]], [["music", 61.79], ["speech", 9.67], ["throbbing", 5.51]], null, [["music", 36.66], ["livestock, farm animals, working animals", 16.91], ["cattle, bovinae", 13.36]], null, [["whip", 38.3], ["music", 6.15], ["whack, thwack", 5.92]], [["music", 36.43], ["speech", 27.97], ["synthesizer", 3.52]], [["music", 15.84], ["buzz", 10.95], ["speech", 10.69]], [["music", 69.09], ["speech", 3.45], ["musical instrument", 2.64]], [["speech", 46.91], ["music", 25.64], ["foghorn", 15.04]], null, null, null, [["insect", 23.03], ["music", 21.98], ["fly, housefly", 16.5]], null, null], "duration": [-0.27, -0.11, 2.79, 0.04, 2.09, 3.56, -0.4, 5.23, 38.11, 2.93, 10.46, 4.22, 10.59, 7.11, 2.21, 8.23, 22.5, 7.56, 1.53, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/d68yRIE9OvQ_filtered.json b/annotations_filtered/d68yRIE9OvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbe0e2562144d84233419758193b06805fe9fbee --- /dev/null +++ b/annotations_filtered/d68yRIE9OvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 54.72], [56.0, 57.59], [61.0, 61.47], [65.0, 80.54], [82.0, 81.87], [111.0, 111.28], [112.0, 112.11]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 58.91], ["synthesizer", 5.83], ["cacophony", 3.8]], null, null, null], "duration": [51.72, 1.59, 0.47, 15.54, -0.13, 0.28, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/d6HReoQl6Mo_filtered.json b/annotations_filtered/d6HReoQl6Mo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8520c8f3901907c5058630f26d003c1d2fd3d96 --- /dev/null +++ b/annotations_filtered/d6HReoQl6Mo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 26.4], [31.0, 43.98], [48.0, 48.76], [53.0, 53.89], [56.0, 60.0], [63.0, 71.52], [72.0, 74.11], [75.0, 77.19], [78.0, 77.94], [79.0, 80.28], [86.0, 87.07], [90.0, 92.16], [94.0, 96.28], [98.0, 99.94], [102.0, 104.4], [106.0, 108.3], [115.0, 118.59], [119.0, 120.34], [122.0, 123.58], [130.0, 135.06], [136.0, 136.9], [138.0, 142.94], [144.0, 161.0], [165.0, 165.01], [166.0, 165.99], [166.0, 166.06], [166.0, 166.09], [166.0, 166.13], [166.0, 166.16], [166.0, 166.19], [166.0, 169.35], [170.0, 171.07], [176.0, 176.77], [178.0, 181.28], [185.0, 190.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [30.86, 32.25, 0.0, 0.0, 63.74, 42.15, 64.41, 73.82, 0.0, 0.0, 0.0, 82.97, 48.91, 0.0, 69.47, 48.52, 58.81, 0.0, 0.0, 57.17, 0.0, 74.29, 33.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.22, 0.0, 0.0, 38.56, 34.85], "audiomae_on_audioset": [[["theremin", 58.17], ["music", 27.23], ["clarinet", 3.04]], [["theremin", 70.01], ["music", 24.25], ["musical instrument", 1.26]], null, null, null, [["theremin", 35.94], ["music", 31.99], ["wind instrument, woodwind instrument", 4.0]], null, null, null, null, null, null, [["music", 42.39], ["theremin", 20.9], ["whale vocalization", 6.15]], null, null, [["music", 30.99], ["domestic animals, pets", 10.03], ["animal", 7.15]], null, null, null, null, null, null, [["music", 56.01], ["theremin", 27.28], ["musical instrument", 3.81]], null, null, null, null, null, null, null, [["music", 30.19], ["speech", 20.21], ["radio", 9.03]], null, null, [["hum", 21.55], ["music", 21.41], ["mains hum", 14.45]], [["music", 45.13], ["theremin", 30.91], ["effects unit", 3.33]]], "duration": [18.4, 12.98, 0.76, 0.89, 4.0, 8.52, 2.11, 2.19, -0.06, 1.28, 1.07, 2.16, 2.28, 1.94, 2.4, 2.3, 3.59, 1.34, 1.58, 5.06, 0.9, 4.94, 17.0, 0.01, -0.01, 0.06, 0.09, 0.13, 0.16, 0.19, 3.35, 1.07, 0.77, 3.28, 5.56]} \ No newline at end of file diff --git a/annotations_filtered/d6NOGc2Dymo_filtered.json b/annotations_filtered/d6NOGc2Dymo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51dd04e65597df1b5b3434bf129e4a400ac86b7f --- /dev/null +++ b/annotations_filtered/d6NOGc2Dymo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 20.24], [22.0, 27.08], [27.0, 36.53]], "keep_status": [false, true, false], "silence_prob": [31.5, 30.51, 32.26], "audiomae_on_audioset": [[["music", 45.0], ["speech", 39.69], ["whack, thwack", 3.15]], [["music", 21.73], ["speech", 20.67], ["fly, housefly", 10.19]], [["music", 59.43], ["electronic music", 6.5], ["hum", 5.15]]], "duration": [18.24, 5.08, 9.53]} \ No newline at end of file diff --git a/annotations_filtered/d6zX6-Rf4JY_filtered.json b/annotations_filtered/d6zX6-Rf4JY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16e2f396658df709bea8b2034693ad81a34fd00b --- /dev/null +++ b/annotations_filtered/d6zX6-Rf4JY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [4.0, 8.8], [10.0, 25.47], [26.0, 26.97], [28.0, 47.16], [48.0, 59.32], [68.0, 73.57], [74.0, 75.44]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 77.36, 0.0, 77.03, 70.02, 73.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.76, 4.8, 15.47, 0.97, 19.16, 11.32, 5.57, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/d7-pWfZgFKU_filtered.json b/annotations_filtered/d7-pWfZgFKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a68559ba78998c6293573ba2b450958f14fe8167 --- /dev/null +++ b/annotations_filtered/d7-pWfZgFKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.05], [7.0, 8.88], [9.0, 13.04], [13.0, 23.33], [25.0, 38.57], [39.0, 41.91], [43.0, 47.01], [48.0, 49.05], [51.0, 90.37], [91.0, 94.66], [96.0, 96.06], [102.0, 103.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 99.16, 57.09, 64.63, 94.07, 99.1, 0.0, 0.0, 82.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.05, 1.88, 4.04, 10.33, 13.57, 2.91, 4.01, 1.05, 39.37, 3.66, 0.06, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/d76CwsWbV2E_filtered.json b/annotations_filtered/d76CwsWbV2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f8dfeb35068344f988916fe694af7138bc64fc6 --- /dev/null +++ b/annotations_filtered/d76CwsWbV2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.12], [9.0, 9.1], [16.0, 16.44], [18.0, 18.54], [19.0, 20.7], [22.0, 22.89], [24.0, 25.66], [26.0, 27.03]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.12, 0.1, 0.44, 0.54, 1.7, 0.89, 1.66, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/d79o09D8cuo_filtered.json b/annotations_filtered/d79o09D8cuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c1a780da3d09c9a00e562d5f28d6ad3fa913d2b --- /dev/null +++ b/annotations_filtered/d79o09D8cuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.18], [5.0, 12.19], [18.0, 19.63], [20.0, 21.19], [22.0, 24.16], [25.0, 26.25], [27.0, 29.35], [35.0, 36.75], [40.0, 41.22], [49.0, 49.23], [70.0, 71.05], [86.0, 86.05], [90.0, 91.02], [97.0, 98.12], [100.0, 100.58], [101.0, 102.12], [104.0, 109.83], [111.0, 111.25], [113.0, 115.42], [117.0, 119.26], [120.0, 121.71], [123.0, 123.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 78.38, 0.0, 0.0, 49.68, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.87, 0.0, 66.39, 83.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 76.78], ["speech", 4.07], ["radio", 2.89]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 53.84], ["music", 18.39], ["bang", 4.75]], null, null, null, null, null], "duration": [0.18, 7.19, 1.63, 1.19, 2.16, 1.25, 2.35, 1.75, 1.22, 0.23, 1.05, 0.05, 1.02, 1.12, 0.58, 1.12, 5.83, 0.25, 2.42, 2.26, 1.71, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/d7Aot4Wr-Yo_filtered.json b/annotations_filtered/d7Aot4Wr-Yo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de758445de65ce47c6d889b9e12cef090b00ca05 --- /dev/null +++ b/annotations_filtered/d7Aot4Wr-Yo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 34.69], [35.0, 120.01], [121.0, 132.43], [135.0, 135.62], [136.0, 158.75], [159.0, 162.4], [167.0, 169.67], [170.0, 169.84], [170.0, 171.27], [173.0, 173.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.71, 0.0, 99.88, 0.0, 78.04, 99.31, 50.21, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [25.69, 85.01, 11.43, 0.62, 22.75, 3.4, 2.67, -0.16, 1.27, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/d7RrYVI3Xw0_filtered.json b/annotations_filtered/d7RrYVI3Xw0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b975cce1f67c7d831a1835435af473cb98b962c --- /dev/null +++ b/annotations_filtered/d7RrYVI3Xw0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.64], [29.0, 29.46], [32.0, 32.85], [41.0, 41.86], [43.0, 43.04], [43.0, 44.02], [47.0, 48.47], [50.0, 51.9], [61.0, 65.67], [66.0, 69.26], [71.0, 72.03], [74.0, 76.38], [78.0, 78.46], [79.0, 80.67], [83.0, 84.45]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.78, 47.39, 0.0, 88.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 57.15], ["theremin", 10.52], ["musical instrument", 5.16]], [["music", 31.17], ["theremin", 10.78], ["speech", 10.08]], null, null, null, null, null], "duration": [0.64, 0.46, 0.85, 0.86, 0.04, 1.02, 1.47, 1.9, 4.67, 3.26, 1.03, 2.38, 0.46, 1.67, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/d7V9liYn-IA_filtered.json b/annotations_filtered/d7V9liYn-IA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..805cf72fd5fb837e2b55096521e55b7d6ca64e38 --- /dev/null +++ b/annotations_filtered/d7V9liYn-IA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.9], [10.0, 14.1], [19.0, 19.8], [21.0, 38.01], [39.0, 66.07], [67.0, 121.32], [123.0, 122.98], [126.0, 126.96], [128.0, 128.31], [129.0, 130.01], [132.0, 132.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 82.79, 0.0, 45.78, 35.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 59.19], ["synthesizer", 14.41], ["musical instrument", 4.15]], [["music", 52.59], ["theremin", 19.13], ["synthesizer", 12.02]], null, null, null, null, null, null], "duration": [1.9, 4.1, 0.8, 17.01, 27.07, 54.32, -0.02, 0.96, 0.31, 1.01, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/d7WraA-roN8_filtered.json b/annotations_filtered/d7WraA-roN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd3b2cdfafeaa65acc1af12c0986c32794d2e4bd --- /dev/null +++ b/annotations_filtered/d7WraA-roN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.56], [7.0, 7.4], [8.0, 11.11], [12.0, 12.97], [14.0, 15.77], [16.0, 18.52], [23.0, 25.07], [34.0, 39.24], [41.0, 52.05], [54.0, 58.04], [61.0, 61.7], [65.0, 65.87], [67.0, 96.72], [98.0, 102.47], [105.0, 105.7], [107.0, 110.15], [111.0, 111.55], [112.0, 117.09]], "keep_status": [false, false, true, false, false, true, false, true, true, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.02, 0.0, 0.0, 45.95, 39.21, 41.62, 28.82, 28.38, 0.0, 0.0, 32.85, 36.44, 0.0, 32.09, 0.0, 34.53], "audiomae_on_audioset": [null, null, [["hum", 19.0], ["sidetone", 17.9], ["speech", 15.49]], null, null, [["speech", 32.69], ["music", 11.39], ["mains hum", 8.17]], [["didgeridoo", 36.6], ["music", 24.77], ["trombone", 9.79]], [["speech", 38.5], ["hum", 17.19], ["throbbing", 7.34]], [["speech", 43.3], ["music", 10.99], ["whack, thwack", 7.03]], [["livestock, farm animals, working animals", 22.19], ["breaking", 16.03], ["cowbell", 8.28]], null, null, [["fly, housefly", 17.86], ["hum", 13.51], ["mosquito", 8.34]], [["music", 73.21], ["guitar", 3.82], ["effects unit", 3.57]], null, [["music", 64.51], ["speech", 9.64], ["guitar", 4.0]], null, [["music", 66.85], ["guitar", 7.46], ["musical instrument", 5.54]]], "duration": [1.56, 0.4, 3.11, 0.97, 1.77, 2.52, 2.07, 5.24, 11.05, 4.04, 0.7, 0.87, 29.72, 4.47, 0.7, 3.15, 0.55, 5.09]} \ No newline at end of file diff --git a/annotations_filtered/d7_F5P5PygM_filtered.json b/annotations_filtered/d7_F5P5PygM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db6e2994f6b4258260b5ede126ab2ae1ff56d100 --- /dev/null +++ b/annotations_filtered/d7_F5P5PygM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.04], [14.0, 14.2], [17.0, 19.3], [20.0, 20.41], [22.0, 23.52], [24.0, 25.56], [26.0, 33.47], [35.0, 35.7], [36.0, 37.98], [40.0, 45.1], [46.0, 53.43], [55.0, 58.04]], "keep_status": [true, false, true, false, false, false, false, false, false, true, true, true], "silence_prob": [31.92, 0.0, 32.3, 0.0, 0.0, 0.0, 33.23, 0.0, 0.0, 30.43, 34.45, 49.59], "audiomae_on_audioset": [[["hum", 23.66], ["music", 22.98], ["mains hum", 18.91]], null, [["white noise", 17.77], ["mains hum", 9.26], ["explosion", 8.34]], null, null, null, [["music", 65.19], ["synthesizer", 8.44], ["hum", 6.49]], null, null, [["music", 29.13], ["synthesizer", 13.11], ["speech", 9.85]], [["music", 39.39], ["mains hum", 13.94], ["hum", 12.49]], [["music", 38.7], ["ambient music", 9.26], ["synthesizer", 8.45]]], "duration": [3.04, 0.2, 2.3, 0.41, 1.52, 1.56, 7.47, 0.7, 1.98, 5.1, 7.43, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/d7c4TXqkMso_filtered.json b/annotations_filtered/d7c4TXqkMso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..624320aa75ba774149009040db9ce4ad11967c3d --- /dev/null +++ b/annotations_filtered/d7c4TXqkMso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.73], [14.0, 13.66], [24.0, 29.39], [32.0, 42.87], [44.0, 44.88], [48.0, 48.49], [50.0, 50.48], [51.0, 51.68], [53.0, 53.06], [54.0, 54.65], [57.0, 58.21], [59.0, 59.73], [64.0, 65.11], [68.0, 67.9], [69.0, 70.07], [71.0, 71.52], [74.0, 74.61], [76.0, 76.28], [85.0, 85.19], [88.0, 88.3], [91.0, 91.23], [94.0, 94.19], [96.0, 97.83], [99.0, 99.22], [100.0, 101.12], [102.0, 103.1], [105.0, 106.1], [108.0, 108.46], [115.0, 116.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.02, 63.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, -0.34, 5.39, 10.87, 0.88, 0.49, 0.48, 0.68, 0.06, 0.65, 1.21, 0.73, 1.11, -0.1, 1.07, 0.52, 0.61, 0.28, 0.19, 0.3, 0.23, 0.19, 1.83, 0.22, 1.12, 1.1, 1.1, 0.46, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/d7he8f2L_BE_filtered.json b/annotations_filtered/d7he8f2L_BE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/d7he8f2L_BE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/d7pioagkX5k_filtered.json b/annotations_filtered/d7pioagkX5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/d7pioagkX5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/d7ye5zFyuso_filtered.json b/annotations_filtered/d7ye5zFyuso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fa2395a1e2dd4f2e67df8359fdfd8be946e0d8a --- /dev/null +++ b/annotations_filtered/d7ye5zFyuso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.68], [3.0, 3.05], [9.0, 17.42], [18.0, 23.31], [38.0, 38.01], [40.0, 40.53], [42.0, 42.35], [43.0, 43.83], [51.0, 54.35], [56.0, 56.74], [68.0, 70.09], [77.0, 77.55], [80.0, 80.62], [83.0, 83.47], [84.0, 110.56]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.74, 44.81, 0.0, 0.0, 0.0, 0.0, 50.26, 0.0, 56.78, 0.0, 0.0, 0.0, 30.35], "audiomae_on_audioset": [null, null, [["speech", 31.63], ["music", 28.65], ["hum", 4.37]], [["music", 53.77], ["speech", 8.77], ["didgeridoo", 3.36]], null, null, null, null, null, null, null, null, null, null, [["music", 52.42], ["theremin", 12.29], ["speech", 3.87]]], "duration": [0.68, 0.05, 8.42, 5.31, 0.01, 0.53, 0.35, 0.83, 3.35, 0.74, 2.09, 0.55, 0.62, 0.47, 26.56]} \ No newline at end of file diff --git a/annotations_filtered/d87eHGVaoc8_filtered.json b/annotations_filtered/d87eHGVaoc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..855f8ce30f982a4d5fa3e2ecf85ecaee3c43b8e1 --- /dev/null +++ b/annotations_filtered/d87eHGVaoc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.2], [24.0, 23.94], [24.0, 27.08], [50.0, 50.3], [57.0, 60.39], [62.0, 63.12], [64.0, 71.66], [77.0, 77.25]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [96.77, 0.0, 54.5, 0.0, 47.78, 0.0, 34.42, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 69.45], ["electronic music", 3.71], ["timpani", 3.4]], null, [["speech", 56.78], ["music", 24.35], ["outside, rural or natural", 2.28]], null], "duration": [2.2, -0.06, 3.08, 0.3, 3.39, 1.12, 7.66, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/d8Ff_W4-4VE_filtered.json b/annotations_filtered/d8Ff_W4-4VE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c898ee13a1133d6867db302e407a68acddc29f79 --- /dev/null +++ b/annotations_filtered/d8Ff_W4-4VE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.97], [13.0, 14.18], [15.0, 15.96], [17.0, 17.93], [34.0, 34.48], [45.0, 45.0], [49.0, 50.01], [54.0, 54.16], [55.0, 54.92], [63.0, 65.26], [69.0, 69.09], [73.0, 74.16], [77.0, 77.97], [83.0, 83.76], [88.0, 88.18], [89.0, 90.12], [101.0, 100.62], [102.0, 102.24], [108.0, 110.96], [116.0, 116.63], [119.0, 119.77], [123.0, 124.36], [126.0, 127.09], [129.0, 129.86], [132.0, 132.83], [133.0, 133.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 67.95], ["musical instrument", 6.51], ["guitar", 3.8]], null, null, null, null, null, null, null, null, [["speech", 59.51], ["radio", 9.67], ["sidetone", 4.16]], null, null, null, null, null, null, null], "duration": [0.97, 1.18, 0.96, 0.93, 0.48, 0.0, 1.01, 0.16, -0.08, 2.26, 0.09, 1.16, 0.97, 0.76, 0.18, 1.12, -0.38, 0.24, 2.96, 0.63, 0.77, 1.36, 1.09, 0.86, 0.83, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/d8Gg9rPHKNU_filtered.json b/annotations_filtered/d8Gg9rPHKNU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79c6ac898d2f7791b9f43b486ece3dff57c2a09a --- /dev/null +++ b/annotations_filtered/d8Gg9rPHKNU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.17], [7.0, 8.36], [10.0, 47.73]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.17, 1.36, 37.73]} \ No newline at end of file diff --git a/annotations_filtered/d8WHOiQZGok_filtered.json b/annotations_filtered/d8WHOiQZGok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0170fe6d96d8b00c7c3faacad3e8b23c9e7abe0 --- /dev/null +++ b/annotations_filtered/d8WHOiQZGok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [8.0, 8.09], [8.0, 9.58], [10.0, 15.74], [17.0, 32.48], [34.0, 34.26], [35.0, 35.68], [37.0, 37.22], [45.0, 45.3], [51.0, 51.61], [53.0, 53.18], [56.0, 56.44], [58.0, 58.24], [59.0, 61.65], [66.0, 75.56], [76.0, 77.33], [78.0, 79.29], [79.0, 85.83], [95.0, 98.12], [99.0, 99.12], [102.0, 103.03], [104.0, 105.06], [108.0, 109.71], [111.0, 111.62], [117.0, 117.34], [118.0, 118.76], [119.0, 124.09], [125.0, 128.6], [129.0, 131.11], [132.0, 133.47], [135.0, 135.63], [137.0, 137.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.62, 31.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.55, 39.25, 0.0, 0.0, 32.96, 34.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.55, 43.69, 37.65, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 71.25], ["trance music", 1.71], ["electronic music", 1.7]], [["music", 71.78], ["psychedelic rock", 5.99], ["swing music", 1.2]], null, null, null, null, null, null, null, null, [["music", 36.53], ["didgeridoo", 27.78], ["musical instrument", 4.03]], [["music", 53.75], ["speech", 12.76], ["throbbing", 3.26]], null, null, [["music", 36.91], ["speech", 36.4], ["sidetone", 8.81]], [["music", 34.85], ["throbbing", 27.1], ["hum", 15.7]], null, null, null, null, null, null, null, [["music", 40.41], ["speech", 23.32], ["didgeridoo", 13.54]], [["fly, housefly", 15.92], ["music", 9.65], ["creak", 8.99]], [["cattle, bovinae", 39.92], ["moo", 29.68], ["livestock, farm animals, working animals", 26.59]], null, null, null], "duration": [0.33, 0.09, 1.58, 5.74, 15.48, 0.26, 0.68, 0.22, 0.3, 0.61, 0.18, 0.44, 0.24, 2.65, 9.56, 1.33, 1.29, 6.83, 3.12, 0.12, 1.03, 1.06, 1.71, 0.62, 0.34, 0.76, 5.09, 3.6, 2.11, 1.47, 0.63, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/d8sDpSZeDBE_filtered.json b/annotations_filtered/d8sDpSZeDBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49514db0b18665a68dcafdf39be6f932c7c8048c --- /dev/null +++ b/annotations_filtered/d8sDpSZeDBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.49], [19.0, 19.55], [21.0, 21.2], [23.0, 24.31], [28.0, 28.93], [30.0, 30.08], [31.0, 33.62], [39.0, 39.06], [41.0, 41.34], [45.0, 47.6], [49.0, 49.67], [50.0, 51.14], [52.0, 52.52], [53.0, 53.82], [55.0, 66.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.22, 0.0, 0.0, 92.31, 0.0, 0.0, 0.0, 0.0, 86.27], "audiomae_on_audioset": [null, null, null, null, null, null, [["fly, housefly", 54.11], ["bee, wasp, etc.", 21.52], ["insect", 13.31]], null, null, null, null, null, null, null, null], "duration": [0.49, 0.55, 0.2, 1.31, 0.93, 0.08, 2.62, 0.06, 0.34, 2.6, 0.67, 1.14, 0.52, 0.82, 11.11]} \ No newline at end of file diff --git a/annotations_filtered/d9-DFXwcmFI_filtered.json b/annotations_filtered/d9-DFXwcmFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1a6a9f8660a6df9d8b08a8d458f0841858d7674 --- /dev/null +++ b/annotations_filtered/d9-DFXwcmFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.06], [9.0, 9.54], [15.0, 16.68], [18.0, 18.62], [19.0, 20.68], [23.0, 23.97], [25.0, 25.86], [28.0, 29.32], [36.0, 38.01], [39.0, 40.36], [41.0, 41.82], [46.0, 47.06], [52.0, 52.17], [59.0, 59.97], [61.0, 62.55], [63.0, 64.27], [67.0, 68.01], [71.0, 73.04], [74.0, 74.65], [75.0, 76.86], [79.0, 79.71], [81.0, 83.51], [86.0, 87.27], [90.0, 90.59], [92.0, 93.21], [94.0, 95.03], [99.0, 106.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.06, 0.54, 1.68, 0.62, 1.68, 0.97, 0.86, 1.32, 2.01, 1.36, 0.82, 1.06, 0.17, 0.97, 1.55, 1.27, 1.01, 2.04, 0.65, 1.86, 0.71, 2.51, 1.27, 0.59, 1.21, 1.03, 7.95]} \ No newline at end of file diff --git a/annotations_filtered/d921M-ACMM4_filtered.json b/annotations_filtered/d921M-ACMM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..963d89f95a4cde432eb7831b3b0154b8237cafab --- /dev/null +++ b/annotations_filtered/d921M-ACMM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.32], [5.0, 5.32], [7.0, 16.17], [20.0, 33.56], [36.0, 48.91], [53.0, 59.76], [60.0, 64.3], [69.0, 79.57], [80.0, 81.58], [83.0, 83.27], [85.0, 84.59], [85.0, 85.67], [97.0, 96.9], [114.0, 114.39], [116.0, 117.42], [119.0, 122.55], [125.0, 147.63], [148.0, 148.64]], "keep_status": [false, false, false, true, false, true, true, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 30.98, 46.02, 45.78, 38.41, 43.69, 37.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 31.78, 0.0], "audiomae_on_audioset": [null, null, [["speech", 44.39], ["eruption", 19.09], ["explosion", 7.67]], [["speech", 15.47], ["animal", 14.93], ["livestock, farm animals, working animals", 10.13]], [["livestock, farm animals, working animals", 34.01], ["cattle, bovinae", 28.85], ["animal", 20.85]], [["speech", 53.48], ["hum", 5.2], ["buzz", 3.51]], [["animal", 30.94], ["domestic animals, pets", 17.19], ["dog", 11.0]], [["whale vocalization", 34.08], ["animal", 16.39], ["speech", 6.46]], null, null, null, null, null, null, null, null, [["frog", 46.28], ["insect", 11.0], ["fly, housefly", 8.44]], null], "duration": [0.32, 0.32, 9.17, 13.56, 12.91, 6.76, 4.3, 10.57, 1.58, 0.27, -0.41, 0.67, -0.1, 0.39, 1.42, 3.55, 22.63, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/d9K2p6NtV40_filtered.json b/annotations_filtered/d9K2p6NtV40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d301358a0d14028626f0623518d8638edf02ea7 --- /dev/null +++ b/annotations_filtered/d9K2p6NtV40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.57], [12.0, 13.37], [14.0, 17.44], [18.0, 18.32], [21.0, 21.81], [23.0, 23.84], [26.0, 26.86], [29.0, 29.37], [30.0, 30.81], [33.0, 33.52], [39.0, 39.85], [42.0, 42.2], [44.0, 44.56], [46.0, 46.4], [47.0, 48.39], [49.0, 50.4], [52.0, 52.35], [56.0, 57.28], [60.0, 63.78], [64.0, 66.09], [71.0, 72.66], [74.0, 75.3], [77.0, 79.2], [80.0, 81.51], [83.0, 84.37], [86.0, 87.88], [89.0, 90.68], [91.0, 92.65], [93.0, 98.42], [101.0, 104.03], [105.0, 105.31], [106.0, 107.2], [108.0, 108.35], [109.0, 111.15], [113.0, 114.42], [120.0, 119.94], [122.0, 128.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 90.43, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 92.31, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 53.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 1.37, 3.44, 0.32, 0.81, 0.84, 0.86, 0.37, 0.81, 0.52, 0.85, 0.2, 0.56, 0.4, 1.39, 1.4, 0.35, 1.28, 3.78, 2.09, 1.66, 1.3, 2.2, 1.51, 1.37, 1.88, 1.68, 1.65, 5.42, 3.03, 0.31, 1.2, 0.35, 2.15, 1.42, -0.06, 6.14]} \ No newline at end of file diff --git a/annotations_filtered/d9PlKlirxT4_filtered.json b/annotations_filtered/d9PlKlirxT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d56d015731d9804ed5891b379b256fc3d8f6233d --- /dev/null +++ b/annotations_filtered/d9PlKlirxT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.82], [8.0, 7.86], [8.0, 7.99], [8.0, 35.04], [37.0, 39.31], [40.0, 39.95], [41.0, 41.54], [43.0, 44.66], [46.0, 49.23], [53.0, 53.37], [55.0, 59.31], [61.0, 61.53], [62.0, 61.92], [62.0, 61.96], [62.0, 67.19], [69.0, 70.24], [71.0, 73.85], [75.0, 76.81], [78.0, 81.21], [84.0, 99.4], [102.0, 115.08], [117.0, 129.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.64, 100.0, 0.0, 0.0, 0.0, 36.84, 0.0, 45.98, 0.0, 0.0, 0.0, 41.44, 0.0, 66.15, 0.0, 99.76, 36.84, 35.3, 37.64], "audiomae_on_audioset": [null, null, null, [["theremin", 55.3], ["music", 35.62], ["musical instrument", 2.1]], null, null, null, null, [["music", 72.11], ["ambient music", 4.92], ["synthesizer", 3.52]], null, [["music", 40.87], ["speech", 15.42], ["theremin", 5.45]], null, null, null, [["music", 60.98], ["theremin", 16.8], ["whale vocalization", 3.49]], null, null, null, null, [["music", 93.94], ["scary music", 0.91], ["ambient music", 0.86]], [["music", 62.27], ["theremin", 27.54], ["scary music", 1.35]], [["music", 52.03], ["theremin", 36.64], ["musical instrument", 1.72]]], "duration": [1.82, -0.14, -0.01, 27.04, 2.31, -0.05, 0.54, 1.66, 3.23, 0.37, 4.31, 0.53, -0.08, -0.04, 5.19, 1.24, 2.85, 1.81, 3.21, 15.4, 13.08, 12.71]} \ No newline at end of file diff --git a/annotations_filtered/d9TdwetEIQ8_filtered.json b/annotations_filtered/d9TdwetEIQ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6450de9936000eb4608c78acfab6449c07da5005 --- /dev/null +++ b/annotations_filtered/d9TdwetEIQ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.84], [23.0, 37.62], [39.0, 39.95], [41.0, 70.98], [74.0, 77.95], [80.0, 134.18], [140.0, 145.32], [147.0, 163.31], [165.0, 166.02], [170.0, 172.91]], "keep_status": [false, false, false, true, false, false, true, true, false, true], "silence_prob": [47.2, 30.3, 0.0, 28.27, 28.28, 0.0, 28.48, 34.57, 0.0, 33.45], "audiomae_on_audioset": [[["sidetone", 47.49], ["music", 21.59], ["hum", 4.17]], [["mains hum", 56.67], ["hum", 29.11], ["music", 4.36]], null, [["music", 46.84], ["hum", 12.13], ["mains hum", 9.13]], [["music", 61.91], ["electronic music", 7.96], ["throbbing", 6.08]], null, [["rumble", 31.98], ["eruption", 11.74], ["hum", 8.1]], [["hum", 25.09], ["music", 21.86], ["rumble", 12.13]], null, [["music", 39.44], ["speech", 10.16], ["didgeridoo", 10.03]]], "duration": [2.84, 14.62, 0.95, 29.98, 3.95, 54.18, 5.32, 16.31, 1.02, 2.91]} \ No newline at end of file diff --git a/annotations_filtered/d9YfIZP8qPE_filtered.json b/annotations_filtered/d9YfIZP8qPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02d901e1a87de066e832163f9be2e90596dac04c --- /dev/null +++ b/annotations_filtered/d9YfIZP8qPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 54.23], [55.0, 56.67], [57.0, 60.52], [63.0, 63.93], [67.0, 74.63], [76.0, 94.31], [97.0, 100.79], [106.0, 114.27], [115.0, 114.96], [117.0, 132.81], [135.0, 135.97], [138.0, 141.57]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [100.0, 0.0, 100.0, 0.0, 99.99, 75.72, 89.01, 71.29, 0.0, 38.84, 0.0, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 24.94], ["throbbing", 20.23], ["speech", 17.4]], null, null], "duration": [9.23, 1.67, 3.52, 0.93, 7.63, 18.31, 3.79, 8.27, -0.04, 15.81, 0.97, 3.57]} \ No newline at end of file diff --git a/annotations_filtered/d9ykU9FkH-g_filtered.json b/annotations_filtered/d9ykU9FkH-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b30a15f31f71299950f8c508fbaeb0d908c5c768 --- /dev/null +++ b/annotations_filtered/d9ykU9FkH-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [3.0, 22.35], [26.0, 70.93], [73.0, 88.06], [88.0, 88.32], [88.0, 92.7], [94.0, 93.99], [97.0, 98.93], [101.0, 115.62]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.98, 0.0, 33.08, 0.0, 32.69, 0.0, 0.0, 31.82], "audiomae_on_audioset": [null, [["music", 61.68], ["sheep", 6.9], ["chirp tone", 3.83]], null, [["music", 73.02], ["boing", 5.46], ["speech", 4.28]], null, [["music", 66.17], ["speech", 5.8], ["electronic music", 4.19]], null, null, [["music", 84.1], ["theremin", 4.16], ["boing", 1.05]]], "duration": [0.52, 19.35, 44.93, 15.06, 0.32, 4.7, -0.01, 1.93, 14.62]} \ No newline at end of file diff --git a/annotations_filtered/dAE7uOO_4v4_filtered.json b/annotations_filtered/dAE7uOO_4v4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26c4f3165a4c8899136083520c1afe3ac146afd5 --- /dev/null +++ b/annotations_filtered/dAE7uOO_4v4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.34], [14.0, 14.37], [29.0, 29.86], [39.0, 45.33], [46.0, 46.25], [47.0, 47.49], [54.0, 55.05], [60.0, 60.64], [62.0, 63.21], [65.0, 66.01], [73.0, 80.03], [82.0, 107.99], [108.0, 109.04], [109.0, 110.69], [114.0, 114.62], [116.0, 123.18], [127.0, 137.81], [138.0, 143.82], [145.0, 145.45]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [33.82, 0.0, 0.0, 36.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.79, 33.19, 0.0, 0.0, 0.0, 32.22, 32.39, 41.93, 0.0], "audiomae_on_audioset": [[["music", 53.37], ["didgeridoo", 20.73], ["speech", 12.07]], null, null, [["music", 36.84], ["doorbell", 23.29], ["clang", 7.36]], null, null, null, null, null, null, [["music", 25.58], ["theremin", 12.22], ["noise", 5.89]], [["music", 62.99], ["synthesizer", 8.12], ["didgeridoo", 5.87]], null, null, null, [["music", 60.55], ["theremin", 10.1], ["harmonica", 5.19]], [["music", 39.67], ["speech", 32.59], ["didgeridoo", 3.55]], [["music", 46.07], ["fart", 20.71], ["didgeridoo", 10.55]], null], "duration": [5.34, 0.37, 0.86, 6.33, 0.25, 0.49, 1.05, 0.64, 1.21, 1.01, 7.03, 25.99, 1.04, 1.69, 0.62, 7.18, 10.81, 5.82, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/dAMqMErPIIY_filtered.json b/annotations_filtered/dAMqMErPIIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68211f57f6fc943f11087191365a60dec094c932 --- /dev/null +++ b/annotations_filtered/dAMqMErPIIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.25], [20.0, 24.11], [26.0, 26.0], [26.0, 26.11], [26.0, 31.21], [49.0, 51.46], [56.0, 55.8], [56.0, 57.97]], "keep_status": [false, true, false, false, true, false, false, false], "silence_prob": [0.0, 31.84, 0.0, 0.0, 30.47, 99.96, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 22.4], ["music", 10.49], ["insect", 8.84]], null, null, [["music", 30.99], ["speech", 17.96], ["electric shaver, electric razor", 9.14]], null, null, null], "duration": [0.25, 4.11, 0.0, 0.11, 5.21, 2.46, -0.2, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/dAOw8dXcMpw_filtered.json b/annotations_filtered/dAOw8dXcMpw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42b08dacd30f8176199e9ffb5647ed428f74a03b --- /dev/null +++ b/annotations_filtered/dAOw8dXcMpw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.15], [9.0, 9.21], [16.0, 16.23], [21.0, 23.26], [25.0, 25.98], [27.0, 27.9], [31.0, 30.87], [32.0, 34.01], [35.0, 36.29], [39.0, 39.87], [46.0, 45.86], [51.0, 51.26], [54.0, 55.09], [68.0, 68.22], [69.0, 69.79], [70.0, 70.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 0.21, 0.23, 2.26, 0.98, 0.9, -0.13, 2.01, 1.29, 0.87, -0.14, 0.26, 1.09, 0.22, 0.79, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/dAlYuokC9R0_filtered.json b/annotations_filtered/dAlYuokC9R0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1054ca21ea8509130aaec9aade21548584129b25 --- /dev/null +++ b/annotations_filtered/dAlYuokC9R0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.87], [10.0, 11.21], [17.0, 17.02], [18.0, 17.93], [18.0, 18.81], [24.0, 24.06], [33.0, 33.24], [35.0, 35.73], [47.0, 50.67], [51.0, 54.84], [56.0, 62.24], [64.0, 64.98], [67.0, 67.26], [70.0, 72.45], [77.0, 77.3], [79.0, 81.3], [86.0, 89.48], [91.0, 91.93], [93.0, 99.45], [101.0, 101.51], [103.0, 109.38], [114.0, 118.96], [120.0, 121.0], [125.0, 133.25], [134.0, 134.54], [137.0, 137.64]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.72, 63.53, 97.64, 0.0, 0.0, 85.35, 0.0, 93.91, 97.11, 0.0, 99.36, 0.0, 98.19, 76.7, 0.0, 97.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 56.14], ["guitar", 6.83], ["plucked string instrument", 5.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 1.21, 0.02, -0.07, 0.81, 0.06, 0.24, 0.73, 3.67, 3.84, 6.24, 0.98, 0.26, 2.45, 0.3, 2.3, 3.48, 0.93, 6.45, 0.51, 6.38, 4.96, 1.0, 8.25, 0.54, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/dAoRRTPPIys_filtered.json b/annotations_filtered/dAoRRTPPIys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..737cd0f35c286f018dc518c0749d772c36adac24 --- /dev/null +++ b/annotations_filtered/dAoRRTPPIys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.83], [7.0, 7.21], [15.0, 15.58], [16.0, 17.47], [35.0, 37.18], [40.0, 40.96], [42.0, 46.95], [48.0, 50.48], [60.0, 61.18], [64.0, 65.38], [67.0, 67.46], [69.0, 69.35], [71.0, 81.46], [97.0, 107.33], [112.0, 112.55], [126.0, 127.16], [131.0, 131.62], [136.0, 140.59], [143.0, 149.15], [150.0, 151.65], [154.0, 154.38], [156.0, 160.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 99.56, 91.81, 0.0, 0.0, 0.0, 0.0, 42.93, 45.62, 0.0, 0.0, 0.0, 99.98, 78.72, 0.0, 0.0, 99.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 17.57], ["fly, housefly", 16.19], ["mosquito", 11.89]], [["noise", 58.93], ["hum", 7.08], ["radio", 4.47]], null, null, null, null, null, null, null, null], "duration": [0.83, 0.21, 0.58, 1.47, 2.18, 0.96, 4.95, 2.48, 1.18, 1.38, 0.46, 0.35, 10.46, 10.33, 0.55, 1.16, 0.62, 4.59, 6.15, 1.65, 0.38, 4.79]} \ No newline at end of file diff --git a/annotations_filtered/dApRtXZRw1Y_filtered.json b/annotations_filtered/dApRtXZRw1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a24d3dd101f03c9bef1a90ce30b7f26b23d9b32 --- /dev/null +++ b/annotations_filtered/dApRtXZRw1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.11], [16.0, 21.41], [23.0, 23.33], [26.0, 28.63], [37.0, 37.59], [38.0, 39.56], [41.0, 41.93], [43.0, 44.07], [45.0, 46.52], [51.0, 52.1], [53.0, 53.37], [54.0, 54.84], [58.0, 57.84], [62.0, 62.82], [87.0, 87.42], [95.0, 96.38], [98.0, 98.58], [101.0, 101.41], [105.0, 105.6], [107.0, 106.91], [116.0, 116.73], [119.0, 119.11], [126.0, 126.01], [127.0, 128.11], [130.0, 135.11]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [36.78, 39.34, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.5], "audiomae_on_audioset": [[["electric shaver, electric razor", 37.71], ["music", 21.26], ["speech", 9.03]], [["mains hum", 36.1], ["hum", 20.31], ["music", 11.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.33], ["theremin", 17.09], ["civil defense siren", 4.86]]], "duration": [2.11, 5.41, 0.33, 2.63, 0.59, 1.56, 0.93, 1.07, 1.52, 1.1, 0.37, 0.84, -0.16, 0.82, 0.42, 1.38, 0.58, 0.41, 0.6, -0.09, 0.73, 0.11, 0.01, 1.11, 5.11]} \ No newline at end of file diff --git a/annotations_filtered/dAxijzivjlc_filtered.json b/annotations_filtered/dAxijzivjlc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92b28142b335de08c182c49f45ca7a54d19aa49f --- /dev/null +++ b/annotations_filtered/dAxijzivjlc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.72], [10.0, 13.64], [20.0, 21.93], [24.0, 23.95], [25.0, 26.92], [31.0, 32.61], [39.0, 39.88], [44.0, 51.61], [52.0, 66.18], [67.0, 68.66], [70.0, 70.68], [89.0, 89.28], [94.0, 95.08], [99.0, 99.76], [105.0, 117.59], [120.0, 134.92], [137.0, 140.91]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 32.54, 31.75, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 81.35, 48.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 28.94], ["animal", 10.31], ["bow-wow", 8.23]], [["didgeridoo", 20.49], ["music", 11.33], ["speech", 6.79]], null, null, null, null, null, null, null, [["hum", 23.13], ["mains hum", 18.03], ["whale vocalization", 14.9]]], "duration": [0.72, 3.64, 1.93, -0.05, 1.92, 1.61, 0.88, 7.61, 14.18, 1.66, 0.68, 0.28, 1.08, 0.76, 12.59, 14.92, 3.91]} \ No newline at end of file diff --git a/annotations_filtered/dAzXib-thq8_filtered.json b/annotations_filtered/dAzXib-thq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6126c7ff2e17fe3187bb9079711984c31d69bc0 --- /dev/null +++ b/annotations_filtered/dAzXib-thq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.27], [12.0, 12.21], [13.0, 14.4], [16.0, 17.14], [25.0, 26.6], [31.0, 31.97], [33.0, 33.71], [45.0, 64.17], [66.0, 65.8], [66.0, 66.07], [66.0, 72.71], [75.0, 88.97], [90.0, 99.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.04, 0.0, 0.0, 85.35, 70.3, 66.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.27, 0.21, 1.4, 1.14, 1.6, 0.97, 0.71, 19.17, -0.2, 0.07, 6.71, 13.97, 9.44]} \ No newline at end of file diff --git a/annotations_filtered/dB2iZKhWArQ_filtered.json b/annotations_filtered/dB2iZKhWArQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa085730fdfc34b77b3fdfe91ab48847a23520b2 --- /dev/null +++ b/annotations_filtered/dB2iZKhWArQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.56], [11.0, 12.7], [14.0, 16.26], [17.0, 18.93], [19.0, 20.46], [22.0, 22.0], [23.0, 30.5], [33.0, 34.52], [35.0, 37.98], [39.0, 40.39], [42.0, 46.43], [47.0, 47.55], [49.0, 49.92], [51.0, 54.21], [56.0, 59.49], [61.0, 63.26], [65.0, 65.67], [66.0, 69.55], [70.0, 72.55], [74.0, 76.38]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [45.78, 0.0, 43.33, 0.0, 0.0, 0.0, 55.46, 0.0, 36.02, 0.0, 52.16, 0.0, 0.0, 56.63, 85.35, 58.22, 0.0, 38.46, 81.0, 34.64], "audiomae_on_audioset": [[["sidetone", 29.98], ["chirp tone", 14.43], ["speech", 11.87]], null, [["sidetone", 81.67], ["speech", 5.29], ["hum", 2.61]], null, null, null, null, null, [["mains hum", 35.27], ["hum", 26.06], ["speech", 15.28]], null, null, null, null, null, null, null, null, [["sidetone", 54.29], ["mains hum", 12.76], ["speech", 10.23]], null, [["sidetone", 27.68], ["mains hum", 21.35], ["speech", 20.39]]], "duration": [2.56, 1.7, 2.26, 1.93, 1.46, 0.0, 7.5, 1.52, 2.98, 1.39, 4.43, 0.55, 0.92, 3.21, 3.49, 2.26, 0.67, 3.55, 2.55, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/dBal-Rb366c_filtered.json b/annotations_filtered/dBal-Rb366c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3da44469b4f0871f2755d2db2b88c55e48542d8 --- /dev/null +++ b/annotations_filtered/dBal-Rb366c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [10.0, 10.76], [12.0, 12.87], [18.0, 18.82], [20.0, 21.2], [29.0, 29.86], [32.0, 33.22], [35.0, 35.65], [36.0, 36.96], [38.0, 38.64], [42.0, 43.12], [48.0, 48.59], [52.0, 52.25], [53.0, 53.65], [55.0, 56.46], [57.0, 57.0], [59.0, 59.71], [64.0, 64.39], [71.0, 73.7], [76.0, 76.38], [78.0, 79.08], [81.0, 81.63], [82.0, 82.44], [82.0, 84.1], [85.0, 86.66], [87.0, 90.19], [91.0, 93.5], [94.0, 95.81], [97.0, 99.55], [103.0, 104.31], [105.0, 105.95], [108.0, 109.8], [110.0, 112.28], [114.0, 115.53], [118.0, 119.1], [121.0, 121.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 91.81, 0.0, 99.73, 97.54, 0.0, 92.64, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 0.76, 0.87, 0.82, 1.2, 0.86, 1.22, 0.65, 0.96, 0.64, 1.12, 0.59, 0.25, 0.65, 1.46, 0.0, 0.71, 0.39, 2.7, 0.38, 1.08, 0.63, 0.44, 2.1, 1.66, 3.19, 2.5, 1.81, 2.55, 1.31, 0.95, 1.8, 2.28, 1.53, 1.1, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/dC1bJ1qmOCo_filtered.json b/annotations_filtered/dC1bJ1qmOCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..298c8afef54355674a201f9afe3cafa020539a71 --- /dev/null +++ b/annotations_filtered/dC1bJ1qmOCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.22], [10.0, 11.21], [12.0, 14.15], [17.0, 17.19], [18.0, 18.22], [20.0, 20.6], [22.0, 22.65], [26.0, 26.5], [27.0, 28.34], [31.0, 37.39], [38.0, 37.72], [39.0, 42.38], [50.0, 51.44], [63.0, 63.07], [67.0, 68.17], [70.0, 70.8], [85.0, 85.24], [88.0, 89.9], [91.0, 93.16], [108.0, 109.04], [116.0, 117.95], [119.0, 121.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 0.0, 99.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.22, 1.21, 2.15, 0.19, 0.22, 0.6, 0.65, 0.5, 1.34, 6.39, -0.28, 3.38, 1.44, 0.07, 1.17, 0.8, 0.24, 1.9, 2.16, 1.04, 1.95, 2.96]} \ No newline at end of file diff --git a/annotations_filtered/dC1yHLp9bWA_filtered.json b/annotations_filtered/dC1yHLp9bWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c33dd9fc12da668d08437e3d1547bc594e3e6db7 --- /dev/null +++ b/annotations_filtered/dC1yHLp9bWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.86], [8.0, 8.85], [10.0, 13.49], [17.0, 18.23], [20.0, 20.92], [24.0, 24.83], [30.0, 29.84], [31.0, 31.89], [34.0, 35.34], [37.0, 36.53], [38.0, 39.43], [46.0, 48.84], [51.0, 51.66], [54.0, 55.49], [56.0, 61.42], [66.0, 68.72], [73.0, 76.59], [81.0, 84.81], [88.0, 89.83], [97.0, 98.58], [107.0, 107.94], [115.0, 116.18], [118.0, 119.28], [122.0, 123.38], [124.0, 125.51], [126.0, 127.2], [128.0, 128.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0, 0.0, 30.18, 32.04, 31.37, 31.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 44.85], ["cattle, bovinae", 20.2], ["moo", 16.13]], [["music", 19.49], ["throbbing", 19.28], ["hum", 15.4]], [["music", 37.99], ["fly, housefly", 14.16], ["insect", 8.28]], [["music", 45.44], ["hum", 7.95], ["throbbing", 7.49]], null, null, null, null, null, null, null, null, null], "duration": [-0.14, 0.85, 3.49, 1.23, 0.92, 0.83, -0.16, 0.89, 1.34, -0.47, 1.43, 2.84, 0.66, 1.49, 5.42, 2.72, 3.59, 3.81, 1.83, 1.58, 0.94, 1.18, 1.28, 1.38, 1.51, 1.2, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/dCRen85hQ7Q_filtered.json b/annotations_filtered/dCRen85hQ7Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f9d703f1dbbdc5f2582701cf55776a5d7a51d38 --- /dev/null +++ b/annotations_filtered/dCRen85hQ7Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.73], [5.0, 5.66], [8.0, 9.54], [10.0, 11.72], [13.0, 14.13], [15.0, 15.52], [16.0, 17.88], [23.0, 25.05], [26.0, 28.22], [31.0, 34.6], [35.0, 38.23], [42.0, 43.21], [45.0, 46.31], [48.0, 57.43], [60.0, 63.12], [80.0, 80.94], [83.0, 89.88], [91.0, 97.77], [100.0, 107.94], [115.0, 118.25], [120.0, 120.66], [122.0, 125.44], [127.0, 127.48], [129.0, 130.4], [132.0, 132.34], [134.0, 136.21], [137.0, 138.57], [140.0, 148.54], [149.0, 148.58], [150.0, 150.04], [150.0, 150.16], [153.0, 153.71], [155.0, 167.48], [168.0, 169.42]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.9, 54.43, 37.37, 35.1, 0.0, 0.0, 31.2, 35.08, 0.0, 31.58, 32.33, 32.06, 31.63, 0.0, 34.85, 0.0, 0.0, 0.0, 34.98, 0.0, 32.07, 0.0, 0.0, 0.0, 0.0, 30.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["fart", 31.68], ["field recording", 11.0], ["moo", 10.43]], null, [["hum", 41.51], ["music", 27.28], ["mains hum", 15.07]], [["hum", 34.63], ["mains hum", 32.13], ["music", 8.26]], null, null, [["music", 40.25], ["reverberation", 14.8], ["echo", 7.27]], [["didgeridoo", 54.49], ["music", 23.34], ["musical instrument", 6.73]], null, [["music", 75.47], ["synthesizer", 2.79], ["musical instrument", 2.7]], [["music", 51.03], ["reverberation", 8.8], ["echo", 8.0]], [["music", 67.38], ["theremin", 6.49], ["reverberation", 4.9]], [["music", 26.25], ["speech", 7.79], ["musical instrument", 2.25]], null, [["hum", 48.08], ["mains hum", 17.57], ["music", 13.71]], null, null, null, [["music", 59.77], ["musical instrument", 10.25], ["guitar", 2.99]], null, [["music", 64.06], ["didgeridoo", 17.59], ["musical instrument", 7.22]], null, null, null, null, [["music", 48.06], ["didgeridoo", 33.62], ["musical instrument", 5.37]], null], "duration": [1.73, 0.66, 1.54, 1.72, 1.13, 0.52, 1.88, 2.05, 2.22, 3.6, 3.23, 1.21, 1.31, 9.43, 3.12, 0.94, 6.88, 6.77, 7.94, 3.25, 0.66, 3.44, 0.48, 1.4, 0.34, 2.21, 1.57, 8.54, -0.42, 0.04, 0.16, 0.71, 12.48, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/dCTd1XHbliU_filtered.json b/annotations_filtered/dCTd1XHbliU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2eb200edde41c05d4dd8a1732f91c7fec7a700a --- /dev/null +++ b/annotations_filtered/dCTd1XHbliU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.48], [9.0, 9.34], [12.0, 12.29], [15.0, 18.13], [21.0, 21.27], [24.0, 25.05], [28.0, 28.44], [35.0, 37.44], [40.0, 41.4], [43.0, 43.09], [44.0, 48.37], [54.0, 54.7], [69.0, 68.99], [73.0, 73.65], [78.0, 84.91]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 51.82, 0.0, 0.0, 0.0, 38.94], "audiomae_on_audioset": [null, null, null, [["boing", 16.59], ["speech", 15.93], ["music", 13.93]], null, null, null, null, null, null, null, null, null, null, [["speech", 35.24], ["music", 21.47], ["rumble", 8.02]]], "duration": [1.48, 0.34, 0.29, 3.13, 0.27, 1.05, 0.44, 2.44, 1.4, 0.09, 4.37, 0.7, -0.01, 0.65, 6.91]} \ No newline at end of file diff --git a/annotations_filtered/dCxgKZ5QV5E_filtered.json b/annotations_filtered/dCxgKZ5QV5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc0ab5d8b4e0eb37c6f30f7091f7dffdf43cab23 --- /dev/null +++ b/annotations_filtered/dCxgKZ5QV5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.74], [4.0, 5.09], [6.0, 7.18], [12.0, 12.66], [17.0, 18.72], [20.0, 21.59], [22.0, 25.69], [27.0, 27.14], [32.0, 34.1], [37.0, 38.26], [39.0, 42.03], [43.0, 44.12], [45.0, 46.43], [48.0, 48.81], [50.0, 51.87], [57.0, 58.58], [59.0, 60.79], [64.0, 66.36], [67.0, 69.53], [71.0, 71.49], [76.0, 76.67], [80.0, 80.25], [85.0, 86.14], [90.0, 89.83], [91.0, 92.06], [97.0, 97.75], [107.0, 107.49], [108.0, 109.11], [110.0, 112.08], [113.0, 113.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 82.61, 0.0, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.66, 54.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.66], ["speech", 7.47], ["didgeridoo", 4.72]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.74, 1.09, 1.18, 0.66, 1.72, 1.59, 3.69, 0.14, 2.1, 1.26, 3.03, 1.12, 1.43, 0.81, 1.87, 1.58, 1.79, 2.36, 2.53, 0.49, 0.67, 0.25, 1.14, -0.17, 1.06, 0.75, 0.49, 1.11, 2.08, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/dCyrhdW9e8M_filtered.json b/annotations_filtered/dCyrhdW9e8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b3a54397dcad0f3c289395ba595e8949e200d47 --- /dev/null +++ b/annotations_filtered/dCyrhdW9e8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 25.69], [26.0, 25.73], [26.0, 25.76], [28.0, 27.87], [29.0, 79.88], [82.0, 84.37], [86.0, 93.85], [98.0, 107.94], [109.0, 113.91], [117.0, 121.53], [123.0, 153.32]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.5, 34.04, 35.81, 36.69, 37.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 13.41], ["whoosh, swoosh, swish", 9.81], ["music", 7.99]], [["hum", 45.36], ["music", 20.45], ["throbbing", 14.68]], [["music", 55.28], ["hum", 12.3], ["ambient music", 10.44]], [["music", 57.73], ["ambient music", 10.56], ["whale vocalization", 5.48]], [["music", 45.91], ["hum", 10.71], ["electronic music", 8.63]], null], "duration": [-0.31, -0.27, -0.24, -0.13, 50.88, 2.37, 7.85, 9.94, 4.91, 4.53, 30.32]} \ No newline at end of file diff --git a/annotations_filtered/dDDbmin38gg_filtered.json b/annotations_filtered/dDDbmin38gg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c53704e623dd696a44fa79fe29ebc9a4791d96d5 --- /dev/null +++ b/annotations_filtered/dDDbmin38gg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 19.63], [42.0, 42.58], [51.0, 53.15], [60.0, 70.93], [71.0, 74.88], [78.0, 106.76], [108.0, 108.26], [109.0, 111.48]], "keep_status": [false, false, true, true, true, true, false, false], "silence_prob": [49.97, 0.0, 40.34, 42.65, 48.27, 30.34, 0.0, 99.76], "audiomae_on_audioset": [[["speech", 58.5], ["telephone", 15.09], ["telephone bell ringing", 9.1]], null, [["speech", 38.27], ["music", 21.69], ["vehicle", 1.56]], [["music", 37.04], ["speech", 20.5], ["musical instrument", 5.71]], [["speech", 24.18], ["music", 17.27], ["mains hum", 14.92]], [["explosion", 28.78], ["eruption", 9.24], ["hum", 6.87]], null, null], "duration": [14.63, 0.58, 2.15, 10.93, 3.88, 28.76, 0.26, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/dDGMTl1Ya78_filtered.json b/annotations_filtered/dDGMTl1Ya78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdf95e0d5ebcc7fe65300a0cae2ede2ea687b987 --- /dev/null +++ b/annotations_filtered/dDGMTl1Ya78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [5.0, 6.25], [10.0, 11.26], [13.0, 18.82], [20.0, 20.55], [24.0, 42.9], [57.0, 58.92], [60.0, 63.58], [66.0, 69.04], [69.0, 70.66], [76.0, 83.66], [85.0, 91.42], [99.0, 105.49], [110.0, 126.4], [128.0, 131.7], [132.0, 137.93]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, true, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 29.26, 0.0, 29.5, 0.0, 30.33, 30.4, 0.0, 30.45, 30.99, 28.67, 29.73, 28.01, 28.24], "audiomae_on_audioset": [null, null, null, [["mains hum", 55.06], ["hum", 14.83], ["noise", 9.45]], null, [["music", 70.65], ["theremin", 11.04], ["speech", 3.02]], null, [["hum", 39.33], ["mains hum", 29.88], ["buzz", 4.18]], [["hum", 21.86], ["mains hum", 10.09], ["rumble", 9.1]], null, [["hum", 17.4], ["music", 16.74], ["rumble", 13.21]], [["vehicle", 21.39], ["aircraft", 18.27], ["fixed-wing aircraft, airplane", 13.27]], [["mains hum", 32.46], ["hum", 14.22], ["music", 11.02]], [["hum", 25.94], ["mains hum", 23.57], ["music", 9.93]], [["music", 23.51], ["cattle, bovinae", 21.3], ["livestock, farm animals, working animals", 9.68]], [["vehicle", 31.55], ["car", 12.04], ["race car, auto racing", 8.26]]], "duration": [0.42, 1.25, 1.26, 5.82, 0.55, 18.9, 1.92, 3.58, 3.04, 1.66, 7.66, 6.42, 6.49, 16.4, 3.7, 5.93]} \ No newline at end of file diff --git a/annotations_filtered/dDH3nlKHRQ8_filtered.json b/annotations_filtered/dDH3nlKHRQ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29f183901b4994defb8bd14d685b9a97fd82ce90 --- /dev/null +++ b/annotations_filtered/dDH3nlKHRQ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.09], [17.0, 17.79], [18.0, 18.76], [20.0, 19.74], [23.0, 23.62], [26.0, 26.6], [29.0, 31.23], [35.0, 35.21], [49.0, 49.32], [57.0, 57.27], [61.0, 60.79], [79.0, 81.55], [82.0, 83.19], [95.0, 95.15], [97.0, 97.24], [100.0, 101.29], [103.0, 103.1], [110.0, 111.01], [113.0, 112.82], [139.0, 139.65], [146.0, 146.47], [151.0, 151.31], [155.0, 155.19], [156.0, 158.13], [158.0, 158.26], [159.0, 161.72], [162.0, 163.51], [168.0, 168.96], [171.0, 175.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 99.9, 0.0, 0.0, 59.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 0.79, 0.76, -0.26, 0.62, 0.6, 2.23, 0.21, 0.32, 0.27, -0.21, 2.55, 1.19, 0.15, 0.24, 1.29, 0.1, 1.01, -0.18, 0.65, 0.47, 0.31, 0.19, 2.13, 0.26, 2.72, 1.51, 0.96, 4.68]} \ No newline at end of file diff --git a/annotations_filtered/dDQ0rUdj0KM_filtered.json b/annotations_filtered/dDQ0rUdj0KM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c6cd282e87bd9ceea3e1bfcd9a8745a6bee0b71 --- /dev/null +++ b/annotations_filtered/dDQ0rUdj0KM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 22.52], [25.0, 36.17], [39.0, 56.64], [58.0, 58.23], [59.0, 95.69], [97.0, 104.16], [107.0, 111.27], [115.0, 115.77], [116.0, 117.02], [120.0, 122.59], [132.0, 131.75], [132.0, 131.82]], "keep_status": [true, true, true, false, false, true, true, false, false, true, false, false], "silence_prob": [30.64, 30.49, 31.7, 0.0, 0.0, 36.56, 29.32, 0.0, 0.0, 32.28, 0.0, 0.0], "audiomae_on_audioset": [[["car", 23.75], ["vehicle", 12.96], ["race car, auto racing", 9.34]], [["music", 19.86], ["cacophony", 7.52], ["vehicle", 6.01]], [["speech", 28.25], ["vehicle", 17.07], ["aircraft", 10.55]], null, null, [["speech", 31.19], ["sidetone", 17.31], ["buzz", 6.93]], [["vehicle", 23.7], ["fixed-wing aircraft, airplane", 17.0], ["aircraft", 14.68]], null, null, [["speech", 34.25], ["outside, rural or natural", 8.82], ["outside, urban or manmade", 8.06]], null, null], "duration": [3.52, 11.17, 17.64, 0.23, 36.69, 7.16, 4.27, 0.77, 1.02, 2.59, -0.25, -0.18]} \ No newline at end of file diff --git a/annotations_filtered/dDtFWw1mZuw_filtered.json b/annotations_filtered/dDtFWw1mZuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c49ebca82ff02769f8c02c48bc5ef3a67809f5b6 --- /dev/null +++ b/annotations_filtered/dDtFWw1mZuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.13], [5.0, 6.08], [11.0, 10.93], [12.0, 12.61], [14.0, 13.96], [16.0, 18.13], [19.0, 24.53], [25.0, 29.27], [31.0, 43.7], [44.0, 48.96], [50.0, 55.17], [56.0, 56.34], [58.0, 60.05], [61.0, 62.63], [64.0, 66.38], [68.0, 69.97], [71.0, 73.87], [79.0, 80.5], [81.0, 82.17], [83.0, 83.73], [84.0, 87.54], [90.0, 91.67], [99.0, 98.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.87, 0.0, 0.0, 0.0, 0.0, 98.19, 100.0, 62.17, 100.0, 88.64, 86.27, 0.0, 62.99, 0.0, 79.07, 0.0, 80.46, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.13, 1.08, -0.07, 0.61, -0.04, 2.13, 5.53, 4.27, 12.7, 4.96, 5.17, 0.34, 2.05, 1.63, 2.38, 1.97, 2.87, 1.5, 1.17, 0.73, 3.54, 1.67, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/dEnoofPhBtE_filtered.json b/annotations_filtered/dEnoofPhBtE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24a945d696a24609c8bc0e71b937cdaddb47a8ba --- /dev/null +++ b/annotations_filtered/dEnoofPhBtE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.25], [7.0, 10.02], [11.0, 15.4], [16.0, 16.77], [19.0, 22.11], [24.0, 26.64], [27.0, 67.12], [68.0, 73.5], [75.0, 97.12], [99.0, 141.74], [143.0, 145.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 0.0, 100.0, 99.4, 0.0, 100.0, 99.99, 0.0, 99.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.25, 3.02, 4.4, 0.77, 3.11, 2.64, 40.12, 5.5, 22.12, 42.74, 2.61]} \ No newline at end of file diff --git a/annotations_filtered/dEqrnOk8P1Q_filtered.json b/annotations_filtered/dEqrnOk8P1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a09fa340b2b640012add868178bebca5acb6292b --- /dev/null +++ b/annotations_filtered/dEqrnOk8P1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.16], [19.0, 20.73], [26.0, 30.42], [32.0, 33.45], [37.0, 38.72], [40.0, 40.26], [42.0, 43.24], [47.0, 47.95], [50.0, 50.38], [57.0, 57.77], [59.0, 59.39], [60.0, 60.66], [62.0, 65.1], [66.0, 66.18], [68.0, 69.43], [70.0, 71.39], [78.0, 78.43], [79.0, 79.93], [82.0, 87.2], [89.0, 89.33], [92.0, 95.81], [96.0, 98.0], [99.0, 99.55], [101.0, 101.66], [108.0, 108.65], [110.0, 110.29], [114.0, 114.27], [115.0, 115.6], [120.0, 120.66], [122.0, 122.57], [124.0, 124.77], [126.0, 128.46], [129.0, 130.44], [132.0, 133.19], [134.0, 134.35], [140.0, 141.25], [146.0, 146.62], [149.0, 149.45], [152.0, 152.96], [158.0, 163.83], [166.0, 167.1], [170.0, 170.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.71, 0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.86, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0, 100.0, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.16, 1.73, 4.42, 1.45, 1.72, 0.26, 1.24, 0.95, 0.38, 0.77, 0.39, 0.66, 3.1, 0.18, 1.43, 1.39, 0.43, 0.93, 5.2, 0.33, 3.81, 2.0, 0.55, 0.66, 0.65, 0.29, 0.27, 0.6, 0.66, 0.57, 0.77, 2.46, 1.44, 1.19, 0.35, 1.25, 0.62, 0.45, 0.96, 5.83, 1.1, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/dFAd35ck7hY_filtered.json b/annotations_filtered/dFAd35ck7hY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b26c40e0b8d93c25180efdaae4bb705be6ccab83 --- /dev/null +++ b/annotations_filtered/dFAd35ck7hY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.66], [12.0, 12.51], [13.0, 14.07], [20.0, 21.14], [24.0, 25.57], [28.0, 30.45], [31.0, 32.64], [33.0, 33.61], [37.0, 37.34], [38.0, 38.11], [39.0, 41.79], [43.0, 43.48], [46.0, 46.85], [48.0, 48.69], [50.0, 51.19], [65.0, 66.19], [82.0, 83.17], [89.0, 90.8], [92.0, 93.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 0.51, 1.07, 1.14, 1.57, 2.45, 1.64, 0.61, 0.34, 0.11, 2.79, 0.48, 0.85, 0.69, 1.19, 1.19, 1.17, 1.8, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/dFIsw8XfF30_filtered.json b/annotations_filtered/dFIsw8XfF30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2853c950c5a0272371761cf6e33c0e9cef9cd770 --- /dev/null +++ b/annotations_filtered/dFIsw8XfF30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 20.97], [22.0, 23.18], [33.0, 33.03], [34.0, 34.05], [34.0, 34.16], [50.0, 55.59], [58.0, 62.8], [64.0, 64.32], [76.0, 77.16], [78.0, 78.29], [80.0, 81.82], [85.0, 85.08], [86.0, 87.47], [88.0, 89.41], [90.0, 96.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.11, 0.0, 0.0, 0.0, 0.0, 100.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.97, 1.18, 0.03, 0.05, 0.16, 5.59, 4.8, 0.32, 1.16, 0.29, 1.82, 0.08, 1.47, 1.41, 6.53]} \ No newline at end of file diff --git a/annotations_filtered/dFwt1vL1JOg_filtered.json b/annotations_filtered/dFwt1vL1JOg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/dFwt1vL1JOg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/dFxzdwS4yE8_filtered.json b/annotations_filtered/dFxzdwS4yE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df202de9a966d2546bac68479988611f716e314e --- /dev/null +++ b/annotations_filtered/dFxzdwS4yE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 21.15], [22.0, 57.59], [58.0, 61.03], [62.0, 63.39], [65.0, 66.9], [69.0, 80.76], [81.0, 83.4], [84.0, 85.13], [86.0, 87.17], [87.0, 88.52], [89.0, 90.09], [91.0, 92.08], [93.0, 93.83], [95.0, 98.02], [99.0, 104.48], [107.0, 126.08], [128.0, 130.35], [134.0, 134.89], [139.0, 139.62]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.98, 0.0, 39.88, 0.0, 0.0, 38.27, 56.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 57.81, 30.63, 52.27, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 29.14], ["whale vocalization", 24.7], ["hum", 5.02]], null, null, [["music", 60.89], ["hum", 5.05], ["ambient music", 4.74]], null, null, null, null, null, null, null, null, null, [["music", 50.0], ["mains hum", 16.25], ["hum", 15.64]], null, null, null], "duration": [5.15, 35.59, 3.03, 1.39, 1.9, 11.76, 2.4, 1.13, 1.17, 1.52, 1.09, 1.08, 0.83, 3.02, 5.48, 19.08, 2.35, 0.89, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/dG6C9JuB4YA_filtered.json b/annotations_filtered/dG6C9JuB4YA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d528453b501ce5e3dbab171c2495f5719fe68c50 --- /dev/null +++ b/annotations_filtered/dG6C9JuB4YA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.7], [5.0, 9.93], [11.0, 12.11], [14.0, 17.63], [22.0, 25.12], [27.0, 28.68], [33.0, 34.1], [37.0, 39.31], [47.0, 48.46], [50.0, 52.1], [54.0, 54.87], [61.0, 62.68], [66.0, 66.83], [68.0, 69.79], [71.0, 70.78], [71.0, 73.48], [75.0, 76.03], [76.0, 77.08], [79.0, 79.29], [80.0, 80.81], [81.0, 82.21], [84.0, 85.5], [86.0, 88.97], [89.0, 89.43], [90.0, 91.29], [94.0, 94.53], [96.0, 96.3], [97.0, 98.41], [100.0, 101.63], [103.0, 106.14], [108.0, 110.35], [112.0, 111.99], [115.0, 115.75], [117.0, 118.99], [124.0, 124.38], [125.0, 125.91], [129.0, 129.81], [131.0, 132.97], [134.0, 135.13], [137.0, 137.19], [138.0, 138.67], [142.0, 142.75], [147.0, 147.95], [148.0, 149.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 98.59, 0.0, 99.98, 99.84, 0.0, 0.0, 95.51, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.7, 4.93, 1.11, 3.63, 3.12, 1.68, 1.1, 2.31, 1.46, 2.1, 0.87, 1.68, 0.83, 1.79, -0.22, 2.48, 1.03, 1.08, 0.29, 0.81, 1.21, 1.5, 2.97, 0.43, 1.29, 0.53, 0.3, 1.41, 1.63, 3.14, 2.35, -0.01, 0.75, 1.99, 0.38, 0.91, 0.81, 1.97, 1.13, 0.19, 0.67, 0.75, 0.95, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/dGmuICb8a7Y_filtered.json b/annotations_filtered/dGmuICb8a7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fe7dcc9b08a87ccb9cfee709512907013b64c23 --- /dev/null +++ b/annotations_filtered/dGmuICb8a7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.97], [15.0, 18.62], [20.0, 22.35], [32.0, 36.96], [43.0, 44.95], [49.0, 48.52], [51.0, 82.27], [91.0, 92.11], [112.0, 111.89], [121.0, 122.34], [177.0, 177.9], [196.0, 195.93], [200.0, 200.8], [202.0, 205.8], [206.0, 206.81], [207.0, 207.76], [210.0, 212.28]], "keep_status": [true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.96, 33.77, 33.17, 32.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.39, 0.0, 0.0, 64.97], "audiomae_on_audioset": [[["moo", 21.11], ["whale vocalization", 15.73], ["cattle, bovinae", 14.94]], [["cattle, bovinae", 35.31], ["livestock, farm animals, working animals", 31.9], ["moo", 31.57]], [["moo", 16.96], ["cattle, bovinae", 16.61], ["speech", 10.98]], [["noise", 15.63], ["music", 15.61], ["echo", 6.32]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.97, 3.62, 2.35, 4.96, 1.95, -0.48, 31.27, 1.11, -0.11, 1.34, 0.9, -0.07, 0.8, 3.8, 0.81, 0.76, 2.28]} \ No newline at end of file diff --git a/annotations_filtered/dGz9C2xMADc_filtered.json b/annotations_filtered/dGz9C2xMADc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c79ce00f9e10b73927431edb2608aa496d9c4a8c --- /dev/null +++ b/annotations_filtered/dGz9C2xMADc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 83.96], [86.0, 86.34], [88.0, 111.5], [114.0, 159.31]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 31.22, 0.0], "audiomae_on_audioset": [null, null, [["music", 53.32], ["synthesizer", 10.62], ["hum", 5.29]], null], "duration": [50.96, 0.34, 23.5, 45.31]} \ No newline at end of file diff --git a/annotations_filtered/dH1SeHOpEO8_filtered.json b/annotations_filtered/dH1SeHOpEO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43741c0d706ade2743fb69f35cd2a672387f198b --- /dev/null +++ b/annotations_filtered/dH1SeHOpEO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [4.0, 5.17], [8.0, 8.21], [10.0, 10.37], [11.0, 11.25], [13.0, 17.12], [45.0, 44.96], [49.0, 51.29], [54.0, 54.19], [56.0, 57.13], [58.0, 65.25], [74.0, 74.85], [76.0, 76.45], [83.0, 83.39], [84.0, 84.67], [86.0, 87.2], [89.0, 90.83], [97.0, 99.91], [106.0, 105.7], [110.0, 110.02]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 47.35, 0.0, 0.0, 33.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 18.06], ["mains hum", 15.33], ["speech", 10.8]], null, [["music", 64.7], ["musical instrument", 5.17], ["guitar", 4.26]], null, null, [["music", 23.98], ["hum", 21.83], ["mains hum", 17.88]], null, null, null, null, null, null, null, null, null], "duration": [0.87, 1.17, 0.21, 0.37, 0.25, 4.12, -0.04, 2.29, 0.19, 1.13, 7.25, 0.85, 0.45, 0.39, 0.67, 1.2, 1.83, 2.91, -0.3, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/dH3dqXHH0yU_filtered.json b/annotations_filtered/dH3dqXHH0yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..360ed9a34378e14a33e28639d7482ee365837716 --- /dev/null +++ b/annotations_filtered/dH3dqXHH0yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.68], [5.0, 8.75], [9.0, 12.83], [14.0, 17.32], [32.0, 57.57], [60.0, 80.2], [85.0, 85.62], [96.0, 96.28], [100.0, 101.92], [104.0, 104.48], [106.0, 107.1], [140.0, 140.7], [150.0, 151.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.22, 71.72, 39.94, 48.82, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 66.8], ["speech", 13.77], ["groan", 1.78]], [["music", 49.24], ["theremin", 23.15], ["didgeridoo", 6.88]], null, null, null, null, null, null, null, null], "duration": [1.68, 3.75, 3.83, 3.32, 25.57, 20.2, 0.62, 0.28, 1.92, 0.48, 1.1, 0.7, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/dHPnUPFcxdE_filtered.json b/annotations_filtered/dHPnUPFcxdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afce0e787d548e973e473d48aa9b386d425ea83b --- /dev/null +++ b/annotations_filtered/dHPnUPFcxdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.04], [8.0, 8.02], [9.0, 9.76], [13.0, 13.76], [15.0, 15.9], [21.0, 22.91], [24.0, 24.44], [26.0, 26.13], [27.0, 27.6], [28.0, 29.4], [29.0, 29.76], [30.0, 30.0], [30.0, 30.08], [30.0, 31.97], [37.0, 37.12], [38.0, 39.21], [40.0, 41.07], [44.0, 44.64], [46.0, 47.6], [48.0, 49.22], [49.0, 49.3], [50.0, 49.71], [50.0, 49.98], [57.0, 57.21], [62.0, 62.78], [69.0, 69.62], [71.0, 70.88], [72.0, 72.82], [77.0, 78.46], [80.0, 80.08], [81.0, 81.4], [84.0, 85.16], [86.0, 92.7], [99.0, 99.99], [104.0, 105.54], [107.0, 107.35], [110.0, 114.59], [122.0, 123.08], [125.0, 125.98], [126.0, 127.43], [128.0, 128.39], [129.0, 129.59], [130.0, 130.59], [131.0, 132.02], [135.0, 135.08], [137.0, 137.71], [138.0, 139.11], [142.0, 141.74], [150.0, 149.84], [152.0, 154.58], [156.0, 158.33], [163.0, 163.44], [164.0, 165.25], [166.0, 167.64], [174.0, 174.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.04, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.35, 58.38, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 34.32], ["throbbing", 18.36], ["mains hum", 9.28]], null, null, null, [["speech", 40.21], ["hum", 22.17], ["throbbing", 10.83]], null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 33.3], ["speech", 23.64], ["telephone", 8.1]], null, null, null, null, null], "duration": [1.04, 0.02, 0.76, 0.76, 0.9, 1.91, 0.44, 0.13, 0.6, 1.4, 0.76, 0.0, 0.08, 1.97, 0.12, 1.21, 1.07, 0.64, 1.6, 1.22, 0.3, -0.29, -0.02, 0.21, 0.78, 0.62, -0.12, 0.82, 1.46, 0.08, 0.4, 1.16, 6.7, 0.99, 1.54, 0.35, 4.59, 1.08, 0.98, 1.43, 0.39, 0.59, 0.59, 1.02, 0.08, 0.71, 1.11, -0.26, -0.16, 2.58, 2.33, 0.44, 1.25, 1.64, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/dHXVvD4FFas_filtered.json b/annotations_filtered/dHXVvD4FFas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac7542b878c2bd8b322ee8499059e134f11e11ba --- /dev/null +++ b/annotations_filtered/dHXVvD4FFas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.1], [12.0, 13.81], [19.0, 19.95], [26.0, 27.55], [33.0, 34.69], [37.0, 39.28], [41.0, 64.12], [65.0, 73.3], [74.0, 90.32], [91.0, 92.23], [105.0, 105.29], [105.0, 108.73], [109.0, 110.27], [113.0, 113.51], [118.0, 120.18], [121.0, 125.12], [126.0, 132.76], [134.0, 144.49], [151.0, 152.22], [153.0, 174.95], [178.0, 180.27], [189.0, 190.22], [193.0, 201.24], [206.0, 207.01], [208.0, 208.52], [210.0, 211.55]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [75.07, 0.0, 0.0, 0.0, 0.0, 34.94, 33.68, 46.33, 31.52, 0.0, 0.0, 32.22, 0.0, 0.0, 56.25, 70.86, 44.49, 31.15, 0.0, 30.34, 34.5, 0.0, 31.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 30.25], ["speech", 24.54], ["foghorn", 9.73]], [["music", 67.49], ["theremin", 13.23], ["ambient music", 4.56]], [["music", 77.48], ["hum", 4.94], ["theremin", 2.19]], [["music", 51.12], ["speech", 16.09], ["throbbing", 10.88]], null, null, [["music", 35.62], ["speech", 30.4], ["throbbing", 6.09]], null, null, null, null, [["music", 40.29], ["speech", 14.26], ["hum", 11.43]], [["music", 48.83], ["throbbing", 22.12], ["hum", 16.14]], null, [["music", 46.32], ["hum", 19.32], ["throbbing", 10.35]], [["music", 30.34], ["brass instrument", 4.67], ["speech", 4.31]], null, [["music", 64.38], ["throbbing", 6.37], ["hum", 4.71]], null, null, null], "duration": [3.1, 1.81, 0.95, 1.55, 1.69, 2.28, 23.12, 8.3, 16.32, 1.23, 0.29, 3.73, 1.27, 0.51, 2.18, 4.12, 6.76, 10.49, 1.22, 21.95, 2.27, 1.22, 8.24, 1.01, 0.52, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/dIUK_wn5If4_filtered.json b/annotations_filtered/dIUK_wn5If4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88934c084bd6e08173e97142824c013b3443bf5d --- /dev/null +++ b/annotations_filtered/dIUK_wn5If4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 107.5], [111.0, 127.45]], "keep_status": [false, true], "silence_prob": [0.0, 30.63], "audiomae_on_audioset": [null, [["music", 39.92], ["cacophony", 11.87], ["synthesizer", 3.33]]], "duration": [44.5, 16.45]} \ No newline at end of file diff --git a/annotations_filtered/dIgGZA4qQoc_filtered.json b/annotations_filtered/dIgGZA4qQoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9605d6f3e101c1ad9a0fb395d2182dad9928baec --- /dev/null +++ b/annotations_filtered/dIgGZA4qQoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [1.0, 1.97], [5.0, 5.61], [9.0, 10.42], [11.0, 11.5], [13.0, 19.35], [26.0, 25.78], [28.0, 27.99], [32.0, 32.24], [34.0, 34.05], [35.0, 36.19], [37.0, 38.45], [42.0, 47.85], [52.0, 53.18], [63.0, 63.17], [64.0, 64.83], [67.0, 67.68], [81.0, 82.9], [84.0, 85.13], [89.0, 89.01], [97.0, 98.09], [101.0, 100.82], [102.0, 102.17], [106.0, 108.24], [109.0, 111.15], [115.0, 116.83], [118.0, 119.47], [121.0, 123.97], [129.0, 131.01], [134.0, 134.2], [136.0, 135.95], [139.0, 140.83], [142.0, 144.68], [146.0, 147.63]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.66, 58.05, 0.0, 0.0, 49.68, 61.97, 0.0, 0.0, 0.0, 53.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 22.85], ["speech", 22.38], ["fly, housefly", 7.69]], null, null, null, null, null, null, [["music", 33.66], ["theremin", 19.06], ["didgeridoo", 7.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 54.57], ["insect", 17.91], ["mosquito", 10.56]], null, null, null, null, null, null], "duration": [0.33, 0.97, 0.61, 1.42, 0.5, 6.35, -0.22, -0.01, 0.24, 0.05, 1.19, 1.45, 5.85, 1.18, 0.17, 0.83, 0.68, 1.9, 1.13, 0.01, 1.09, -0.18, 0.17, 2.24, 2.15, 1.83, 1.47, 2.97, 2.01, 0.2, -0.05, 1.83, 2.68, 1.63]} \ No newline at end of file diff --git a/annotations_filtered/dIu418Y0TGY_filtered.json b/annotations_filtered/dIu418Y0TGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..817186539188401ecbfbf558ca839744351db526 --- /dev/null +++ b/annotations_filtered/dIu418Y0TGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.64], [8.0, 12.7], [16.0, 16.36], [19.0, 22.49], [31.0, 31.33], [33.0, 33.44], [37.0, 42.87], [45.0, 49.17], [51.0, 63.78], [64.0, 70.21]], "keep_status": [false, false, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 37.38, 0.0, 38.79, 0.0, 0.0, 33.24, 32.44, 62.68, 54.56], "audiomae_on_audioset": [null, [["speech", 76.57], ["clip-clop", 1.5], ["radio", 1.3]], null, [["speech", 35.75], ["clip-clop", 10.47], ["eruption", 9.41]], null, null, [["speech", 41.76], ["rowboat, canoe, kayak", 7.94], ["chop", 4.27]], [["speech", 15.66], ["animal", 11.91], ["crowd", 9.25]], null, null], "duration": [0.64, 4.7, 0.36, 3.49, 0.33, 0.44, 5.87, 4.17, 12.78, 6.21]} \ No newline at end of file diff --git a/annotations_filtered/dIv1kqivuZc_filtered.json b/annotations_filtered/dIv1kqivuZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f8e3947e7bc6aa1d9a5a61a744a641a75101744 --- /dev/null +++ b/annotations_filtered/dIv1kqivuZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 27.43], [32.0, 49.27], [50.0, 51.09], [52.0, 52.83], [55.0, 57.81], [59.0, 61.1], [62.0, 62.26], [64.0, 67.91], [68.0, 68.74], [72.0, 72.86], [73.0, 81.31], [82.0, 83.24], [87.0, 87.78], [89.0, 91.57], [93.0, 94.71], [96.0, 97.56], [100.0, 100.72], [103.0, 103.4], [105.0, 108.99], [110.0, 110.78], [112.0, 114.56], [116.0, 121.27], [122.0, 125.51], [126.0, 130.33], [131.0, 134.32], [135.0, 137.57], [139.0, 143.55], [144.0, 163.9]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, true, false, true, true], "silence_prob": [28.55, 29.06, 0.0, 0.0, 36.66, 39.3, 0.0, 30.27, 0.0, 0.0, 35.09, 0.0, 0.0, 40.24, 0.0, 0.0, 0.0, 0.0, 30.52, 0.0, 73.51, 55.31, 59.68, 42.33, 40.47, 41.36, 39.64, 33.29], "audiomae_on_audioset": [[["music", 48.63], ["speech", 11.68], ["throbbing", 11.21]], [["speech", 41.49], ["music", 27.68], ["gunshot, gunfire", 8.93]], null, null, [["hum", 33.54], ["throbbing", 31.86], ["music", 14.18]], [["hum", 22.03], ["music", 14.56], ["speech", 13.06]], null, [["machine gun", 53.88], ["speech", 18.39], ["gunshot, gunfire", 2.95]], null, null, [["hum", 35.6], ["throbbing", 33.18], ["music", 11.05]], null, null, [["music", 30.38], ["speech", 25.02], ["hum", 7.14]], null, null, null, null, [["speech", 35.17], ["machine gun", 17.6], ["sound effect", 7.51]], null, null, null, null, [["singing bowl", 29.74], ["music", 13.68], ["sheep", 7.24]], [["music", 48.35], ["electronic music", 7.9], ["singing bowl", 5.42]], [["gong", 50.88], ["music", 25.53], ["electronic music", 4.47]], [["music", 23.82], ["singing bowl", 20.51], ["speech", 9.45]], [["music", 29.61], ["hum", 18.87], ["gong", 7.71]]], "duration": [22.43, 17.27, 1.09, 0.83, 2.81, 2.1, 0.26, 3.91, 0.74, 0.86, 8.31, 1.24, 0.78, 2.57, 1.71, 1.56, 0.72, 0.4, 3.99, 0.78, 2.56, 5.27, 3.51, 4.33, 3.32, 2.57, 4.55, 19.9]} \ No newline at end of file diff --git a/annotations_filtered/dIw0nCJpAqE_filtered.json b/annotations_filtered/dIw0nCJpAqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf09eecfb1789121cdcf4be2cd264d2eecc0e2ca --- /dev/null +++ b/annotations_filtered/dIw0nCJpAqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.89], [14.0, 14.64], [17.0, 18.99], [21.0, 21.52], [24.0, 26.27], [31.0, 32.53], [36.0, 49.57], [50.0, 51.93], [53.0, 54.78], [56.0, 60.79], [61.0, 64.99], [66.0, 66.93], [70.0, 72.1], [75.0, 75.56], [77.0, 80.37], [85.0, 86.71], [88.0, 88.79], [91.0, 92.13], [96.0, 103.5], [105.0, 105.07], [107.0, 107.65], [113.0, 121.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 46.4, 0.0, 0.0, 64.07, 42.46, 0.0, 78.72, 0.0, 31.29, 0.0, 0.0, 0.0, 29.72, 0.0, 0.0, 37.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 66.15], ["musical instrument", 6.72], ["theremin", 5.26]], null, null, null, [["chirp tone", 43.17], ["singing bowl", 11.86], ["music", 9.8]], null, null, null, [["music", 50.23], ["speech", 15.82], ["didgeridoo", 7.39]], null, null, null, [["music", 69.97], ["boing", 3.54], ["groan", 3.53]], null, null, [["music", 22.08], ["animal", 14.11], ["hum", 7.14]]], "duration": [0.89, 0.64, 1.99, 0.52, 2.27, 1.53, 13.57, 1.93, 1.78, 4.79, 3.99, 0.93, 2.1, 0.56, 3.37, 1.71, 0.79, 1.13, 7.5, 0.07, 0.65, 8.04]} \ No newline at end of file diff --git a/annotations_filtered/dIy6QpVNPuo_filtered.json b/annotations_filtered/dIy6QpVNPuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17916554023e32969eeb7d24cff240e904ef3c8a --- /dev/null +++ b/annotations_filtered/dIy6QpVNPuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [5.0, 10.37], [22.0, 22.72], [23.0, 27.16], [31.0, 36.22], [45.0, 49.86], [52.0, 62.07], [64.0, 73.04], [76.0, 77.9], [79.0, 92.85], [96.0, 114.66]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 30.91, 0.0, 30.27, 32.44, 30.18, 30.74, 31.46, 0.0, 30.68, 30.72], "audiomae_on_audioset": [null, [["speech", 57.03], ["vehicle", 14.38], ["rumble", 8.23]], null, [["music", 34.88], ["animal", 10.24], ["roaring cats (lions, tigers)", 9.3]], [["music", 72.83], ["hum", 4.03], ["musical instrument", 2.52]], [["music", 88.8], ["speech", 2.9], ["synthesizer", 0.72]], [["music", 68.06], ["throbbing", 5.3], ["hum", 2.65]], [["music", 34.16], ["skidding", 23.88], ["vehicle", 15.19]], null, [["music", 41.44], ["speech", 27.78], ["vehicle", 4.53]], [["vehicle", 22.55], ["music", 21.94], ["car", 17.28]]], "duration": [0.16, 5.37, 0.72, 4.16, 5.22, 4.86, 10.07, 9.04, 1.9, 13.85, 18.66]} \ No newline at end of file diff --git a/annotations_filtered/dJBnRYy3mFI_filtered.json b/annotations_filtered/dJBnRYy3mFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eafe086d72b4176db591b6324fff3f0e287eda30 --- /dev/null +++ b/annotations_filtered/dJBnRYy3mFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.04], [8.0, 8.33], [14.0, 17.02], [18.0, 19.31], [22.0, 24.95], [30.0, 30.91], [32.0, 32.1], [43.0, 44.31], [45.0, 48.44]], "keep_status": [false, false, true, false, false, false, false, false, true], "silence_prob": [30.88, 0.0, 38.3, 0.0, 32.22, 0.0, 0.0, 0.0, 33.98], "audiomae_on_audioset": [[["music", 82.73], ["speech", 6.37], ["sidetone", 1.72]], null, [["music", 42.47], ["speech", 13.54], ["throbbing", 6.39]], null, [["music", 67.88], ["speech", 13.34], ["gunshot, gunfire", 5.19]], null, null, null, [["music", 58.15], ["speech", 4.82], ["electronic music", 4.52]]], "duration": [3.04, 0.33, 3.02, 1.31, 2.95, 0.91, 0.1, 1.31, 3.44]} \ No newline at end of file diff --git a/annotations_filtered/dJFR7xbOIuw_filtered.json b/annotations_filtered/dJFR7xbOIuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4ab069ea91d96408f98ca5ddc15f0177eedc886 --- /dev/null +++ b/annotations_filtered/dJFR7xbOIuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [5.0, 12.19], [13.0, 17.22], [19.0, 19.11], [21.0, 21.86], [23.0, 23.41], [26.0, 27.6], [33.0, 34.16], [36.0, 36.07], [37.0, 38.85], [40.0, 41.59], [42.0, 43.9], [48.0, 49.71], [51.0, 52.25], [53.0, 54.11], [55.0, 55.09], [58.0, 58.78], [62.0, 62.4], [65.0, 65.84], [67.0, 88.64], [90.0, 94.34], [99.0, 111.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 88.83, 40.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.44, 70.02, 43.0], "audiomae_on_audioset": [null, null, [["music", 45.16], ["hum", 23.64], ["throbbing", 6.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 59.13], ["hum", 17.71], ["music", 15.59]], null, [["speech", 36.74], ["music", 36.54], ["hum", 5.56]]], "duration": [0.98, 7.19, 4.22, 0.11, 0.86, 0.41, 1.6, 1.16, 0.07, 1.85, 1.59, 1.9, 1.71, 1.25, 1.11, 0.09, 0.78, 0.4, 0.84, 21.64, 4.34, 12.81]} \ No newline at end of file diff --git a/annotations_filtered/dJS8Umi2b0Q_filtered.json b/annotations_filtered/dJS8Umi2b0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4f61b602f330211322f89d44daf9d4fba222632 --- /dev/null +++ b/annotations_filtered/dJS8Umi2b0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.99], [7.0, 7.57], [11.0, 11.92], [17.0, 19.6], [23.0, 24.7], [26.0, 28.61], [31.0, 31.75], [33.0, 33.86], [35.0, 35.87], [37.0, 37.39], [39.0, 39.95], [41.0, 41.76], [44.0, 45.71], [47.0, 50.63], [51.0, 52.95], [54.0, 57.97], [60.0, 60.39], [62.0, 61.82], [64.0, 67.12], [68.0, 72.62], [73.0, 74.98], [79.0, 83.05], [85.0, 89.04], [90.0, 95.1], [96.0, 98.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 50.56, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 59.33, 0.0, 53.78, 71.72, 87.19, 90.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.99, 0.57, 0.92, 2.6, 1.7, 2.61, 0.75, 0.86, 0.87, 0.39, 0.95, 0.76, 1.71, 3.63, 1.95, 3.97, 0.39, -0.18, 3.12, 4.62, 1.98, 4.05, 4.04, 5.1, 2.1]} \ No newline at end of file diff --git a/annotations_filtered/dJU1SZIfK3Y_filtered.json b/annotations_filtered/dJU1SZIfK3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ef23ce393626f3fcab1720f81c7e45165e1c707 --- /dev/null +++ b/annotations_filtered/dJU1SZIfK3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [5.0, 5.49], [6.0, 6.37], [7.0, 7.86], [10.0, 11.01], [14.0, 14.07], [17.0, 16.85], [21.0, 26.67], [29.0, 28.98], [30.0, 32.31], [34.0, 36.66], [38.0, 39.01], [40.0, 58.83], [61.0, 61.92]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.52, 0.0, 32.36, 32.62, 0.0, 31.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 41.69], ["whale vocalization", 9.04], ["theremin", 6.39]], null, [["music", 74.76], ["didgeridoo", 3.45], ["musical instrument", 3.02]], [["music", 44.73], ["jingle bell", 5.1], ["musical instrument", 4.67]], null, [["music", 77.77], ["musical instrument", 6.61], ["synthesizer", 4.38]], null], "duration": [0.33, 0.49, 0.37, 0.86, 1.01, 0.07, -0.15, 5.67, -0.02, 2.31, 2.66, 1.01, 18.83, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/dJma8pVAvH4_filtered.json b/annotations_filtered/dJma8pVAvH4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e283c0ae94732e374a07303fae34903c4f699ef5 --- /dev/null +++ b/annotations_filtered/dJma8pVAvH4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [10.0, 13.19], [15.0, 16.29], [26.0, 28.9], [40.0, 40.95], [44.0, 45.15], [49.0, 49.23], [50.0, 66.19], [66.0, 77.35], [82.0, 86.17], [88.0, 89.67], [97.0, 97.14], [98.0, 99.3], [102.0, 104.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 69.47, 0.0, 75.72, 0.0, 0.0, 0.0, 35.49, 44.6, 50.76, 0.0, 0.0, 0.0, 41.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 61.47], ["hum", 4.7], ["synthesizer", 4.09]], [["speech", 32.12], ["music", 28.59], ["foghorn", 10.07]], null, null, null, null, [["music", 45.79], ["hum", 8.12], ["scary music", 4.84]]], "duration": [0.83, 3.19, 1.29, 2.9, 0.95, 1.15, 0.23, 16.19, 11.35, 4.17, 1.67, 0.14, 1.3, 2.25]} \ No newline at end of file diff --git a/annotations_filtered/dJsuwhIpSDQ_filtered.json b/annotations_filtered/dJsuwhIpSDQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/dJsuwhIpSDQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/dK2oGZK490w_filtered.json b/annotations_filtered/dK2oGZK490w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bf795c7d1db48fd7fda0f2fdf6b70d82d1ba4e6 --- /dev/null +++ b/annotations_filtered/dK2oGZK490w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.33], [8.0, 9.37], [12.0, 12.78], [14.0, 21.36], [27.0, 28.02], [30.0, 35.78], [39.0, 39.01], [40.0, 41.54], [43.0, 48.32], [51.0, 53.94], [58.0, 60.17], [61.0, 61.92], [64.0, 64.49], [66.0, 66.7], [68.0, 67.83], [70.0, 70.23], [73.0, 87.91], [92.0, 92.35], [97.0, 106.0], [110.0, 112.46], [113.0, 115.25], [120.0, 120.51], [123.0, 123.74], [129.0, 130.2], [131.0, 134.52], [136.0, 137.88], [140.0, 142.48], [144.0, 144.76], [146.0, 146.65], [150.0, 153.49]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.81, 0.0, 41.7, 0.0, 0.0, 65.44, 47.31, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.29, 0.0, 77.87, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 98.44], "audiomae_on_audioset": [null, null, null, [["music", 66.35], ["yodeling", 10.2], ["singing", 2.77]], null, [["music", 54.44], ["brass instrument", 10.9], ["trombone", 6.56]], null, null, null, [["speech", 26.23], ["animal", 11.7], ["music", 6.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 1.37, 0.78, 7.36, 1.02, 5.78, 0.01, 1.54, 5.32, 2.94, 2.17, 0.92, 0.49, 0.7, -0.17, 0.23, 14.91, 0.35, 9.0, 2.46, 2.25, 0.51, 0.74, 1.2, 3.52, 1.88, 2.48, 0.76, 0.65, 3.49]} \ No newline at end of file diff --git a/annotations_filtered/dKAvAAT2q_U_filtered.json b/annotations_filtered/dKAvAAT2q_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1960026c99d0efed20b55b67cc55e6d587e481f6 --- /dev/null +++ b/annotations_filtered/dKAvAAT2q_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [8.0, 14.86], [15.0, 14.89], [15.0, 14.93], [15.0, 14.96], [15.0, 14.99], [15.0, 15.11], [15.0, 15.25], [15.0, 15.42], [15.0, 15.52], [16.0, 18.69], [19.0, 36.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.77, 52.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 6.86, -0.11, -0.07, -0.04, -0.01, 0.11, 0.25, 0.42, 0.52, 2.69, 17.58]} \ No newline at end of file diff --git a/annotations_filtered/dKC2CPS9AFI_filtered.json b/annotations_filtered/dKC2CPS9AFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aafe20d7c68e3e0bfb7d83d3b5d28fd86efbb7c1 --- /dev/null +++ b/annotations_filtered/dKC2CPS9AFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.18], [8.0, 8.4], [12.0, 12.23], [13.0, 13.15], [17.0, 17.95], [19.0, 20.92], [22.0, 22.77], [34.0, 34.01], [37.0, 37.98], [40.0, 40.19], [41.0, 41.05], [49.0, 50.26], [51.0, 53.16], [54.0, 54.92], [55.0, 56.15], [62.0, 63.59], [68.0, 78.66], [84.0, 84.13], [88.0, 95.01], [98.0, 102.51], [106.0, 106.2], [110.0, 110.57], [113.0, 126.55], [128.0, 129.3]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, true, false], "silence_prob": [48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 0.0, 0.0, 0.0, 37.92, 0.0, 36.56, 35.47, 0.0, 0.0, 37.98, 0.0], "audiomae_on_audioset": [[["music", 19.0], ["speech", 9.99], ["hum", 8.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 31.44], ["insect", 14.86], ["speech", 14.01]], null, [["theremin", 18.13], ["cattle, bovinae", 13.35], ["moo", 11.74]], [["civil defense siren", 42.07], ["speech", 13.22], ["siren", 12.87]], null, null, [["livestock, farm animals, working animals", 39.22], ["cattle, bovinae", 14.1], ["moo", 12.44]], null], "duration": [2.18, 0.4, 0.23, 0.15, 0.95, 1.92, 0.77, 0.01, 0.98, 0.19, 0.05, 1.26, 2.16, 0.92, 1.15, 1.59, 10.66, 0.13, 7.01, 4.51, 0.2, 0.57, 13.55, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/dKFZ4T_Y9Pw_filtered.json b/annotations_filtered/dKFZ4T_Y9Pw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78c5179566e60dca5d442cd5bf358b6f21b92f03 --- /dev/null +++ b/annotations_filtered/dKFZ4T_Y9Pw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.81], [19.0, 19.28], [20.0, 20.6], [22.0, 22.33], [26.0, 30.91], [31.0, 32.09], [33.0, 33.29], [34.0, 36.41], [39.0, 41.05], [42.0, 41.99], [43.0, 43.11], [44.0, 45.66], [47.0, 47.8], [48.0, 48.2], [52.0, 52.32], [53.0, 53.3], [54.0, 55.0], [55.0, 55.66], [59.0, 59.51], [60.0, 60.47], [64.0, 64.35], [65.0, 71.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 100.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.28, 0.6, 0.33, 4.91, 1.09, 0.29, 2.41, 2.05, -0.01, 0.11, 1.66, 0.8, 0.2, 0.32, 0.3, 1.0, 0.66, 0.51, 0.47, 0.35, 6.71]} \ No newline at end of file diff --git a/annotations_filtered/dKJa-KQNjQU_filtered.json b/annotations_filtered/dKJa-KQNjQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9fa8e4a5e0f343f989d75b685cffc745f1e0ba4 --- /dev/null +++ b/annotations_filtered/dKJa-KQNjQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.45], [16.0, 16.44], [18.0, 18.33], [19.0, 34.67], [37.0, 43.26], [45.0, 55.95], [58.0, 73.45], [74.0, 90.29], [93.0, 94.86], [103.0, 105.29], [121.0, 121.41], [122.0, 123.72]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [38.46, 0.0, 0.0, 34.53, 39.38, 35.24, 34.16, 31.69, 0.0, 36.09, 0.0, 0.0], "audiomae_on_audioset": [[["music", 71.4], ["soundtrack music", 4.82], ["video game music", 3.47]], null, null, [["music", 36.14], ["hum", 26.66], ["throbbing", 15.61]], [["music", 67.35], ["brass instrument", 4.46], ["musical instrument", 2.77]], [["hum", 29.49], ["music", 29.25], ["throbbing", 17.51]], [["music", 66.22], ["speech", 15.78], ["scary music", 2.94]], [["music", 23.42], ["speech", 21.61], ["hum", 14.35]], null, [["speech", 36.72], ["music", 12.03], ["hum", 4.93]], null, null], "duration": [8.45, 0.44, 0.33, 15.67, 6.26, 10.95, 15.45, 16.29, 1.86, 2.29, 0.41, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/dKPw9-jpA3Y_filtered.json b/annotations_filtered/dKPw9-jpA3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adaaf9a7d4c5f181426f00ffba5530076457a383 --- /dev/null +++ b/annotations_filtered/dKPw9-jpA3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 39.18], [40.0, 39.66], [40.0, 59.19], [59.0, 60.78], [62.0, 62.65], [66.0, 68.34], [70.0, 79.88], [82.0, 116.07], [117.0, 129.37], [130.0, 131.53], [132.0, 133.56]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 49.04, 0.0, 0.0, 96.04, 80.64, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 48.19], ["thunk", 10.11], ["hum", 7.13]], null, null, null, null, null, null, null, null], "duration": [31.18, -0.34, 19.19, 1.78, 0.65, 2.34, 9.88, 34.07, 12.37, 1.53, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/dKSAKBEI4w0_filtered.json b/annotations_filtered/dKSAKBEI4w0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da10dfbff80688c4cf56be48bbd58c35177e68ac --- /dev/null +++ b/annotations_filtered/dKSAKBEI4w0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.98], [9.0, 12.01], [15.0, 30.16], [31.0, 31.16], [40.0, 45.79], [48.0, 49.62], [50.0, 57.72], [60.0, 60.93], [61.0, 62.94], [67.0, 69.21], [86.0, 86.34], [100.0, 104.16], [111.0, 112.77], [121.0, 122.05], [127.0, 126.84]], "keep_status": [false, true, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.51, 38.35, 34.04, 0.0, 39.69, 0.0, 38.8, 0.0, 0.0, 99.76, 0.0, 98.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 22.08], ["speech", 13.31], ["livestock, farm animals, working animals", 11.84]], [["music", 38.38], ["speech", 12.41], ["synthesizer", 6.46]], null, [["speech", 43.31], ["music", 19.33], ["thunk", 6.93]], null, [["speech", 50.15], ["music", 27.92], ["didgeridoo", 5.71]], null, null, null, null, null, null, null, null], "duration": [3.98, 3.01, 15.16, 0.16, 5.79, 1.62, 7.72, 0.93, 1.94, 2.21, 0.34, 4.16, 1.77, 1.05, -0.16]} \ No newline at end of file diff --git a/annotations_filtered/dKleqAHv-Zw_filtered.json b/annotations_filtered/dKleqAHv-Zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..283ae068e4ece78501208e6c530de0e881d0f736 --- /dev/null +++ b/annotations_filtered/dKleqAHv-Zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.95], [6.0, 7.4], [8.0, 8.56], [9.0, 10.77], [14.0, 17.15], [18.0, 19.38], [20.0, 21.78], [24.0, 24.44], [26.0, 27.51], [29.0, 30.87], [32.0, 33.22], [34.0, 34.86], [35.0, 36.41], [37.0, 38.65], [40.0, 41.39], [43.0, 43.48], [45.0, 45.08], [46.0, 46.97], [48.0, 49.98], [52.0, 53.28], [54.0, 53.76], [54.0, 53.79], [56.0, 56.62], [58.0, 64.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.17], ["effects unit", 14.08], ["distortion", 6.2]]], "duration": [1.95, 1.4, 0.56, 1.77, 3.15, 1.38, 1.78, 0.44, 1.51, 1.87, 1.22, 0.86, 1.41, 1.65, 1.39, 0.48, 0.08, 0.97, 1.98, 1.28, -0.24, -0.21, 0.62, 6.45]} \ No newline at end of file diff --git a/annotations_filtered/dKoFTEK7O_o_filtered.json b/annotations_filtered/dKoFTEK7O_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07d12a2d16e738dbda6939811147f04d050f1392 --- /dev/null +++ b/annotations_filtered/dKoFTEK7O_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.76], [29.0, 31.38], [33.0, 33.1], [34.0, 36.19], [38.0, 54.55], [56.0, 57.18], [58.0, 60.0], [63.0, 64.59], [67.0, 67.49], [68.0, 80.64]], "keep_status": [false, false, false, false, false, false, true, false, false, true], "silence_prob": [39.09, 49.68, 0.0, 31.72, 34.55, 0.0, 31.45, 0.0, 0.0, 35.82], "audiomae_on_audioset": [[["whale vocalization", 40.47], ["music", 19.51], ["speech", 15.21]], [["speech", 59.72], ["sidetone", 19.76], ["hum", 4.66]], null, [["mains hum", 39.18], ["hum", 28.08], ["music", 11.15]], [["hum", 32.86], ["mains hum", 32.37], ["music", 11.18]], null, [["hum", 14.02], ["music", 11.84], ["noise", 11.43]], null, null, [["music", 57.07], ["hum", 6.16], ["mains hum", 5.86]]], "duration": [3.76, 2.38, 0.1, 2.19, 16.55, 1.18, 2.0, 1.59, 0.49, 12.64]} \ No newline at end of file diff --git a/annotations_filtered/dKsDjpKr2Mk_filtered.json b/annotations_filtered/dKsDjpKr2Mk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8fefbfccaca8be64df27d35b82066f3f50d4c4e --- /dev/null +++ b/annotations_filtered/dKsDjpKr2Mk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.38], [9.0, 14.22], [17.0, 19.2], [22.0, 22.01], [23.0, 26.84], [46.0, 46.21], [50.0, 50.67], [52.0, 52.91], [55.0, 54.89], [56.0, 56.88], [59.0, 65.77], [69.0, 69.26], [71.0, 71.09], [72.0, 73.57], [76.0, 81.7], [82.0, 83.74], [85.0, 85.06], [88.0, 90.66], [107.0, 111.48], [113.0, 122.99], [124.0, 125.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 62.47, 91.3, 0.0, 34.36, 0.0, 0.0, 0.0, 0.0, 0.0, 36.62, 0.0, 0.0, 0.0, 81.71, 0.0, 0.0, 48.65, 88.83, 71.87, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 59.1], ["fart", 9.98], ["electric shaver, electric razor", 3.75]], null, null, null, null, null, [["speech", 66.68], ["hum", 6.15], ["mains hum", 5.23]], null, null, null, null, null, null, [["crack", 30.62], ["music", 26.68], ["crushing", 16.99]], null, null, null], "duration": [0.38, 5.22, 2.2, 0.01, 3.84, 0.21, 0.67, 0.91, -0.11, 0.88, 6.77, 0.26, 0.09, 1.57, 5.7, 1.74, 0.06, 2.66, 4.48, 9.99, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/dL2_nbhJaTs_filtered.json b/annotations_filtered/dL2_nbhJaTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..055f1c3fa4d29d7efdf1f0088d6c66c4a1b14853 --- /dev/null +++ b/annotations_filtered/dL2_nbhJaTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.56], [3.0, 7.92], [11.0, 25.54], [28.0, 32.78], [38.0, 56.19], [61.0, 83.78], [86.0, 99.08], [100.0, 100.77], [101.0, 105.41]], "keep_status": [true, true, true, false, true, false, false, false, true], "silence_prob": [29.71, 30.46, 29.92, 37.26, 29.05, 34.36, 33.08, 0.0, 32.64], "audiomae_on_audioset": [[["fart", 21.81], ["sound effect", 12.39], ["music", 11.43]], [["speech", 27.83], ["music", 16.27], ["vehicle", 7.48]], [["electric shaver, electric razor", 29.86], ["buzz", 22.43], ["music", 11.47]], [["music", 45.13], ["hum", 13.29], ["mains hum", 12.33]], [["music", 52.37], ["musical instrument", 11.66], ["didgeridoo", 4.64]], [["music", 38.13], ["buzz", 25.74], ["smash, crash", 7.0]], [["music", 63.72], ["didgeridoo", 5.77], ["musical instrument", 4.85]], null, [["music", 18.04], ["theremin", 10.79], ["didgeridoo", 8.41]]], "duration": [2.56, 4.92, 14.54, 4.78, 18.19, 22.78, 13.08, 0.77, 4.41]} \ No newline at end of file diff --git a/annotations_filtered/dLLkOjKNanY_filtered.json b/annotations_filtered/dLLkOjKNanY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..366e01f7bdb27625e07a6c6b1ee291f6c4b613df --- /dev/null +++ b/annotations_filtered/dLLkOjKNanY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 53.18], [57.0, 57.5], [59.0, 58.62], [61.0, 62.14], [90.0, 90.1], [95.0, 94.86], [95.0, 96.35], [98.0, 98.63], [102.0, 102.42], [103.0, 103.57], [115.0, 116.68], [118.0, 123.43], [124.0, 129.76], [130.0, 129.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 0.5, -0.38, 1.14, 0.1, -0.14, 1.35, 0.63, 0.42, 0.57, 1.68, 5.43, 5.76, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/dLVgEWrfdSg_filtered.json b/annotations_filtered/dLVgEWrfdSg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81ba0dd00c9579a1daaaf2904cd137747497a236 --- /dev/null +++ b/annotations_filtered/dLVgEWrfdSg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.52]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.52]} \ No newline at end of file diff --git a/annotations_filtered/dLXri8sYr6Q_filtered.json b/annotations_filtered/dLXri8sYr6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8db39c295f4587e9198a904414ee3b5c04099df9 --- /dev/null +++ b/annotations_filtered/dLXri8sYr6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.98], [42.0, 43.34], [46.0, 49.49], [51.0, 52.35], [54.0, 57.6], [63.0, 64.39], [67.0, 68.76], [70.0, 70.44], [71.0, 71.25], [74.0, 79.68], [84.0, 86.12], [89.0, 90.56], [100.0, 101.68], [107.0, 107.89], [111.0, 112.41], [117.0, 118.52], [119.0, 129.56], [133.0, 134.4]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [99.99, 0.0, 44.9, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 99.31, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 49.45, 0.0], "audiomae_on_audioset": [null, null, [["speech", 57.94], ["chop", 4.98], ["hubbub, speech noise, speech babble", 2.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["vocal music", 22.1], ["chant", 17.27], ["music", 14.45]], null], "duration": [2.98, 1.34, 3.49, 1.35, 3.6, 1.39, 1.76, 0.44, 0.25, 5.68, 2.12, 1.56, 1.68, 0.89, 1.41, 1.52, 10.56, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/dLjNzwEULG8_filtered.json b/annotations_filtered/dLjNzwEULG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8044fdb60f08a9a6fe2aed5d583f019acae785b --- /dev/null +++ b/annotations_filtered/dLjNzwEULG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.34], [10.0, 11.18], [13.0, 12.68], [13.0, 23.92], [26.0, 25.89], [27.0, 28.0], [31.0, 35.53], [36.0, 38.94], [40.0, 45.05], [46.0, 47.34], [49.0, 49.74], [60.0, 59.93], [61.0, 62.07], [66.0, 83.56], [84.0, 85.11], [87.0, 88.52], [89.0, 95.57], [96.0, 99.77], [100.0, 100.75], [105.0, 110.22], [111.0, 112.14], [113.0, 114.61], [115.0, 116.63], [118.0, 119.16], [120.0, 120.33], [121.0, 122.76], [124.0, 128.75], [130.0, 134.79], [136.0, 136.38], [137.0, 137.51], [139.0, 140.46], [144.0, 144.71], [145.0, 146.21], [147.0, 153.01], [154.0, 159.41], [163.0, 170.24]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 34.89, 0.0, 0.0, 63.21, 64.75, 72.16, 0.0, 0.0, 0.0, 0.0, 38.31, 0.0, 0.0, 34.37, 63.96, 0.0, 33.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.45, 30.34, 0.0, 0.0, 0.0, 0.0, 0.0, 31.89, 37.8, 66.88], "audiomae_on_audioset": [null, null, null, [["speech", 46.92], ["noise", 10.81], ["male speech, man speaking", 3.38]], null, null, null, null, null, null, null, null, null, [["speech", 51.9], ["fart", 7.69], ["knock", 4.49]], null, null, [["speech", 51.33], ["radio", 15.92], ["noise", 13.15]], null, null, [["horse", 26.91], ["speech", 11.93], ["clip-clop", 7.0]], null, null, null, null, null, null, [["sheep", 16.41], ["chuckle, chortle", 10.39], ["snicker", 10.37]], [["animal", 31.36], ["dog", 12.45], ["bow-wow", 12.44]], null, null, null, null, null, [["snicker", 30.4], ["laughter", 12.08], ["chuckle, chortle", 10.96]], [["fly, housefly", 11.94], ["insect", 9.56], ["mosquito", 6.73]], null], "duration": [1.34, 1.18, -0.32, 10.92, -0.11, 1.0, 4.53, 2.94, 5.05, 1.34, 0.74, -0.07, 1.07, 17.56, 1.11, 1.52, 6.57, 3.77, 0.75, 5.22, 1.14, 1.61, 1.63, 1.16, 0.33, 1.76, 4.75, 4.79, 0.38, 0.51, 1.46, 0.71, 1.21, 6.01, 5.41, 7.24]} \ No newline at end of file diff --git a/annotations_filtered/dLjnIpWhLZ4_filtered.json b/annotations_filtered/dLjnIpWhLZ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44f9b0b6d00a87bdd689a3801c27e78ce03203d5 --- /dev/null +++ b/annotations_filtered/dLjnIpWhLZ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.23], [13.0, 14.66], [15.0, 16.78], [18.0, 19.25], [21.0, 21.81], [23.0, 26.54], [28.0, 30.86], [32.0, 35.75], [37.0, 38.04]], "keep_status": [true, false, false, false, false, true, false, false, false], "silence_prob": [37.5, 0.0, 0.0, 0.0, 0.0, 39.02, 77.36, 53.78, 0.0], "audiomae_on_audioset": [[["sidetone", 36.54], ["hum", 15.93], ["noise", 8.4]], null, null, null, null, [["speech", 28.59], ["fly, housefly", 12.65], ["insect", 9.91]], null, null, null], "duration": [4.23, 1.66, 1.78, 1.25, 0.81, 3.54, 2.86, 3.75, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/dLpCZ8g5uK8_filtered.json b/annotations_filtered/dLpCZ8g5uK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efa1f8ab090fe56251a46992703604e56c717ed8 --- /dev/null +++ b/annotations_filtered/dLpCZ8g5uK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.51], [39.0, 42.16], [43.0, 45.37], [54.0, 55.58], [56.0, 57.13], [59.0, 60.47], [64.0, 64.3], [68.0, 68.59], [70.0, 70.68], [77.0, 79.3], [82.0, 81.9], [84.0, 84.21], [91.0, 91.66], [93.0, 93.63], [95.0, 116.87], [119.0, 119.38], [122.0, 122.03]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 32.17, 44.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.39, 0.0, 0.0, 0.0, 0.0, 30.65, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.0], ["effects unit", 12.39], ["synthesizer", 9.25]], [["music", 40.9], ["synthesizer", 6.94], ["musical instrument", 6.65]], null, null, null, null, null, null, null, null, null, null, null, [["music", 55.24], ["hum", 10.54], ["synthesizer", 3.35]], null, null], "duration": [0.51, 3.16, 2.37, 1.58, 1.13, 1.47, 0.3, 0.59, 0.68, 2.3, -0.1, 0.21, 0.66, 0.63, 21.87, 0.38, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/dLxtD4f_DA4_filtered.json b/annotations_filtered/dLxtD4f_DA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c30e8b12060a57763a3f5e3a3efb5aca28ad4a5 --- /dev/null +++ b/annotations_filtered/dLxtD4f_DA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [4.0, 4.75], [6.0, 7.64], [8.0, 9.54], [10.0, 11.37], [13.0, 13.73], [15.0, 15.01], [16.0, 30.42], [30.0, 30.48], [31.0, 76.03], [77.0, 78.06], [79.0, 83.69], [86.0, 124.61], [128.0, 160.02], [163.0, 163.78]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.66, 0.0, 0.0, 0.0, 29.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 37.86], ["mains hum", 18.23], ["music", 10.44]], null, null, null, [["music", 25.52], ["hum", 10.82], ["cacophony", 5.16]], null, null, null], "duration": [1.13, 0.75, 1.64, 1.54, 1.37, 0.73, 0.01, 14.42, 0.48, 45.03, 1.06, 4.69, 38.61, 32.02, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/dM6waznJ7No_filtered.json b/annotations_filtered/dM6waznJ7No_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cab572d82a5b39f0f8cc5e14cb023240673d84a --- /dev/null +++ b/annotations_filtered/dM6waznJ7No_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.44], [11.0, 10.69], [11.0, 11.01], [11.0, 11.45], [12.0, 11.64], [12.0, 30.33], [36.0, 36.75]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [31.95, 0.0, 0.0, 0.0, 0.0, 30.42, 0.0], "audiomae_on_audioset": [[["music", 42.27], ["drum machine", 18.21], ["speech", 13.36]], null, null, null, null, [["music", 77.4], ["electronic music", 3.51], ["speech", 3.35]], null], "duration": [6.44, -0.31, 0.01, 0.45, -0.36, 18.33, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/dME9-07ZvJI_filtered.json b/annotations_filtered/dME9-07ZvJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9e399fec71e0dc69af6b1a63bbc48d6e9b6b33f --- /dev/null +++ b/annotations_filtered/dME9-07ZvJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 56.81], [59.0, 64.49], [65.0, 64.94], [65.0, 65.3], [66.0, 67.22], [71.0, 81.8], [82.0, 86.04], [88.0, 92.75], [93.0, 94.53], [96.0, 96.79], [99.0, 117.14], [118.0, 119.58], [123.0, 130.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [49.73, 33.67, 0.0, 0.0, 0.0, 38.11, 58.22, 35.95, 0.0, 0.0, 32.01, 0.0, 32.53], "audiomae_on_audioset": [[["music", 64.97], ["throbbing", 4.3], ["boing", 3.76]], [["music", 58.69], ["groan", 14.17], ["throbbing", 4.87]], null, null, null, [["music", 62.13], ["throbbing", 9.98], ["hum", 5.62]], null, [["hum", 34.03], ["throbbing", 29.57], ["music", 17.69]], null, null, [["music", 43.85], ["hum", 18.27], ["throbbing", 6.71]], null, [["music", 26.97], ["vehicle", 22.49], ["car", 12.44]]], "duration": [10.81, 5.49, -0.06, 0.3, 1.22, 10.8, 4.04, 4.75, 1.53, 0.79, 18.14, 1.58, 7.71]} \ No newline at end of file diff --git a/annotations_filtered/dMJolQgBp38_filtered.json b/annotations_filtered/dMJolQgBp38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbd2d6317ffa07a2349a90c37282a09951caa8af --- /dev/null +++ b/annotations_filtered/dMJolQgBp38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.68], [15.0, 16.17], [18.0, 20.01], [23.0, 28.04], [31.0, 39.99], [42.0, 55.95], [59.0, 88.25], [89.0, 90.9], [93.0, 97.44], [98.0, 104.45]], "keep_status": [false, false, true, true, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 29.92, 48.39, 33.87, 35.13, 32.99, 0.0, 51.94, 33.08], "audiomae_on_audioset": [null, null, [["vehicle", 15.17], ["music", 4.97], ["speech", 4.71]], [["music", 51.67], ["throbbing", 8.14], ["hum", 7.51]], [["music", 49.91], ["throbbing", 12.03], ["hum", 7.82]], [["music", 29.02], ["mains hum", 19.36], ["hum", 18.86]], [["music", 61.43], ["speech", 7.08], ["hum", 3.85]], null, null, [["speech", 39.67], ["music", 17.93], ["explosion", 6.12]]], "duration": [0.68, 1.17, 2.01, 5.04, 8.99, 13.95, 29.25, 1.9, 4.44, 6.45]} \ No newline at end of file diff --git a/annotations_filtered/dMOQv0rb6DY_filtered.json b/annotations_filtered/dMOQv0rb6DY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74372af13bb0db92ba3a3258568b4793a877b850 --- /dev/null +++ b/annotations_filtered/dMOQv0rb6DY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.2], [7.0, 7.91], [22.0, 22.28], [30.0, 31.16], [39.0, 44.0], [53.0, 54.36], [57.0, 73.48], [74.0, 76.37], [86.0, 100.8], [102.0, 103.2], [103.0, 110.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.44, 0.0, 32.78, 31.79, 31.91, 0.0, 31.21], "audiomae_on_audioset": [null, null, null, null, [["music", 68.91], ["singing", 4.32], ["musical instrument", 2.84]], null, [["music", 36.75], ["synthetic singing", 23.37], ["male singing", 11.94]], [["music", 69.68], ["a capella", 6.67], ["singing", 5.38]], [["music", 84.77], ["male singing", 2.37], ["musical instrument", 2.27]], null, [["music", 83.48], ["speech", 3.51], ["musical instrument", 3.01]]], "duration": [0.2, 0.91, 0.28, 1.16, 5.0, 1.36, 16.48, 2.37, 14.8, 1.2, 7.88]} \ No newline at end of file diff --git a/annotations_filtered/dN1RMOrtK7A_filtered.json b/annotations_filtered/dN1RMOrtK7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2911ffbf5f48a40691d7968194e0b0d0e1bfd244 --- /dev/null +++ b/annotations_filtered/dN1RMOrtK7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.0], [14.0, 20.65], [25.0, 36.49], [43.0, 45.25], [50.0, 53.11], [58.0, 59.09], [67.0, 70.09], [71.0, 71.1], [73.0, 74.02], [75.0, 77.33], [79.0, 79.79], [84.0, 84.7], [87.0, 87.39], [103.0, 103.71], [105.0, 105.6], [114.0, 119.8], [123.0, 122.81], [123.0, 123.65], [125.0, 125.15], [126.0, 125.86], [126.0, 125.98], [138.0, 138.27], [147.0, 147.88], [149.0, 150.21], [155.0, 154.89], [172.0, 175.34], [177.0, 182.38], [184.0, 187.49], [188.0, 196.94], [197.0, 197.61]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [38.16, 36.95, 45.82, 48.78, 36.42, 0.0, 55.11, 0.0, 0.0, 39.17, 0.0, 0.0, 0.0, 0.0, 0.0, 29.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.3, 29.0, 28.56, 86.09, 0.0], "audiomae_on_audioset": [[["speech", 66.66], ["noise", 5.2], ["groan", 2.83]], [["speech", 61.64], ["hum", 11.94], ["music", 10.2]], [["hum", 29.34], ["whale vocalization", 17.54], ["music", 15.81]], [["speech", 30.9], ["sidetone", 30.49], ["music", 13.86]], [["sidetone", 53.17], ["speech", 23.75], ["sine wave", 3.62]], null, null, null, null, [["speech", 32.9], ["music", 17.41], ["hum", 9.26]], null, null, null, null, null, [["music", 26.54], ["hum", 19.85], ["mains hum", 12.72]], null, null, null, null, null, null, null, null, null, [["speech", 75.86], ["animal", 16.54], ["roaring cats (lions, tigers)", 2.64]], [["music", 55.41], ["speech", 11.64], ["electronic music", 2.32]], [["whale vocalization", 32.26], ["sound effect", 5.39], ["music", 5.11]], null, null], "duration": [5.0, 6.65, 11.49, 2.25, 3.11, 1.09, 3.09, 0.1, 1.02, 2.33, 0.79, 0.7, 0.39, 0.71, 0.6, 5.8, -0.19, 0.65, 0.15, -0.14, -0.02, 0.27, 0.88, 1.21, -0.11, 3.34, 5.38, 3.49, 8.94, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/dN9rfJvFHgw_filtered.json b/annotations_filtered/dN9rfJvFHgw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..193689ff6b693866f449fe99bbd022c3ce24cdbb --- /dev/null +++ b/annotations_filtered/dN9rfJvFHgw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 18.6], [26.0, 26.94], [30.0, 31.02], [43.0, 43.51], [49.0, 57.32], [59.0, 59.26], [64.0, 68.94], [70.0, 130.82]], "keep_status": [false, false, false, false, true, false, true, false], "silence_prob": [38.74, 0.0, 0.0, 0.0, 44.55, 0.0, 33.87, 0.0], "audiomae_on_audioset": [[["music", 34.96], ["hum", 23.87], ["mains hum", 14.81]], null, null, null, [["music", 41.56], ["speech", 15.32], ["percussion", 7.85]], null, [["music", 25.3], ["throbbing", 18.71], ["hum", 16.72]], null], "duration": [11.6, 0.94, 1.02, 0.51, 8.32, 0.26, 4.94, 60.82]} \ No newline at end of file diff --git a/annotations_filtered/dNlMe4kU9TA_filtered.json b/annotations_filtered/dNlMe4kU9TA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17651e51374d93f65e1e922077bccf895e36012b --- /dev/null +++ b/annotations_filtered/dNlMe4kU9TA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[104.0, 104.95]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.95]} \ No newline at end of file diff --git a/annotations_filtered/dOTGLArtfrQ_filtered.json b/annotations_filtered/dOTGLArtfrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7b6a7a72756eb86a2d19d794579ef95e6fa0ad6 --- /dev/null +++ b/annotations_filtered/dOTGLArtfrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.55], [16.0, 17.96], [19.0, 19.92], [23.0, 26.82], [30.0, 42.87], [45.0, 44.85], [48.0, 47.87], [49.0, 69.72], [71.0, 73.97], [78.0, 78.9], [81.0, 87.42], [89.0, 89.38], [91.0, 91.79], [93.0, 94.49], [96.0, 96.85], [98.0, 99.15], [103.0, 108.16], [112.0, 112.8], [116.0, 116.38], [117.0, 120.97], [122.0, 124.02]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [57.32, 0.0, 0.0, 74.44, 39.22, 0.0, 0.0, 31.73, 42.17, 0.0, 33.9, 0.0, 0.0, 0.0, 0.0, 0.0, 38.88, 0.0, 0.0, 42.08, 38.04], "audiomae_on_audioset": [null, null, null, null, [["music", 52.12], ["whack, thwack", 16.71], ["boing", 4.38]], null, null, [["music", 57.94], ["speech", 14.77], ["synthesizer", 3.33]], [["music", 54.74], ["synthesizer", 6.35], ["throbbing", 4.38]], null, [["music", 40.56], ["drum machine", 14.28], ["synthesizer", 8.31]], null, null, null, null, null, [["music", 43.26], ["sidetone", 17.26], ["speech", 11.87]], null, null, [["music", 70.75], ["synthesizer", 5.31], ["drum machine", 4.51]], [["music", 18.15], ["drum", 9.85], ["drum machine", 6.55]]], "duration": [4.55, 1.96, 0.92, 3.82, 12.87, -0.15, -0.13, 20.72, 2.97, 0.9, 6.42, 0.38, 0.79, 1.49, 0.85, 1.15, 5.16, 0.8, 0.38, 3.97, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/dOZndhz24OA_filtered.json b/annotations_filtered/dOZndhz24OA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c27a9471014defc16a1444c33934c7412be2439 --- /dev/null +++ b/annotations_filtered/dOZndhz24OA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [4.0, 7.94], [10.0, 14.64], [16.0, 23.31], [25.0, 25.68], [38.0, 60.15], [60.0, 61.77], [67.0, 77.28], [78.0, 80.16], [81.0, 81.38], [81.0, 82.53], [87.0, 92.18], [99.0, 99.12], [99.0, 101.44], [104.0, 105.48], [106.0, 108.94], [110.0, 112.13], [115.0, 116.09], [118.0, 118.54], [126.0, 129.22], [130.0, 135.11], [139.0, 139.73], [141.0, 144.39], [162.0, 171.86]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, true, false], "silence_prob": [0.0, 80.29, 78.89, 31.15, 0.0, 29.95, 0.0, 38.4, 57.64, 0.0, 0.0, 29.84, 0.0, 29.43, 0.0, 29.39, 32.39, 0.0, 0.0, 50.31, 33.46, 0.0, 29.36, 29.68], "audiomae_on_audioset": [null, null, null, [["speech", 26.53], ["sidetone", 20.27], ["whack, thwack", 13.94]], null, [["sidetone", 47.51], ["speech", 12.4], ["music", 7.37]], null, [["music", 73.6], ["whale vocalization", 10.14], ["buzz", 1.92]], null, null, null, [["speech", 86.2], ["grunt", 1.99], ["beatboxing", 1.74]], null, [["speech", 78.11], ["boing", 3.72], ["grunt", 3.5]], null, [["speech", 51.87], ["music", 8.17], ["beatboxing", 7.49]], [["hum", 31.39], ["mains hum", 13.77], ["music", 12.99]], null, null, null, [["speech", 28.11], ["sidetone", 20.74], ["music", 10.44]], null, [["speech", 30.83], ["music", 15.12], ["grunt", 11.13]], [["speech", 51.41], ["grunt", 32.44], ["music", 5.24]]], "duration": [0.08, 3.94, 4.64, 7.31, 0.68, 22.15, 1.77, 10.28, 2.16, 0.38, 1.53, 5.18, 0.12, 2.44, 1.48, 2.94, 2.13, 1.09, 0.54, 3.22, 5.11, 0.73, 3.39, 9.86]} \ No newline at end of file diff --git a/annotations_filtered/dO_D5ilNoZA_filtered.json b/annotations_filtered/dO_D5ilNoZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00823fed6f0b1914fc03a88b4c5c894194d65b05 --- /dev/null +++ b/annotations_filtered/dO_D5ilNoZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.62], [7.0, 8.68], [9.0, 12.19], [13.0, 18.01], [20.0, 46.53], [47.0, 49.47], [50.0, 56.69], [58.0, 58.92], [60.0, 61.6], [63.0, 63.95], [67.0, 94.86], [96.0, 96.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.04, 0.0, 93.13, 94.66, 35.18, 77.7, 93.45, 0.0, 0.0, 0.0, 84.07, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 45.85], ["speech", 33.84], ["crack", 3.48]], null, null, null, null, null, null, null], "duration": [3.62, 1.68, 3.19, 5.01, 26.53, 2.47, 6.69, 0.92, 1.6, 0.95, 27.86, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/dObTXYa-_n4_filtered.json b/annotations_filtered/dObTXYa-_n4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..522e6244213e417a47c3bef4ffccaf6564c83ee2 --- /dev/null +++ b/annotations_filtered/dObTXYa-_n4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[110.0, 111.91]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.91]} \ No newline at end of file diff --git a/annotations_filtered/dOnoBJvtVMU_filtered.json b/annotations_filtered/dOnoBJvtVMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3f712b98bd5ac2fbc9c64a50f30f0cc50e56755 --- /dev/null +++ b/annotations_filtered/dOnoBJvtVMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [3.0, 4.51], [5.0, 6.66], [9.0, 10.29], [11.0, 11.35], [12.0, 12.99], [14.0, 14.66], [17.0, 17.05], [17.0, 18.28], [20.0, 20.6], [21.0, 22.98], [23.0, 24.65], [25.0, 25.73], [28.0, 36.36], [37.0, 41.44], [43.0, 45.01], [46.0, 48.83], [50.0, 52.56], [53.0, 56.32], [59.0, 60.96], [62.0, 63.1], [64.0, 65.67], [66.0, 67.32], [68.0, 68.2], [72.0, 72.69], [73.0, 74.68], [76.0, 75.9], [80.0, 80.52], [83.0, 83.67], [84.0, 84.62], [86.0, 87.74], [89.0, 89.16], [90.0, 90.58], [93.0, 94.91], [97.0, 100.43], [101.0, 101.61], [104.0, 105.73], [107.0, 108.48], [111.0, 112.77], [114.0, 114.94], [115.0, 115.89], [117.0, 117.71], [118.0, 118.5], [120.0, 119.97], [121.0, 120.68], [121.0, 121.36], [122.0, 122.76], [123.0, 123.65], [127.0, 128.06], [129.0, 129.37], [130.0, 130.59], [132.0, 133.07], [135.0, 136.11], [137.0, 138.13], [140.0, 141.07], [142.0, 142.18], [144.0, 144.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 35.86, 45.18, 73.82, 62.89, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 15.56], ["bow-wow", 11.25], ["mains hum", 9.63]], [["cattle, bovinae", 37.92], ["moo", 34.71], ["livestock, farm animals, working animals", 25.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.06], ["sidetone", 20.41], ["radio", 11.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 1.51, 1.66, 1.29, 0.35, 0.99, 0.66, 0.05, 1.28, 0.6, 1.98, 1.65, 0.73, 8.36, 4.44, 2.01, 2.83, 2.56, 3.32, 1.96, 1.1, 1.67, 1.32, 0.2, 0.69, 1.68, -0.1, 0.52, 0.67, 0.62, 1.74, 0.16, 0.58, 1.91, 3.43, 0.61, 1.73, 1.48, 1.77, 0.94, 0.89, 0.71, 0.5, -0.03, -0.32, 0.36, 0.76, 0.65, 1.06, 0.37, 0.59, 1.07, 1.11, 1.13, 1.07, 0.18, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/dOzGnmkbahw_filtered.json b/annotations_filtered/dOzGnmkbahw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cc11fa931378bd7ba102c2786330c64a12c3c40 --- /dev/null +++ b/annotations_filtered/dOzGnmkbahw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.38], [20.0, 20.56], [21.0, 28.93], [34.0, 34.18], [35.0, 45.32], [49.0, 49.55], [50.0, 53.37], [54.0, 54.63], [59.0, 61.2], [64.0, 66.51], [70.0, 69.96], [70.0, 70.09], [71.0, 71.63], [77.0, 77.58], [83.0, 84.27], [90.0, 91.12], [97.0, 101.51], [103.0, 103.38], [105.0, 105.6], [108.0, 108.67], [111.0, 111.62], [112.0, 112.94], [114.0, 115.47], [118.0, 119.6], [122.0, 122.99], [124.0, 130.17]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.28, 0.0, 28.84, 0.0, 28.79, 0.0, 47.78, 30.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.48], "audiomae_on_audioset": [null, null, [["music", 66.77], ["boom", 4.19], ["machine gun", 3.13]], null, [["speech", 60.1], ["music", 9.23], ["sound effect", 4.43]], null, [["speech", 25.68], ["whack, thwack", 10.56], ["thump, thud", 8.24]], null, [["chirp tone", 40.63], ["sine wave", 29.66], ["hum", 6.87]], [["breaking", 24.59], ["whale vocalization", 13.32], ["music", 11.31]], null, null, null, null, null, null, [["music", 44.03], ["hum", 31.47], ["throbbing", 4.83]], null, null, null, null, null, null, null, null, [["mains hum", 56.97], ["hum", 33.95], ["music", 3.37]]], "duration": [0.38, 0.56, 7.93, 0.18, 10.32, 0.55, 3.37, 0.63, 2.2, 2.51, -0.04, 0.09, 0.63, 0.58, 1.27, 1.12, 4.51, 0.38, 0.6, 0.67, 0.62, 0.94, 1.47, 1.6, 0.99, 6.17]} \ No newline at end of file diff --git a/annotations_filtered/dPKG3WMkMxQ_filtered.json b/annotations_filtered/dPKG3WMkMxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6d2aebcd1252cb03d8fda4be49e8f38780854c9 --- /dev/null +++ b/annotations_filtered/dPKG3WMkMxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 80.81], [87.0, 94.73], [98.0, 122.72]], "keep_status": [false, true, false], "silence_prob": [30.55, 31.27, 30.62], "audiomae_on_audioset": [[["music", 62.87], ["hum", 8.81], ["throbbing", 6.01]], [["music", 34.91], ["hum", 19.07], ["mains hum", 14.44]], [["music", 69.68], ["breaking", 3.87], ["boom", 2.72]]], "duration": [17.81, 7.73, 24.72]} \ No newline at end of file diff --git a/annotations_filtered/dPXGowa6p3Y_filtered.json b/annotations_filtered/dPXGowa6p3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..800342a5f79db026c6f8a11699482e90c1bea3e4 --- /dev/null +++ b/annotations_filtered/dPXGowa6p3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.9], [14.0, 14.76], [16.0, 16.14], [17.0, 17.25], [19.0, 25.62], [27.0, 27.31], [31.0, 35.67], [39.0, 39.78], [42.0, 45.71], [49.0, 56.91], [57.0, 59.71], [60.0, 64.02], [66.0, 66.92], [71.0, 71.25], [78.0, 78.33], [80.0, 81.84]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 65.67, 0.0, 83.34, 47.43, 62.17, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 41.86], ["fart", 10.13], ["arrow", 9.06]], null, null, null, null, null, null], "duration": [0.9, 0.76, 0.14, 0.25, 6.62, 0.31, 4.67, 0.78, 3.71, 7.91, 2.71, 4.02, 0.92, 0.25, 0.33, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/dPi40lQetew_filtered.json b/annotations_filtered/dPi40lQetew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26b4941e134c77525f180ba5a8baec57a488fc7f --- /dev/null +++ b/annotations_filtered/dPi40lQetew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.72], [9.0, 10.77], [13.0, 16.48], [18.0, 18.69], [19.0, 39.34], [40.0, 41.52], [43.0, 44.29], [48.0, 49.35], [53.0, 54.63], [56.0, 55.98], [57.0, 58.23], [59.0, 59.95], [61.0, 61.72], [63.0, 63.59], [65.0, 65.25], [69.0, 70.61], [72.0, 72.93], [76.0, 76.92], [82.0, 82.09], [83.0, 84.65], [86.0, 86.61], [88.0, 88.05], [90.0, 91.83], [96.0, 97.61], [100.0, 100.72], [102.0, 102.54], [103.0, 104.06], [105.0, 109.38], [111.0, 113.05], [114.0, 114.07], [116.0, 118.88], [121.0, 123.75]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [30.76, 0.0, 31.03, 0.0, 30.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 94.81, 0.0, 49.73, 40.97], "audiomae_on_audioset": [[["speech", 64.44], ["sidetone", 14.53], ["radio", 3.96]], null, [["cattle, bovinae", 43.24], ["moo", 40.13], ["livestock, farm animals, working animals", 8.13]], null, [["motorboat, speedboat", 14.6], ["boat, water vehicle", 13.08], ["fly, housefly", 10.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["vehicle", 30.96], ["hum", 11.27], ["car", 4.93]], [["speech", 22.6], ["sine wave", 16.94], ["sidetone", 16.2]]], "duration": [3.72, 1.77, 3.48, 0.69, 20.34, 1.52, 1.29, 1.35, 1.63, -0.02, 1.23, 0.95, 0.72, 0.59, 0.25, 1.61, 0.93, 0.92, 0.09, 1.65, 0.61, 0.05, 1.83, 1.61, 0.72, 0.54, 1.06, 4.38, 2.05, 0.07, 2.88, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/dPk7S_LiI1I_filtered.json b/annotations_filtered/dPk7S_LiI1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87c61b1e5fd1a8a1641e2112658429356039a4b1 --- /dev/null +++ b/annotations_filtered/dPk7S_LiI1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.24], [10.0, 10.13], [13.0, 13.32], [15.0, 15.43], [16.0, 16.33], [18.0, 18.99], [21.0, 21.46], [23.0, 23.3], [25.0, 26.4], [28.0, 28.22], [33.0, 33.3], [35.0, 35.01], [36.0, 36.95], [40.0, 40.78], [41.0, 43.34], [47.0, 47.88], [54.0, 55.21], [75.0, 84.97], [86.0, 86.85], [88.0, 88.42], [98.0, 98.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.95, 0.0, 0.0, 35.69, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 22.56], ["creak", 14.86], ["radio", 9.41]], null, null, [["speech", 55.64], ["sidetone", 6.43], ["explosion", 6.19]], null, null, null], "duration": [1.24, 0.13, 0.32, 0.43, 0.33, 0.99, 0.46, 0.3, 1.4, 0.22, 0.3, 0.01, 0.95, 0.78, 2.34, 0.88, 1.21, 9.97, 0.85, 0.42, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/dQ0sgbvSQAk_filtered.json b/annotations_filtered/dQ0sgbvSQAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51e8ff17dc032fe15c7546a463d925ef421688e3 --- /dev/null +++ b/annotations_filtered/dQ0sgbvSQAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.22], [6.0, 6.88], [14.0, 14.86], [20.0, 19.87], [24.0, 23.94], [25.0, 39.85], [41.0, 49.99], [53.0, 54.04], [54.0, 57.87], [59.0, 60.12], [63.0, 63.46], [65.0, 65.89], [68.0, 69.04], [69.0, 70.61], [71.0, 94.19], [96.0, 98.02], [100.0, 100.7], [102.0, 103.38], [106.0, 112.33], [113.0, 120.02], [123.0, 123.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 71.72, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 0.0, 49.64, 100.0, 0.0, 0.0, 99.95, 97.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 27.17], ["livestock, farm animals, working animals", 8.11], ["groan", 6.17]], null, null, null, null, null, null], "duration": [1.22, 0.88, 0.86, -0.13, -0.06, 14.85, 8.99, 1.04, 3.87, 1.12, 0.46, 0.89, 1.04, 1.61, 23.19, 2.02, 0.7, 1.38, 6.33, 7.02, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/dQNrOoc3NTA_filtered.json b/annotations_filtered/dQNrOoc3NTA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96eef079bb1de7851ac0d0c894892d3b72f54921 --- /dev/null +++ b/annotations_filtered/dQNrOoc3NTA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.35], [26.0, 27.09], [28.0, 28.85], [30.0, 32.36], [33.0, 33.93], [35.0, 37.05], [37.0, 38.8], [42.0, 44.22], [45.0, 46.52], [48.0, 58.29], [59.0, 63.8], [71.0, 109.0], [112.0, 132.98], [135.0, 135.28], [136.0, 137.71], [139.0, 139.28], [141.0, 141.44], [144.0, 144.69], [146.0, 147.61], [148.0, 148.59]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.49, 0.0, 41.05, 0.0, 42.51, 0.0, 66.39, 78.89, 0.0, 43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 54.68], ["music", 12.52], ["livestock, farm animals, working animals", 2.98]], null, [["music", 32.69], ["speech", 17.17], ["hum", 10.36]], null, [["mains hum", 39.7], ["music", 19.27], ["hum", 18.42]], null, null, null, null, [["music", 65.44], ["whale vocalization", 10.63], ["didgeridoo", 2.97]], null, null, null, null, null, null, null], "duration": [0.35, 1.09, 0.85, 2.36, 0.93, 2.05, 1.8, 2.22, 1.52, 10.29, 4.8, 38.0, 20.98, 0.28, 1.71, 0.28, 0.44, 0.69, 1.61, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/dQQd6s5gYhk_filtered.json b/annotations_filtered/dQQd6s5gYhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..deacf0d06bb12922a3b95e3f4a01d96e3d500d3f --- /dev/null +++ b/annotations_filtered/dQQd6s5gYhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.59], [23.0, 24.88], [26.0, 30.42], [31.0, 33.15], [36.0, 37.27], [46.0, 46.2], [47.0, 46.7], [49.0, 49.44], [53.0, 54.21], [62.0, 62.09], [63.0, 63.88], [65.0, 66.33], [69.0, 70.14], [73.0, 73.31], [77.0, 80.18], [81.0, 82.27], [95.0, 97.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 99.99, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.26, 0.0, 42.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.13], ["ping", 8.59], ["music", 7.51]], null, [["speech", 31.62], ["music", 15.27], ["sine wave", 14.62]]], "duration": [0.59, 1.88, 4.42, 2.15, 1.27, 0.2, -0.3, 0.44, 1.21, 0.09, 0.88, 1.33, 1.14, 0.31, 3.18, 1.27, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/dQRfWqSj3Gw_filtered.json b/annotations_filtered/dQRfWqSj3Gw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..847c5e9c7d1c2df738b6235eca15653cb65c292b --- /dev/null +++ b/annotations_filtered/dQRfWqSj3Gw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [21.0, 48.69], [50.0, 56.84], [61.0, 82.78], [84.0, 84.27], [95.0, 94.59], [96.0, 96.26]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 32.97, 30.98, 32.19, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 68.46], ["hum", 3.8], ["throbbing", 3.7]], [["music", 29.21], ["throbbing", 20.22], ["hum", 10.58]], [["buzz", 31.29], ["music", 29.12], ["fart", 10.94]], null, null, null], "duration": [0.48, 27.69, 6.84, 21.78, 0.27, -0.41, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/dQSK2gmtNMI_filtered.json b/annotations_filtered/dQSK2gmtNMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..745153b54a902353eb85a626746eacbca641488c --- /dev/null +++ b/annotations_filtered/dQSK2gmtNMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.21], [8.0, 9.42], [12.0, 12.72], [15.0, 15.31], [17.0, 17.56], [29.0, 29.81], [40.0, 40.07], [52.0, 53.3], [62.0, 61.7], [77.0, 78.73], [81.0, 81.7], [84.0, 86.17], [88.0, 88.77], [91.0, 92.2], [105.0, 108.77], [115.0, 116.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0, 0.0, 31.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.86], ["static", 9.89], ["hum", 7.69]], null], "duration": [1.21, 1.42, 0.72, 0.31, 0.56, 0.81, 0.07, 1.3, -0.3, 1.73, 0.7, 2.17, 0.77, 1.2, 3.77, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/dQUjkTOrAn4_filtered.json b/annotations_filtered/dQUjkTOrAn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a573094673cab5f63d954cf7de6e47e487c0c143 --- /dev/null +++ b/annotations_filtered/dQUjkTOrAn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.26], [23.0, 24.29], [29.0, 29.57], [35.0, 35.4], [36.0, 41.44], [56.0, 81.04], [82.0, 82.75], [84.0, 83.98], [89.0, 89.9], [90.0, 93.5], [94.0, 93.53], [95.0, 95.1], [99.0, 106.79], [109.0, 109.39], [112.0, 112.72], [119.0, 119.3], [121.0, 125.56], [127.0, 129.54], [131.0, 132.93], [141.0, 141.25], [142.0, 143.46], [145.0, 148.41], [150.0, 151.17], [154.0, 162.97], [164.0, 165.81], [167.0, 168.24], [170.0, 171.14], [172.0, 172.79], [174.0, 176.69]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.27, 36.98, 0.0, 0.0, 0.0, 43.28, 0.0, 0.0, 46.43, 0.0, 0.0, 0.0, 48.23, 95.37, 0.0, 0.0, 0.0, 79.41, 0.0, 74.13, 0.0, 0.0, 0.0, 0.0, 64.63], "audiomae_on_audioset": [null, null, null, null, [["speech", 74.65], ["wail, moan", 11.48], ["screaming", 3.49]], [["speech", 40.25], ["moo", 14.29], ["cattle, bovinae", 13.9]], null, null, null, [["fly, housefly", 33.4], ["bee, wasp, etc.", 19.01], ["speech", 14.11]], null, null, [["speech", 70.16], ["whale vocalization", 6.55], ["vehicle", 3.99]], null, null, null, [["speech", 30.04], ["insect", 14.75], ["fly, housefly", 12.43]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.26, 1.29, 0.57, 0.4, 5.44, 25.04, 0.75, -0.02, 0.9, 3.5, -0.47, 0.1, 7.79, 0.39, 0.72, 0.3, 4.56, 2.54, 1.93, 0.25, 1.46, 3.41, 1.17, 8.97, 1.81, 1.24, 1.14, 0.79, 2.69]} \ No newline at end of file diff --git a/annotations_filtered/dQbpx5Be5rI_filtered.json b/annotations_filtered/dQbpx5Be5rI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7125c64520ec47c8ef67c6147d3fdd1b6ae4d9ec --- /dev/null +++ b/annotations_filtered/dQbpx5Be5rI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.01], [9.0, 11.16], [14.0, 14.13], [31.0, 31.51], [45.0, 50.82], [52.0, 51.87], [53.0, 54.21], [57.0, 57.27], [58.0, 62.92], [71.0, 70.88], [72.0, 75.24], [78.0, 81.4], [81.0, 82.98], [84.0, 84.84], [94.0, 94.32], [102.0, 102.76], [103.0, 103.72], [115.0, 118.1], [119.0, 122.42], [123.0, 124.07], [126.0, 126.72], [130.0, 130.52]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [31.4, 32.98, 0.0, 0.0, 43.13, 0.0, 0.0, 0.0, 46.19, 0.0, 34.53, 32.43, 0.0, 0.0, 0.0, 0.0, 0.0, 46.12, 52.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 48.35], ["vehicle", 9.55], ["car", 8.15]], [["speech", 75.53], ["vehicle", 2.54], ["throbbing", 1.55]], null, null, [["telephone", 86.86], ["telephone bell ringing", 4.51], ["telephone dialing, dtmf", 2.38]], null, null, null, [["rumble", 41.78], ["hum", 21.36], ["throbbing", 15.83]], null, [["speech", 65.45], ["sidetone", 13.29], ["hum", 2.17]], [["speech", 40.58], ["music", 17.77], ["sidetone", 12.51]], null, null, null, null, null, [["speech", 46.15], ["hum", 7.29], ["busy signal", 5.6]], null, null, null, null], "duration": [5.01, 2.16, 0.13, 0.51, 5.82, -0.13, 1.21, 0.27, 4.92, -0.12, 3.24, 3.4, 1.98, 0.84, 0.32, 0.76, 0.72, 3.1, 3.42, 1.07, 0.72, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/dQoqvTs4lvg_filtered.json b/annotations_filtered/dQoqvTs4lvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51eb0529d8da90f5bcba36f31c90293a20b136e6 --- /dev/null +++ b/annotations_filtered/dQoqvTs4lvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.73], [3.0, 3.5], [21.0, 22.96], [26.0, 27.36], [29.0, 30.92]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.73, 0.5, 1.96, 1.36, 1.92]} \ No newline at end of file diff --git a/annotations_filtered/dR0_tMYKwXE_filtered.json b/annotations_filtered/dR0_tMYKwXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e2f595c758b22db8c6117529a940bef8ee70bdc --- /dev/null +++ b/annotations_filtered/dR0_tMYKwXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.63], [6.0, 9.46], [10.0, 14.3], [15.0, 16.48], [32.0, 32.78], [37.0, 38.16], [54.0, 54.51], [71.0, 71.0], [73.0, 73.67], [80.0, 79.88], [109.0, 109.59], [112.0, 112.36], [116.0, 116.33], [119.0, 118.99], [121.0, 122.0], [127.0, 127.57], [132.0, 132.61], [134.0, 133.98], [142.0, 142.91], [144.0, 145.74], [146.0, 149.93], [150.0, 159.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.26, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 3.46, 4.3, 1.48, 0.78, 1.16, 0.51, 0.0, 0.67, -0.12, 0.59, 0.36, 0.33, -0.01, 1.0, 0.57, 0.61, -0.02, 0.91, 1.74, 3.93, 9.41]} \ No newline at end of file diff --git a/annotations_filtered/dR3cjXncoSk_filtered.json b/annotations_filtered/dR3cjXncoSk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb72b0a56673a9d3770fd7005c9e6983f434215b --- /dev/null +++ b/annotations_filtered/dR3cjXncoSk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.43], [12.0, 12.66], [17.0, 17.29], [18.0, 18.47], [27.0, 30.13], [34.0, 42.2], [42.0, 55.98], [63.0, 76.96], [79.0, 84.5], [85.0, 85.43], [86.0, 88.33], [89.0, 89.48], [91.0, 95.57], [97.0, 119.75], [120.0, 120.72], [122.0, 130.23], [132.0, 136.8], [139.0, 139.24], [145.0, 145.13], [149.0, 155.09], [164.0, 170.92], [173.0, 176.01], [183.0, 183.56], [185.0, 186.56], [188.0, 188.65], [189.0, 194.14], [195.0, 198.83]], "keep_status": [true, false, false, false, true, true, true, false, false, false, false, false, true, false, false, true, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [41.24, 0.0, 0.0, 0.0, 36.91, 45.52, 30.58, 29.67, 31.5, 0.0, 31.26, 0.0, 29.66, 28.89, 0.0, 28.7, 29.29, 0.0, 0.0, 31.77, 29.37, 32.42, 0.0, 0.0, 0.0, 32.77, 69.2], "audiomae_on_audioset": [[["hum", 23.32], ["noise", 15.92], ["throbbing", 10.42]], null, null, null, [["speech", 26.39], ["sidetone", 24.52], ["hum", 11.47]], [["frog", 17.13], ["hum", 16.34], ["music", 15.79]], [["music", 32.42], ["throbbing", 16.42], ["cacophony", 5.56]], [["speech", 54.33], ["music", 30.88], ["explosion", 1.79]], [["music", 49.2], ["speech", 16.72], ["electronic music", 5.47]], null, [["speech", 66.05], ["music", 21.63], ["helicopter", 2.51]], null, [["speech", 36.16], ["music", 15.17], ["hum", 11.75]], [["music", 39.68], ["speech", 34.04], ["buzz", 2.8]], null, [["music", 22.7], ["speech", 17.56], ["electric shaver, electric razor", 7.37]], [["livestock, farm animals, working animals", 43.6], ["cattle, bovinae", 27.42], ["moo", 21.45]], null, null, [["music", 34.1], ["speech", 22.32], ["fart", 10.19]], [["music", 33.68], ["speech", 14.72], ["hum", 9.68]], [["music", 49.18], ["speech", 13.24], ["explosion", 4.04]], null, null, null, [["clang", 43.54], ["ding", 40.26], ["fly, housefly", 1.62]], null], "duration": [7.43, 0.66, 0.29, 0.47, 3.13, 8.2, 13.98, 13.96, 5.5, 0.43, 2.33, 0.48, 4.57, 22.75, 0.72, 8.23, 4.8, 0.24, 0.13, 6.09, 6.92, 3.01, 0.56, 1.56, 0.65, 5.14, 3.83]} \ No newline at end of file diff --git a/annotations_filtered/dRTKQQtFoRU_filtered.json b/annotations_filtered/dRTKQQtFoRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdec40d81fbaa8de59201c7e6a00955c82ed45d6 --- /dev/null +++ b/annotations_filtered/dRTKQQtFoRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 24.92], [32.0, 33.0], [38.0, 51.54], [52.0, 55.04], [57.0, 58.82], [59.0, 69.62], [70.0, 73.28], [74.0, 76.1], [77.0, 79.54], [80.0, 81.21], [82.0, 82.68], [83.0, 84.25], [86.0, 86.83], [88.0, 94.59], [95.0, 96.36], [97.0, 98.44], [107.0, 130.77]], "keep_status": [false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [37.91, 0.0, 48.95, 54.43, 0.0, 48.39, 56.93, 48.91, 52.16, 0.0, 0.0, 0.0, 0.0, 41.01, 0.0, 0.0, 35.0], "audiomae_on_audioset": [[["hum", 36.42], ["mains hum", 27.94], ["buzz", 7.98]], null, [["hum", 38.49], ["mains hum", 14.66], ["music", 12.07]], null, null, [["mains hum", 22.89], ["hum", 16.43], ["livestock, farm animals, working animals", 13.42]], null, [["sine wave", 35.87], ["hum", 26.81], ["mains hum", 6.63]], null, null, null, null, null, [["frog", 55.29], ["didgeridoo", 11.61], ["animal", 3.73]], null, null, [["speech", 53.42], ["eruption", 8.02], ["sidetone", 5.64]]], "duration": [15.92, 1.0, 13.54, 3.04, 1.82, 10.62, 3.28, 2.1, 2.54, 1.21, 0.68, 1.25, 0.83, 6.59, 1.36, 1.44, 23.77]} \ No newline at end of file diff --git a/annotations_filtered/dRVq4Um7E5Q_filtered.json b/annotations_filtered/dRVq4Um7E5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2bdd6ea629ead4615199007a0d176ced633c895 --- /dev/null +++ b/annotations_filtered/dRVq4Um7E5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.01], [17.0, 31.8], [32.0, 34.48], [35.0, 65.74], [67.0, 72.03], [74.0, 82.09], [85.0, 85.43], [88.0, 88.38], [91.0, 93.01], [95.0, 94.69], [99.0, 99.13], [100.0, 132.61], [135.0, 139.14], [143.0, 145.29], [146.0, 152.39], [154.0, 161.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.88, 35.91, 77.03, 0.0, 63.42, 96.54, 0.0, 0.0, 62.78, 0.0, 0.0, 0.0, 50.11, 99.9, 97.83, 89.9], "audiomae_on_audioset": [null, [["music", 39.96], ["neigh, whinny", 21.15], ["horse", 21.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.01, 14.8, 2.48, 30.74, 5.03, 8.09, 0.43, 0.38, 2.01, -0.31, 0.13, 32.61, 4.14, 2.29, 6.39, 7.59]} \ No newline at end of file diff --git a/annotations_filtered/dRz8OjNEtaI_filtered.json b/annotations_filtered/dRz8OjNEtaI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acebb2a2f50a299b21b9f9ffa6ea00f75dee95ca --- /dev/null +++ b/annotations_filtered/dRz8OjNEtaI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.14], [25.0, 78.26]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.14, 53.26]} \ No newline at end of file diff --git a/annotations_filtered/dSRxB66FLV4_filtered.json b/annotations_filtered/dSRxB66FLV4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b973553f681ab9cb08d8fedb48c1b7f71b9fd57b --- /dev/null +++ b/annotations_filtered/dSRxB66FLV4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.8], [9.0, 9.19], [11.0, 11.01], [17.0, 17.74], [18.0, 18.77], [19.0, 20.63], [21.0, 22.42], [24.0, 27.11], [33.0, 34.45], [38.0, 38.58], [41.0, 40.59], [41.0, 42.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 0.19, 0.01, 0.74, 0.77, 1.63, 1.42, 3.11, 1.45, 0.58, -0.41, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/dSdY41CWixQ_filtered.json b/annotations_filtered/dSdY41CWixQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd5c0221286b62b97dd062b960a5e9e17f06cf8d --- /dev/null +++ b/annotations_filtered/dSdY41CWixQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.37], [15.0, 16.71], [23.0, 23.33], [38.0, 39.18], [40.0, 41.72], [49.0, 49.18], [55.0, 55.58], [59.0, 59.54], [60.0, 61.91], [64.0, 68.18], [71.0, 71.93], [73.0, 81.16], [82.0, 88.87], [93.0, 98.61], [101.0, 103.52], [114.0, 118.52], [119.0, 122.5], [129.0, 129.74], [131.0, 132.39], [135.0, 144.66], [145.0, 145.83], [154.0, 169.32], [171.0, 173.53], [177.0, 177.53], [179.0, 178.87], [180.0, 180.05], [180.0, 180.86], [186.0, 189.31], [199.0, 200.13], [202.0, 203.12], [204.0, 206.04], [215.0, 216.55]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.74, 0.0, 28.9, 29.35, 84.62, 65.91, 52.86, 49.68, 0.0, 0.0, 31.92, 0.0, 30.31, 31.39, 0.0, 0.0, 0.0, 0.0, 32.44, 0.0, 0.0, 51.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 32.01], ["music", 19.01], ["foghorn", 5.19]], null, [["moo", 17.47], ["cattle, bovinae", 16.16], ["buzz", 14.03]], [["thunk", 70.77], ["whack, thwack", 13.6], ["speech", 5.89]], null, null, null, [["hoot", 34.42], ["owl", 15.95], ["music", 14.12]], null, null, [["music", 83.72], ["speech", 4.47], ["groan", 1.85]], null, [["music", 37.3], ["speech", 21.88], ["hum", 7.85]], [["moo", 34.93], ["livestock, farm animals, working animals", 32.13], ["cattle, bovinae", 28.67]], null, null, null, null, [["fart", 41.16], ["speech", 15.68], ["fly, housefly", 10.75]], null, null, null, null], "duration": [1.37, 1.71, 0.33, 1.18, 1.72, 0.18, 0.58, 0.54, 1.91, 4.18, 0.93, 8.16, 6.87, 5.61, 2.52, 4.52, 3.5, 0.74, 1.39, 9.66, 0.83, 15.32, 2.53, 0.53, -0.13, 0.05, 0.86, 3.31, 1.13, 1.12, 2.04, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/dShmoHD7PdM_filtered.json b/annotations_filtered/dShmoHD7PdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18a0cc24f2b766dab96281ede37e716869e3ffec --- /dev/null +++ b/annotations_filtered/dShmoHD7PdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.45], [20.0, 20.48], [22.0, 24.85], [27.0, 27.95], [29.0, 29.29], [31.0, 31.83], [33.0, 34.96], [37.0, 37.42], [39.0, 39.66], [42.0, 42.87], [46.0, 47.85], [50.0, 50.5], [52.0, 53.35], [60.0, 60.81], [64.0, 65.77], [68.0, 68.81], [73.0, 74.87], [77.0, 78.63], [82.0, 84.08], [88.0, 89.21], [91.0, 91.86], [93.0, 94.88], [95.0, 96.18], [97.0, 97.93], [102.0, 102.76], [104.0, 104.55], [106.0, 106.81], [107.0, 107.84], [110.0, 110.71], [113.0, 114.81], [117.0, 117.63], [119.0, 120.51], [121.0, 121.76], [124.0, 124.88], [128.0, 128.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.66, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.45, 0.48, 2.85, 0.95, 0.29, 0.83, 1.96, 0.42, 0.66, 0.87, 1.85, 0.5, 1.35, 0.81, 1.77, 0.81, 1.87, 1.63, 2.08, 1.21, 0.86, 1.88, 1.18, 0.93, 0.76, 0.55, 0.81, 0.84, 0.71, 1.81, 0.63, 1.51, 0.76, 0.88, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/dSpTTf_dzDI_filtered.json b/annotations_filtered/dSpTTf_dzDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6192b6f803e9cec18b7307651858cd105889d89a --- /dev/null +++ b/annotations_filtered/dSpTTf_dzDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 18.82], [20.0, 44.09], [47.0, 71.47]], "keep_status": [false, true, false], "silence_prob": [30.39, 31.09, 30.57], "audiomae_on_audioset": [[["music", 65.7], ["musical instrument", 7.74], ["didgeridoo", 4.6]], [["speech", 43.95], ["hum", 12.06], ["music", 8.99]], [["music", 60.19], ["skidding", 5.58], ["vehicle", 4.44]]], "duration": [11.82, 24.09, 24.47]} \ No newline at end of file diff --git a/annotations_filtered/dStxLpnwvWs_filtered.json b/annotations_filtered/dStxLpnwvWs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d57c6a17e22c81a65111952b2759cdeb1a1e4eaf --- /dev/null +++ b/annotations_filtered/dStxLpnwvWs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.45], [9.0, 10.05], [11.0, 14.44], [15.0, 16.97], [18.0, 21.93], [27.0, 27.55], [32.0, 33.51], [36.0, 39.29], [40.0, 51.83], [55.0, 56.12], [60.0, 60.66], [63.0, 64.47], [69.0, 69.11], [73.0, 125.32], [126.0, 127.75], [134.0, 136.78], [140.0, 144.09], [149.0, 148.95], [149.0, 149.15], [152.0, 154.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.16, 0.0, 90.78, 0.0, 0.0, 98.1, 70.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 87.19, 0.0, 0.0, 94.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.45, 1.05, 3.44, 1.97, 3.93, 0.55, 1.51, 3.29, 11.83, 1.12, 0.66, 1.47, 0.11, 52.32, 1.75, 2.78, 4.09, -0.05, 0.15, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/dTM13gYxkoQ_filtered.json b/annotations_filtered/dTM13gYxkoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e4a6f9be943adf07f9384f6e265311fd15893c7 --- /dev/null +++ b/annotations_filtered/dTM13gYxkoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.34], [23.0, 24.75], [26.0, 26.65], [28.0, 28.19], [34.0, 36.04], [37.0, 37.81], [39.0, 41.96], [42.0, 42.35], [43.0, 45.1], [49.0, 50.45], [55.0, 55.27], [57.0, 74.41], [76.0, 76.08], [76.0, 77.19], [78.0, 78.16], [78.0, 83.35], [86.0, 92.13], [93.0, 99.66], [102.0, 102.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.42, 0.0, 0.0, 0.0, 99.97, 0.0, 66.15, 0.0, 81.71, 0.0, 0.0, 84.25, 0.0, 0.0, 0.0, 84.07, 60.32, 62.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.34, 1.75, 0.65, 0.19, 2.04, 0.81, 2.96, 0.35, 2.1, 1.45, 0.27, 17.41, 0.08, 1.19, 0.16, 5.35, 6.13, 6.66, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/dTSXhhHDOk0_filtered.json b/annotations_filtered/dTSXhhHDOk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2c686fece23dd96247006429977c2d763873566 --- /dev/null +++ b/annotations_filtered/dTSXhhHDOk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.4], [15.0, 15.58], [16.0, 16.9], [21.0, 25.17], [31.0, 31.45], [41.0, 41.89], [43.0, 69.23], [69.0, 71.07], [71.0, 74.38], [75.0, 75.78], [77.0, 78.43], [85.0, 87.05], [88.0, 89.53], [91.0, 91.72], [102.0, 103.74], [106.0, 107.91], [109.0, 109.59], [118.0, 118.94], [127.0, 127.65], [129.0, 128.75], [130.0, 130.11]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.35, 0.0, 0.0, 30.47, 74.29, 67.76, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 32.69], ["insect", 20.3], ["horse", 14.08]], null, null, [["music", 31.28], ["speech", 12.22], ["cattle, bovinae", 6.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.58, 0.9, 4.17, 0.45, 0.89, 26.23, 2.07, 3.38, 0.78, 1.43, 2.05, 1.53, 0.72, 1.74, 1.91, 0.59, 0.94, 0.65, -0.25, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/dTVEd7WtyAw_filtered.json b/annotations_filtered/dTVEd7WtyAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59d1406d706d36de1de094b7abdedc6bff46c587 --- /dev/null +++ b/annotations_filtered/dTVEd7WtyAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [6.0, 8.02], [9.0, 10.25], [10.0, 11.23], [12.0, 13.58], [14.0, 33.56], [34.0, 40.37], [41.0, 45.2], [48.0, 50.04], [52.0, 54.82], [56.0, 55.63], [56.0, 55.66], [56.0, 55.7], [56.0, 67.95], [68.0, 74.34], [76.0, 78.22], [80.0, 93.5], [96.0, 98.46], [99.0, 100.41], [101.0, 102.25], [115.0, 116.13], [118.0, 154.14], [156.0, 158.84], [170.0, 170.72], [173.0, 176.52], [177.0, 185.52], [189.0, 189.75], [191.0, 191.84]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 76.7, 0.0, 0.0, 0.0, 39.91, 36.25, 37.26, 38.37, 41.09, 0.0, 0.0, 0.0, 36.11, 39.33, 68.02, 36.89, 35.52, 0.0, 0.0, 0.0, 0.0, 35.43, 0.0, 37.0, 39.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 59.96], ["speech", 9.57], ["hum", 5.89]], [["music", 70.75], ["musical instrument", 3.92], ["guitar", 2.72]], [["music", 77.1], ["chorus effect", 2.78], ["singing", 2.55]], [["throbbing", 23.51], ["music", 18.46], ["moo", 9.11]], [["music", 64.96], ["synthesizer", 7.75], ["sampler", 3.7]], null, null, null, [["music", 73.57], ["singing", 4.91], ["male singing", 1.85]], [["music", 47.57], ["effects unit", 11.17], ["guitar", 10.55]], null, [["music", 77.07], ["speech", 2.0], ["synthesizer", 1.87]], [["music", 73.97], ["electronic music", 3.0], ["synthesizer", 2.86]], null, null, null, null, [["music", 30.96], ["moo", 14.86], ["cattle, bovinae", 6.85]], null, [["music", 16.26], ["fly, housefly", 16.17], ["grunt", 8.52]], [["music", 41.72], ["speech", 32.76], ["sidetone", 14.26]], null, null], "duration": [1.08, 2.02, 1.25, 1.23, 1.58, 19.56, 6.37, 4.2, 2.04, 2.82, -0.37, -0.34, -0.3, 11.95, 6.34, 2.22, 13.5, 2.46, 1.41, 1.25, 1.13, 36.14, 2.84, 0.72, 3.52, 8.52, 0.75, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/dTllG2KdPMQ_filtered.json b/annotations_filtered/dTllG2KdPMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9458f233a2b42bb6574ccbe1ea61294ca26216d0 --- /dev/null +++ b/annotations_filtered/dTllG2KdPMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [4.0, 5.54], [8.0, 9.05], [10.0, 22.64], [23.0, 29.52], [32.0, 42.6], [46.0, 49.33], [52.0, 52.59], [53.0, 53.92], [54.0, 54.53], [55.0, 55.71], [58.0, 59.0], [63.0, 63.37], [64.0, 64.54], [67.0, 68.13], [72.0, 80.25], [83.0, 83.17], [86.0, 85.89], [87.0, 87.27], [89.0, 89.04], [90.0, 90.48], [100.0, 101.98], [103.0, 103.94], [107.0, 127.52]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 98.01, 71.87, 33.18, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.02], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 14.04], ["hum", 10.41], ["music", 9.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.71], ["explosion", 11.76], ["boing", 6.51]]], "duration": [0.94, 1.54, 1.05, 12.64, 6.52, 10.6, 3.33, 0.59, 0.92, 0.53, 0.71, 1.0, 0.37, 0.54, 1.13, 8.25, 0.17, -0.11, 0.27, 0.04, 0.48, 1.98, 0.94, 20.52]} \ No newline at end of file diff --git a/annotations_filtered/dTr8dXob7YI_filtered.json b/annotations_filtered/dTr8dXob7YI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bb626cbfc4a879b3eb6e2e08af525103bcb2048 --- /dev/null +++ b/annotations_filtered/dTr8dXob7YI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.74], [15.0, 15.58], [16.0, 16.97], [18.0, 24.78], [26.0, 26.74], [30.0, 32.58], [35.0, 35.53], [39.0, 39.55], [42.0, 48.03], [49.0, 50.5], [52.0, 52.88], [54.0, 55.24], [56.0, 56.61], [58.0, 60.99], [63.0, 64.42], [66.0, 66.66], [69.0, 70.04], [71.0, 72.81], [73.0, 75.61], [77.0, 76.99], [79.0, 79.95], [85.0, 86.63], [87.0, 89.02], [90.0, 95.1], [97.0, 97.65], [99.0, 99.28], [101.0, 102.07], [103.0, 102.84], [105.0, 105.29], [108.0, 110.34], [112.0, 112.23], [113.0, 114.4], [115.0, 115.77], [117.0, 120.78], [121.0, 124.39], [125.0, 126.72], [127.0, 135.16], [136.0, 136.71], [139.0, 138.84], [139.0, 140.95], [141.0, 152.66], [154.0, 153.94], [156.0, 155.75], [157.0, 157.23], [158.0, 158.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [73.67, 0.0, 0.0, 44.78, 0.0, 63.85, 0.0, 0.0, 73.06, 0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 47.82, 0.0, 0.0, 0.0, 35.0, 73.51, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 0.0, 0.0, 80.29, 43.53, 0.0, 44.93, 0.0, 0.0, 0.0, 43.28, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 33.96], ["speech", 32.53], ["white noise", 11.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 38.35], ["mains hum", 6.4], ["speech", 5.53]], null, null, null, [["sidetone", 59.44], ["speech", 28.61], ["busy signal", 2.26]], null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 42.81], ["speech", 25.06], ["radio", 6.13]], null, [["speech", 29.61], ["hum", 22.69], ["mains hum", 16.17]], null, null, null, [["speech", 65.12], ["hum", 7.72], ["sidetone", 6.37]], null, null, null, null], "duration": [6.74, 0.58, 0.97, 6.78, 0.74, 2.58, 0.53, 0.55, 6.03, 1.5, 0.88, 1.24, 0.61, 2.99, 1.42, 0.66, 1.04, 1.81, 2.61, -0.01, 0.95, 1.63, 2.02, 5.1, 0.65, 0.28, 1.07, -0.16, 0.29, 2.34, 0.23, 1.4, 0.77, 3.78, 3.39, 1.72, 8.16, 0.71, -0.16, 1.95, 11.66, -0.06, -0.25, 0.23, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/dUCUs8EtHoM_filtered.json b/annotations_filtered/dUCUs8EtHoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1f3d7eac4cb67687682411b218060dba9102a94 --- /dev/null +++ b/annotations_filtered/dUCUs8EtHoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.96], [5.0, 30.13], [36.0, 36.64], [37.0, 38.38], [46.0, 59.81]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 34.76, 0.0, 0.0, 30.86], "audiomae_on_audioset": [null, [["hum", 60.29], ["mains hum", 33.95], ["throbbing", 3.9]], null, null, [["vehicle", 21.39], ["car", 17.42], ["speech", 16.37]]], "duration": [1.96, 25.13, 0.64, 1.38, 13.81]} \ No newline at end of file diff --git a/annotations_filtered/dUFtkBtGIgg_filtered.json b/annotations_filtered/dUFtkBtGIgg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9dc5e4d8700b1546f4b99dade8a9e75d9fc5d08 --- /dev/null +++ b/annotations_filtered/dUFtkBtGIgg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 83.29], [85.0, 112.62]], "keep_status": [false, false], "silence_prob": [0.0, 31.82], "audiomae_on_audioset": [null, [["music", 39.22], ["theremin", 25.46], ["synthesizer", 8.53]]], "duration": [79.29, 27.62]} \ No newline at end of file diff --git a/annotations_filtered/dUMW1YRsWcY_filtered.json b/annotations_filtered/dUMW1YRsWcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92942b83de28f58f3bce3137ae73356d1df261d8 --- /dev/null +++ b/annotations_filtered/dUMW1YRsWcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.91], [16.0, 47.12], [58.0, 58.99], [61.0, 68.08], [69.0, 70.87], [73.0, 74.02], [77.0, 81.55], [83.0, 87.07], [89.0, 91.37], [92.0, 96.87], [97.0, 99.84], [101.0, 105.17], [106.0, 109.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [44.32, 0.0, 0.0, 90.08, 0.0, 0.0, 89.54, 87.92, 84.07, 89.19, 36.37, 84.62, 84.8], "audiomae_on_audioset": [[["hum", 33.54], ["music", 25.6], ["mains hum", 15.14]], null, null, null, null, null, null, null, null, null, [["speech", 40.98], ["whale vocalization", 10.71], ["hum", 6.62]], null, null], "duration": [8.91, 31.12, 0.99, 7.08, 1.87, 1.02, 4.55, 4.07, 2.37, 4.87, 2.84, 4.17, 3.21]} \ No newline at end of file diff --git a/annotations_filtered/dUYCIwyMZTQ_filtered.json b/annotations_filtered/dUYCIwyMZTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b3378108b030e68d40cb09cdb618b9a91406f3a --- /dev/null +++ b/annotations_filtered/dUYCIwyMZTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.36], [8.0, 8.85], [16.0, 16.46], [20.0, 20.58], [21.0, 21.71], [24.0, 25.41], [27.0, 28.11], [28.0, 28.53], [30.0, 30.55], [33.0, 33.22], [37.0, 37.27], [39.0, 38.8], [41.0, 44.59], [45.0, 46.9], [55.0, 55.68], [62.0, 63.46], [68.0, 70.77], [72.0, 77.7], [78.0, 77.95], [78.0, 78.65], [81.0, 81.35], [88.0, 89.58], [91.0, 90.71], [91.0, 92.15], [93.0, 94.34], [96.0, 97.5], [104.0, 104.95], [111.0, 112.16], [115.0, 115.89], [117.0, 118.62], [120.0, 120.85], [122.0, 122.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 97.83, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.36, 0.85, 0.46, 0.58, 0.71, 1.41, 1.11, 0.53, 0.55, 0.22, 0.27, -0.2, 3.59, 1.9, 0.68, 1.46, 2.77, 5.7, -0.05, 0.65, 0.35, 1.58, -0.29, 1.15, 1.34, 1.5, 0.95, 1.16, 0.89, 1.62, 0.85, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/dUbNFv_h6Kc_filtered.json b/annotations_filtered/dUbNFv_h6Kc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4fba173ccfcfcbccf39552ad25c9917e77f3e23 --- /dev/null +++ b/annotations_filtered/dUbNFv_h6Kc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.62], [14.0, 58.56], [59.0, 59.56], [64.0, 69.87], [72.0, 73.21], [74.0, 75.25], [79.0, 79.34], [81.0, 81.55], [97.0, 98.86], [100.0, 100.2], [102.0, 102.49], [107.0, 107.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.31, 0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 88.49], ["musical instrument", 1.14], ["tick-tock", 1.07]], null, null, [["theremin", 40.7], ["music", 31.87], ["musical instrument", 7.06]], null, null, null, null, null, null, null, null], "duration": [6.62, 44.56, 0.56, 5.87, 1.21, 1.25, 0.34, 0.55, 1.86, 0.2, 0.49, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/dUi0j-vedRE_filtered.json b/annotations_filtered/dUi0j-vedRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..308a6b7180894a1ad1de0a793d6f2fbc915230b7 --- /dev/null +++ b/annotations_filtered/dUi0j-vedRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.41], [8.0, 14.1], [15.0, 15.5], [29.0, 31.35], [33.0, 34.79], [41.0, 41.96], [44.0, 43.97], [45.0, 47.6], [52.0, 52.78], [55.0, 55.12], [57.0, 57.16], [62.0, 62.36], [68.0, 68.08], [73.0, 73.77], [75.0, 79.24], [85.0, 92.28], [92.0, 96.28], [97.0, 98.51], [99.0, 100.35], [103.0, 104.04], [105.0, 105.68], [106.0, 106.12], [107.0, 114.12], [116.0, 115.97], [118.0, 117.93], [122.0, 123.72], [124.0, 127.26], [128.0, 137.89], [139.0, 139.62], [140.0, 142.06], [143.0, 143.51], [144.0, 146.04], [151.0, 151.04], [152.0, 152.09], [153.0, 157.71], [161.0, 161.1]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 49.45, 0.0, 86.64, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 59.42, 65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 61.08, 0.0, 0.0, 0.0, 65.09, 79.59, 0.0, 80.64, 0.0, 82.43, 0.0, 0.0, 31.79, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 24.21], ["music", 19.67], ["speech", 10.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 15.25], ["speech", 12.98], ["crowd", 9.53]], null], "duration": [0.41, 6.1, 0.5, 2.35, 1.79, 0.96, -0.03, 2.6, 0.78, 0.12, 0.16, 0.36, 0.08, 0.77, 4.24, 7.28, 4.28, 1.51, 1.35, 1.04, 0.68, 0.12, 7.12, -0.03, -0.07, 1.72, 3.26, 9.89, 0.62, 2.06, 0.51, 2.04, 0.04, 0.09, 4.71, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/dUoKiRrGu4c_filtered.json b/annotations_filtered/dUoKiRrGu4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3d098be61601f4ffd51a09d9f0f9da6f0527cd9 --- /dev/null +++ b/annotations_filtered/dUoKiRrGu4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.93], [11.0, 11.7], [12.0, 12.7], [13.0, 15.35], [16.0, 20.19], [23.0, 23.04], [24.0, 34.21], [35.0, 36.19], [38.0, 44.49], [46.0, 47.38], [49.0, 48.95], [50.0, 115.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.85, 90.25, 0.0, 64.07, 0.0, 53.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.93, 0.7, 0.7, 2.35, 4.19, 0.04, 10.21, 1.19, 6.49, 1.38, -0.05, 65.82]} \ No newline at end of file diff --git a/annotations_filtered/dVCki9kwF_4_filtered.json b/annotations_filtered/dVCki9kwF_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e68ba716aa08db0a54f4d2d0e993a7393ed92cc9 --- /dev/null +++ b/annotations_filtered/dVCki9kwF_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.06], [9.0, 38.89]], "keep_status": [false, true], "silence_prob": [0.0, 30.97], "audiomae_on_audioset": [null, [["speech", 47.09], ["music", 13.31], ["synthesizer", 7.13]]], "duration": [1.06, 29.89]} \ No newline at end of file diff --git a/annotations_filtered/dVFDYCPO19A_filtered.json b/annotations_filtered/dVFDYCPO19A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e38c3c425cb0dc44be5c6ac72487a5c3804d119f --- /dev/null +++ b/annotations_filtered/dVFDYCPO19A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.91], [25.0, 28.81], [31.0, 31.33], [33.0, 32.98], [37.0, 37.66], [46.0, 46.67], [48.0, 56.17], [58.0, 58.6], [59.0, 59.83], [67.0, 67.58], [71.0, 76.01], [77.0, 89.06], [90.0, 90.69], [92.0, 92.57], [96.0, 96.65], [97.0, 98.31], [99.0, 99.54], [100.0, 100.79], [103.0, 103.84], [104.0, 104.77], [107.0, 108.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.52, 77.87, 0.0, 0.0, 0.0, 0.0, 33.03, 0.0, 0.0, 0.0, 40.04, 35.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.7], ["speech", 7.96], ["musical instrument", 2.76]], null, null, null, null, null, [["slap, smack", 47.99], ["whack, thwack", 26.36], ["whip", 5.9]], null, null, null, [["burping, eructation", 50.85], ["thunk", 8.85], ["knock", 5.66]], [["speech", 59.07], ["fart", 28.33], ["animal", 3.51]], null, null, null, null, null, null, null, null, null], "duration": [2.91, 3.81, 0.33, -0.02, 0.66, 0.67, 8.17, 0.6, 0.83, 0.58, 5.01, 12.06, 0.69, 0.57, 0.65, 1.31, 0.54, 0.79, 0.84, 0.77, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/dVLMfoIop9M_filtered.json b/annotations_filtered/dVLMfoIop9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cb52715f1684e3c60bfd338cb214396262fbd40 --- /dev/null +++ b/annotations_filtered/dVLMfoIop9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [6.0, 7.62], [9.0, 9.58], [11.0, 11.99], [13.0, 14.35], [18.0, 19.94], [21.0, 20.97], [21.0, 25.47], [27.0, 30.5], [33.0, 33.96], [37.0, 37.94], [41.0, 41.39], [44.0, 45.39], [49.0, 49.28], [59.0, 59.88], [72.0, 74.31], [84.0, 86.12], [91.0, 97.46], [110.0, 111.77], [123.0, 124.73], [133.0, 133.74], [149.0, 148.91], [149.0, 149.47], [151.0, 151.75], [153.0, 153.77], [168.0, 170.41], [180.0, 183.32], [191.0, 195.08]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.07, 33.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.33, 48.31, 30.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.53, 56.78, 29.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 39.16], ["speech", 9.94], ["wind instrument, woodwind instrument", 9.76]], [["music", 40.34], ["wind instrument, woodwind instrument", 19.16], ["shofar", 8.55]], null, null, null, null, null, null, [["music", 51.99], ["musical instrument", 2.8], ["piano", 2.31]], [["speech", 33.24], ["busy signal", 18.78], ["sidetone", 7.44]], [["music", 69.55], ["funny music", 2.71], ["musical instrument", 2.52]], null, null, null, null, null, null, null, [["music", 61.27], ["marimba, xylophone", 5.76], ["glockenspiel", 4.38]], null, [["music", 46.55], ["synthetic singing", 6.86], ["theremin", 4.05]]], "duration": [1.17, 1.62, 0.58, 0.99, 1.35, 1.94, -0.03, 4.47, 3.5, 0.96, 0.94, 0.39, 1.39, 0.28, 0.88, 2.31, 2.12, 6.46, 1.77, 1.73, 0.74, -0.09, 0.47, 0.75, 0.77, 2.41, 3.32, 4.08]} \ No newline at end of file diff --git a/annotations_filtered/dVzFy-4c-AY_filtered.json b/annotations_filtered/dVzFy-4c-AY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30c05f6f970d9e25d1efb7585d8b872f9e1c2bcf --- /dev/null +++ b/annotations_filtered/dVzFy-4c-AY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 93.93], [97.0, 99.2], [100.0, 102.37], [103.0, 104.57], [109.0, 109.61], [111.0, 112.35], [114.0, 118.29], [119.0, 122.88], [124.0, 131.31], [132.0, 134.37], [139.0, 147.26], [150.0, 150.52], [151.0, 152.49], [154.0, 155.76], [157.0, 157.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.2, 66.51, 62.68, 0.0, 0.0, 0.0, 47.31, 98.8, 54.36, 89.72, 50.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 37.54], ["music", 31.31], ["hum", 14.85]], null, null, null, null, null, [["music", 55.0], ["sonar", 17.37], ["electronic music", 4.36]], null, null, null, null, null, null, null, null], "duration": [17.93, 2.2, 2.37, 1.57, 0.61, 1.35, 4.29, 3.88, 7.31, 2.37, 8.26, 0.52, 1.49, 1.76, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/dWJuJlmcabY_filtered.json b/annotations_filtered/dWJuJlmcabY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5f7a1511c83f85e096dc1b6f4eec0903df2399a --- /dev/null +++ b/annotations_filtered/dWJuJlmcabY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.96], [12.0, 11.79], [14.0, 15.08], [16.0, 16.85], [20.0, 26.52], [28.0, 29.22], [31.0, 31.68], [34.0, 34.47], [45.0, 45.35], [46.0, 46.48], [54.0, 54.95], [56.0, 64.64], [67.0, 68.2], [72.0, 72.57], [73.0, 74.11], [76.0, 76.67], [78.0, 78.73], [81.0, 87.94], [94.0, 93.88], [95.0, 94.91], [97.0, 97.01], [98.0, 99.89], [103.0, 105.97], [108.0, 107.77], [113.0, 114.13], [115.0, 117.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.27, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0, 60.14, 0.0, 0.0, 75.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 31.7], ["speech", 9.69], ["fly, housefly", 7.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, -0.21, 1.08, 0.85, 6.52, 1.22, 0.68, 0.47, 0.35, 0.48, 0.95, 8.64, 1.2, 0.57, 1.11, 0.67, 0.73, 6.94, -0.12, -0.09, 0.01, 1.89, 2.97, -0.23, 1.13, 2.29]} \ No newline at end of file diff --git a/annotations_filtered/dWQ3B8qTpes_filtered.json b/annotations_filtered/dWQ3B8qTpes_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b7962c024752744311338b777383d8ccdc5a831 --- /dev/null +++ b/annotations_filtered/dWQ3B8qTpes_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 42.2], [44.0, 44.19], [46.0, 47.41], [50.0, 56.15], [59.0, 89.88], [94.0, 108.75], [112.0, 118.22], [122.0, 122.77]], "keep_status": [true, false, false, true, false, true, true, false], "silence_prob": [43.58, 0.0, 0.0, 45.33, 0.0, 33.69, 40.14, 0.0], "audiomae_on_audioset": [[["fly, housefly", 23.21], ["bee, wasp, etc.", 18.08], ["insect", 14.99]], null, null, [["music", 37.2], ["hum", 23.61], ["mains hum", 8.87]], null, [["music", 34.94], ["speech", 19.05], ["hum", 7.29]], [["music", 49.2], ["hum", 5.39], ["throbbing", 4.96]], null], "duration": [3.2, 0.19, 1.41, 6.15, 30.88, 14.75, 6.22, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/dX0dcSJE7ek_filtered.json b/annotations_filtered/dX0dcSJE7ek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb3a5714f7bb72e7ec956b7b0548fd8c843e17fe --- /dev/null +++ b/annotations_filtered/dX0dcSJE7ek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.24], [13.0, 13.42], [16.0, 16.24], [17.0, 18.72], [21.0, 21.36], [23.0, 24.61], [26.0, 27.92], [46.0, 46.92], [62.0, 62.09], [63.0, 63.14], [65.0, 70.98], [88.0, 88.43], [89.0, 90.68], [93.0, 93.58], [99.0, 100.95], [101.0, 102.46], [107.0, 107.77], [114.0, 114.34], [117.0, 120.38], [131.0, 131.55], [132.0, 131.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["mosquito", 55.56], ["fly, housefly", 23.4], ["insect", 5.86]], null, null, null, null, null, null, null, [["explosion", 16.82], ["mosquito", 11.14], ["music", 9.13]], null, null], "duration": [0.24, 0.42, 0.24, 1.72, 0.36, 1.61, 1.92, 0.92, 0.09, 0.14, 5.98, 0.43, 1.68, 0.58, 1.95, 1.46, 0.77, 0.34, 3.38, 0.55, -0.37]} \ No newline at end of file diff --git a/annotations_filtered/dX762k_3zWg_filtered.json b/annotations_filtered/dX762k_3zWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95aa58c19e79b532d627ae847655e8985597f085 --- /dev/null +++ b/annotations_filtered/dX762k_3zWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 70.92], [74.0, 133.37], [134.0, 134.03], [134.0, 134.42], [135.0, 148.69], [152.0, 153.1]], "keep_status": [false, false, false, false, false, false], "silence_prob": [30.41, 0.0, 0.0, 0.0, 30.16, 0.0], "audiomae_on_audioset": [[["music", 78.78], ["musical instrument", 3.94], ["throbbing", 1.57]], null, null, null, [["music", 79.38], ["musical instrument", 5.71], ["didgeridoo", 0.99]], null], "duration": [29.92, 59.37, 0.03, 0.42, 13.69, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/dXBUdCvqpNg_filtered.json b/annotations_filtered/dXBUdCvqpNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88dc2a907662767e2431a9fc0af9cd8fbffd3907 --- /dev/null +++ b/annotations_filtered/dXBUdCvqpNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.57], [12.0, 54.35], [58.0, 59.26], [69.0, 71.54], [77.0, 78.36], [81.0, 108.87], [110.0, 123.35], [125.0, 125.64], [127.0, 145.56], [146.0, 147.66], [150.0, 162.5]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [40.19, 0.0, 0.0, 39.18, 0.0, 42.96, 67.38, 0.0, 55.89, 0.0, 41.6], "audiomae_on_audioset": [[["music", 25.65], ["hum", 13.84], ["speech", 10.92]], null, null, [["music", 51.3], ["speech", 4.75], ["synthesizer", 3.67]], null, [["hum", 43.7], ["mains hum", 22.44], ["speech", 7.14]], null, null, null, null, [["music", 64.09], ["speech", 6.75], ["synthesizer", 2.91]]], "duration": [4.57, 42.35, 1.26, 2.54, 1.36, 27.87, 13.35, 0.64, 18.56, 1.66, 12.5]} \ No newline at end of file diff --git a/annotations_filtered/dXNmLJXEgQU_filtered.json b/annotations_filtered/dXNmLJXEgQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6baaf7cf50e104e592851ebff23fb54cbe2bc693 --- /dev/null +++ b/annotations_filtered/dXNmLJXEgQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.09], [12.0, 11.74], [13.0, 14.86], [15.0, 15.99], [32.0, 36.66], [37.0, 47.02], [52.0, 52.05], [55.0, 56.98], [63.0, 64.05], [66.0, 66.95], [68.0, 70.02], [71.0, 75.69], [82.0, 85.29], [87.0, 96.42], [108.0, 108.58], [110.0, 110.71], [114.0, 114.51], [117.0, 117.46], [121.0, 121.51], [122.0, 123.63], [126.0, 128.04], [133.0, 132.75], [134.0, 134.99], [137.0, 141.79], [142.0, 143.34], [144.0, 144.66]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [61.27, 0.0, 0.0, 0.0, 74.13, 33.5, 0.0, 0.0, 0.0, 0.0, 89.54, 66.51, 84.07, 35.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.97, 0.0, 0.0, 42.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["emergency vehicle", 22.52], ["siren", 21.36], ["speech", 15.47]], null, null, null, null, null, null, null, [["music", 48.13], ["whale vocalization", 8.64], ["throbbing", 7.68]], null, null, null, null, null, null, [["fly, housefly", 31.94], ["mosquito", 18.38], ["insect", 16.5]], null, null, [["music", 62.25], ["musical instrument", 6.05], ["trombone", 5.68]], null, null], "duration": [2.09, -0.26, 1.86, 0.99, 4.66, 10.02, 0.05, 1.98, 1.05, 0.95, 2.02, 4.69, 3.29, 9.42, 0.58, 0.71, 0.51, 0.46, 0.51, 1.63, 2.04, -0.25, 0.99, 4.79, 1.34, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/dXNu5a3KmMg_filtered.json b/annotations_filtered/dXNu5a3KmMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f5ce4d17207c53a4e2de84c5ed5daabcf02c7c1 --- /dev/null +++ b/annotations_filtered/dXNu5a3KmMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.33], [17.0, 23.03], [26.0, 26.67], [27.0, 27.65], [28.0, 28.51], [29.0, 29.37], [30.0, 29.88], [34.0, 33.89], [37.0, 37.79], [39.0, 38.91], [48.0, 49.2], [50.0, 54.78], [66.0, 66.29], [78.0, 78.9], [81.0, 82.36], [85.0, 85.89], [87.0, 87.25], [97.0, 97.38], [102.0, 102.86], [105.0, 105.11], [110.0, 109.88], [113.0, 114.02], [115.0, 114.98], [139.0, 139.53], [144.0, 145.72], [151.0, 152.1], [155.0, 156.19], [157.0, 158.13], [160.0, 161.69]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 45.56], ["frog", 6.46], ["whale vocalization", 4.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 6.03, 0.67, 0.65, 0.51, 0.37, -0.12, -0.11, 0.79, -0.09, 1.2, 4.78, 0.29, 0.9, 1.36, 0.89, 0.25, 0.38, 0.86, 0.11, -0.12, 1.02, -0.02, 0.53, 1.72, 1.1, 1.19, 1.13, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/dXe45jbpElA_filtered.json b/annotations_filtered/dXe45jbpElA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48e0e7e43f6848baeccb661e9f5ac46c600ce5a6 --- /dev/null +++ b/annotations_filtered/dXe45jbpElA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.03], [67.0, 67.98], [69.0, 70.68], [72.0, 72.33], [72.0, 72.45], [77.0, 77.52], [81.0, 83.84], [86.0, 86.54], [91.0, 93.29], [95.0, 94.71], [97.0, 109.44]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.09, 0.0, 31.04, 0.0, 30.85], "audiomae_on_audioset": [null, null, null, null, null, null, [["stomach rumble", 12.42], ["hum", 9.86], ["throbbing", 7.37]], null, [["speech", 39.9], ["boing", 22.28], ["music", 10.87]], null, [["speech", 41.1], ["whack, thwack", 11.76], ["noise", 11.35]]], "duration": [0.03, 0.98, 1.68, 0.33, 0.45, 0.52, 2.84, 0.54, 2.29, -0.29, 12.44]} \ No newline at end of file diff --git a/annotations_filtered/dXk2wGeBUHE_filtered.json b/annotations_filtered/dXk2wGeBUHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a2505e8dcb6bf2f73d01d11b0ee00fe5b720ea5 --- /dev/null +++ b/annotations_filtered/dXk2wGeBUHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [3.0, 3.87], [5.0, 5.7], [7.0, 7.53], [9.0, 10.66], [12.0, 23.3], [24.0, 24.26], [25.0, 26.28], [30.0, 30.84], [31.0, 31.95], [33.0, 33.81], [35.0, 36.14], [43.0, 44.71], [45.0, 49.67], [53.0, 54.41], [55.0, 56.39], [57.0, 57.33], [59.0, 78.58], [87.0, 87.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.02, 0.0, 0.0, 0.0, 31.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 81.43], ["telephone", 4.85], ["hum", 2.92]], null, null, null, null, null, null, null, [["music", 40.89], ["speech", 24.56], ["theremin", 9.58]], null, null, null, [["throbbing", 37.87], ["hum", 20.96], ["music", 20.45]], null], "duration": [1.1, 0.87, 0.7, 0.53, 1.66, 11.3, 0.26, 1.28, 0.84, 0.95, 0.81, 1.14, 1.71, 4.67, 1.41, 1.39, 0.33, 19.58, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/dXngQtk0BCU_filtered.json b/annotations_filtered/dXngQtk0BCU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca049b8ee3c8aaa3cf77c595e7058d9e8ea5b52a --- /dev/null +++ b/annotations_filtered/dXngQtk0BCU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.39], [9.0, 9.78], [12.0, 12.51], [14.0, 14.17], [21.0, 21.76], [24.0, 24.61], [28.0, 28.56], [30.0, 30.86], [34.0, 34.43], [38.0, 48.34], [50.0, 49.99], [53.0, 53.67], [54.0, 63.37], [64.0, 65.1], [67.0, 77.26], [78.0, 78.36], [80.0, 80.81], [82.0, 84.2], [86.0, 86.24], [88.0, 88.2], [90.0, 90.91], [94.0, 94.63], [97.0, 97.41], [101.0, 101.22], [104.0, 105.83], [107.0, 107.82], [109.0, 111.01], [112.0, 113.24], [118.0, 119.43], [120.0, 121.66], [124.0, 125.27]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 30.8, 0.0, 34.94, 0.0, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 20.7], ["thunk", 12.37], ["whack, thwack", 8.12]], null, null, [["speech", 38.53], ["music", 28.71], ["didgeridoo", 4.79]], null, [["theremin", 59.26], ["music", 19.11], ["musical instrument", 6.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.39, 0.78, 0.51, 0.17, 0.76, 0.61, 0.56, 0.86, 0.43, 10.34, -0.01, 0.67, 9.37, 1.1, 10.26, 0.36, 0.81, 2.2, 0.24, 0.2, 0.91, 0.63, 0.41, 0.22, 1.83, 0.82, 2.01, 1.24, 1.43, 1.66, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/dXqs6yH3KF8_filtered.json b/annotations_filtered/dXqs6yH3KF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7b06c3e6aae7ff90b101a5a4d720a6787af80a9 --- /dev/null +++ b/annotations_filtered/dXqs6yH3KF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.23], [7.0, 7.3], [8.0, 8.48], [10.0, 10.44], [11.0, 11.85], [12.0, 14.23], [16.0, 21.57], [22.0, 23.7], [24.0, 24.6], [26.0, 28.54], [30.0, 31.51], [34.0, 36.15], [38.0, 40.54], [44.0, 44.56], [46.0, 48.36], [51.0, 53.11], [55.0, 58.51], [60.0, 63.22], [64.0, 65.37], [68.0, 72.44], [75.0, 76.03], [83.0, 84.1], [85.0, 86.66], [88.0, 88.79], [90.0, 91.23], [92.0, 102.09], [102.0, 102.9], [105.0, 107.08], [109.0, 110.47], [111.0, 112.6], [116.0, 116.88], [118.0, 119.89], [121.0, 121.02], [124.0, 125.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 99.91, 0.0, 89.36, 100.0, 95.64, 68.67, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 0.3, 0.48, 0.44, 0.85, 2.23, 5.57, 1.7, 0.6, 2.54, 1.51, 2.15, 2.54, 0.56, 2.36, 2.11, 3.51, 3.22, 1.37, 4.44, 1.03, 1.1, 1.66, 0.79, 1.23, 10.09, 0.9, 2.08, 1.47, 1.6, 0.88, 1.89, 0.02, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/dYDxxHrlmUg_filtered.json b/annotations_filtered/dYDxxHrlmUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a51fa157ca97da2741c83abbcaeae46fe913f56b --- /dev/null +++ b/annotations_filtered/dYDxxHrlmUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [6.0, 19.43], [20.0, 28.49], [33.0, 33.83], [37.0, 37.74], [42.0, 42.21], [44.0, 44.39], [56.0, 56.52], [66.0, 68.82], [71.0, 71.25], [72.0, 72.66], [75.0, 76.72], [85.0, 86.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 61.87, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 13.43, 8.49, 0.83, 0.74, 0.21, 0.39, 0.52, 2.82, 0.25, 0.66, 1.72, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/dYafG2EuZjs_filtered.json b/annotations_filtered/dYafG2EuZjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c91a60df7c8d8c54e5faa66596e8f9968d6e6ee3 --- /dev/null +++ b/annotations_filtered/dYafG2EuZjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.56], [8.0, 9.91], [10.0, 11.35], [14.0, 14.67], [23.0, 23.73], [27.0, 27.82], [29.0, 30.38], [34.0, 36.85], [38.0, 38.03], [39.0, 39.04], [40.0, 40.15], [43.0, 44.9], [46.0, 46.43], [47.0, 56.56], [57.0, 58.08], [59.0, 60.13], [61.0, 61.43], [63.0, 63.14], [66.0, 66.92], [77.0, 80.7], [85.0, 103.87], [104.0, 127.52], [133.0, 133.03], [134.0, 135.62], [136.0, 137.71], [138.0, 138.48], [139.0, 140.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 37.72, 53.4, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.96], ["hum", 8.78], ["thunk", 5.16]], null, null, null, null, null, null, null], "duration": [2.56, 1.91, 1.35, 0.67, 0.73, 0.82, 1.38, 2.85, 0.03, 0.04, 0.15, 1.9, 0.43, 9.56, 1.08, 1.13, 0.43, 0.14, 0.92, 3.7, 18.87, 23.52, 0.03, 1.62, 1.71, 0.48, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/dZ-teGgl2tw_filtered.json b/annotations_filtered/dZ-teGgl2tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6af2182b20b54325f2689746a54f5d3d5625ed9a --- /dev/null +++ b/annotations_filtered/dZ-teGgl2tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.26], [13.0, 13.1], [16.0, 17.31], [28.0, 28.04], [30.0, 30.94], [36.0, 37.56], [38.0, 38.97], [40.0, 40.69], [44.0, 44.81], [46.0, 46.92], [48.0, 49.54], [52.0, 57.16], [65.0, 65.89], [66.0, 66.9], [68.0, 68.79], [75.0, 76.05], [80.0, 80.57], [84.0, 84.0], [89.0, 89.19], [93.0, 93.18], [95.0, 96.84], [99.0, 99.06], [100.0, 100.01], [101.0, 102.51], [105.0, 105.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 0.1, 1.31, 0.04, 0.94, 1.56, 0.97, 0.69, 0.81, 0.92, 1.54, 5.16, 0.89, 0.9, 0.79, 1.05, 0.57, 0.0, 0.19, 0.18, 1.84, 0.06, 0.01, 1.51, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/dZb8CGMC1zA_filtered.json b/annotations_filtered/dZb8CGMC1zA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8ab6b793ae6569c17b0716db507741428868e97 --- /dev/null +++ b/annotations_filtered/dZb8CGMC1zA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.82], [8.0, 7.94], [8.0, 8.06], [17.0, 29.84], [30.0, 31.46], [31.0, 31.5], [32.0, 32.63], [33.0, 33.61], [34.0, 35.56], [36.0, 41.4], [42.0, 43.85], [45.0, 46.85], [49.0, 49.23], [54.0, 54.31], [54.0, 57.65], [58.0, 59.73], [60.0, 71.34], [72.0, 74.06], [79.0, 79.71], [81.0, 81.53], [84.0, 86.26], [87.0, 88.13], [90.0, 90.12], [91.0, 91.02], [92.0, 92.91], [93.0, 93.82], [99.0, 100.55], [101.0, 104.01], [104.0, 105.39], [106.0, 107.89], [108.0, 110.71], [111.0, 111.97], [113.0, 113.27], [115.0, 115.37], [116.0, 116.92], [118.0, 120.56], [121.0, 125.12], [127.0, 128.48], [130.0, 132.31], [148.0, 147.95], [157.0, 158.09], [160.0, 160.73], [161.0, 161.94], [164.0, 166.94], [180.0, 200.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [32.04, 0.0, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0, 0.0, 59.59, 0.0, 0.0, 0.0, 0.0, 39.96, 0.0, 41.81, 44.78, 0.0, 0.0, 45.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 78.89, 98.19, 0.0, 71.29, 0.0, 0.0, 0.0, 0.0, 28.98, 48.48], "audiomae_on_audioset": [[["speech", 83.36], ["whack, thwack", 4.76], ["fart", 2.28]], null, null, [["speech", 78.53], ["whack, thwack", 4.29], ["inside, large room or hall", 2.19]], null, null, null, null, null, null, null, null, null, null, [["speech", 69.21], ["music", 4.49], ["sidetone", 3.33]], null, [["music", 33.32], ["electric shaver, electric razor", 19.91], ["speech", 12.85]], [["music", 46.75], ["speech", 35.13], ["musical instrument", 1.35]], null, null, [["music", 46.78], ["sheep", 5.89], ["livestock, farm animals, working animals", 5.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sound effect", 19.47], ["whack, thwack", 18.57], ["speech", 14.32]], [["music", 54.37], ["hum", 11.81], ["throbbing", 6.74]]], "duration": [6.82, -0.06, 0.06, 12.84, 1.46, 0.5, 0.63, 0.61, 1.56, 5.4, 1.85, 1.85, 0.23, 0.31, 3.65, 1.73, 11.34, 2.06, 0.71, 0.53, 2.26, 1.13, 0.12, 0.02, 0.91, 0.82, 1.55, 3.01, 1.39, 1.89, 2.71, 0.97, 0.27, 0.37, 0.92, 2.56, 4.12, 1.48, 2.31, -0.05, 1.09, 0.73, 0.94, 2.94, 20.82]} \ No newline at end of file diff --git a/annotations_filtered/dZjgSYTxWsY_filtered.json b/annotations_filtered/dZjgSYTxWsY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5958bdc350bb22c68f898b373775042ddf80ed0 --- /dev/null +++ b/annotations_filtered/dZjgSYTxWsY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.88], [12.0, 13.66], [23.0, 23.33], [31.0, 35.33], [36.0, 37.5], [39.0, 40.17], [42.0, 42.89], [44.0, 44.52], [47.0, 47.48], [55.0, 56.12], [58.0, 58.75], [63.0, 64.62], [85.0, 85.16], [95.0, 95.44], [103.0, 103.5], [109.0, 110.17], [110.0, 111.18], [112.0, 112.29], [117.0, 117.34], [118.0, 119.7], [124.0, 124.33], [125.0, 125.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 80.73], ["sidetone", 6.47], ["hum", 1.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 1.66, 0.33, 4.33, 1.5, 1.17, 0.89, 0.52, 0.48, 1.12, 0.75, 1.62, 0.16, 0.44, 0.5, 1.17, 1.18, 0.29, 0.34, 1.7, 0.33, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/dZmGh0bXqqw_filtered.json b/annotations_filtered/dZmGh0bXqqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2605fe8a8e3614fca745ad4de7f121ef96973a5 --- /dev/null +++ b/annotations_filtered/dZmGh0bXqqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.91], [20.0, 21.09], [24.0, 24.61], [27.0, 28.09], [33.0, 36.17], [39.0, 41.81], [44.0, 44.27], [46.0, 46.84], [77.0, 78.46], [80.0, 81.08], [86.0, 86.02], [90.0, 90.22], [94.0, 98.22], [100.0, 101.36], [105.0, 105.66], [108.0, 109.78], [117.0, 118.18], [131.0, 132.53], [150.0, 151.38], [158.0, 159.16], [163.0, 162.68], [163.0, 165.5], [170.0, 173.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [78.89, 0.0, 0.0, 0.0, 92.48, 65.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.21, 34.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.11], ["theremin", 40.57], ["musical instrument", 1.71]], null, null, null, null, null, null, null, null, [["music", 63.26], ["electronica", 2.08], ["didgeridoo", 1.58]], [["music", 58.85], ["disco", 3.0], ["pop music", 1.84]]], "duration": [3.91, 1.09, 0.61, 1.09, 3.17, 2.81, 0.27, 0.84, 1.46, 1.08, 0.02, 0.22, 4.22, 1.36, 0.66, 1.78, 1.18, 1.53, 1.38, 1.16, -0.32, 2.5, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/dZt3TeTClV8_filtered.json b/annotations_filtered/dZt3TeTClV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2707d4c210eaea1ccd77e92d44f81e2c1c3a87c1 --- /dev/null +++ b/annotations_filtered/dZt3TeTClV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.1], [15.0, 17.12], [22.0, 23.38], [29.0, 30.21], [36.0, 36.85], [39.0, 39.19], [42.0, 43.58], [46.0, 47.9], [49.0, 55.66], [58.0, 59.97], [60.0, 64.29], [67.0, 69.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.01, 99.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 95.64, 72.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.1, 2.12, 1.38, 1.21, 0.85, 0.19, 1.58, 1.9, 6.66, 1.97, 4.29, 2.52]} \ No newline at end of file diff --git a/annotations_filtered/dZwnXa6XHSI_filtered.json b/annotations_filtered/dZwnXa6XHSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..650c258dd0ebadb3edf9d20578290297b46ac452 --- /dev/null +++ b/annotations_filtered/dZwnXa6XHSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.66], [7.0, 7.94], [9.0, 11.33], [12.0, 13.41], [15.0, 15.9], [19.0, 18.96], [20.0, 20.01], [23.0, 23.5], [27.0, 27.92], [29.0, 30.86], [32.0, 32.93], [34.0, 34.55], [38.0, 41.5], [49.0, 49.92], [54.0, 54.87], [56.0, 56.56], [62.0, 62.5], [65.0, 65.65], [66.0, 66.72], [68.0, 68.1], [71.0, 71.24], [84.0, 85.24], [87.0, 89.46], [90.0, 89.87], [92.0, 93.58], [97.0, 98.51], [99.0, 99.82], [103.0, 104.08], [105.0, 109.76], [111.0, 111.77], [113.0, 113.97], [115.0, 115.4], [117.0, 117.48], [122.0, 128.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 43.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.05], ["sidetone", 28.66], ["noise", 17.9]]], "duration": [0.66, 0.94, 2.33, 1.41, 0.9, -0.04, 0.01, 0.5, 0.92, 1.86, 0.93, 0.55, 3.5, 0.92, 0.87, 0.56, 0.5, 0.65, 0.72, 0.1, 0.24, 1.24, 2.46, -0.13, 1.58, 1.51, 0.82, 1.08, 4.76, 0.77, 0.97, 0.4, 0.48, 6.09]} \ No newline at end of file diff --git a/annotations_filtered/d_A4tfEukp4_filtered.json b/annotations_filtered/d_A4tfEukp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d6dd27f1e8738a6cdab6efd9bf35b25f34f5128 --- /dev/null +++ b/annotations_filtered/d_A4tfEukp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [9.0, 10.57], [11.0, 12.8], [14.0, 18.18], [24.0, 25.83], [29.0, 30.5], [31.0, 32.48], [34.0, 35.31], [36.0, 41.94], [51.0, 78.46], [80.0, 81.55], [83.0, 139.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.25, 0.0, 0.0, 0.0, 0.0, 33.5, 29.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 77.28], ["hum", 4.74], ["throbbing", 2.26]], null, null, null, null, [["speech", 59.06], ["animal", 14.67], ["music", 2.81]], [["music", 48.74], ["speech", 31.65], ["throbbing", 6.24]], null, null], "duration": [0.5, 1.57, 1.8, 4.18, 1.83, 1.5, 1.48, 1.31, 5.94, 27.46, 1.55, 56.09]} \ No newline at end of file diff --git a/annotations_filtered/d_hNjBBdcyU_filtered.json b/annotations_filtered/d_hNjBBdcyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b37e63c10a5e97de9c801142295fa86cdc88013b --- /dev/null +++ b/annotations_filtered/d_hNjBBdcyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.31], [8.0, 11.13], [16.0, 16.83], [19.0, 19.43], [21.0, 22.27], [23.0, 25.2], [26.0, 27.28], [31.0, 31.67], [35.0, 35.55], [39.0, 38.91], [46.0, 46.7], [58.0, 59.68], [65.0, 65.92], [75.0, 75.05], [82.0, 82.49], [83.0, 87.39], [88.0, 101.43], [102.0, 103.1], [104.0, 104.14], [106.0, 106.14], [108.0, 110.1], [114.0, 115.77], [119.0, 119.7], [121.0, 128.53], [139.0, 141.88], [145.0, 151.12], [163.0, 172.44]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [37.8, 46.12, 0.0, 0.0, 0.0, 77.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 43.69, 0.0, 0.0, 0.0, 51.99, 0.0, 0.0, 29.08, 42.33, 30.87, 30.09], "audiomae_on_audioset": [[["speech", 62.87], ["telephone bell ringing", 10.19], ["telephone", 6.65]], [["music", 24.1], ["didgeridoo", 11.61], ["speech", 7.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.5], ["singing bowl", 20.19], ["sonar", 5.09]], null, null, null, null, null, null, [["whack, thwack", 27.26], ["speech", 23.95], ["music", 9.25]], [["music", 24.51], ["rumble", 12.53], ["hum", 7.11]], [["music", 26.06], ["rumble", 25.78], ["mains hum", 21.92]], [["hum", 19.69], ["buzz", 18.71], ["mains hum", 10.86]]], "duration": [2.31, 3.13, 0.83, 0.43, 1.27, 2.2, 1.28, 0.67, 0.55, -0.09, 0.7, 1.68, 0.92, 0.05, 0.49, 4.39, 13.43, 1.1, 0.14, 0.14, 2.1, 1.77, 0.7, 7.53, 2.88, 6.12, 9.44]} \ No newline at end of file diff --git a/annotations_filtered/d_jEVMQc0ig_filtered.json b/annotations_filtered/d_jEVMQc0ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd577bc496aaff110e04e6b57de30113b7e431d9 --- /dev/null +++ b/annotations_filtered/d_jEVMQc0ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.2], [4.0, 4.6]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.2, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/d_t77ai5GEk_filtered.json b/annotations_filtered/d_t77ai5GEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..654cf1ded4ba9b3ac89aa6efa36d578ddba62210 --- /dev/null +++ b/annotations_filtered/d_t77ai5GEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.48], [5.0, 17.19], [19.0, 21.39], [22.0, 22.94], [24.0, 24.73], [27.0, 27.53], [29.0, 30.82], [35.0, 40.78], [45.0, 49.77], [51.0, 52.81], [54.0, 55.8], [59.0, 59.24], [60.0, 62.4], [64.0, 64.74], [67.0, 68.57], [74.0, 74.87], [77.0, 97.51], [101.0, 128.6], [131.0, 130.94]], "keep_status": [false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [32.0, 31.33, 34.09, 0.0, 0.0, 0.0, 0.0, 31.57, 37.74, 0.0, 0.0, 0.0, 38.6, 0.0, 0.0, 0.0, 32.13, 45.65, 0.0], "audiomae_on_audioset": [[["hum", 29.81], ["mains hum", 24.45], ["music", 18.23]], [["music", 38.83], ["hum", 10.84], ["ambient music", 8.34]], [["music", 47.33], ["didgeridoo", 26.09], ["guitar", 3.66]], null, null, null, null, [["music", 11.44], ["gong", 10.44], ["livestock, farm animals, working animals", 8.36]], [["music", 30.63], ["hum", 14.95], ["mains hum", 11.84]], null, null, null, [["music", 54.3], ["didgeridoo", 9.02], ["hum", 8.71]], null, null, null, [["music", 44.62], ["thunk", 7.77], ["speech", 7.62]], [["speech", 39.69], ["music", 24.23], ["hum", 11.37]], null], "duration": [2.48, 12.19, 2.39, 0.94, 0.73, 0.53, 1.82, 5.78, 4.77, 1.81, 1.8, 0.24, 2.4, 0.74, 1.57, 0.87, 20.51, 27.6, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/daUvbGlC3CY_filtered.json b/annotations_filtered/daUvbGlC3CY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f44c9b1574b3ebdba9bb203d534912a2ea66229f --- /dev/null +++ b/annotations_filtered/daUvbGlC3CY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.62], [5.0, 6.78], [9.0, 11.48], [13.0, 13.27], [14.0, 15.23], [16.0, 18.45], [19.0, 21.17], [23.0, 25.24], [27.0, 26.82], [27.0, 29.32], [30.0, 40.74], [41.0, 42.62], [45.0, 44.78], [45.0, 47.97], [49.0, 52.91], [54.0, 56.56], [58.0, 59.61], [61.0, 62.87], [64.0, 79.61], [80.0, 84.94], [86.0, 90.59], [91.0, 112.26], [113.0, 123.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.54, 0.0, 99.9, 0.0, 0.0, 99.82, 92.48, 99.97, 0.0, 65.2, 90.43, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 97.83, 100.0, 100.0, 99.99, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.62, 1.78, 2.48, 0.27, 1.23, 2.45, 2.17, 2.24, -0.18, 2.32, 10.74, 1.62, -0.22, 2.97, 3.91, 2.56, 1.61, 1.87, 15.61, 4.94, 4.59, 21.26, 10.3]} \ No newline at end of file diff --git a/annotations_filtered/daVOnsL2wkU_filtered.json b/annotations_filtered/daVOnsL2wkU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bafdcb773bd9398b9696945e6a7bd4f1bcee1777 --- /dev/null +++ b/annotations_filtered/daVOnsL2wkU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.23], [10.0, 10.69], [12.0, 12.12], [13.0, 14.44], [15.0, 26.59], [27.0, 29.22], [30.0, 31.11], [32.0, 34.47], [36.0, 38.15], [39.0, 42.15], [43.0, 46.04], [47.0, 49.37], [50.0, 52.03], [53.0, 54.46], [55.0, 56.86], [59.0, 77.67], [79.0, 85.18], [87.0, 89.65], [90.0, 94.37], [96.0, 99.47], [101.0, 123.38], [124.0, 125.29], [126.0, 129.44]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [37.82, 0.0, 0.0, 0.0, 46.4, 53.84, 0.0, 61.97, 68.41, 53.04, 72.46, 70.44, 54.04, 0.0, 0.0, 40.48, 71.57, 63.96, 61.37, 59.42, 56.18, 0.0, 45.62], "audiomae_on_audioset": [[["fly, housefly", 28.21], ["sidetone", 15.96], ["insect", 14.24]], null, null, null, [["fly, housefly", 30.93], ["bee, wasp, etc.", 24.31], ["animal", 11.68]], null, null, null, null, null, null, null, null, null, null, [["speech", 25.1], ["radio", 17.86], ["hum", 10.28]], null, null, null, null, null, null, [["music", 52.51], ["musical instrument", 7.35], ["guitar", 6.08]]], "duration": [2.23, 0.69, 0.12, 1.44, 11.59, 2.22, 1.11, 2.47, 2.15, 3.15, 3.04, 2.37, 2.03, 1.46, 1.86, 18.67, 6.18, 2.65, 4.37, 3.47, 22.38, 1.29, 3.44]} \ No newline at end of file diff --git a/annotations_filtered/daoD1UtU5XI_filtered.json b/annotations_filtered/daoD1UtU5XI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2c466578c4d2eab07afd05d26ff6e8739fbeefb --- /dev/null +++ b/annotations_filtered/daoD1UtU5XI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.13], [20.0, 21.74], [23.0, 25.49], [28.0, 28.59], [32.0, 33.13], [37.0, 37.27], [38.0, 37.98], [38.0, 40.04], [42.0, 43.41], [48.0, 49.23], [51.0, 51.8], [79.0, 79.2], [92.0, 92.2], [93.0, 93.7], [95.0, 95.28], [96.0, 96.77], [99.0, 99.15], [103.0, 104.48], [106.0, 106.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.72, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.13, 1.74, 2.49, 0.59, 1.13, 0.27, -0.02, 2.04, 1.41, 1.23, 0.8, 0.2, 0.2, 0.7, 0.28, 0.77, 0.15, 1.48, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/dapP5W153YE_filtered.json b/annotations_filtered/dapP5W153YE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..231d6b068247a45c1899830b0c043b9186c25d3f --- /dev/null +++ b/annotations_filtered/dapP5W153YE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 32.59], [37.0, 45.99], [48.0, 58.28], [59.0, 77.65], [79.0, 94.42], [97.0, 98.63], [100.0, 118.96], [121.0, 126.57], [127.0, 136.29], [139.0, 148.04], [150.0, 153.25], [155.0, 157.59], [159.0, 177.31], [180.0, 205.97], [208.0, 207.81], [209.0, 209.65]], "keep_status": [false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [30.38, 30.75, 30.43, 30.47, 29.95, 0.0, 30.36, 30.28, 30.24, 30.52, 30.47, 31.05, 30.33, 30.12, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.1], ["speech", 8.81], ["throbbing", 5.54]], [["music", 38.89], ["hum", 18.22], ["throbbing", 11.78]], [["livestock, farm animals, working animals", 24.52], ["music", 22.15], ["cattle, bovinae", 20.11]], [["music", 37.81], ["hum", 24.28], ["throbbing", 10.07]], [["music", 67.24], ["speech", 12.29], ["synthesizer", 5.43]], null, [["music", 37.96], ["hum", 25.14], ["throbbing", 13.09]], [["music", 47.43], ["throbbing", 6.46], ["hum", 4.49]], [["music", 49.72], ["speech", 15.64], ["synthesizer", 10.57]], [["vehicle", 21.38], ["speech", 19.3], ["car", 17.06]], [["music", 75.76], ["electronic music", 2.79], ["hum", 1.98]], [["music", 54.06], ["throbbing", 13.44], ["hum", 12.13]], [["music", 71.5], ["speech", 9.38], ["synthesizer", 4.08]], [["throbbing", 34.24], ["hum", 28.8], ["music", 15.58]], null, null], "duration": [13.59, 8.99, 10.28, 18.65, 15.42, 1.63, 18.96, 5.57, 9.29, 9.04, 3.25, 2.59, 18.31, 25.97, -0.19, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/darXVyyQUlc_filtered.json b/annotations_filtered/darXVyyQUlc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63059fb843738853e23fba69255110c53e3e191b --- /dev/null +++ b/annotations_filtered/darXVyyQUlc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.98], [7.0, 7.86], [10.0, 11.13], [12.0, 84.15], [86.0, 88.25], [90.0, 96.33], [97.0, 101.24], [102.0, 108.9], [111.0, 126.4]], "keep_status": [true, false, false, false, true, false, false, false, false], "silence_prob": [45.33, 0.0, 0.0, 0.0, 38.0, 53.04, 59.68, 52.22, 53.72], "audiomae_on_audioset": [[["speech", 53.1], ["hum", 8.08], ["mains hum", 4.06]], null, null, null, [["whale vocalization", 31.77], ["speech", 15.29], ["hum", 10.66]], null, null, null, null], "duration": [2.98, 0.86, 1.13, 72.15, 2.25, 6.33, 4.24, 6.9, 15.4]} \ No newline at end of file diff --git a/annotations_filtered/dazYs4DgYtc_filtered.json b/annotations_filtered/dazYs4DgYtc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c469639ad3e365284f86c1e229d9460ed2bbbe68 --- /dev/null +++ b/annotations_filtered/dazYs4DgYtc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [13.0, 18.86], [21.0, 22.08]], "keep_status": [false, false, false], "silence_prob": [0.0, 29.26, 0.0], "audiomae_on_audioset": [null, [["speech", 78.88], ["hum", 4.69], ["thunk", 3.37]], null], "duration": [0.5, 5.86, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/db1o8mTCBXU_filtered.json b/annotations_filtered/db1o8mTCBXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e5e59f62aea65ca54ee6d77f893da2d7a8eaba3 --- /dev/null +++ b/annotations_filtered/db1o8mTCBXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.66], [14.0, 17.14], [18.0, 19.18], [20.0, 22.65], [24.0, 27.58], [29.0, 40.78], [41.0, 41.13], [41.0, 41.2], [42.0, 50.33], [53.0, 52.95], [56.0, 61.7], [64.0, 64.96], [66.0, 67.04], [69.0, 71.52], [72.0, 73.99], [75.0, 78.27], [79.0, 79.76], [82.0, 83.3], [86.0, 87.49], [88.0, 90.31], [91.0, 91.64], [94.0, 95.62], [98.0, 99.1], [103.0, 102.64], [108.0, 108.26], [111.0, 112.36], [114.0, 115.32], [117.0, 116.95], [118.0, 120.73], [121.0, 126.39], [128.0, 128.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 73.51, 0.0, 82.25, 62.47, 50.36, 0.0, 0.0, 62.89, 0.0, 46.33, 0.0, 0.0, 48.91, 0.0, 62.47, 0.0, 0.0, 0.0, 70.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.31, 60.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 19.63], ["electric shaver, electric razor", 18.18], ["hum", 10.09]], null, null, [["speech", 33.63], ["music", 24.01], ["musical instrument", 8.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.31], ["throbbing", 9.39], ["musical instrument", 6.25]], null, null], "duration": [0.66, 3.14, 1.18, 2.65, 3.58, 11.78, 0.13, 0.2, 8.33, -0.05, 5.7, 0.96, 1.04, 2.52, 1.99, 3.27, 0.76, 1.3, 1.49, 2.31, 0.64, 1.62, 1.1, -0.36, 0.26, 1.36, 1.32, -0.05, 2.73, 5.39, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/db50XeSEtv4_filtered.json b/annotations_filtered/db50XeSEtv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9803fee7e696e002fe0d45c600aceec54179f225 --- /dev/null +++ b/annotations_filtered/db50XeSEtv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.2], [12.0, 14.55], [16.0, 17.88], [19.0, 20.38], [23.0, 26.96], [28.0, 28.98], [31.0, 33.57], [37.0, 39.85], [40.0, 40.47], [41.0, 45.39], [48.0, 49.32], [51.0, 51.24], [51.0, 56.03], [57.0, 57.89], [58.0, 60.69], [61.0, 63.14], [64.0, 65.57], [67.0, 67.93], [68.0, 70.97], [73.0, 83.61], [85.0, 91.79], [94.0, 97.78], [98.0, 100.21], [101.0, 102.52], [105.0, 106.2], [106.0, 106.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [97.11, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 99.91, 0.0, 82.43, 0.0, 0.0, 65.2, 0.0, 51.18, 73.06, 0.0, 0.0, 57.01, 45.24, 29.98, 56.25, 40.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 27.46], ["speech", 23.45], ["didgeridoo", 7.22]], [["speech", 23.67], ["explosion", 23.04], ["burst, pop", 7.14]], null, [["music", 57.42], ["speech", 6.5], ["singing bowl", 2.7]], null, null, null], "duration": [4.2, 2.55, 1.88, 1.38, 3.96, 0.98, 2.57, 2.85, 0.47, 4.39, 1.32, 0.24, 5.03, 0.89, 2.69, 2.14, 1.57, 0.93, 2.97, 10.61, 6.79, 3.78, 2.21, 1.52, 1.2, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/dbE2-VU-4SM_filtered.json b/annotations_filtered/dbE2-VU-4SM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56627c95fdd8a5e91dfde8e504026f1959337cbb --- /dev/null +++ b/annotations_filtered/dbE2-VU-4SM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.66], [14.0, 14.47], [16.0, 15.96], [16.0, 17.32], [19.0, 19.04], [21.0, 21.51], [23.0, 23.06], [26.0, 27.13], [27.0, 28.44], [30.0, 30.64], [32.0, 33.25], [35.0, 34.89], [36.0, 39.6], [56.0, 56.29], [59.0, 60.07], [61.0, 61.57], [64.0, 64.13], [66.0, 66.72], [69.0, 69.31], [72.0, 72.13], [73.0, 74.09], [76.0, 76.33], [77.0, 77.5], [91.0, 93.14], [94.0, 94.51], [95.0, 97.24], [98.0, 98.39], [100.0, 104.89], [114.0, 115.47], [116.0, 116.48], [117.0, 119.35], [123.0, 124.19], [127.0, 127.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 68.54, 0.0, 41.93, 0.0, 0.0, 46.94, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.16], ["noise", 13.76], ["sidetone", 3.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["chirp tone", 67.6], ["sine wave", 20.8], ["tuning fork", 1.37]], null, null, [["noise", 13.72], ["hum", 10.04], ["tuning fork", 8.68]], null, null], "duration": [0.66, 0.47, -0.04, 1.32, 0.04, 0.51, 0.06, 1.13, 1.44, 0.64, 1.25, -0.11, 3.6, 0.29, 1.07, 0.57, 0.13, 0.72, 0.31, 0.13, 1.09, 0.33, 0.5, 2.14, 0.51, 2.24, 0.39, 4.89, 1.47, 0.48, 2.35, 1.19, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/dbH4Amzn-Rk_filtered.json b/annotations_filtered/dbH4Amzn-Rk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d8e1759ceac0c1108fefbc6b0aea6ad8feb5e96 --- /dev/null +++ b/annotations_filtered/dbH4Amzn-Rk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.68], [7.0, 11.5], [13.0, 14.39], [15.0, 15.23], [16.0, 17.64], [21.0, 22.62], [26.0, 27.09], [29.0, 30.59], [32.0, 33.69], [35.0, 35.68], [42.0, 42.85], [47.0, 47.92], [54.0, 54.68], [58.0, 59.17], [60.0, 60.56], [62.0, 63.24], [65.0, 65.11], [73.0, 74.58], [76.0, 76.94], [78.0, 79.17], [80.0, 80.81], [84.0, 84.62], [85.0, 87.02], [88.0, 88.55], [89.0, 89.68], [95.0, 95.05], [96.0, 97.16], [99.0, 99.3], [103.0, 103.67], [108.0, 108.55], [110.0, 111.06], [115.0, 119.18], [120.0, 121.42], [124.0, 126.1], [127.0, 127.79], [129.0, 130.77]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 79.41, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 37.83], ["bouncing", 13.24], ["whack, thwack", 7.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.15], ["sidetone", 22.29], ["dial tone", 7.88]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 4.5, 1.39, 0.23, 1.64, 1.62, 1.09, 1.59, 1.69, 0.68, 0.85, 0.92, 0.68, 1.17, 0.56, 1.24, 0.11, 1.58, 0.94, 1.17, 0.81, 0.62, 2.02, 0.55, 0.68, 0.05, 1.16, 0.3, 0.67, 0.55, 1.06, 4.18, 1.42, 2.1, 0.79, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/dbX-ekoWGWE_filtered.json b/annotations_filtered/dbX-ekoWGWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d2bfebf10ace4a5ea304b067bb5ea577c030caa --- /dev/null +++ b/annotations_filtered/dbX-ekoWGWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.81], [11.0, 11.65], [15.0, 17.0], [21.0, 22.5], [26.0, 27.92], [34.0, 34.59], [36.0, 36.44], [39.0, 40.34], [42.0, 43.16], [45.0, 45.89], [52.0, 54.85], [56.0, 56.59], [61.0, 62.4], [67.0, 68.1], [74.0, 74.04], [78.0, 79.74], [81.0, 82.56], [84.0, 85.4], [88.0, 88.13], [92.0, 96.08], [101.0, 102.0], [107.0, 107.84], [113.0, 113.71], [117.0, 118.99], [121.0, 122.17], [124.0, 124.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 49.39], ["speech", 13.22], ["musical instrument", 10.09]], null, null, null, null, null, null, null, null, [["music", 72.97], ["guitar", 7.76], ["musical instrument", 4.84]], null, null, null, null, null, null], "duration": [0.81, 0.65, 2.0, 1.5, 1.92, 0.59, 0.44, 1.34, 1.16, 0.89, 2.85, 0.59, 1.4, 1.1, 0.04, 1.74, 1.56, 1.4, 0.13, 4.08, 1.0, 0.84, 0.71, 1.99, 1.17, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/dbgOACJpZg0_filtered.json b/annotations_filtered/dbgOACJpZg0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d41240ae605ffaf13b26d03b994199a515aa43cf --- /dev/null +++ b/annotations_filtered/dbgOACJpZg0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [4.0, 4.65], [10.0, 15.35], [19.0, 54.06], [56.0, 60.84], [62.0, 62.26], [64.0, 64.67], [65.0, 66.29], [69.0, 70.23], [72.0, 79.3], [86.0, 86.86], [89.0, 93.11], [95.0, 95.3], [96.0, 97.43], [100.0, 102.2], [103.0, 103.84], [107.0, 108.09], [112.0, 113.34], [116.0, 117.54], [119.0, 119.3], [121.0, 121.54], [123.0, 124.11]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.71, 0.0, 39.3, 0.0, 0.0, 0.0, 0.0, 51.34, 0.0, 49.27, 0.0, 0.0, 42.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["fly, housefly", 24.1], ["hum", 19.11], ["insect", 12.12]], null, [["sidetone", 36.52], ["radio", 7.08], ["frog", 5.41]], null, null, null, null, null, null, [["frog", 42.16], ["hum", 18.31], ["throbbing", 5.16]], null, null, [["throbbing", 13.3], ["hum", 8.82], ["mosquito", 8.08]], null, null, null, null, null, null, null], "duration": [0.13, 0.65, 5.35, 35.06, 4.84, 0.26, 0.67, 1.29, 1.23, 7.3, 0.86, 4.11, 0.3, 1.43, 2.2, 0.84, 1.09, 1.34, 1.54, 0.3, 0.54, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/dc8glsGbIus_filtered.json b/annotations_filtered/dc8glsGbIus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c7755a150c30e0f8a8a996ca1e2fd37ddf2f45f --- /dev/null +++ b/annotations_filtered/dc8glsGbIus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.01], [6.0, 6.47], [7.0, 8.51], [9.0, 9.75], [11.0, 11.28], [13.0, 15.18], [18.0, 20.92], [25.0, 29.03], [33.0, 53.89], [54.0, 54.77], [55.0, 55.81], [56.0, 56.51], [58.0, 64.57], [65.0, 85.77], [87.0, 88.13], [89.0, 110.29], [114.0, 119.45], [120.0, 120.55], [124.0, 124.6], [126.0, 127.23], [130.0, 130.13], [131.0, 132.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false, false, false, false, false], "silence_prob": [52.56, 0.0, 0.0, 0.0, 0.0, 59.07, 71.14, 53.65, 29.26, 0.0, 0.0, 0.0, 29.18, 30.81, 0.0, 30.32, 31.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 49.06], ["buzz", 24.06], ["cacophony", 6.51]], null, null, null, [["speech", 33.27], ["music", 21.47], ["explosion", 10.38]], [["cattle, bovinae", 19.01], ["explosion", 9.91], ["speech", 8.48]], null, [["music", 38.18], ["musical instrument", 3.74], ["explosion", 3.51]], [["music", 30.99], ["hum", 8.82], ["cacophony", 7.78]], null, null, null, null, null], "duration": [2.01, 0.47, 1.51, 0.75, 0.28, 2.18, 2.92, 4.03, 20.89, 0.77, 0.81, 0.51, 6.57, 20.77, 1.13, 21.29, 5.45, 0.55, 0.6, 1.23, 0.13, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/dcCsAQTY9lQ_filtered.json b/annotations_filtered/dcCsAQTY9lQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de89f9faf7c3c6f07bf661705a2b9dc75c084d3d --- /dev/null +++ b/annotations_filtered/dcCsAQTY9lQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [10.0, 10.79], [22.0, 21.83], [26.0, 27.82], [29.0, 29.29], [31.0, 38.26], [43.0, 43.21], [59.0, 67.91], [71.0, 71.2], [75.0, 78.73], [81.0, 83.17], [91.0, 95.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.78, 0.0, 29.22, 0.0, 29.06, 28.86, 29.04], "audiomae_on_audioset": [null, null, null, null, null, [["music", 45.69], ["crowd", 22.23], ["electronic music", 6.24]], null, [["music", 68.48], ["speech", 14.74], ["boing", 6.09]], null, [["music", 76.94], ["electronic music", 2.3], ["reggae", 1.37]], [["music", 85.04], ["speech", 1.93], ["boing", 0.95]], [["music", 82.81], ["middle eastern music", 1.79], ["singing", 1.7]]], "duration": [0.26, 0.79, -0.17, 1.82, 0.29, 7.26, 0.21, 8.91, 0.2, 3.73, 2.17, 4.05]} \ No newline at end of file diff --git a/annotations_filtered/dcSalZZ5YjM_filtered.json b/annotations_filtered/dcSalZZ5YjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7cd220b99904ba195027a9f3c0f7ff6b438d2478 --- /dev/null +++ b/annotations_filtered/dcSalZZ5YjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.11], [4.0, 12.29], [25.0, 28.22], [36.0, 46.92], [47.0, 54.7], [70.0, 71.86], [76.0, 76.65], [80.0, 81.4], [82.0, 82.68], [87.0, 87.49], [95.0, 95.22], [97.0, 97.87], [99.0, 101.66], [104.0, 108.36], [112.0, 113.8], [117.0, 118.29], [122.0, 136.93], [142.0, 145.05], [145.0, 148.8], [150.0, 150.5], [151.0, 151.6], [152.0, 153.66], [154.0, 162.06]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 32.61, 35.01, 37.41, 40.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.52, 34.57, 0.0, 0.0, 34.46, 32.2, 31.3, 0.0, 0.0, 0.0, 30.34], "audiomae_on_audioset": [null, [["music", 33.69], ["hum", 28.99], ["throbbing", 18.63]], [["music", 23.46], ["throbbing", 15.88], ["speech", 13.92]], [["music", 46.15], ["throbbing", 17.38], ["hum", 12.87]], [["music", 55.87], ["throbbing", 13.85], ["hum", 12.7]], null, null, null, null, null, null, null, [["music", 34.16], ["hum", 14.53], ["throbbing", 13.18]], [["music", 23.45], ["insect", 16.98], ["fly, housefly", 14.46]], null, null, [["hum", 46.38], ["mains hum", 17.48], ["throbbing", 12.32]], [["hum", 47.19], ["mains hum", 26.15], ["throbbing", 15.57]], [["music", 30.12], ["hum", 18.01], ["throbbing", 15.21]], null, null, null, [["throbbing", 30.15], ["music", 29.46], ["hum", 28.38]]], "duration": [0.11, 8.29, 3.22, 10.92, 7.7, 1.86, 0.65, 1.4, 0.68, 0.49, 0.22, 0.87, 2.66, 4.36, 1.8, 1.29, 14.93, 3.05, 3.8, 0.5, 0.6, 1.66, 8.06]} \ No newline at end of file diff --git a/annotations_filtered/dcmwPYCUysw_filtered.json b/annotations_filtered/dcmwPYCUysw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75b9ae59fbe5846c9faeecaca6ae67a370bff7da --- /dev/null +++ b/annotations_filtered/dcmwPYCUysw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.88], [6.0, 6.13], [11.0, 13.85], [17.0, 61.6], [62.0, 71.31], [73.0, 73.65], [75.0, 75.81], [85.0, 86.17], [87.0, 87.57], [88.0, 88.84], [94.0, 95.34], [99.0, 100.4], [116.0, 116.87]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.48, 0.0, 29.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 75.93], ["vehicle", 4.51], ["rumble", 2.43]], null, [["hum", 20.05], ["mains hum", 15.37], ["noise", 14.24]], null, null, null, null, null, null, null, null], "duration": [0.88, 0.13, 2.85, 44.6, 9.31, 0.65, 0.81, 1.17, 0.57, 0.84, 1.34, 1.4, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/dcsByxGdYO0_filtered.json b/annotations_filtered/dcsByxGdYO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be8adb260eb6735407c27d5052437548b352c5f4 --- /dev/null +++ b/annotations_filtered/dcsByxGdYO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [11.0, 11.69], [19.0, 19.5], [21.0, 20.78], [33.0, 33.54], [35.0, 35.04], [42.0, 42.38], [50.0, 50.63], [54.0, 58.09], [59.0, 58.97], [59.0, 60.07], [62.0, 61.8], [68.0, 69.33], [69.0, 69.36], [69.0, 70.12], [74.0, 73.99], [77.0, 77.38], [90.0, 90.63], [96.0, 96.38], [100.0, 100.35], [103.0, 103.38], [104.0, 104.43], [105.0, 105.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.69, 0.5, -0.22, 0.54, 0.04, 0.38, 0.63, 4.09, -0.03, 1.07, -0.2, 1.33, 0.36, 1.12, -0.01, 0.38, 0.63, 0.38, 0.35, 0.38, 0.43, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/dcsVnpHXXX0_filtered.json b/annotations_filtered/dcsVnpHXXX0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f811ce513789603183563b2e4ec06b4f8f75d22f --- /dev/null +++ b/annotations_filtered/dcsVnpHXXX0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.16], [10.0, 16.33], [17.0, 18.27], [23.0, 23.06], [31.0, 31.77], [33.0, 33.81], [34.0, 35.26], [39.0, 40.09], [42.0, 44.66], [46.0, 51.85], [53.0, 71.14], [72.0, 74.31], [75.0, 78.16], [80.0, 86.14]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 31.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.93, 59.24, 31.75, 40.95, 53.34, 44.23], "audiomae_on_audioset": [null, [["speech", 25.51], ["music", 18.58], ["didgeridoo", 8.03]], null, null, null, null, null, null, null, null, [["music", 70.24], ["theremin", 7.0], ["musical instrument", 4.95]], [["speech", 36.38], ["music", 13.34], ["hum", 8.8]], null, [["music", 51.41], ["foghorn", 6.66], ["theremin", 5.47]]], "duration": [0.16, 6.33, 1.27, 0.06, 0.77, 0.81, 1.26, 1.09, 2.66, 5.85, 18.14, 2.31, 3.16, 6.14]} \ No newline at end of file diff --git a/annotations_filtered/ddGwvveSXxM_filtered.json b/annotations_filtered/ddGwvveSXxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f3299f6b33222f0aed2f867745dcbf5221d7414 --- /dev/null +++ b/annotations_filtered/ddGwvveSXxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.22], [5.0, 14.07], [14.0, 32.32], [33.0, 88.05], [94.0, 95.25], [100.0, 109.05], [116.0, 119.3], [121.0, 123.43], [128.0, 128.93], [130.0, 131.19]], "keep_status": [false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 60.7, 45.08, 0.0, 0.0, 29.93, 28.66, 56.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["noise", 47.23], ["speech", 15.67], ["chirp tone", 5.04]], null, null, [["speech", 43.05], ["music", 25.05], ["trombone", 8.37]], [["speech", 29.32], ["ship", 16.14], ["foghorn", 9.3]], null, null, null], "duration": [1.22, 9.07, 18.32, 55.05, 1.25, 9.05, 3.3, 2.43, 0.93, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/ddQe0gG79zk_filtered.json b/annotations_filtered/ddQe0gG79zk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..977830a516156378e8b2db85dabea6b20b63b85b --- /dev/null +++ b/annotations_filtered/ddQe0gG79zk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[97.0, 100.97], [101.0, 102.22], [104.0, 132.07], [133.0, 138.94], [140.0, 150.25], [151.0, 158.97], [160.0, 170.43], [171.0, 171.75], [173.0, 174.88], [175.0, 176.35]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.87, 0.0, 99.98, 70.44, 96.54, 96.89, 29.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["tuning fork", 46.88], ["sine wave", 6.68], ["music", 4.89]], null, null, null], "duration": [3.97, 1.22, 28.07, 5.94, 10.25, 7.97, 10.43, 0.75, 1.88, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/ddQniqjrVdo_filtered.json b/annotations_filtered/ddQniqjrVdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0accf12d7919de6390c5ec2fc58b12ae377d71d --- /dev/null +++ b/annotations_filtered/ddQniqjrVdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.64], [14.0, 17.51], [21.0, 21.71], [27.0, 28.41], [29.0, 29.64], [30.0, 31.8], [38.0, 42.87], [48.0, 48.81]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.43, 0.0, 0.0, 0.0, 0.0, 46.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 69.11], ["speech", 9.19], ["throbbing", 1.28]], null], "duration": [-0.36, 3.51, 0.71, 1.41, 0.64, 1.8, 4.87, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/ddXUQu9RC4U_filtered.json b/annotations_filtered/ddXUQu9RC4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..005495c0685d3d4c1f667833023bd3d379e4e357 --- /dev/null +++ b/annotations_filtered/ddXUQu9RC4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 89.23], [90.0, 90.93], [91.0, 94.44]], "keep_status": [true, false, false], "silence_prob": [37.98, 0.0, 64.18], "audiomae_on_audioset": [[["music", 25.85], ["speech", 13.99], ["musical instrument", 6.99]], null, null], "duration": [22.23, 0.93, 3.44]} \ No newline at end of file diff --git a/annotations_filtered/dd_IWBNSKY0_filtered.json b/annotations_filtered/dd_IWBNSKY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e237bf9adc29aec87ac6d64b692da1ebb3f0e3d --- /dev/null +++ b/annotations_filtered/dd_IWBNSKY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [9.0, 8.92], [13.0, 13.19], [14.0, 14.76], [15.0, 17.04], [32.0, 35.46], [37.0, 37.62], [42.0, 42.79], [46.0, 47.22], [54.0, 54.5], [56.0, 57.1], [59.0, 60.13], [66.0, 66.77], [70.0, 69.82], [71.0, 104.04], [118.0, 119.33], [120.0, 122.93], [123.0, 124.78], [125.0, 125.78], [131.0, 130.74], [133.0, 133.47], [139.0, 139.89], [141.0, 141.86], [147.0, 148.86], [150.0, 150.18], [151.0, 153.94], [155.0, 155.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 60.98, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, -0.08, 0.19, 0.76, 2.04, 3.46, 0.62, 0.79, 1.22, 0.5, 1.1, 1.13, 0.77, -0.18, 33.04, 1.33, 2.93, 1.78, 0.78, -0.26, 0.47, 0.89, 0.86, 1.86, 0.18, 2.94, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/de1vEYiEMro_filtered.json b/annotations_filtered/de1vEYiEMro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d82beb217167a1ff9cf9835fcd4fef837a90d9a --- /dev/null +++ b/annotations_filtered/de1vEYiEMro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.88], [30.0, 37.79], [40.0, 76.77], [78.0, 111.47], [113.0, 151.43]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 41.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 28.84], ["didgeridoo", 25.1], ["music", 13.18]], null, null, null], "duration": [0.88, 7.79, 36.77, 33.47, 38.43]} \ No newline at end of file diff --git a/annotations_filtered/deUgUoJ4z5I_filtered.json b/annotations_filtered/deUgUoJ4z5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e5612526f2d37aaec1351948b0da9c5f32d50ab --- /dev/null +++ b/annotations_filtered/deUgUoJ4z5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 5.98], [8.0, 9.22], [13.0, 13.93], [14.0, 14.91], [17.0, 18.13], [21.0, 24.14], [25.0, 27.18], [35.0, 36.63], [38.0, 41.1], [44.0, 44.85], [49.0, 50.62], [52.0, 52.96], [56.0, 58.24], [70.0, 73.89], [76.0, 77.53], [85.0, 86.95], [88.0, 89.41], [91.0, 91.1], [91.0, 91.56], [98.0, 100.45], [102.0, 104.35], [105.0, 106.37], [110.0, 111.43], [112.0, 113.31], [116.0, 118.32], [155.0, 163.48], [164.0, 170.31], [171.0, 177.89], [179.0, 182.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.59, 0.0, 0.0, 0.0, 0.0, 59.42, 54.23, 0.0, 87.74, 0.0, 0.0, 0.0, 63.85, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 64.07, 94.07, 0.0, 0.0, 0.0, 45.62, 30.73, 77.87, 89.72, 95.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 57.58], ["musical instrument", 7.73], ["brass instrument", 5.57]], [["music", 62.05], ["theremin", 22.21], ["synthesizer", 2.39]], null, null, null], "duration": [5.98, 1.22, 0.93, 0.91, 1.13, 3.14, 2.18, 1.63, 3.1, 0.85, 1.62, 0.96, 2.24, 3.89, 1.53, 1.95, 1.41, 0.1, 0.56, 2.45, 2.35, 1.37, 1.43, 1.31, 2.32, 8.48, 6.31, 6.89, 3.02]} \ No newline at end of file diff --git a/annotations_filtered/deUroRuOCwM_filtered.json b/annotations_filtered/deUroRuOCwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42a8d484c2eb77545f5b43fad39f5b55e07a0093 --- /dev/null +++ b/annotations_filtered/deUroRuOCwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.22], [22.0, 22.32], [24.0, 25.27], [27.0, 27.97], [29.0, 30.38], [33.0, 33.93], [35.0, 35.16], [35.0, 37.25], [38.0, 38.85], [40.0, 41.39], [42.0, 43.63], [45.0, 47.34], [48.0, 49.08], [53.0, 54.18], [61.0, 63.07], [64.0, 64.96], [67.0, 70.11], [71.0, 72.84], [74.0, 79.84], [81.0, 85.62], [87.0, 86.98], [95.0, 96.23], [114.0, 114.37], [115.0, 115.37], [123.0, 129.66], [134.0, 134.99], [135.0, 135.18], [136.0, 135.73], [136.0, 136.58], [142.0, 151.73], [152.0, 153.99], [155.0, 155.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0, 0.0, 0.0, 49.4, 0.0, 0.0, 99.99, 0.0, 100.0, 0.0, 67.13, 100.0, 0.0, 0.0, 0.0, 0.0, 30.2, 0.0, 0.0, 0.0, 0.0, 38.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 91.72], ["speech", 4.41], ["dial tone", 0.92]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.99], ["explosion", 6.49], ["screaming", 5.61]], null, null, null, null, [["fly, housefly", 23.38], ["mosquito", 11.07], ["insect", 9.56]], null, null], "duration": [0.22, 0.32, 1.27, 0.97, 1.38, 0.93, 0.16, 2.25, 0.85, 1.39, 1.63, 2.34, 1.08, 1.18, 2.07, 0.96, 3.11, 1.84, 5.84, 4.62, -0.02, 1.23, 0.37, 0.37, 6.66, 0.99, 0.18, -0.27, 0.58, 9.73, 1.99, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/de_Dik7HT6E_filtered.json b/annotations_filtered/de_Dik7HT6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..590544eb1139b70e6a56916534fd8f0b8f1ce76b --- /dev/null +++ b/annotations_filtered/de_Dik7HT6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 17.27], [18.0, 21.37], [22.0, 32.05], [32.0, 33.1], [38.0, 39.99], [46.0, 47.93], [55.0, 55.46], [56.0, 56.74], [70.0, 69.96], [72.0, 72.17], [81.0, 81.55], [85.0, 85.56], [89.0, 89.5], [99.0, 99.69], [105.0, 108.72], [112.0, 116.6], [119.0, 124.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [87.74, 89.36, 41.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.77, 83.88, 45.33], "audiomae_on_audioset": [null, null, [["speech", 37.86], ["hum", 21.47], ["music", 11.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 28.02], ["mains hum", 26.63], ["hum", 7.19]]], "duration": [14.27, 3.37, 10.05, 1.1, 1.99, 1.93, 0.46, 0.74, -0.04, 0.17, 0.55, 0.56, 0.5, 0.69, 3.72, 4.6, 5.14]} \ No newline at end of file diff --git a/annotations_filtered/dejp7HK8Owc_filtered.json b/annotations_filtered/dejp7HK8Owc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50151fab182cdf9f3caa72782fa85e3b46949091 --- /dev/null +++ b/annotations_filtered/dejp7HK8Owc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 109.8], [111.0, 124.95], [126.0, 129.27]], "keep_status": [false, false, false], "silence_prob": [0.0, 57.72, 57.89], "audiomae_on_audioset": [null, null, null], "duration": [105.8, 13.95, 3.27]} \ No newline at end of file diff --git a/annotations_filtered/delffcg5VZU_filtered.json b/annotations_filtered/delffcg5VZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e816bdf7cdbcd6403932a9748eef80a1dfd17ec --- /dev/null +++ b/annotations_filtered/delffcg5VZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.4], [20.0, 20.36], [21.0, 22.13], [29.0, 29.69], [32.0, 38.35], [42.0, 42.85], [48.0, 52.44], [54.0, 58.48], [63.0, 73.09], [75.0, 75.1], [78.0, 81.36], [84.0, 84.87], [89.0, 90.68], [93.0, 98.83], [100.0, 101.26], [104.0, 104.67], [108.0, 108.24], [114.0, 114.67], [115.0, 116.55], [119.0, 120.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.11, 0.0, 0.0, 0.0, 99.82, 0.0, 95.78, 93.29, 95.23, 0.0, 57.01, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.4, 0.36, 1.13, 0.69, 6.35, 0.85, 4.44, 4.48, 10.09, 0.1, 3.36, 0.87, 1.68, 5.83, 1.26, 0.67, 0.24, 0.67, 1.55, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/df-YzAnQJpU_filtered.json b/annotations_filtered/df-YzAnQJpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f3ae411dea1a871c0652de5d9b6061c5c6adab6 --- /dev/null +++ b/annotations_filtered/df-YzAnQJpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 64.69], [65.0, 65.23], [65.0, 103.17], [108.0, 107.94], [108.0, 109.59], [110.0, 153.0], [157.0, 160.27]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.19], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 58.16], ["quack", 13.02], ["musical instrument", 6.58]]], "duration": [39.69, 0.23, 38.17, -0.06, 1.59, 43.0, 3.27]} \ No newline at end of file diff --git a/annotations_filtered/df1mSOyvsXU_filtered.json b/annotations_filtered/df1mSOyvsXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81c48683604510c4cbcf7cf55d9113f015fec7ac --- /dev/null +++ b/annotations_filtered/df1mSOyvsXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.79], [9.0, 10.59], [11.0, 13.07], [18.0, 21.2], [23.0, 29.88], [34.0, 36.36], [38.0, 39.34], [44.0, 44.74], [48.0, 48.68], [50.0, 52.32], [60.0, 60.72], [63.0, 65.47], [68.0, 71.69], [75.0, 96.52], [97.0, 100.47], [101.0, 111.6], [113.0, 130.4], [130.0, 130.6], [131.0, 130.82], [131.0, 130.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 99.87, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 99.95, 0.0, 99.85, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.79, 1.59, 2.07, 3.2, 6.88, 2.36, 1.34, 0.74, 0.68, 2.32, 0.72, 2.47, 3.69, 21.52, 3.47, 10.6, 17.4, 0.6, -0.18, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/df2QdWqKC6Q_filtered.json b/annotations_filtered/df2QdWqKC6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..accda8097195bc4378a268a526b6eb2c0bbf8827 --- /dev/null +++ b/annotations_filtered/df2QdWqKC6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [27.0, 28.09], [32.0, 32.19], [36.0, 56.46], [58.0, 58.51], [61.0, 62.56], [63.0, 64.42], [68.0, 68.45], [91.0, 91.42], [132.0, 132.92], [134.0, 133.84], [147.0, 148.61], [150.0, 151.39], [168.0, 168.62], [170.0, 171.49], [172.0, 172.64], [173.0, 175.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.09, 0.19, 20.46, 0.51, 1.56, 1.42, 0.45, 0.42, 0.92, -0.16, 1.61, 1.39, 0.62, 1.49, 0.64, 2.2]} \ No newline at end of file diff --git a/annotations_filtered/dfFFgV624TA_filtered.json b/annotations_filtered/dfFFgV624TA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17c89d3df14dfb9ed783ea7bf6df81bea7af449c --- /dev/null +++ b/annotations_filtered/dfFFgV624TA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.05], [20.0, 20.51], [29.0, 29.59], [31.0, 31.92], [34.0, 43.04], [47.0, 47.98], [51.0, 53.7], [56.0, 59.19]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.73, 0.0, 34.73, 40.92], "audiomae_on_audioset": [null, null, null, null, [["music", 59.75], ["musical instrument", 6.54], ["didgeridoo", 4.66]], null, [["music", 39.51], ["guitar", 11.47], ["musical instrument", 11.12]], [["music", 64.41], ["didgeridoo", 9.21], ["musical instrument", 7.6]]], "duration": [1.05, 0.51, 0.59, 0.92, 9.04, 0.98, 2.7, 3.19]} \ No newline at end of file diff --git a/annotations_filtered/dfLN2aPZ5sM_filtered.json b/annotations_filtered/dfLN2aPZ5sM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..389bb16fd52c4b9027a3667fd8ff9a2cea04957c --- /dev/null +++ b/annotations_filtered/dfLN2aPZ5sM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 34.08], [35.0, 96.25], [97.0, 97.12], [102.0, 104.09], [106.0, 107.67], [108.0, 111.96], [112.0, 117.58], [121.0, 121.42], [125.0, 130.47], [131.0, 131.53], [135.0, 135.55]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.03, 0.0, 65.55, 38.43, 0.0, 52.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 52.13], ["pulse", 17.9], ["synthesizer", 7.1]], null, null, [["music", 30.84], ["speech", 28.8], ["siren", 5.05]], null, null, null, null], "duration": [31.08, 61.25, 0.12, 2.09, 1.67, 3.96, 5.58, 0.42, 5.47, 0.53, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/dfWdmxCHwfc_filtered.json b/annotations_filtered/dfWdmxCHwfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ab265c9fce1bcb93130bd316308066c6f34e2d0 --- /dev/null +++ b/annotations_filtered/dfWdmxCHwfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 28.58], [30.0, 31.63], [33.0, 35.14], [38.0, 38.42], [42.0, 56.24], [67.0, 69.92], [78.0, 89.87], [90.0, 89.9], [91.0, 91.64], [94.0, 98.32], [99.0, 106.35], [108.0, 109.49], [112.0, 114.37], [116.0, 117.64], [119.0, 121.78], [123.0, 128.09], [129.0, 130.08], [132.0, 132.33], [134.0, 133.84], [136.0, 136.66], [144.0, 145.05], [149.0, 166.46]], "keep_status": [false, false, true, false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [29.78, 0.0, 39.8, 0.0, 35.61, 37.17, 29.93, 0.0, 0.0, 34.8, 41.42, 0.0, 49.22, 0.0, 46.83, 34.89, 0.0, 0.0, 0.0, 0.0, 0.0, 29.79], "audiomae_on_audioset": [[["speech", 41.2], ["music", 33.71], ["trombone", 4.23]], null, [["fly, housefly", 15.15], ["music", 14.32], ["bee, wasp, etc.", 7.4]], null, [["fly, housefly", 28.35], ["insect", 15.4], ["bee, wasp, etc.", 13.08]], [["music", 19.53], ["speech", 17.57], ["foghorn", 4.96]], [["moo", 41.15], ["cattle, bovinae", 35.48], ["livestock, farm animals, working animals", 14.11]], null, null, [["hum", 41.07], ["music", 19.97], ["mains hum", 19.94]], [["insect", 18.3], ["fly, housefly", 17.01], ["hum", 11.89]], null, [["music", 26.62], ["hum", 13.26], ["mains hum", 9.08]], null, [["mains hum", 54.5], ["hum", 36.08], ["livestock, farm animals, working animals", 2.23]], [["mains hum", 43.67], ["hum", 34.32], ["noise", 3.92]], null, null, null, null, null, [["speech", 34.75], ["music", 15.88], ["livestock, farm animals, working animals", 9.18]]], "duration": [24.58, 1.63, 2.14, 0.42, 14.24, 2.92, 11.87, -0.1, 0.64, 4.32, 7.35, 1.49, 2.37, 1.64, 2.78, 5.09, 1.08, 0.33, -0.16, 0.66, 1.05, 17.46]} \ No newline at end of file diff --git a/annotations_filtered/dfofju459FA_filtered.json b/annotations_filtered/dfofju459FA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36eb8f7a79cf8f41888591423dd3b259e55c5ad7 --- /dev/null +++ b/annotations_filtered/dfofju459FA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.2], [40.0, 40.86], [61.0, 69.94], [70.0, 70.12], [76.0, 76.59], [80.0, 80.54], [82.0, 85.94], [89.0, 89.94], [98.0, 99.22], [101.0, 101.53], [104.0, 105.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.61, 0.0, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.2, 0.86, 8.94, 0.12, 0.59, 0.54, 3.94, 0.94, 1.22, 0.53, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/dfrJhivMJJY_filtered.json b/annotations_filtered/dfrJhivMJJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb0bbb3e76c2a4bbfbde6cf46980ebca0b162937 --- /dev/null +++ b/annotations_filtered/dfrJhivMJJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [7.0, 7.7], [13.0, 14.07], [16.0, 17.73], [21.0, 22.79], [24.0, 24.7], [27.0, 27.33], [33.0, 33.29], [35.0, 34.96], [35.0, 37.56], [39.0, 38.75], [39.0, 40.81], [44.0, 45.32], [47.0, 48.0], [51.0, 52.83], [59.0, 59.73], [62.0, 62.99], [68.0, 71.39], [74.0, 75.29], [80.0, 83.44], [84.0, 88.64]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 63.64, 71.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 29.54], ["music", 7.82], ["throbbing", 4.52]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.7, 1.07, 1.73, 1.79, 0.7, 0.33, 0.29, -0.04, 2.56, -0.25, 1.81, 1.32, 1.0, 1.83, 0.73, 0.99, 3.39, 1.29, 3.44, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/dg6PaO0e6wA_filtered.json b/annotations_filtered/dg6PaO0e6wA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c64c59805437a4be6d8cf27396499beed359a49 --- /dev/null +++ b/annotations_filtered/dg6PaO0e6wA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 24.21], [24.0, 29.73], [31.0, 49.81], [52.0, 55.49], [58.0, 62.48], [63.0, 73.09], [75.0, 87.29], [92.0, 94.24], [96.0, 101.43], [103.0, 110.81], [112.0, 114.93], [116.0, 121.12], [122.0, 126.55], [127.0, 168.29], [169.0, 177.8], [179.0, 196.6]], "keep_status": [true, false, false, true, false, false, true, true, false, false, true, true, true, false, true, true], "silence_prob": [35.8, 35.83, 33.73, 33.41, 35.43, 36.52, 29.14, 29.81, 29.51, 29.95, 29.57, 29.61, 29.23, 0.0, 34.36, 36.79], "audiomae_on_audioset": [[["music", 45.07], ["synthesizer", 11.58], ["keyboard (musical)", 7.75]], [["music", 65.63], ["musical instrument", 13.56], ["keyboard (musical)", 3.79]], [["music", 51.9], ["keyboard (musical)", 9.82], ["electric piano", 9.05]], [["music", 50.86], ["synthesizer", 12.09], ["mains hum", 4.65]], [["music", 65.17], ["guitar", 6.61], ["musical instrument", 6.45]], [["music", 64.38], ["ambient music", 5.9], ["synthesizer", 4.18]], [["music", 59.93], ["breaking", 3.3], ["didgeridoo", 3.22]], [["music", 46.85], ["theremin", 9.09], ["electronic music", 4.03]], [["music", 57.21], ["throbbing", 8.54], ["mechanisms", 4.54]], [["music", 89.8], ["synthesizer", 1.39], ["electronic music", 1.17]], [["cattle, bovinae", 24.91], ["livestock, farm animals, working animals", 18.31], ["moo", 16.17]], [["music", 38.51], ["foghorn", 21.12], ["theremin", 4.37]], [["hum", 24.31], ["music", 23.36], ["mains hum", 21.8]], null, [["music", 47.32], ["speech", 16.49], ["singing bowl", 4.96]], [["music", 58.87], ["musical instrument", 5.57], ["synthesizer", 4.56]]], "duration": [18.21, 5.73, 18.81, 3.49, 4.48, 10.09, 12.29, 2.24, 5.43, 7.81, 2.93, 5.12, 4.55, 41.29, 8.8, 17.6]} \ No newline at end of file diff --git a/annotations_filtered/dgGvAQ3kcs4_filtered.json b/annotations_filtered/dgGvAQ3kcs4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38f4c92ea194ee42dfb81e098aa49fcb928aa008 --- /dev/null +++ b/annotations_filtered/dgGvAQ3kcs4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [4.0, 5.68], [12.0, 12.51], [13.0, 13.91], [16.0, 15.96], [20.0, 20.71], [26.0, 27.23], [31.0, 31.41], [32.0, 35.46], [36.0, 36.42], [39.0, 40.58], [41.0, 41.89], [44.0, 44.64], [47.0, 49.57], [51.0, 51.95], [58.0, 58.26], [61.0, 61.48], [67.0, 70.38], [72.0, 73.84], [76.0, 76.38], [77.0, 78.93], [81.0, 81.9], [85.0, 85.87], [87.0, 93.88], [94.0, 95.67], [96.0, 97.09], [97.0, 99.76], [101.0, 102.24], [105.0, 107.64], [109.0, 109.54], [110.0, 112.23], [116.0, 117.69], [123.0, 124.71], [126.0, 130.17], [131.0, 133.3], [134.0, 135.23], [137.0, 139.48], [142.0, 145.32], [147.0, 151.16], [153.0, 159.38], [162.0, 163.07], [164.0, 164.27], [165.0, 167.09], [168.0, 170.13], [171.0, 172.3], [173.0, 192.08], [197.0, 197.56], [200.0, 202.49], [203.0, 206.66], [209.0, 209.9], [214.0, 214.68], [215.0, 216.24], [219.0, 218.84], [220.0, 222.45], [225.0, 225.24], [226.0, 229.0], [230.0, 231.11], [231.0, 232.43], [233.0, 235.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, true, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 36.68, 0.0, 0.0, 0.0, 39.67, 0.0, 0.0, 0.0, 0.0, 0.0, 35.27, 0.0, 0.0, 33.26, 0.0, 59.77, 0.0, 43.56, 0.0, 0.0, 50.46, 82.61, 0.0, 39.99, 53.53, 52.8, 38.93, 0.0, 0.0, 33.88, 34.93, 0.0, 37.2, 0.0, 43.53, 47.43, 0.0, 0.0, 0.0, 0.0, 40.4, 0.0, 34.18, 0.0, 0.0, 37.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["whoosh, swoosh, swish", 9.76], ["white noise", 7.46], ["radio", 6.6]], null, null, null, [["microwave oven", 8.17], ["whale vocalization", 6.26], ["noise", 5.22]], null, null, null, null, null, [["radio", 53.65], ["speech", 22.33], ["sidetone", 8.03]], null, null, [["frog", 27.84], ["sidetone", 24.13], ["croak", 14.86]], null, null, null, [["radio", 22.31], ["speech", 20.98], ["sidetone", 10.55]], null, null, null, null, null, [["sidetone", 35.21], ["radio", 11.87], ["buzz", 4.62]], null, null, [["animal", 55.48], ["domestic animals, pets", 12.06], ["dog", 6.03]], null, null, [["sidetone", 83.25], ["radio", 5.68], ["noise", 1.9]], [["sidetone", 28.56], ["noise", 13.31], ["radio", 12.52]], null, [["noise", 40.66], ["radio", 5.59], ["effects unit", 4.53]], null, [["sidetone", 76.51], ["hum", 7.6], ["mains hum", 6.22]], [["speech", 18.87], ["animal", 7.36], ["radio", 5.97]], null, null, null, null, [["dog", 12.9], ["animal", 6.96], ["domestic animals, pets", 6.27]], null, [["frog", 39.76], ["croak", 13.03], ["radio", 8.75]], null, null, [["noise", 31.05], ["speech", 14.45], ["radio", 10.0]]], "duration": [1.44, 1.68, 0.51, 0.91, -0.04, 0.71, 1.23, 0.41, 3.46, 0.42, 1.58, 0.89, 0.64, 2.57, 0.95, 0.26, 0.48, 3.38, 1.84, 0.38, 1.93, 0.9, 0.87, 6.88, 1.67, 1.09, 2.76, 1.24, 2.64, 0.54, 2.23, 1.69, 1.71, 4.17, 2.3, 1.23, 2.48, 3.32, 4.16, 6.38, 1.07, 0.27, 2.09, 2.13, 1.3, 19.08, 0.56, 2.49, 3.66, 0.9, 0.68, 1.24, -0.16, 2.45, 0.24, 3.0, 1.11, 1.43, 2.68]} \ No newline at end of file diff --git a/annotations_filtered/dgJKcCZkXxY_filtered.json b/annotations_filtered/dgJKcCZkXxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d221f6d64353b7b6799910328bc309acd451be97 --- /dev/null +++ b/annotations_filtered/dgJKcCZkXxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.63], [10.0, 18.47], [25.0, 25.41], [26.0, 28.21], [29.0, 32.32], [41.0, 41.79], [45.0, 49.98], [51.0, 56.94], [59.0, 59.8]], "keep_status": [false, false, false, false, true, false, true, true, false], "silence_prob": [29.41, 30.12, 0.0, 45.14, 32.44, 0.0, 29.72, 30.31, 0.0], "audiomae_on_audioset": [[["speech", 39.89], ["music", 23.99], ["mains hum", 10.12]], [["music", 50.98], ["hum", 13.76], ["mains hum", 8.85]], null, [["music", 52.17], ["didgeridoo", 20.91], ["throbbing", 4.28]], [["mosquito", 22.71], ["fly, housefly", 14.81], ["music", 12.41]], null, [["speech", 33.49], ["music", 16.22], ["hum", 14.34]], [["music", 46.23], ["mains hum", 12.32], ["hum", 10.36]], null], "duration": [6.63, 8.47, 0.41, 2.21, 3.32, 0.79, 4.98, 5.94, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/dgM9V3lEZvE_filtered.json b/annotations_filtered/dgM9V3lEZvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ced4b2eb9efc2018ad1ca2ff6822c557a75b900 --- /dev/null +++ b/annotations_filtered/dgM9V3lEZvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.93], [11.0, 20.01], [22.0, 22.82], [24.0, 25.07], [26.0, 26.2], [28.0, 28.43], [32.0, 31.77], [32.0, 32.71], [33.0, 33.78], [36.0, 37.3], [41.0, 45.1], [48.0, 48.15], [50.0, 52.05], [53.0, 53.64], [59.0, 59.22], [60.0, 64.35], [66.0, 65.8], [67.0, 67.56], [69.0, 68.66], [70.0, 75.24], [77.0, 77.67], [79.0, 82.24], [85.0, 87.84], [89.0, 90.63], [91.0, 92.16], [107.0, 106.98], [112.0, 112.19], [114.0, 115.16], [117.0, 122.08], [122.0, 122.3], [122.0, 122.77], [134.0, 135.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [76.53, 44.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 84.43, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 72.46, 0.0, 52.27, 34.04, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 34.53], ["speech", 23.89], ["hum", 13.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.12], ["hum", 6.26], ["throbbing", 5.36]], null, null, null, null, null, [["speech", 49.91], ["busy signal", 4.75], ["radio", 4.69]], null, null, null], "duration": [2.93, 9.01, 0.82, 1.07, 0.2, 0.43, -0.23, 0.71, 0.78, 1.3, 4.1, 0.15, 2.05, 0.64, 0.22, 4.35, -0.2, 0.56, -0.34, 5.24, 0.67, 3.24, 2.84, 1.63, 1.16, -0.02, 0.19, 1.16, 5.08, 0.3, 0.77, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/dgXARu_D5d8_filtered.json b/annotations_filtered/dgXARu_D5d8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b85327668ff6f65b067e70c665a92f7baeb0870 --- /dev/null +++ b/annotations_filtered/dgXARu_D5d8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.04], [15.0, 17.52], [21.0, 38.96], [40.0, 67.64], [68.0, 69.8], [71.0, 74.98], [76.0, 77.06], [78.0, 79.59], [86.0, 89.78], [93.0, 93.34], [96.0, 97.17], [101.0, 104.13], [106.0, 107.79], [110.0, 119.37], [121.0, 121.14], [123.0, 123.69], [129.0, 128.95], [130.0, 136.24], [138.0, 141.91], [146.0, 146.47], [148.0, 148.8], [151.0, 153.1], [155.0, 156.2], [158.0, 159.0]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.98, 33.49, 35.52, 0.0, 34.3, 0.0, 0.0, 80.11, 0.0, 0.0, 87.55, 0.0, 72.46, 0.0, 0.0, 0.0, 57.72, 57.01, 0.0, 0.0, 90.25, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 78.71], ["whale vocalization", 1.97], ["electronic music", 1.53]], [["music", 47.49], ["speech", 9.84], ["hum", 6.96]], [["hum", 22.92], ["mains hum", 17.08], ["music", 16.28]], null, [["speech", 60.82], ["music", 8.36], ["explosion", 3.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 2.52, 17.96, 27.64, 1.8, 3.98, 1.06, 1.59, 3.78, 0.34, 1.17, 3.13, 1.79, 9.37, 0.14, 0.69, -0.05, 6.24, 3.91, 0.47, 0.8, 2.1, 1.2, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/dgdEr-mXQT4_filtered.json b/annotations_filtered/dgdEr-mXQT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..084a2039bc9911eb0653d02b21b0cd023001eeef --- /dev/null +++ b/annotations_filtered/dgdEr-mXQT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.72], [14.0, 14.4], [19.0, 19.68], [21.0, 20.98], [26.0, 26.45], [27.0, 27.7], [29.0, 28.88], [35.0, 35.5], [36.0, 36.86], [37.0, 37.93], [47.0, 47.07], [70.0, 71.42], [86.0, 86.86], [91.0, 91.37], [94.0, 94.54], [97.0, 97.5], [98.0, 98.58], [107.0, 107.28], [108.0, 108.57], [111.0, 111.37], [118.0, 117.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.4, 0.68, -0.02, 0.45, 0.7, -0.12, 0.5, 0.86, 0.93, 0.07, 1.42, 0.86, 0.37, 0.54, 0.5, 0.58, 0.28, 0.57, 0.37, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/dgoDvnebHRw_filtered.json b/annotations_filtered/dgoDvnebHRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2558ad85c542ca6e8843d7e1b8773595ecc55a4 --- /dev/null +++ b/annotations_filtered/dgoDvnebHRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.44], [15.0, 16.82]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.44, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/dhJPm7NolLc_filtered.json b/annotations_filtered/dhJPm7NolLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3957b9541de7188e88a0d1ae220bd47937f3a515 --- /dev/null +++ b/annotations_filtered/dhJPm7NolLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [7.0, 10.72], [12.0, 12.7], [19.0, 19.16], [27.0, 33.22], [38.0, 37.99], [42.0, 43.01], [57.0, 56.96], [58.0, 59.02], [60.0, 60.52], [69.0, 71.59], [79.0, 80.54], [90.0, 90.46], [91.0, 93.31], [94.0, 103.25], [105.0, 104.95], [107.0, 107.33], [110.0, 113.02], [115.0, 116.8], [118.0, 118.57], [128.0, 128.48], [132.0, 132.48], [135.0, 138.82], [139.0, 146.79], [148.0, 147.92]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.1, 36.24, 0.0, 0.0, 48.95, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 0.0, 48.95, 39.11, 0.0, 0.0, 46.33, 0.0, 0.0, 0.0, 0.0, 44.55, 32.27, 0.0], "audiomae_on_audioset": [[["music", 24.02], ["hum", 6.76], ["throbbing", 6.45]], [["animal", 39.94], ["dog", 27.21], ["domestic animals, pets", 16.25]], null, null, [["sine wave", 67.1], ["chirp tone", 17.53], ["crying, sobbing", 1.65]], null, null, null, null, null, null, null, null, [["music", 40.45], ["speech", 39.0], ["didgeridoo", 2.25]], [["music", 74.84], ["speech", 13.65], ["didgeridoo", 1.71]], null, null, [["music", 58.62], ["speech", 21.49], ["sidetone", 3.82]], null, null, null, null, [["music", 78.19], ["didgeridoo", 4.62], ["musical instrument", 2.57]], [["music", 74.28], ["speech", 18.47], ["smash, crash", 0.73]], null], "duration": [2.11, 3.72, 0.7, 0.16, 6.22, -0.01, 1.01, -0.04, 1.02, 0.52, 2.59, 1.54, 0.46, 2.31, 9.25, -0.05, 0.33, 3.02, 1.8, 0.57, 0.48, 0.48, 3.82, 7.79, -0.08]} \ No newline at end of file diff --git a/annotations_filtered/dhPSvTyGSgs_filtered.json b/annotations_filtered/dhPSvTyGSgs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d35b3049eea8a557265a3a53360be697e5768f9f --- /dev/null +++ b/annotations_filtered/dhPSvTyGSgs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.03], [11.0, 11.62], [16.0, 19.36], [20.0, 21.69], [24.0, 23.9], [27.0, 39.14], [42.0, 46.89], [48.0, 48.86], [56.0, 56.2], [61.0, 60.94], [62.0, 63.53], [64.0, 65.52], [69.0, 69.43], [70.0, 70.75], [74.0, 73.9], [75.0, 77.28], [78.0, 97.16], [98.0, 109.27], [110.0, 115.11], [117.0, 119.04], [121.0, 121.41], [122.0, 126.08], [127.0, 131.18]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 70.44, 0.0, 0.0, 43.35, 77.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.29, 32.71, 31.58, 31.06, 35.54, 0.0, 45.82, 41.4], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 24.33], ["throbbing", 12.45], ["walk, footsteps", 9.92]], null, null, null, null, null, null, null, null, null, [["music", 52.73], ["mains hum", 4.37], ["hum", 3.91]], [["music", 48.26], ["musical instrument", 5.27], ["harp", 4.42]], [["music", 48.14], ["theremin", 33.22], ["synthesizer", 3.01]], [["theremin", 55.97], ["music", 34.47], ["musical instrument", 1.29]], [["music", 57.17], ["theremin", 4.78], ["didgeridoo", 3.83]], null, [["music", 57.98], ["ambient music", 6.76], ["throbbing", 5.44]], [["music", 30.5], ["speech", 28.86], ["hum", 7.6]]], "duration": [0.03, 0.62, 3.36, 1.69, -0.1, 12.14, 4.89, 0.86, 0.2, -0.06, 1.53, 1.52, 0.43, 0.75, -0.1, 2.28, 19.16, 11.27, 5.11, 2.04, 0.41, 4.08, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/di3Xh95aXp8_filtered.json b/annotations_filtered/di3Xh95aXp8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aab3900408105fd9f65648d7b9b066c036e15274 --- /dev/null +++ b/annotations_filtered/di3Xh95aXp8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.17], [9.0, 9.96], [12.0, 12.92], [15.0, 16.65], [18.0, 19.21], [24.0, 25.25], [27.0, 29.12], [30.0, 33.47], [36.0, 37.47], [45.0, 45.76], [47.0, 47.73], [50.0, 51.31], [53.0, 52.96], [54.0, 54.62], [58.0, 59.93], [63.0, 63.34], [72.0, 72.77], [75.0, 76.47], [77.0, 78.75], [80.0, 81.55], [82.0, 83.88], [85.0, 86.21], [89.0, 90.05], [97.0, 98.42], [101.0, 101.46], [106.0, 106.71], [111.0, 111.52], [117.0, 117.17], [119.0, 120.11], [122.0, 127.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.17, 0.96, 0.92, 1.65, 1.21, 1.25, 2.12, 3.47, 1.47, 0.76, 0.73, 1.31, -0.04, 0.62, 1.93, 0.34, 0.77, 1.47, 1.75, 1.55, 1.88, 1.21, 1.05, 1.42, 0.46, 0.71, 0.52, 0.17, 1.11, 5.97]} \ No newline at end of file diff --git a/annotations_filtered/diFDBNNmnnU_filtered.json b/annotations_filtered/diFDBNNmnnU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55d08133f12c60ee00d77c58a62f8590971c2de6 --- /dev/null +++ b/annotations_filtered/diFDBNNmnnU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.21], [10.0, 11.58], [14.0, 15.38], [16.0, 16.87], [18.0, 18.27], [20.0, 20.39], [27.0, 30.47], [38.0, 37.84], [49.0, 49.22], [52.0, 52.69], [65.0, 65.31], [66.0, 66.92], [69.0, 71.98], [72.0, 78.41], [79.0, 86.32], [91.0, 91.17], [92.0, 98.32]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 37.15, 31.09, 29.14, 0.0, 29.2], "audiomae_on_audioset": [null, null, null, null, null, null, [["shofar", 33.42], ["wind instrument, woodwind instrument", 27.8], ["music", 7.33]], null, null, null, null, null, [["music", 34.28], ["synthesizer", 11.63], ["didgeridoo", 7.58]], [["music", 68.1], ["synthesizer", 12.12], ["musical instrument", 3.34]], [["music", 58.02], ["speech", 8.17], ["throbbing", 6.58]], null, [["vehicle", 38.51], ["car", 20.99], ["outside, urban or manmade", 6.66]]], "duration": [0.21, 1.58, 1.38, 0.87, 0.27, 0.39, 3.47, -0.16, 0.22, 0.69, 0.31, 0.92, 2.98, 6.41, 7.32, 0.17, 6.32]} \ No newline at end of file diff --git a/annotations_filtered/diLE4umndNM_filtered.json b/annotations_filtered/diLE4umndNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69f97a890942cc778e7606391528b18a08932070 --- /dev/null +++ b/annotations_filtered/diLE4umndNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.31], [1.0, 98.73], [100.0, 111.11], [113.0, 120.45], [123.0, 156.88]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 30.91, 31.21, 0.0], "audiomae_on_audioset": [null, null, [["whale vocalization", 14.65], ["buzz", 10.35], ["music", 6.09]], [["speech", 67.87], ["explosion", 12.3], ["hubbub, speech noise, speech babble", 3.66]], null], "duration": [0.31, 97.73, 11.11, 7.45, 33.88]} \ No newline at end of file diff --git a/annotations_filtered/diNo0cO2Je0_filtered.json b/annotations_filtered/diNo0cO2Je0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebd3d2946e9c90004ff014714247a31b15e6206f --- /dev/null +++ b/annotations_filtered/diNo0cO2Je0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 41.82], [45.0, 101.22], [103.0, 127.47], [128.0, 128.53], [129.0, 129.51], [134.0, 142.89], [145.0, 166.92], [169.0, 185.25], [188.0, 204.9], [206.0, 213.6]], "keep_status": [false, false, true, false, false, true, false, false, true, false], "silence_prob": [28.6, 0.0, 30.64, 0.0, 0.0, 29.77, 29.47, 28.75, 28.61, 28.18], "audiomae_on_audioset": [[["hum", 42.75], ["mains hum", 30.81], ["throbbing", 13.35]], null, [["music", 40.6], ["whack, thwack", 11.82], ["whip", 8.05]], null, null, [["music", 55.0], ["throbbing", 7.96], ["didgeridoo", 6.29]], [["music", 66.85], ["hum", 7.85], ["throbbing", 7.25]], [["music", 45.81], ["speech", 33.43], ["machine gun", 2.93]], [["cacophony", 26.45], ["mains hum", 21.55], ["hum", 20.61]], [["music", 66.75], ["buzz", 3.77], ["throbbing", 3.71]]], "duration": [21.82, 56.22, 24.47, 0.53, 0.51, 8.89, 21.92, 16.25, 16.9, 7.6]} \ No newline at end of file diff --git a/annotations_filtered/diX4myfR6vU_filtered.json b/annotations_filtered/diX4myfR6vU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c74418aa90cd5191f693b354e8fe0346220652ae --- /dev/null +++ b/annotations_filtered/diX4myfR6vU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.82], [13.0, 13.88], [16.0, 16.09], [17.0, 17.41], [18.0, 18.49], [21.0, 24.44], [32.0, 32.43], [34.0, 34.84], [37.0, 37.4], [53.0, 53.03], [57.0, 58.95], [59.0, 61.77], [63.0, 63.81], [66.0, 68.61], [70.0, 79.39], [82.0, 82.53], [83.0, 83.56], [96.0, 96.47], [99.0, 100.7], [102.0, 102.15], [104.0, 104.67], [108.0, 108.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 50.41, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.82, 0.88, 0.09, 0.41, 0.49, 3.44, 0.43, 0.84, 0.4, 0.03, 1.95, 2.77, 0.81, 2.61, 9.39, 0.53, 0.56, 0.47, 1.7, 0.15, 0.67, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/diteeSODzTQ_filtered.json b/annotations_filtered/diteeSODzTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..138dec2abdb14810399592911117b19f931697ff --- /dev/null +++ b/annotations_filtered/diteeSODzTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.73], [3.0, 6.86], [13.0, 13.88], [14.0, 15.69], [17.0, 17.68], [19.0, 19.79], [22.0, 28.02], [30.0, 33.72], [38.0, 52.74], [57.0, 58.33], [60.0, 61.86], [65.0, 71.96], [75.0, 88.38], [91.0, 92.03], [93.0, 96.18], [98.0, 99.27], [100.0, 100.21], [102.0, 103.28], [105.0, 112.62], [115.0, 114.64], [118.0, 119.18]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 30.62, 30.01, 33.03, 0.0, 0.0, 33.4, 31.71, 0.0, 100.0, 0.0, 0.0, 0.0, 41.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 34.87], ["speech", 27.8], ["explosion", 3.84]], [["music", 43.42], ["speech", 16.18], ["electronic music", 3.29]], [["music", 45.31], ["didgeridoo", 6.44], ["speech", 5.96]], null, null, [["music", 21.75], ["hum", 13.96], ["breaking", 5.55]], [["music", 52.15], ["speech", 11.04], ["livestock, farm animals, working animals", 10.21]], null, null, null, null, null, [["noise", 28.81], ["speech", 18.6], ["animal", 9.44]], null, null], "duration": [0.73, 3.86, 0.88, 1.69, 0.68, 0.79, 6.02, 3.72, 14.74, 1.33, 1.86, 6.96, 13.38, 1.03, 3.18, 1.27, 0.21, 1.28, 7.62, -0.36, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/dj0MEV7d1NE_filtered.json b/annotations_filtered/dj0MEV7d1NE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ff48419577ada6ba4e15f55e4de0f2cfb6490c --- /dev/null +++ b/annotations_filtered/dj0MEV7d1NE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 23.79], [25.0, 27.26], [29.0, 43.68], [49.0, 49.13], [53.0, 53.11], [60.0, 62.31], [68.0, 87.67], [94.0, 97.43]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [91.13, 77.36, 36.19, 0.0, 0.0, 42.35, 30.33, 50.97], "audiomae_on_audioset": [null, null, [["music", 71.72], ["hum", 5.12], ["mains hum", 2.77]], null, null, [["speech", 22.89], ["mains hum", 22.06], ["hum", 21.41]], [["hum", 43.02], ["music", 21.06], ["mains hum", 19.59]], null], "duration": [20.79, 2.26, 14.68, 0.13, 0.11, 2.31, 19.67, 3.43]} \ No newline at end of file diff --git a/annotations_filtered/dj5zbxA4bEI_filtered.json b/annotations_filtered/dj5zbxA4bEI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4c1576366371e8e5489b3751d88f5a7a9dc195e --- /dev/null +++ b/annotations_filtered/dj5zbxA4bEI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [4.0, 4.5], [7.0, 7.26], [7.0, 7.52], [13.0, 13.78], [18.0, 18.59], [22.0, 23.36], [36.0, 66.77], [73.0, 75.64], [78.0, 84.84], [89.0, 103.57], [111.0, 112.73], [115.0, 123.92]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.74, 43.15, 67.76, 0.0, 35.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 37.87], ["music", 21.28], ["buzz", 5.17]], null, null, [["speech", 55.56], ["groan", 10.87], ["outside, rural or natural", 4.08]]], "duration": [0.7, 0.5, 0.26, 0.52, 0.78, 0.59, 1.36, 30.77, 2.64, 6.84, 14.57, 1.73, 8.92]} \ No newline at end of file diff --git a/annotations_filtered/djIvmaYI9LQ_filtered.json b/annotations_filtered/djIvmaYI9LQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a7f62cdb04fb681a47c6fa9dbbd79a5a137eed7 --- /dev/null +++ b/annotations_filtered/djIvmaYI9LQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.08], [5.0, 6.71], [9.0, 9.81], [16.0, 16.71], [20.0, 22.01], [27.0, 28.12], [30.0, 32.19], [34.0, 40.29], [44.0, 48.15], [51.0, 51.75], [52.0, 53.69], [57.0, 59.14], [61.0, 61.38], [63.0, 68.28], [78.0, 93.73], [94.0, 94.73], [96.0, 96.08], [98.0, 104.36]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, true, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.11, 0.0, 46.12, 34.29, 31.46, 0.0, 0.0, 39.49, 0.0, 35.05, 30.52, 0.0, 0.0, 36.22], "audiomae_on_audioset": [null, null, null, null, [["speech", 37.34], ["sidetone", 34.77], ["music", 2.97]], null, [["hum", 37.27], ["music", 8.36], ["throbbing", 6.42]], [["speech", 64.37], ["vehicle", 7.9], ["explosion", 5.39]], [["speech", 46.15], ["hum", 8.87], ["eruption", 4.67]], null, null, [["speech", 30.16], ["sidetone", 23.28], ["music", 12.36]], null, [["speech", 51.58], ["hum", 8.32], ["vehicle", 7.72]], [["speech", 23.36], ["music", 14.84], ["reverberation", 4.93]], null, null, [["speech", 22.92], ["hum", 15.66], ["mains hum", 13.95]]], "duration": [0.08, 1.71, 0.81, 0.71, 2.01, 1.12, 2.19, 6.29, 4.15, 0.75, 1.69, 2.14, 0.38, 5.28, 15.73, 0.73, 0.08, 6.36]} \ No newline at end of file diff --git a/annotations_filtered/djMYTM1p318_filtered.json b/annotations_filtered/djMYTM1p318_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..914afd578b782ec20faf844e3ebb9990130983eb --- /dev/null +++ b/annotations_filtered/djMYTM1p318_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.49], [11.0, 11.4], [12.0, 12.95], [14.0, 14.96], [16.0, 17.98], [22.0, 23.68], [27.0, 27.01], [28.0, 28.76], [30.0, 30.18], [32.0, 32.36], [34.0, 34.89], [36.0, 37.2], [39.0, 42.03], [45.0, 45.91], [47.0, 47.78], [66.0, 67.32], [68.0, 69.92], [73.0, 74.63], [75.0, 77.8], [80.0, 81.36], [91.0, 92.16], [94.0, 97.92], [106.0, 106.35], [106.0, 106.42], [106.0, 106.46], [107.0, 111.99], [113.0, 114.37], [116.0, 117.88], [119.0, 119.16], [122.0, 123.77], [125.0, 131.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.49, 0.4, 0.95, 0.96, 1.98, 1.68, 0.01, 0.76, 0.18, 0.36, 0.89, 1.2, 3.03, 0.91, 0.78, 1.32, 1.92, 1.63, 2.8, 1.36, 1.16, 3.92, 0.35, 0.42, 0.46, 4.99, 1.37, 1.88, 0.16, 1.77, 6.63]} \ No newline at end of file diff --git a/annotations_filtered/djPS3AC9DKk_filtered.json b/annotations_filtered/djPS3AC9DKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d10d60d8d58227b3cee3998cc2c3268ccd634e47 --- /dev/null +++ b/annotations_filtered/djPS3AC9DKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.29], [7.0, 7.57], [9.0, 9.96], [43.0, 44.02], [72.0, 75.22], [78.0, 84.27], [88.0, 88.42], [90.0, 90.69], [93.0, 92.72]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.67, 35.08, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["applause", 19.54], ["clapping", 17.0], ["fart", 14.54]], [["moo", 30.56], ["cattle, bovinae", 29.93], ["livestock, farm animals, working animals", 13.62]], null, null, null], "duration": [1.29, 0.57, 0.96, 1.02, 3.22, 6.27, 0.42, 0.69, -0.28]} \ No newline at end of file diff --git a/annotations_filtered/djTx7slpfHI_filtered.json b/annotations_filtered/djTx7slpfHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..390211033a78318cc055d46b2175cc039f4dd0db --- /dev/null +++ b/annotations_filtered/djTx7slpfHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 43.04], [44.0, 90.36], [92.0, 102.59], [103.0, 103.28]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 32.31, 0.0], "audiomae_on_audioset": [null, null, [["whack, thwack", 34.53], ["music", 12.27], ["mechanisms", 7.07]], null], "duration": [42.04, 46.36, 10.59, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/djUYiJu6K48_filtered.json b/annotations_filtered/djUYiJu6K48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc2d3f9db853d694efe7c342d3291ce116cf075a --- /dev/null +++ b/annotations_filtered/djUYiJu6K48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.21], [13.0, 15.92], [20.0, 20.95], [21.0, 22.91], [27.0, 27.87], [32.0, 31.78], [33.0, 34.82], [39.0, 39.41], [70.0, 73.5], [78.0, 92.55], [93.0, 113.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 33.77, 33.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 49.57], ["mains hum", 18.25], ["throbbing", 9.49]], [["speech", 29.09], ["buzz", 23.21], ["vehicle", 5.36]]], "duration": [0.21, 2.92, 0.95, 1.91, 0.87, -0.22, 1.82, 0.41, 3.5, 14.55, 20.12]} \ No newline at end of file diff --git a/annotations_filtered/djh21tkgGJ4_filtered.json b/annotations_filtered/djh21tkgGJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76d604763bb6d8f1b2e174d12bce0cab7bdab283 --- /dev/null +++ b/annotations_filtered/djh21tkgGJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.43], [14.0, 15.08], [22.0, 22.65], [26.0, 27.16], [28.0, 35.55], [38.0, 37.76], [38.0, 39.55], [41.0, 40.91], [48.0, 52.59], [54.0, 54.46], [56.0, 57.01], [58.0, 58.02], [58.0, 59.66], [61.0, 61.28], [74.0, 81.57], [83.0, 83.88], [86.0, 89.45], [90.0, 90.32], [93.0, 96.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.64, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 85.35, 0.0, 91.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.43, 1.08, 0.65, 1.16, 7.55, -0.24, 1.55, -0.09, 4.59, 0.46, 1.01, 0.02, 1.66, 0.28, 7.57, 0.88, 3.45, 0.32, 3.18]} \ No newline at end of file diff --git a/annotations_filtered/djr5QNJG73k_filtered.json b/annotations_filtered/djr5QNJG73k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb139d2b1d1190ffbee730b10ca34e0370e81834 --- /dev/null +++ b/annotations_filtered/djr5QNJG73k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.81], [35.0, 35.6], [39.0, 39.19], [40.0, 40.37], [41.0, 41.15], [42.0, 42.45], [48.0, 48.15], [59.0, 60.56], [70.0, 70.01]], "keep_status": [true, false, false, false, false, false, false, false, false], "silence_prob": [32.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 15.39], ["music", 8.6], ["explosion", 1.97]], null, null, null, null, null, null, null, null], "duration": [2.81, 0.6, 0.19, 0.37, 0.15, 0.45, 0.15, 1.56, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/djv5gGXEyXo_filtered.json b/annotations_filtered/djv5gGXEyXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64ae718c57e39a5d0c8248f3e844496bf7d80bbf --- /dev/null +++ b/annotations_filtered/djv5gGXEyXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.44], [7.0, 6.96], [11.0, 12.65], [17.0, 17.2], [20.0, 21.07], [22.0, 24.14], [27.0, 28.49], [29.0, 36.86], [38.0, 43.16], [43.0, 45.94], [47.0, 60.99], [64.0, 84.45], [85.0, 87.1], [88.0, 94.64], [96.0, 103.08], [109.0, 109.38], [111.0, 112.73], [113.0, 112.95], [113.0, 141.94], [145.0, 146.4], [148.0, 149.15], [150.0, 151.12], [153.0, 154.95], [156.0, 156.3], [158.0, 158.36], [164.0, 164.25], [166.0, 167.16], [168.0, 175.85]], "keep_status": [false, false, false, false, false, true, false, true, true, true, true, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 46.33, 0.0, 41.85, 44.63, 44.46, 41.54, 44.04, 50.46, 41.2, 44.55, 0.0, 0.0, 0.0, 46.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.7], "audiomae_on_audioset": [null, null, null, null, null, [["sine wave", 23.12], ["sidetone", 16.11], ["chirp tone", 8.96]], null, [["hum", 31.04], ["speech", 12.05], ["rumble", 11.59]], [["hum", 21.88], ["speech", 11.37], ["rumble", 7.79]], [["speech", 46.94], ["rumble", 12.54], ["sidetone", 6.52]], [["speech", 25.32], ["sidetone", 22.22], ["hum", 18.55]], [["music", 46.63], ["hum", 13.47], ["mains hum", 5.92]], null, [["sidetone", 21.06], ["hum", 13.27], ["music", 11.29]], [["hum", 40.21], ["throbbing", 19.11], ["speech", 15.54]], null, null, null, [["hum", 23.31], ["sidetone", 23.13], ["radio", 9.05]], null, null, null, null, null, null, null, null, [["throbbing", 51.88], ["hum", 23.79], ["music", 13.71]]], "duration": [0.44, -0.04, 1.65, 0.2, 1.07, 2.14, 1.49, 7.86, 5.16, 2.94, 13.99, 20.45, 2.1, 6.64, 7.08, 0.38, 1.73, -0.05, 28.94, 1.4, 1.15, 1.12, 1.95, 0.3, 0.36, 0.25, 1.16, 7.85]} \ No newline at end of file diff --git a/annotations_filtered/dk3BfcWrx8c_filtered.json b/annotations_filtered/dk3BfcWrx8c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95bd280b9bc3bc678b7fcdbc923096331de63a16 --- /dev/null +++ b/annotations_filtered/dk3BfcWrx8c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.28], [12.0, 15.92], [17.0, 18.0], [19.0, 21.14], [24.0, 24.31], [26.0, 26.57], [28.0, 31.06], [34.0, 34.32], [35.0, 35.99], [38.0, 38.96], [42.0, 43.16], [44.0, 45.3], [47.0, 47.8], [52.0, 53.37], [56.0, 56.96], [58.0, 58.01], [58.0, 62.56], [63.0, 65.06], [66.0, 68.84], [70.0, 70.65], [72.0, 73.31], [76.0, 78.09], [79.0, 86.02], [88.0, 88.86], [90.0, 91.05], [93.0, 94.02], [95.0, 100.62], [101.0, 101.14], [102.0, 102.3], [104.0, 106.32], [114.0, 114.51], [118.0, 119.01]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [38.56, 35.26, 0.0, 59.86, 0.0, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 99.98, 100.0, 0.0, 0.0, 84.43, 92.15, 0.0, 0.0, 0.0, 46.61, 0.0, 0.0, 87.37, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 78.88], ["fart", 2.11], ["livestock, farm animals, working animals", 1.68]], [["speech", 38.02], ["livestock, farm animals, working animals", 11.05], ["animal", 4.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["crow", 35.09], ["speech", 8.36], ["caw", 8.29]], null, null, null, null, null], "duration": [11.28, 3.92, 1.0, 2.14, 0.31, 0.57, 3.06, 0.32, 0.99, 0.96, 1.16, 1.3, 0.8, 1.37, 0.96, 0.01, 4.56, 2.06, 2.84, 0.65, 1.31, 2.09, 7.02, 0.86, 1.05, 1.02, 5.62, 0.14, 0.3, 2.32, 0.51, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/dkAv65bo8a8_filtered.json b/annotations_filtered/dkAv65bo8a8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e58b75c16c39f7656119fba999026c350e5e7ecb --- /dev/null +++ b/annotations_filtered/dkAv65bo8a8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.25], [19.0, 21.49], [24.0, 24.88], [28.0, 28.75], [29.0, 30.84], [32.0, 33.25], [36.0, 37.71], [41.0, 41.49], [46.0, 46.06], [49.0, 50.06], [51.0, 52.41], [53.0, 53.97], [55.0, 55.85], [58.0, 59.97], [61.0, 61.16], [62.0, 64.47], [67.0, 68.42], [69.0, 70.29], [71.0, 71.39], [75.0, 75.44], [77.0, 77.9], [80.0, 80.76], [84.0, 88.05], [88.0, 91.52], [93.0, 96.03], [98.0, 100.18], [101.0, 103.0], [105.0, 107.5], [108.0, 112.67], [114.0, 115.79], [117.0, 118.96], [120.0, 123.58], [127.0, 127.67], [130.0, 132.14], [134.0, 136.09], [137.0, 137.27], [138.0, 139.99], [143.0, 144.36], [146.0, 149.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [51.44, 57.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.51, 77.03, 73.06, 91.3, 67.89, 56.48, 65.55, 0.0, 0.0, 49.68, 0.0, 57.48, 55.25, 0.0, 0.0, 0.0, 84.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.42], ["didgeridoo", 22.54], ["musical instrument", 2.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.86], ["musical instrument", 6.07], ["hum", 6.03]], null, null, null, null, null, null, null], "duration": [2.25, 2.49, 0.88, 0.75, 1.84, 1.25, 1.71, 0.49, 0.06, 1.06, 1.41, 0.97, 0.85, 1.97, 0.16, 2.47, 1.42, 1.29, 0.39, 0.44, 0.9, 0.76, 4.05, 3.52, 3.03, 2.18, 2.0, 2.5, 4.67, 1.79, 1.96, 3.58, 0.67, 2.14, 2.09, 0.27, 1.99, 1.36, 3.69]} \ No newline at end of file diff --git a/annotations_filtered/dkCUjz7I36M_filtered.json b/annotations_filtered/dkCUjz7I36M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/dkCUjz7I36M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/dkErNkX2HKM_filtered.json b/annotations_filtered/dkErNkX2HKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..248fdef03a31f115d34c526e89328b1b6441bc4d --- /dev/null +++ b/annotations_filtered/dkErNkX2HKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 22.2], [31.0, 38.87], [44.0, 44.52], [48.0, 50.75], [52.0, 51.85], [53.0, 53.57], [57.0, 60.91], [63.0, 80.49], [93.0, 93.63], [104.0, 104.3], [105.0, 119.57]], "keep_status": [true, true, false, true, false, false, true, true, false, false, false], "silence_prob": [31.43, 31.67, 0.0, 31.9, 0.0, 0.0, 31.29, 31.44, 0.0, 0.0, 32.92], "audiomae_on_audioset": [[["speech", 27.98], ["hum", 15.78], ["vehicle", 11.57]], [["music", 20.42], ["didgeridoo", 15.14], ["speech", 11.45]], null, [["music", 30.47], ["speech", 19.62], ["hum", 15.46]], null, null, [["vehicle", 21.62], ["speech", 11.91], ["motorcycle", 6.72]], [["speech", 42.72], ["vehicle", 10.8], ["car", 6.29]], null, null, [["speech", 69.13], ["music", 7.0], ["vehicle", 4.61]]], "duration": [12.2, 7.87, 0.52, 2.75, -0.15, 0.57, 3.91, 17.49, 0.63, 0.3, 14.57]} \ No newline at end of file diff --git a/annotations_filtered/dkcsqI6hZz8_filtered.json b/annotations_filtered/dkcsqI6hZz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..846aeb4c9a345e4c30dd2538e8fa1c3be0aebe90 --- /dev/null +++ b/annotations_filtered/dkcsqI6hZz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.31], [3.0, 4.29], [5.0, 6.78], [7.0, 8.24], [9.0, 11.5], [12.0, 13.04], [14.0, 15.23], [16.0, 18.08], [20.0, 21.69], [22.0, 22.92], [24.0, 25.1], [28.0, 29.05], [29.0, 35.83], [37.0, 37.52], [41.0, 41.42], [44.0, 46.6], [51.0, 51.71], [57.0, 57.23], [59.0, 63.59], [65.0, 65.21], [67.0, 67.05], [72.0, 73.25], [75.0, 77.57], [78.0, 78.46], [79.0, 81.23], [83.0, 83.79], [84.0, 86.14], [88.0, 88.25], [90.0, 91.88], [93.0, 94.8], [97.0, 113.02], [113.0, 117.17], [119.0, 119.21], [128.0, 128.34], [130.0, 130.55], [134.0, 134.54], [136.0, 137.0], [139.0, 148.81], [151.0, 154.2], [154.0, 163.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 78.89, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 95.91, 0.0, 66.63, 0.0, 92.48, 0.0, 0.0, 0.0, 69.88, 45.82, 0.0, 0.0, 0.0, 0.0, 0.0, 42.0, 43.08, 42.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.93], ["didgeridoo", 20.63], ["foghorn", 5.93]], null, null, null, null, null, [["animal", 16.11], ["goose", 15.65], ["honk", 13.93]], [["music", 59.58], ["effects unit", 6.29], ["musical instrument", 5.17]], [["music", 20.01], ["foghorn", 13.04], ["livestock, farm animals, working animals", 12.97]]], "duration": [0.31, 1.29, 1.78, 1.24, 2.5, 1.04, 1.23, 2.08, 1.69, 0.92, 1.1, 1.05, 6.83, 0.52, 0.42, 2.6, 0.71, 0.23, 4.59, 0.21, 0.05, 1.25, 2.57, 0.46, 2.23, 0.79, 2.14, 0.25, 1.88, 1.8, 16.02, 4.17, 0.21, 0.34, 0.55, 0.54, 1.0, 9.81, 3.2, 9.41]} \ No newline at end of file diff --git a/annotations_filtered/dkdrbg4EwGA_filtered.json b/annotations_filtered/dkdrbg4EwGA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..655442a7938b3554fb70bb752c2c61eb1552382a --- /dev/null +++ b/annotations_filtered/dkdrbg4EwGA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.21], [19.0, 35.99], [39.0, 42.8], [43.0, 68.99], [71.0, 79.51], [85.0, 89.83], [96.0, 100.41], [101.0, 102.46], [106.0, 119.72]], "keep_status": [false, true, false, false, true, true, true, false, true], "silence_prob": [33.5, 33.74, 39.96, 35.72, 33.57, 34.44, 31.97, 0.0, 31.78], "audiomae_on_audioset": [[["music", 65.53], ["synthesizer", 5.38], ["musical instrument", 4.03]], [["music", 33.65], ["didgeridoo", 11.88], ["throbbing", 9.29]], [["music", 68.28], ["synthesizer", 9.18], ["throbbing", 6.09]], [["music", 70.48], ["throbbing", 11.2], ["hum", 5.85]], [["music", 59.21], ["boing", 5.87], ["whack, thwack", 3.9]], [["music", 49.46], ["synthesizer", 6.47], ["throbbing", 5.39]], [["music", 51.21], ["brass instrument", 8.36], ["synthesizer", 7.86]], null, [["music", 24.89], ["hum", 22.68], ["mains hum", 14.31]]], "duration": [2.21, 16.99, 3.8, 25.99, 8.51, 4.83, 4.41, 1.46, 13.72]} \ No newline at end of file diff --git a/annotations_filtered/dkjBBdHZNUs_filtered.json b/annotations_filtered/dkjBBdHZNUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2470e5b53de23f2591fa6faaa7012578bd02760d --- /dev/null +++ b/annotations_filtered/dkjBBdHZNUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.24], [34.0, 35.46], [40.0, 40.74], [44.0, 46.21], [69.0, 69.23], [70.0, 70.01], [70.0, 73.11], [81.0, 83.88]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 56.78, 0.0, 0.0, 46.72, 68.54], "audiomae_on_audioset": [null, null, null, null, null, null, [["theremin", 38.32], ["wind instrument, woodwind instrument", 29.04], ["music", 9.26]], null], "duration": [1.24, 1.46, 0.74, 2.21, 0.23, 0.01, 3.11, 2.88]} \ No newline at end of file diff --git a/annotations_filtered/dl1X9j-9Lbg_filtered.json b/annotations_filtered/dl1X9j-9Lbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad5fde2279de67afba9a8aae12e47c5a97239792 --- /dev/null +++ b/annotations_filtered/dl1X9j-9Lbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.81], [8.0, 15.16], [19.0, 19.85], [22.0, 22.45], [23.0, 24.26], [27.0, 47.02], [48.0, 49.15], [52.0, 52.37], [53.0, 54.03], [56.0, 57.06], [58.0, 58.45], [64.0, 64.52], [67.0, 67.69], [69.0, 70.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.45, 0.0, 0.0, 0.0, 45.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 64.91], ["music", 24.03], ["synthesizer", 1.53]], null, null, null, [["music", 63.48], ["speech", 17.61], ["didgeridoo", 4.85]], null, null, null, null, null, null, null, null], "duration": [0.81, 7.16, 0.85, 0.45, 1.26, 20.02, 1.15, 0.37, 1.03, 1.06, 0.45, 0.52, 0.69, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/dl2NG3vkMTk_filtered.json b/annotations_filtered/dl2NG3vkMTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10aed6d609ee126513dab5afc1da689288b7af06 --- /dev/null +++ b/annotations_filtered/dl2NG3vkMTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.73], [4.0, 5.75], [11.0, 11.99], [14.0, 14.69], [16.0, 17.98], [20.0, 23.14], [24.0, 28.51], [30.0, 30.25], [32.0, 34.25], [35.0, 36.21], [37.0, 38.11]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 41.81, 0.0, 52.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 35.35], ["mains hum", 19.07], ["speech", 9.98]], null, null, null, null], "duration": [0.73, 1.75, 0.99, 0.69, 1.98, 3.14, 4.51, 0.25, 2.25, 1.21, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/dlYo5IHqD80_filtered.json b/annotations_filtered/dlYo5IHqD80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1de81688320939522b1b43930d3c1d80b22b06f8 --- /dev/null +++ b/annotations_filtered/dlYo5IHqD80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.94], [15.0, 18.5], [21.0, 26.86], [31.0, 34.28], [39.0, 108.45]], "keep_status": [false, true, true, true, false], "silence_prob": [53.22, 42.96, 45.3, 47.82, 0.0], "audiomae_on_audioset": [null, [["music", 31.99], ["singing bowl", 9.04], ["gong", 8.61]], [["music", 51.01], ["theremin", 8.72], ["hum", 5.37]], [["music", 40.52], ["mantra", 16.26], ["didgeridoo", 6.39]], null], "duration": [9.94, 3.5, 5.86, 3.28, 69.45]} \ No newline at end of file diff --git a/annotations_filtered/dm3xv5sosng_filtered.json b/annotations_filtered/dm3xv5sosng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da9c8c629185c1d38affc88a704df4aa24e0b89b --- /dev/null +++ b/annotations_filtered/dm3xv5sosng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.24], [26.0, 38.45], [39.0, 40.37], [42.0, 42.6], [43.0, 47.29], [47.0, 49.54], [74.0, 73.99], [75.0, 76.69]], "keep_status": [false, true, false, false, false, true, false, false], "silence_prob": [0.0, 35.87, 0.0, 0.0, 34.9, 39.02, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 21.34], ["fly, housefly", 18.86], ["speech", 17.48]], null, null, [["speech", 70.01], ["music", 7.9], ["outside, urban or manmade", 1.45]], [["speech", 36.94], ["music", 20.29], ["sidetone", 10.54]], null, null], "duration": [0.24, 12.45, 1.37, 0.6, 4.29, 2.54, -0.01, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/dm61r3qnPKQ_filtered.json b/annotations_filtered/dm61r3qnPKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b130291ab2b3491dd9ce87ed554601329020787 --- /dev/null +++ b/annotations_filtered/dm61r3qnPKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.29], [7.0, 8.31], [13.0, 13.64], [16.0, 18.15], [20.0, 20.7], [22.0, 26.15], [27.0, 27.55], [28.0, 28.73], [31.0, 31.43], [32.0, 33.45], [35.0, 36.12], [39.0, 39.9], [41.0, 42.3], [44.0, 45.01], [46.0, 60.29], [64.0, 64.77], [66.0, 67.93], [71.0, 72.33], [73.0, 80.49], [108.0, 108.21], [109.0, 113.09], [116.0, 116.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 63.74, 0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.47, 0.0, 0.0, 0.0, 32.93, 0.0, 36.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.27], ["theremin", 9.0], ["synthesizer", 7.04]], null, null, null, [["music", 65.07], ["musical instrument", 5.41], ["didgeridoo", 3.48]], null, [["music", 50.31], ["theremin", 17.56], ["synthesizer", 6.52]], null], "duration": [1.29, 1.31, 0.64, 2.15, 0.7, 4.15, 0.55, 0.73, 0.43, 1.45, 1.12, 0.9, 1.3, 1.01, 14.29, 0.77, 1.93, 1.33, 7.49, 0.21, 4.09, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/dmASD5tRwV4_filtered.json b/annotations_filtered/dmASD5tRwV4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f584b9f4ca3f00d21cae564340aa049cb625cc7 --- /dev/null +++ b/annotations_filtered/dmASD5tRwV4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 10.35], [11.0, 21.44], [23.0, 23.6], [24.0, 27.04], [28.0, 29.13], [30.0, 30.77], [33.0, 49.2], [51.0, 57.99], [59.0, 61.15], [66.0, 66.63], [68.0, 69.62], [71.0, 75.54], [77.0, 77.35], [79.0, 118.25], [118.0, 118.3], [118.0, 118.44], [118.0, 164.94]], "keep_status": [false, true, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [29.48, 30.14, 0.0, 39.17, 0.0, 0.0, 33.64, 33.48, 32.91, 0.0, 0.0, 31.8, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 47.23], ["music", 22.59], ["rumble", 6.55]], [["speech", 51.45], ["rumble", 12.66], ["hum", 5.12]], null, [["speech", 61.85], ["whale vocalization", 11.68], ["sidetone", 7.99]], null, null, [["whale vocalization", 30.65], ["insect", 13.97], ["fly, housefly", 13.29]], [["whale vocalization", 23.54], ["rumble", 21.51], ["hum", 14.53]], [["music", 63.03], ["hum", 6.07], ["electronic music", 1.93]], null, null, [["rumble", 19.71], ["hum", 19.53], ["music", 9.79]], null, null, null, null, null], "duration": [9.35, 10.44, 0.6, 3.04, 1.13, 0.77, 16.2, 6.99, 2.15, 0.63, 1.62, 4.54, 0.35, 39.25, 0.3, 0.44, 46.94]} \ No newline at end of file diff --git a/annotations_filtered/dmL4e3jljy4_filtered.json b/annotations_filtered/dmL4e3jljy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56b6c4af6b6d2131091d7152a6b19d988226eb14 --- /dev/null +++ b/annotations_filtered/dmL4e3jljy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 103.38], [104.0, 104.57], [108.0, 113.17], [117.0, 118.35], [121.0, 126.69], [129.0, 129.83]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 41.42, 0.0, 99.91, 0.0], "audiomae_on_audioset": [null, null, [["speech", 45.64], ["animal", 9.17], ["boing", 6.68]], null, null, null], "duration": [59.38, 0.57, 5.17, 1.35, 5.69, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/dmqo-EuR8Cw_filtered.json b/annotations_filtered/dmqo-EuR8Cw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c03b5ac9856b9238a948c7580869273018b36e33 --- /dev/null +++ b/annotations_filtered/dmqo-EuR8Cw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.1], [9.0, 12.65], [13.0, 15.35], [17.0, 19.35], [27.0, 35.5], [36.0, 38.15], [39.0, 40.96], [42.0, 42.31], [42.0, 42.5], [44.0, 44.12], [45.0, 48.42], [49.0, 51.41], [59.0, 59.09], [61.0, 62.5], [69.0, 73.08], [75.0, 82.49], [85.0, 86.8], [89.0, 104.72], [109.0, 109.12]], "keep_status": [false, true, false, true, true, true, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 29.74, 33.24, 32.55, 29.72, 29.59, 0.0, 0.0, 0.0, 0.0, 30.78, 31.56, 0.0, 0.0, 33.4, 30.45, 0.0, 29.9, 0.0], "audiomae_on_audioset": [null, [["music", 46.04], ["hum", 6.83], ["noise", 6.36]], [["music", 31.21], ["throbbing", 22.13], ["hum", 22.01]], [["speech", 32.95], ["music", 18.82], ["croak", 8.14]], [["music", 48.18], ["groan", 7.77], ["throbbing", 5.66]], [["music", 47.24], ["tabla", 9.1], ["musical instrument", 6.21]], null, null, null, null, [["boing", 55.34], ["music", 14.54], ["speech", 5.48]], [["music", 28.93], ["crowd", 7.46], ["speech", 6.94]], null, null, [["music", 42.26], ["livestock, farm animals, working animals", 15.52], ["cattle, bovinae", 5.23]], [["music", 49.94], ["throbbing", 17.3], ["cacophony", 6.07]], null, [["music", 52.71], ["whack, thwack", 18.09], ["smash, crash", 6.57]], null], "duration": [0.1, 3.65, 2.35, 2.35, 8.5, 2.15, 1.96, 0.31, 0.5, 0.12, 3.42, 2.41, 0.09, 1.5, 4.08, 7.49, 1.8, 15.72, 0.12]} \ No newline at end of file diff --git a/annotations_filtered/dmy8Lcf_TiE_filtered.json b/annotations_filtered/dmy8Lcf_TiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94fc5fb8186489c5048c3881b2ed28207698fa19 --- /dev/null +++ b/annotations_filtered/dmy8Lcf_TiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.94], [10.0, 10.0], [11.0, 11.69], [14.0, 15.11], [15.0, 15.3], [15.0, 15.33], [16.0, 16.5], [17.0, 16.68], [17.0, 17.91], [19.0, 19.79], [23.0, 23.26], [25.0, 25.3], [30.0, 30.91], [32.0, 36.41], [37.0, 38.55], [40.0, 41.23], [42.0, 42.82], [45.0, 45.01], [46.0, 48.96], [58.0, 59.09], [60.0, 61.18], [64.0, 64.81], [70.0, 71.85], [75.0, 75.98], [81.0, 81.18], [83.0, 82.88], [88.0, 88.11], [96.0, 96.79], [101.0, 101.28], [102.0, 104.73], [105.0, 104.77], [109.0, 109.95], [113.0, 112.89], [116.0, 116.23], [118.0, 118.62], [120.0, 126.18], [129.0, 129.81], [131.0, 140.9], [147.0, 149.01], [152.0, 161.25], [164.0, 166.04], [168.0, 168.24], [173.0, 173.06], [174.0, 174.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.13, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 30.72, 38.47, 29.12, 41.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.07], ["fart", 5.51], ["crackle", 4.88]], null, null, null, null, null, null, null, [["speech", 64.14], ["whack, thwack", 9.88], ["smash, crash", 8.54]], [["music", 14.34], ["beatboxing", 13.12], ["boing", 9.45]], [["speech", 38.29], ["vehicle", 14.14], ["car", 8.72]], [["speech", 42.74], ["music", 21.33], ["boing", 14.98]], null, null, null], "duration": [1.94, 0.0, 0.69, 1.11, 0.3, 0.33, 0.5, -0.32, 0.91, 0.79, 0.26, 0.3, 0.91, 4.41, 1.55, 1.23, 0.82, 0.01, 2.96, 1.09, 1.18, 0.81, 1.85, 0.98, 0.18, -0.12, 0.11, 0.79, 0.28, 2.73, -0.23, 0.95, -0.11, 0.23, 0.62, 6.18, 0.81, 9.9, 2.01, 9.25, 2.04, 0.24, 0.06, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/dnIPfZIKYPc_filtered.json b/annotations_filtered/dnIPfZIKYPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3713331e0105ab8a2261ad56d8bd1f0bb5ee99c5 --- /dev/null +++ b/annotations_filtered/dnIPfZIKYPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.55], [6.0, 14.32], [15.0, 39.01]], "keep_status": [false, false, false], "silence_prob": [0.0, 31.49, 31.54], "audiomae_on_audioset": [null, [["music", 58.74], ["speech", 7.2], ["throbbing", 6.84]], [["music", 62.03], ["hum", 9.57], ["throbbing", 4.26]]], "duration": [1.55, 8.32, 24.01]} \ No newline at end of file diff --git a/annotations_filtered/dnRxQ3dcaQk_filtered.json b/annotations_filtered/dnRxQ3dcaQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..402c98ee48cf3e0f3e4c63f0c4ccc93bc9c91502 --- /dev/null +++ b/annotations_filtered/dnRxQ3dcaQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 16.92], [17.0, 31.4], [32.0, 55.9], [57.0, 101.22], [104.0, 137.12], [139.0, 167.41], [168.0, 168.44]], "keep_status": [false, true, true, false, false, true, false], "silence_prob": [40.79, 34.46, 48.61, 0.0, 0.0, 31.31, 0.0], "audiomae_on_audioset": [[["sidetone", 58.2], ["speech", 29.47], ["music", 2.8]], [["sound effect", 16.98], ["fart", 14.71], ["animal", 9.66]], [["music", 38.76], ["synthesizer", 15.05], ["speech", 7.93]], null, null, [["electric shaver, electric razor", 20.24], ["hum", 13.24], ["music", 9.77]], null], "duration": [14.92, 14.4, 23.9, 44.22, 33.12, 28.41, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/dnThWk9ib1c_filtered.json b/annotations_filtered/dnThWk9ib1c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ed8b05ee25748122596f927f2294d66f6cec4ac --- /dev/null +++ b/annotations_filtered/dnThWk9ib1c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 19.52], [20.0, 20.71], [24.0, 24.85], [26.0, 30.47], [32.0, 31.83], [33.0, 33.74], [35.0, 35.63], [38.0, 44.02], [45.0, 46.82], [49.0, 49.55], [51.0, 51.36], [58.0, 58.95]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [29.82, 0.0, 0.0, 30.02, 0.0, 0.0, 0.0, 31.47, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 35.63], ["music", 23.57], ["throbbing", 21.32]], null, null, [["speech", 16.94], ["fart", 8.39], ["didgeridoo", 7.84]], null, null, null, [["music", 38.42], ["didgeridoo", 12.89], ["speech", 12.81]], null, null, null, null], "duration": [13.52, 0.71, 0.85, 4.47, -0.17, 0.74, 0.63, 6.02, 1.82, 0.55, 0.36, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/dnnrhhZjTh8_filtered.json b/annotations_filtered/dnnrhhZjTh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f71d6a2c6f950ac1e7c419ba6379a95a85b65297 --- /dev/null +++ b/annotations_filtered/dnnrhhZjTh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.93], [27.0, 51.78], [53.0, 57.32], [59.0, 59.7], [61.0, 86.9], [87.0, 99.72], [100.0, 109.39]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 29.75, 30.96, 0.0, 29.94, 29.52, 30.04], "audiomae_on_audioset": [null, [["music", 55.36], ["throbbing", 15.69], ["hum", 6.97]], [["music", 46.0], ["speech", 10.49], ["electronic music", 8.18]], null, [["music", 40.6], ["throbbing", 33.36], ["hum", 8.62]], [["music", 45.86], ["speech", 17.83], ["throbbing", 8.26]], [["music", 60.92], ["speech", 19.62], ["throbbing", 5.02]]], "duration": [0.93, 24.78, 4.32, 0.7, 25.9, 12.72, 9.39]} \ No newline at end of file diff --git a/annotations_filtered/dnrJELv76n4_filtered.json b/annotations_filtered/dnrJELv76n4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6ead8c25989442fc7becb410b87015421d4dae3 --- /dev/null +++ b/annotations_filtered/dnrJELv76n4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.34], [10.0, 10.13], [19.0, 18.98], [31.0, 35.43], [44.0, 45.1], [45.0, 61.48], [75.0, 76.71], [84.0, 86.17], [93.0, 93.5], [95.0, 97.88], [111.0, 115.13], [119.0, 120.85], [127.0, 127.67], [134.0, 134.57], [135.0, 135.09], [135.0, 138.2], [143.0, 147.04], [151.0, 156.09], [168.0, 167.91], [172.0, 172.0], [178.0, 179.15], [180.0, 180.49], [187.0, 188.38], [194.0, 194.22], [194.0, 194.36], [200.0, 200.48], [205.0, 206.9], [209.0, 214.41], [218.0, 221.68], [224.0, 225.61]], "keep_status": [false, false, false, true, false, false, false, true, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.61, 0.0, 33.49, 0.0, 35.65, 0.0, 30.93, 34.74, 0.0, 0.0, 0.0, 0.0, 31.74, 30.03, 29.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.78, 31.71, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 57.54], ["synthesizer", 4.35], ["musical instrument", 2.2]], null, [["music", 69.53], ["quack", 3.14], ["buzz", 2.38]], null, [["music", 57.55], ["synthesizer", 4.1], ["musical instrument", 3.58]], null, [["music", 46.81], ["speech", 11.5], ["electronic music", 4.83]], [["speech", 28.03], ["music", 26.18], ["bleat", 5.64]], null, null, null, null, [["speech", 49.69], ["music", 28.75], ["throbbing", 5.54]], [["music", 70.18], ["synthesizer", 7.69], ["musical instrument", 3.61]], [["speech", 37.19], ["music", 19.22], ["sound effect", 5.47]], null, null, null, null, null, null, null, null, null, [["groan", 40.93], ["speech", 13.92], ["music", 9.46]], [["didgeridoo", 25.94], ["livestock, farm animals, working animals", 16.11], ["cattle, bovinae", 13.05]], null], "duration": [0.34, 0.13, -0.02, 4.43, 1.1, 16.48, 1.71, 2.17, 0.5, 2.88, 4.13, 1.85, 0.67, 0.57, 0.09, 3.2, 4.04, 5.09, -0.09, 0.0, 1.15, 0.49, 1.38, 0.22, 0.36, 0.48, 1.9, 5.41, 3.68, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/doKP3Il9R1k_filtered.json b/annotations_filtered/doKP3Il9R1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16e7769c03b0e77897126353984b43b355f8a460 --- /dev/null +++ b/annotations_filtered/doKP3Il9R1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [4.0, 4.28], [5.0, 6.29], [7.0, 8.34], [10.0, 10.13], [12.0, 15.6], [17.0, 17.12], [24.0, 23.99], [24.0, 25.1], [26.0, 26.25], [28.0, 28.46], [34.0, 34.28], [35.0, 36.02], [37.0, 37.57], [56.0, 56.22], [66.0, 66.28], [68.0, 68.01], [73.0, 73.04], [78.0, 78.04], [78.0, 78.27], [78.0, 79.47], [80.0, 81.11], [92.0, 91.94], [95.0, 95.0], [95.0, 97.23], [105.0, 105.9]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.14, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["radio", 15.39], ["speech", 11.67], ["moo", 7.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.13], ["speech", 25.58], ["beatboxing", 5.37]], null], "duration": [0.65, 0.28, 1.29, 1.34, 0.13, 3.6, 0.12, -0.01, 1.1, 0.25, 0.46, 0.28, 1.02, 0.57, 0.22, 0.28, 0.01, 0.04, 0.04, 0.27, 1.47, 1.11, -0.06, 0.0, 2.23, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/doLHipw196I_filtered.json b/annotations_filtered/doLHipw196I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..498bfb98b2f59a397e7d1e91732b730617920e5a --- /dev/null +++ b/annotations_filtered/doLHipw196I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.31], [25.0, 42.87], [48.0, 69.7], [70.0, 71.71], [72.0, 108.19]], "keep_status": [false, false, false, false, false], "silence_prob": [47.23, 34.83, 31.08, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 42.39], ["throbbing", 32.65], ["mains hum", 13.47]], [["music", 62.69], ["theremin", 10.22], ["hum", 5.7]], [["music", 67.7], ["hum", 7.45], ["throbbing", 5.2]], null, null], "duration": [15.31, 17.87, 21.7, 1.71, 36.19]} \ No newline at end of file diff --git a/annotations_filtered/doVYFjIJcfU_filtered.json b/annotations_filtered/doVYFjIJcfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/doVYFjIJcfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/dobHtRTf5rY_filtered.json b/annotations_filtered/dobHtRTf5rY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f6a27ee4fd3a6d9fcaed1225b57577bee76b94b --- /dev/null +++ b/annotations_filtered/dobHtRTf5rY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [4.0, 5.59], [6.0, 22.99], [23.0, 25.89], [28.0, 38.2]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.46, 32.65, 30.96], "audiomae_on_audioset": [null, null, [["speech", 45.76], ["music", 34.77], ["smash, crash", 2.38]], [["music", 49.07], ["throbbing", 24.07], ["cacophony", 5.03]], [["hum", 36.79], ["music", 22.44], ["throbbing", 18.62]]], "duration": [0.62, 1.59, 16.99, 2.89, 10.2]} \ No newline at end of file diff --git a/annotations_filtered/dofECCtTfaM_filtered.json b/annotations_filtered/dofECCtTfaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..992c75ea6bd8acae15d56dc92beb0acdeae379d7 --- /dev/null +++ b/annotations_filtered/dofECCtTfaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.39], [4.0, 5.48], [6.0, 29.19], [30.0, 33.69], [35.0, 38.47]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 50.31, 32.92, 34.68], "audiomae_on_audioset": [null, null, null, [["speech", 19.84], ["music", 19.63], ["foghorn", 18.94]], [["brass instrument", 36.62], ["trombone", 20.65], ["music", 19.74]]], "duration": [1.39, 1.48, 23.19, 3.69, 3.47]} \ No newline at end of file diff --git a/annotations_filtered/dp2MR9fswWk_filtered.json b/annotations_filtered/dp2MR9fswWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3024bd13c986cc4a72c17bb4f6120eac1d7cd6a2 --- /dev/null +++ b/annotations_filtered/dp2MR9fswWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.7], [7.0, 8.21], [13.0, 14.2], [36.0, 36.54], [38.0, 42.2], [47.0, 46.92], [54.0, 54.28], [56.0, 55.92], [69.0, 69.13], [75.0, 76.13], [85.0, 85.73], [89.0, 89.16], [108.0, 108.08], [128.0, 129.61], [131.0, 130.86], [133.0, 133.73], [135.0, 137.46], [138.0, 139.18], [147.0, 147.11], [156.0, 156.37], [161.0, 161.22], [163.0, 170.87], [171.0, 179.76]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.88, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.06, 0.0, 0.0, 0.0, 0.0, 80.82, 48.39], "audiomae_on_audioset": [[["speech", 38.38], ["music", 25.01], ["hum", 3.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.91], ["arrow", 7.05], ["thunk", 6.38]]], "duration": [4.7, 1.21, 1.2, 0.54, 4.2, -0.08, 0.28, -0.08, 0.13, 1.13, 0.73, 0.16, 0.08, 1.61, -0.14, 0.73, 2.46, 1.18, 0.11, 0.37, 0.22, 7.87, 8.76]} \ No newline at end of file diff --git a/annotations_filtered/dp4qnnVSk8Y_filtered.json b/annotations_filtered/dp4qnnVSk8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..606571b3c4e870a476c95ae4f9dd12950843ee9b --- /dev/null +++ b/annotations_filtered/dp4qnnVSk8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 16.73], [18.0, 18.81], [20.0, 20.61], [21.0, 24.71], [27.0, 40.73], [44.0, 44.86], [67.0, 68.07], [70.0, 71.54], [72.0, 75.39], [76.0, 76.64], [80.0, 79.62], [80.0, 82.61], [85.0, 85.68], [86.0, 86.27], [86.0, 86.53], [87.0, 93.12], [94.0, 95.13], [95.0, 96.2], [99.0, 100.2]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [34.0, 0.0, 0.0, 32.17, 30.58, 0.0, 0.0, 0.0, 67.25, 0.0, 0.0, 34.27, 0.0, 0.0, 0.0, 33.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 37.39], ["mains hum", 19.93], ["whale vocalization", 11.81]], null, null, [["breaking", 24.04], ["fart", 8.01], ["whack, thwack", 6.47]], [["music", 62.81], ["throbbing", 10.85], ["hum", 8.39]], null, null, null, null, null, null, [["speech", 15.31], ["hum", 8.5], ["dog", 8.35]], null, null, null, [["speech", 32.88], ["groan", 15.57], ["whimper", 5.16]], null, null, null], "duration": [12.73, 0.81, 0.61, 3.71, 13.73, 0.86, 1.07, 1.54, 3.39, 0.64, -0.38, 2.61, 0.68, 0.27, 0.53, 6.12, 1.13, 1.2, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/dpAoVOU-q60_filtered.json b/annotations_filtered/dpAoVOU-q60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..254bdf95a6dd4984e42579899dd4d42e34ec55b5 --- /dev/null +++ b/annotations_filtered/dpAoVOU-q60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.12], [27.0, 30.27], [31.0, 31.48], [32.0, 32.78], [34.0, 34.38], [35.0, 36.49], [42.0, 42.6], [43.0, 44.34], [47.0, 47.75], [49.0, 50.46], [53.0, 54.24], [58.0, 62.06], [63.0, 64.56], [66.0, 68.5], [69.0, 70.77], [71.0, 72.82], [75.0, 76.23], [77.0, 77.3], [80.0, 80.69], [83.0, 83.08], [84.0, 83.93], [87.0, 87.64], [92.0, 95.17], [97.0, 100.4], [101.0, 102.78], [104.0, 109.54], [110.0, 113.91]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, true, false, true, true], "silence_prob": [31.13, 35.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.79, 0.0, 37.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.92, 38.14, 0.0, 34.63, 37.78], "audiomae_on_audioset": [[["speech", 56.98], ["civil defense siren", 18.05], ["music", 6.31]], [["hum", 21.09], ["mains hum", 20.22], ["speech", 11.65]], null, null, null, null, null, null, null, null, null, [["didgeridoo", 9.18], ["noise", 8.21], ["whale vocalization", 7.43]], null, [["mains hum", 16.87], ["hum", 11.99], ["music", 5.86]], null, null, null, null, null, null, null, null, [["fly, housefly", 11.69], ["speech", 8.12], ["bee, wasp, etc.", 8.12]], [["speech", 24.51], ["aircraft", 21.73], ["fixed-wing aircraft, airplane", 14.09]], null, [["hum", 14.63], ["eruption", 7.34], ["mains hum", 7.13]], [["speech", 42.01], ["hum", 13.29], ["mains hum", 7.06]]], "duration": [3.12, 3.27, 0.48, 0.78, 0.38, 1.49, 0.6, 1.34, 0.75, 1.46, 1.24, 4.06, 1.56, 2.5, 1.77, 1.82, 1.23, 0.3, 0.69, 0.08, -0.07, 0.64, 3.17, 3.4, 1.78, 5.54, 3.91]} \ No newline at end of file diff --git a/annotations_filtered/dpg077fR9Mc_filtered.json b/annotations_filtered/dpg077fR9Mc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..768ed6f95b3149f2c73eafd7dbf98e7f38108982 --- /dev/null +++ b/annotations_filtered/dpg077fR9Mc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.61], [18.0, 34.74], [37.0, 37.3], [39.0, 44.81], [46.0, 51.38], [56.0, 88.94], [91.0, 96.7], [98.0, 98.47], [102.0, 123.11], [124.0, 142.72], [143.0, 143.18], [144.0, 143.72], [144.0, 143.75], [144.0, 158.23]], "keep_status": [false, false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 64.52, 0.0, 70.58, 73.82, 0.0, 40.24, 0.0, 33.83, 35.83, 0.0, 0.0, 0.0, 36.42], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 63.0], ["musical instrument", 2.28], ["cattle, bovinae", 2.12]], null, [["music", 34.39], ["speech", 10.44], ["fireworks", 5.16]], [["hum", 21.59], ["music", 12.09], ["buzz", 11.85]], null, null, null, [["buzz", 70.22], ["speech", 6.33], ["electric shaver, electric razor", 4.7]]], "duration": [1.61, 16.74, 0.3, 5.81, 5.38, 32.94, 5.7, 0.47, 21.11, 18.72, 0.18, -0.28, -0.25, 14.23]} \ No newline at end of file diff --git a/annotations_filtered/dq_RCN3esGk_filtered.json b/annotations_filtered/dq_RCN3esGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcddc91619aaf29da3708f7b29c46e047428aa38 --- /dev/null +++ b/annotations_filtered/dq_RCN3esGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.25], [7.0, 7.65], [12.0, 26.65], [38.0, 43.06], [49.0, 49.01], [52.0, 85.9], [92.0, 99.93]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [48.1, 0.0, 44.69, 29.72, 0.0, 0.0, 29.93], "audiomae_on_audioset": [[["fly, housefly", 27.28], ["insect", 11.14], ["bee, wasp, etc.", 7.33]], null, [["cattle, bovinae", 48.08], ["livestock, farm animals, working animals", 30.9], ["moo", 20.11]], [["cattle, bovinae", 50.52], ["moo", 30.79], ["livestock, farm animals, working animals", 12.5]], null, null, [["cattle, bovinae", 35.4], ["moo", 34.09], ["livestock, farm animals, working animals", 12.46]]], "duration": [2.25, 0.65, 14.65, 5.06, 0.01, 33.9, 7.93]} \ No newline at end of file diff --git a/annotations_filtered/drTH0CDFgx8_filtered.json b/annotations_filtered/drTH0CDFgx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..563d83af71bb74be2e156f67a6d19e0399d1c220 --- /dev/null +++ b/annotations_filtered/drTH0CDFgx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [4.0, 6.0], [8.0, 9.12], [10.0, 11.08], [14.0, 14.61], [16.0, 16.07], [22.0, 22.99], [23.0, 24.0], [27.0, 28.24], [29.0, 30.21], [31.0, 30.79], [31.0, 36.63], [42.0, 44.69], [46.0, 46.63], [51.0, 52.25], [53.0, 54.6], [57.0, 57.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 95.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 2.0, 1.12, 1.08, 0.61, 0.07, 0.99, 1.0, 1.24, 1.21, -0.21, 5.63, 2.69, 0.63, 1.25, 1.6, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/droww43JVyA_filtered.json b/annotations_filtered/droww43JVyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9664ee3479f2993bcf3a75c2b404a971762df9f4 --- /dev/null +++ b/annotations_filtered/droww43JVyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.48], [4.0, 9.17], [14.0, 15.16], [16.0, 17.39], [18.0, 18.37], [21.0, 21.52], [23.0, 23.52], [24.0, 25.49], [26.0, 29.37], [30.0, 33.34], [36.0, 37.07], [40.0, 40.54], [41.0, 41.69], [43.0, 44.54], [46.0, 47.11], [48.0, 49.47], [51.0, 51.93], [52.0, 53.5], [54.0, 55.32], [64.0, 66.23], [71.0, 73.08], [74.0, 76.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 5.17, 1.16, 1.39, 0.37, 0.52, 0.52, 1.49, 3.37, 3.34, 1.07, 0.54, 0.69, 1.54, 1.11, 1.47, 0.93, 1.5, 1.32, 2.23, 2.08, 2.69]} \ No newline at end of file diff --git a/annotations_filtered/dry7kY2BMlk_filtered.json b/annotations_filtered/dry7kY2BMlk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67348b1af2ca6d4de0efc3c25d7fee39e0ab580c --- /dev/null +++ b/annotations_filtered/dry7kY2BMlk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [8.0, 10.57], [12.0, 24.88], [25.0, 57.15], [59.0, 65.65], [67.0, 67.53], [70.0, 75.42], [77.0, 77.94], [88.0, 89.34], [91.0, 91.64], [93.0, 94.17], [95.0, 97.16], [100.0, 100.52], [102.0, 103.69], [105.0, 107.52], [110.0, 110.61], [112.0, 114.49], [122.0, 123.18], [137.0, 146.62], [148.0, 155.28], [156.0, 159.81], [160.0, 161.25], [164.0, 164.61]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 37.53, 31.56, 0.0, 36.79, 0.0, 48.44, 0.0, 0.0, 0.0, 0.0, 50.11, 0.0, 0.0, 41.28, 0.0, 35.92, 0.0, 30.04, 36.25, 43.4, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 27.78], ["music", 25.78], ["didgeridoo", 6.07]], [["music", 72.97], ["hum", 6.52], ["throbbing", 3.88]], null, [["speech", 43.19], ["music", 5.47], ["car", 4.96]], null, [["music", 36.39], ["speech", 23.88], ["hum", 10.02]], null, null, null, null, null, null, null, [["music", 35.38], ["throbbing", 9.24], ["hum", 7.63]], null, [["music", 65.4], ["throbbing", 6.75], ["electronic music", 3.81]], null, [["speech", 41.79], ["machine gun", 23.22], ["music", 15.33]], [["music", 54.03], ["hum", 9.0], ["throbbing", 6.35]], [["music", 55.07], ["speech", 17.75], ["didgeridoo", 9.92]], null, null], "duration": [0.51, 2.57, 12.88, 32.15, 6.65, 0.53, 5.42, 0.94, 1.34, 0.64, 1.17, 2.16, 0.52, 1.69, 2.52, 0.61, 2.49, 1.18, 9.62, 7.28, 3.81, 1.25, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/dsCzZE_y0so_filtered.json b/annotations_filtered/dsCzZE_y0so_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5326abf21c354b1b109847947cd6c7f84c29e8b6 --- /dev/null +++ b/annotations_filtered/dsCzZE_y0so_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.12], [7.0, 7.59], [10.0, 10.22], [13.0, 46.33], [47.0, 49.38], [52.0, 67.59], [69.0, 71.41], [72.0, 74.8], [77.0, 77.7], [80.0, 86.63], [89.0, 96.35], [99.0, 101.75], [104.0, 122.54], [123.0, 124.51], [127.0, 127.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 99.56, 96.29, 99.71, 0.0, 99.93, 99.94, 99.98, 88.83, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.59, 0.22, 33.33, 2.38, 15.59, 2.41, 2.8, 0.7, 6.63, 7.35, 2.75, 18.54, 1.51, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/dsONBwWtAts_filtered.json b/annotations_filtered/dsONBwWtAts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e122b1e5dda5c66e48b9b432c259e73a3d92cb3c --- /dev/null +++ b/annotations_filtered/dsONBwWtAts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.05], [20.0, 21.05], [24.0, 23.9], [25.0, 25.17], [34.0, 34.16], [36.0, 36.42], [42.0, 42.16], [46.0, 48.07], [49.0, 53.76], [54.0, 74.63], [76.0, 85.33], [86.0, 87.08], [88.0, 98.2], [99.0, 109.48], [110.0, 114.34], [116.0, 123.82], [124.0, 123.85]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false], "silence_prob": [56.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.26, 30.44, 32.35, 37.61, 0.0, 32.56, 57.17, 66.03, 35.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 44.17], ["whack, thwack", 14.69], ["boing", 7.24]], [["music", 49.5], ["speech", 20.12], ["breaking", 3.07]], [["music", 24.04], ["gong", 9.59], ["whack, thwack", 8.5]], [["speech", 71.86], ["explosion", 9.46], ["burst, pop", 2.11]], null, [["speech", 53.5], ["music", 19.59], ["door", 4.83]], null, null, [["speech", 32.58], ["hum", 18.71], ["music", 11.43]], null], "duration": [3.05, 1.05, -0.1, 0.17, 0.16, 0.42, 0.16, 2.07, 4.76, 20.63, 9.33, 1.08, 10.2, 10.48, 4.34, 7.82, -0.15]} \ No newline at end of file diff --git a/annotations_filtered/dsRTzhbsAmQ_filtered.json b/annotations_filtered/dsRTzhbsAmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c76c171301a82a7d8fc1c2604bb43f1c5368304 --- /dev/null +++ b/annotations_filtered/dsRTzhbsAmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.76], [60.0, 60.13], [60.0, 60.96], [62.0, 61.99], [63.0, 62.9], [63.0, 63.9], [64.0, 65.13], [67.0, 68.57], [73.0, 74.51]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.76, 0.13, 0.96, -0.01, -0.1, 0.9, 1.13, 1.57, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/dsTyKFkGPuM_filtered.json b/annotations_filtered/dsTyKFkGPuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c955b8b19bf6d41c377861bfe7ddee8a84ecd4e1 --- /dev/null +++ b/annotations_filtered/dsTyKFkGPuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.79], [4.0, 5.21], [6.0, 6.98], [8.0, 8.8], [10.0, 10.59], [11.0, 11.92], [13.0, 65.77], [67.0, 72.89], [75.0, 75.73]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 30.2], ["hum", 24.6], ["mains hum", 20.09]], null], "duration": [1.79, 1.21, 0.98, 0.8, 0.59, 0.92, 52.77, 5.89, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/dshJG5PEOqY_filtered.json b/annotations_filtered/dshJG5PEOqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b7cfa17f4ebf2d11bd17efc1d9e3881d4c1bfbb --- /dev/null +++ b/annotations_filtered/dshJG5PEOqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.97], [9.0, 18.3], [20.0, 22.91], [23.0, 24.66], [25.0, 25.98], [26.0, 27.36], [28.0, 29.54], [30.0, 33.25], [34.0, 35.18], [36.0, 36.69], [40.0, 41.18], [42.0, 42.85], [44.0, 45.33], [50.0, 51.14], [52.0, 52.3], [55.0, 56.3], [58.0, 58.62], [60.0, 61.52], [63.0, 64.69], [66.0, 66.58], [69.0, 69.84], [72.0, 78.54], [80.0, 81.24], [82.0, 86.95], [92.0, 95.0], [95.0, 98.29], [99.0, 100.6], [103.0, 104.46], [105.0, 106.57], [107.0, 108.26], [109.0, 109.61], [111.0, 113.31], [116.0, 116.38], [122.0, 123.97], [124.0, 125.95], [127.0, 128.29], [129.0, 130.74], [134.0, 134.42], [138.0, 140.73], [141.0, 141.74], [143.0, 143.83], [145.0, 145.22], [147.0, 148.07], [149.0, 149.44], [150.0, 150.77], [154.0, 156.93], [158.0, 158.25], [159.0, 159.29], [169.0, 169.2], [170.0, 173.84], [181.0, 181.03], [189.0, 192.1], [195.0, 195.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.64, 99.97, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 90.08, 100.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 52.98, 0.0, 96.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.97, 9.3, 2.91, 1.66, 0.98, 1.36, 1.54, 3.25, 1.18, 0.69, 1.18, 0.85, 1.33, 1.14, 0.3, 1.3, 0.62, 1.52, 1.69, 0.58, 0.84, 6.54, 1.24, 4.95, 3.0, 3.29, 1.6, 1.46, 1.57, 1.26, 0.61, 2.31, 0.38, 1.97, 1.95, 1.29, 1.74, 0.42, 2.73, 0.74, 0.83, 0.22, 1.07, 0.44, 0.77, 2.93, 0.25, 0.29, 0.2, 3.84, 0.03, 3.1, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/dshmyllg2HE_filtered.json b/annotations_filtered/dshmyllg2HE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64ec1b9e279920e84e63d8464d719eb1dd1c27b6 --- /dev/null +++ b/annotations_filtered/dshmyllg2HE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.22], [9.0, 9.07], [33.0, 32.73], [33.0, 34.01], [34.0, 34.67], [37.0, 44.96], [49.0, 50.09], [54.0, 57.25], [58.0, 63.96], [64.0, 65.53], [74.0, 74.33], [97.0, 97.23], [99.0, 98.64], [103.0, 108.48], [131.0, 131.41], [133.0, 132.81], [140.0, 151.93], [154.0, 154.55], [158.0, 158.16], [166.0, 166.31]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.31, 0.0, 38.76, 32.93, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 0.0, 31.9, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 48.26], ["whale vocalization", 8.3], ["sonar", 3.97]], null, [["music", 20.61], ["synthesizer", 17.46], ["theremin", 7.01]], [["music", 64.25], ["speech", 8.18], ["boing", 2.23]], null, null, null, null, null, null, null, [["music", 78.93], ["synthesizer", 2.86], ["didgeridoo", 2.08]], null, null, null], "duration": [0.22, 0.07, -0.27, 1.01, 0.67, 7.96, 1.09, 3.25, 5.96, 1.53, 0.33, 0.23, -0.36, 5.48, 0.41, -0.19, 11.93, 0.55, 0.16, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/dslpHxTuA-w_filtered.json b/annotations_filtered/dslpHxTuA-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f306ea001b68f9320a5e1aeb98d25061be63ba90 --- /dev/null +++ b/annotations_filtered/dslpHxTuA-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.03], [21.0, 22.4], [28.0, 29.35], [32.0, 32.95], [38.0, 38.62], [48.0, 49.49], [50.0, 58.43], [62.0, 62.65], [64.0, 64.91], [67.0, 68.99], [75.0, 75.25], [76.0, 76.71], [79.0, 79.68], [85.0, 85.45], [92.0, 92.84], [94.0, 96.04], [98.0, 98.59], [101.0, 104.53], [113.0, 114.67], [133.0, 133.52], [149.0, 154.94], [156.0, 174.29], [175.0, 175.54], [176.0, 193.55], [194.0, 195.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.94, 0.0, 60.7, 0.0, 0.0, 31.58, 30.71, 0.0, 29.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 73.93], ["theremin", 3.33], ["musical instrument", 2.53]], null, null, null, null, null, null, null, null, [["music", 48.59], ["musical instrument", 7.91], ["cello", 6.8]], null, null, null, null, [["music", 76.91], ["singing", 4.42], ["male singing", 1.66]], [["music", 89.41], ["yodeling", 1.5], ["singing", 1.17]], null, [["music", 61.43], ["singing", 4.97], ["yodeling", 4.31]], null], "duration": [1.03, 1.4, 1.35, 0.95, 0.62, 1.49, 8.43, 0.65, 0.91, 1.99, 0.25, 0.71, 0.68, 0.45, 0.84, 2.04, 0.59, 3.53, 1.67, 0.52, 5.94, 18.29, 0.54, 17.55, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/dso8WOrSRSQ_filtered.json b/annotations_filtered/dso8WOrSRSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92b8571c984bf30b280334d983757de584c13734 --- /dev/null +++ b/annotations_filtered/dso8WOrSRSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.55], [29.0, 29.96], [35.0, 35.58], [37.0, 42.25], [43.0, 49.65], [53.0, 54.58], [55.0, 61.05], [62.0, 161.03], [162.0, 161.87], [162.0, 195.03]], "keep_status": [false, false, false, true, false, false, false, false, false, false], "silence_prob": [77.53, 0.0, 0.0, 38.41, 33.69, 0.0, 32.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 46.28], ["singing bowl", 11.69], ["musical instrument", 6.82]], [["gong", 72.79], ["music", 6.78], ["synthesizer", 3.42]], null, [["gong", 83.86], ["effects unit", 2.08], ["tuning fork", 1.77]], null, null, null], "duration": [2.55, 0.96, 0.58, 5.25, 6.65, 1.58, 6.05, 99.03, -0.13, 33.03]} \ No newline at end of file diff --git a/annotations_filtered/dtOaXCoryQo_filtered.json b/annotations_filtered/dtOaXCoryQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf0782a7ec55adff164a771eac39522f5d445c8b --- /dev/null +++ b/annotations_filtered/dtOaXCoryQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 60.61], [63.0, 74.83], [76.0, 101.17]], "keep_status": [false, false, false], "silence_prob": [30.89, 30.55, 31.34], "audiomae_on_audioset": [[["hum", 51.32], ["throbbing", 28.24], ["music", 10.18]], [["music", 36.94], ["throbbing", 26.21], ["hum", 25.96]], [["music", 62.14], ["hum", 13.51], ["throbbing", 11.16]]], "duration": [12.61, 11.83, 25.17]} \ No newline at end of file diff --git a/annotations_filtered/dtgOzzBMl2o_filtered.json b/annotations_filtered/dtgOzzBMl2o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67fbc3ee17dfccfe3e421c0c392ba45a8e620894 --- /dev/null +++ b/annotations_filtered/dtgOzzBMl2o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.42], [14.0, 14.72], [16.0, 16.11], [20.0, 20.73], [22.0, 22.82], [23.0, 25.2], [31.0, 31.55], [37.0, 38.42], [39.0, 41.55], [43.0, 42.97], [48.0, 48.34], [50.0, 51.0], [53.0, 54.21], [55.0, 60.03], [68.0, 68.89], [72.0, 72.22], [73.0, 75.37], [78.0, 78.36], [83.0, 82.63], [84.0, 86.04], [109.0, 109.53], [128.0, 128.98], [130.0, 131.31], [132.0, 131.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 78.55, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 0.72, 0.11, 0.73, 0.82, 2.2, 0.55, 1.42, 2.55, -0.03, 0.34, 1.0, 1.21, 5.03, 0.89, 0.22, 2.37, 0.36, -0.37, 2.04, 0.53, 0.98, 1.31, -0.13]} \ No newline at end of file diff --git a/annotations_filtered/dtwfZd9KGpo_filtered.json b/annotations_filtered/dtwfZd9KGpo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b2ea7fc832e6a84e6fe7e5f30d4f67dc22404a4 --- /dev/null +++ b/annotations_filtered/dtwfZd9KGpo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [4.0, 6.1], [7.0, 9.1], [10.0, 11.38], [12.0, 14.28], [17.0, 18.52], [23.0, 24.29], [25.0, 26.92], [27.0, 28.68], [29.0, 29.51], [31.0, 31.94], [34.0, 36.98], [38.0, 39.87], [42.0, 42.9], [44.0, 44.95], [57.0, 57.32], [59.0, 63.61]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 57.72, 37.55, 0.0, 52.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.43, 0.0, 0.0, 0.0, 0.0, 53.47], "audiomae_on_audioset": [null, null, [["speech", 26.28], ["crow", 14.44], ["caw", 10.59]], null, null, null, null, null, null, null, null, [["throbbing", 12.92], ["hum", 6.37], ["skateboard", 5.42]], null, null, null, null, null], "duration": [1.1, 2.1, 2.1, 1.38, 2.28, 1.52, 1.29, 1.92, 1.68, 0.51, 0.94, 2.98, 1.87, 0.9, 0.95, 0.32, 4.61]} \ No newline at end of file diff --git a/annotations_filtered/du22ttQhRhA_filtered.json b/annotations_filtered/du22ttQhRhA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a87448b6cd81c4ba3f87eb16deb96fcae1898ed7 --- /dev/null +++ b/annotations_filtered/du22ttQhRhA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.39], [7.0, 8.21], [8.0, 9.36], [11.0, 11.45], [12.0, 27.48], [33.0, 35.16], [36.0, 37.39], [39.0, 41.81], [43.0, 53.11], [55.0, 60.1], [62.0, 62.65], [64.0, 64.44], [65.0, 66.92], [68.0, 70.17], [71.0, 107.86], [124.0, 124.65], [135.0, 136.66], [149.0, 150.09], [152.0, 152.63], [155.0, 155.56], [165.0, 165.35], [168.0, 168.56], [171.0, 171.75], [187.0, 186.9], [191.0, 191.59], [197.0, 197.33], [199.0, 200.01], [204.0, 204.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.16, 0.0, 0.0, 0.0, 52.8, 65.44, 0.0, 80.64, 81.71, 77.2, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.39, 1.21, 1.36, 0.45, 15.48, 2.16, 1.39, 2.81, 10.11, 5.1, 0.65, 0.44, 1.92, 2.17, 36.86, 0.65, 1.66, 1.09, 0.63, 0.56, 0.35, 0.56, 0.75, -0.1, 0.59, 0.33, 1.01, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/duEErwP8eds_filtered.json b/annotations_filtered/duEErwP8eds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d74072edad544c61be2d4a295635a8eb0bb5dd0e --- /dev/null +++ b/annotations_filtered/duEErwP8eds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 31.68], [33.0, 46.79], [49.0, 54.38], [56.0, 59.24], [62.0, 79.57], [83.0, 89.94], [93.0, 115.97], [118.0, 118.89], [119.0, 120.09]], "keep_status": [true, true, false, false, false, false, true, false, false], "silence_prob": [37.72, 38.16, 70.02, 48.78, 33.83, 33.01, 36.82, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 7.26], ["music", 6.52], ["whale vocalization", 5.35]], [["groan", 25.89], ["speech", 21.78], ["grunt", 18.38]], null, [["music", 53.75], ["electronic music", 14.79], ["hum", 5.84]], [["mains hum", 27.26], ["music", 21.72], ["hum", 21.5]], [["fly, housefly", 55.67], ["insect", 27.61], ["mosquito", 5.63]], [["speech", 27.97], ["buzz", 27.59], ["hum", 8.89]], null, null], "duration": [3.68, 13.79, 5.38, 3.24, 17.57, 6.94, 22.97, 0.89, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/duT6QvbGAls_filtered.json b/annotations_filtered/duT6QvbGAls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..969e904ea22fc7f11b10ad755235d162b1116ae2 --- /dev/null +++ b/annotations_filtered/duT6QvbGAls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.29], [14.0, 21.02], [24.0, 24.14], [25.0, 26.05], [28.0, 32.32], [36.0, 36.29], [37.0, 37.44], [42.0, 42.63], [49.0, 49.74], [54.0, 54.46], [56.0, 57.92], [60.0, 61.92], [63.0, 63.76], [66.0, 66.56], [68.0, 69.4], [70.0, 71.86], [75.0, 75.68], [76.0, 82.78], [84.0, 94.85], [95.0, 96.23], [98.0, 98.83], [100.0, 100.87], [104.0, 104.48], [106.0, 106.81], [110.0, 109.95], [114.0, 114.32], [119.0, 119.55], [121.0, 121.9], [124.0, 124.38], [126.0, 126.66], [128.0, 128.83], [129.0, 131.28], [133.0, 132.97], [136.0, 136.76]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 32.1, 0.0, 0.0, 36.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.64, 31.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.51, 0.0, 0.0], "audiomae_on_audioset": [null, [["mains hum", 29.54], ["hum", 16.89], ["speech", 12.57]], null, null, [["hum", 16.67], ["noise", 14.52], ["mains hum", 12.88]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.63], ["mains hum", 18.51], ["hum", 18.23]], [["music", 42.42], ["theremin", 26.28], ["musical instrument", 5.16]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.1], ["speech", 15.2], ["musical instrument", 5.09]], null, null], "duration": [0.29, 7.02, 0.14, 1.05, 4.32, 0.29, 0.44, 0.63, 0.74, 0.46, 1.92, 1.92, 0.76, 0.56, 1.4, 1.86, 0.68, 6.78, 10.85, 1.23, 0.83, 0.87, 0.48, 0.81, -0.05, 0.32, 0.55, 0.9, 0.38, 0.66, 0.83, 2.28, -0.03, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/duU5cdQtpSE_filtered.json b/annotations_filtered/duU5cdQtpSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b57f536be37306121ce725a7729efd82503b2fea --- /dev/null +++ b/annotations_filtered/duU5cdQtpSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.85], [18.0, 26.45], [27.0, 32.09], [36.0, 36.44], [36.0, 40.24], [41.0, 41.17], [43.0, 43.48], [44.0, 44.31], [45.0, 45.79], [47.0, 48.9], [52.0, 52.34], [57.0, 62.75], [64.0, 80.67], [84.0, 84.37], [86.0, 93.56], [97.0, 96.9], [98.0, 99.3], [101.0, 101.36], [104.0, 104.52], [106.0, 106.17], [107.0, 107.79], [109.0, 109.92], [111.0, 120.65], [121.0, 121.42], [122.0, 122.77], [123.0, 126.01], [126.0, 130.64], [131.0, 132.41]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [99.21, 81.53, 89.36, 0.0, 45.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.23, 40.77, 0.0, 29.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 54.76, 38.09, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 30.82], ["radio", 13.0], ["noise", 5.96]], null, null, null, null, null, null, [["music", 35.91], ["hum", 14.53], ["throbbing", 10.45]], [["hum", 49.76], ["mains hum", 33.11], ["throbbing", 6.81]], null, [["speech", 49.08], ["music", 31.91], ["synthesizer", 5.26]], null, null, null, null, null, null, null, null, null, null, null, [["frog", 43.02], ["speech", 11.07], ["croak", 10.38]], null], "duration": [3.85, 8.45, 5.09, 0.44, 4.24, 0.17, 0.48, 0.31, 0.79, 1.9, 0.34, 5.75, 16.67, 0.37, 7.56, -0.1, 1.3, 0.36, 0.52, 0.17, 0.79, 0.92, 9.65, 0.42, 0.77, 3.01, 4.64, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/duZLaW_6qLc_filtered.json b/annotations_filtered/duZLaW_6qLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e7ec67aa9b0b4dbdd1327167947f80ecd72d4c1 --- /dev/null +++ b/annotations_filtered/duZLaW_6qLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.86], [9.0, 9.93], [12.0, 12.87], [17.0, 17.09], [19.0, 19.67], [25.0, 25.76], [26.0, 27.65], [31.0, 31.21], [32.0, 32.39], [33.0, 34.32], [39.0, 39.72], [42.0, 41.82], [50.0, 50.25], [51.0, 51.66], [53.0, 52.73], [54.0, 54.99], [56.0, 55.93], [59.0, 59.44], [61.0, 61.79], [64.0, 65.8], [66.0, 66.45], [68.0, 70.78], [73.0, 73.9]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [33.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.22, 0.0], "audiomae_on_audioset": [[["speech", 10.79], ["vehicle", 9.87], ["car", 9.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.71], ["boing", 7.4], ["fart", 6.22]], null], "duration": [2.86, 0.93, 0.87, 0.09, 0.67, 0.76, 1.65, 0.21, 0.39, 1.32, 0.72, -0.18, 0.25, 0.66, -0.27, 0.99, -0.07, 0.44, 0.79, 1.8, 0.45, 2.78, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/dudDh8KZiTE_filtered.json b/annotations_filtered/dudDh8KZiTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9af911d3071ab8141c4b9e33bded11a0a5f1a828 --- /dev/null +++ b/annotations_filtered/dudDh8KZiTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.71], [10.0, 9.75], [11.0, 13.41], [22.0, 22.38], [28.0, 28.16], [42.0, 42.08], [44.0, 51.27], [52.0, 52.66], [56.0, 56.46], [62.0, 61.94], [66.0, 67.32], [71.0, 71.19], [72.0, 72.35], [75.0, 75.25], [86.0, 86.21], [88.0, 88.72], [90.0, 90.68], [99.0, 100.77], [102.0, 103.13], [105.0, 106.14], [108.0, 109.04], [113.0, 114.35], [116.0, 116.48], [122.0, 122.98], [124.0, 124.7], [131.0, 131.82], [134.0, 134.59], [136.0, 137.07], [138.0, 139.06], [140.0, 140.8], [142.0, 143.4], [146.0, 146.87], [157.0, 157.17], [160.0, 160.32], [168.0, 168.71], [169.0, 172.0], [173.0, 173.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.16, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.71, -0.25, 2.41, 0.38, 0.16, 0.08, 7.27, 0.66, 0.46, -0.06, 1.32, 0.19, 0.35, 0.25, 0.21, 0.72, 0.68, 1.77, 1.13, 1.14, 1.04, 1.35, 0.48, 0.98, 0.7, 0.82, 0.59, 1.07, 1.06, 0.8, 1.4, 0.87, 0.17, 0.32, 0.71, 3.0, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/dvIzAdqrb4U_filtered.json b/annotations_filtered/dvIzAdqrb4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d85554c4874b0486f40501a5e88288da78f2a15 --- /dev/null +++ b/annotations_filtered/dvIzAdqrb4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.59], [26.0, 26.59], [50.0, 50.63], [64.0, 65.18], [66.0, 66.28], [78.0, 79.1], [84.0, 84.33], [93.0, 94.17], [102.0, 102.24], [109.0, 109.14], [111.0, 113.07], [119.0, 120.09], [128.0, 128.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.28, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.59, 0.63, 1.18, 0.28, 1.1, 0.33, 1.17, 0.24, 0.14, 2.07, 1.09, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/dvJqm3PFKLk_filtered.json b/annotations_filtered/dvJqm3PFKLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bb9b3b76fb55dc144be1fcaa0fdaf03e73ab46f --- /dev/null +++ b/annotations_filtered/dvJqm3PFKLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [6.0, 6.99], [9.0, 9.56], [12.0, 12.39], [14.0, 14.86], [17.0, 17.05], [21.0, 21.96], [24.0, 24.83], [30.0, 30.18], [31.0, 31.63], [33.0, 33.44], [52.0, 52.56], [55.0, 55.54], [58.0, 58.11], [60.0, 62.55], [71.0, 71.39], [72.0, 72.33], [73.0, 72.99], [74.0, 74.34], [75.0, 75.22], [76.0, 76.62], [79.0, 79.64], [80.0, 80.18], [82.0, 84.32], [89.0, 89.78], [95.0, 96.21], [98.0, 99.23], [101.0, 101.36], [103.0, 104.25], [106.0, 106.17], [108.0, 109.32], [111.0, 111.5], [112.0, 113.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.99, 0.56, 0.39, 0.86, 0.05, 0.96, 0.83, 0.18, 0.63, 0.44, 0.56, 0.54, 0.11, 2.55, 0.39, 0.33, -0.01, 0.34, 0.22, 0.62, 0.64, 0.18, 2.32, 0.78, 1.21, 1.23, 0.36, 1.25, 0.17, 1.32, 0.5, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/dvT333RoCrw_filtered.json b/annotations_filtered/dvT333RoCrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..519e09b177976ad76cdda9bd3e1a4562a0cff3db --- /dev/null +++ b/annotations_filtered/dvT333RoCrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.34], [13.0, 15.69], [17.0, 18.72], [20.0, 22.28], [25.0, 42.08], [43.0, 46.84], [49.0, 49.84], [51.0, 53.79], [55.0, 57.0], [58.0, 59.56], [61.0, 78.16], [80.0, 83.17], [84.0, 91.4], [92.0, 102.68], [103.0, 106.98], [108.0, 109.92], [110.0, 111.1], [112.0, 113.44], [114.0, 114.83], [115.0, 115.67], [117.0, 117.42], [120.0, 121.78], [122.0, 125.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 98.44, 0.0, 100.0, 100.0, 100.0, 0.0, 100.0, 100.0, 0.0, 100.0, 99.97, 99.98, 98.1, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.34, 2.69, 1.72, 2.28, 17.08, 3.84, 0.84, 2.79, 2.0, 1.56, 17.16, 3.17, 7.4, 10.68, 3.98, 1.92, 1.1, 1.44, 0.83, 0.67, 0.42, 1.78, 3.15]} \ No newline at end of file diff --git a/annotations_filtered/dvloIUSHogs_filtered.json b/annotations_filtered/dvloIUSHogs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3c90cc37abd00c16b9fb9b9c3c5cb7096ad42d3 --- /dev/null +++ b/annotations_filtered/dvloIUSHogs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.53], [15.0, 20.65], [22.0, 26.16], [28.0, 28.44], [29.0, 32.71], [35.0, 38.42], [43.0, 44.85], [46.0, 48.15], [53.0, 53.16], [57.0, 63.93], [64.0, 65.96], [67.0, 70.5], [74.0, 74.76], [84.0, 89.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.02, 31.77, 0.0, 31.82, 32.3, 0.0, 34.6, 0.0, 38.21, 0.0, 36.9, 0.0, 34.65], "audiomae_on_audioset": [null, [["music", 72.62], ["speech", 8.89], ["electronic music", 4.36]], [["music", 67.26], ["throbbing", 7.04], ["electronic music", 5.95]], null, [["music", 86.52], ["electronic music", 2.51], ["throbbing", 2.26]], [["music", 64.94], ["speech", 9.13], ["didgeridoo", 6.57]], null, [["music", 77.55], ["throbbing", 5.22], ["electronic music", 4.64]], null, [["music", 43.0], ["speech", 17.65], ["throbbing", 16.13]], null, [["music", 70.53], ["electronic music", 6.4], ["techno", 4.86]], null, [["music", 85.39], ["electronic music", 4.41], ["techno", 2.97]]], "duration": [1.53, 5.65, 4.16, 0.44, 3.71, 3.42, 1.85, 2.15, 0.16, 6.93, 1.96, 3.5, 0.76, 5.41]} \ No newline at end of file diff --git a/annotations_filtered/dvm7mLmAtTM_filtered.json b/annotations_filtered/dvm7mLmAtTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..050685224dcae430347bb9c0fe83252a514bd368 --- /dev/null +++ b/annotations_filtered/dvm7mLmAtTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.0], [23.0, 23.7], [24.0, 24.44], [26.0, 25.93], [29.0, 30.37], [31.0, 34.01], [35.0, 36.12], [38.0, 40.39], [43.0, 44.04], [45.0, 45.37], [45.0, 45.45], [47.0, 47.83], [48.0, 48.93], [50.0, 52.39], [54.0, 55.98], [60.0, 60.37], [61.0, 62.34], [63.0, 64.54], [68.0, 70.78], [73.0, 74.16], [81.0, 81.3], [84.0, 85.82], [86.0, 88.84], [89.0, 91.54], [92.0, 96.35], [100.0, 101.46], [106.0, 107.81], [114.0, 117.09], [120.0, 145.99], [148.0, 148.63], [154.0, 154.6], [155.0, 156.76], [162.0, 162.41], [163.0, 164.47], [166.0, 179.49]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, true, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.3, 0.0, 36.54, 0.0, 0.0, 0.0, 0.0, 0.0, 40.33, 0.0, 0.0, 0.0, 0.0, 38.03, 0.0, 0.0, 0.0, 41.2, 41.28, 39.54, 0.0, 0.0, 40.71, 29.27, 0.0, 0.0, 0.0, 0.0, 0.0, 29.44], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 26.31], ["mains hum", 13.08], ["music", 12.5]], null, [["music", 70.73], ["synthesizer", 3.36], ["singing bowl", 2.4]], null, null, null, null, null, [["music", 44.08], ["speech", 11.16], ["musical instrument", 5.37]], null, null, null, null, [["music", 38.41], ["guitar", 12.32], ["musical instrument", 11.89]], null, null, null, [["music", 42.71], ["speech", 14.52], ["synthesizer", 8.01]], [["hum", 17.0], ["mains hum", 13.24], ["speech", 9.57]], [["music", 51.58], ["mains hum", 9.33], ["synthesizer", 8.36]], null, null, [["music", 38.25], ["musical instrument", 7.86], ["guitar", 6.6]], [["music", 78.38], ["hum", 4.15], ["mains hum", 2.27]], null, null, null, null, null, [["music", 76.84], ["musical instrument", 6.7], ["drum", 1.65]]], "duration": [1.0, 0.7, 0.44, -0.07, 1.37, 3.01, 1.12, 2.39, 1.04, 0.37, 0.45, 0.83, 0.93, 2.39, 1.98, 0.37, 1.34, 1.54, 2.78, 1.16, 0.3, 1.82, 2.84, 2.54, 4.35, 1.46, 1.81, 3.09, 25.99, 0.63, 0.6, 1.76, 0.41, 1.47, 13.49]} \ No newline at end of file diff --git a/annotations_filtered/dvodASNU58U_filtered.json b/annotations_filtered/dvodASNU58U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3ae91aa99686a37c9cd918a598397a83647a20e --- /dev/null +++ b/annotations_filtered/dvodASNU58U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 33.42], [34.0, 35.68], [39.0, 40.0], [41.0, 64.5], [65.0, 68.28], [73.0, 73.57], [76.0, 76.65], [77.0, 78.27], [84.0, 91.44], [92.0, 92.96], [95.0, 104.77], [107.0, 124.68]], "keep_status": [true, false, false, true, true, false, false, false, true, false, false, true], "silence_prob": [31.47, 0.0, 0.0, 31.57, 32.38, 0.0, 0.0, 0.0, 35.71, 0.0, 34.17, 30.97], "audiomae_on_audioset": [[["music", 25.57], ["cattle, bovinae", 16.63], ["livestock, farm animals, working animals", 16.37]], null, null, [["music", 31.25], ["speech", 28.83], ["smash, crash", 8.18]], [["fart", 38.43], ["whale vocalization", 11.89], ["music", 9.68]], null, null, null, [["music", 41.57], ["speech", 15.4], ["crushing", 11.19]], null, [["music", 61.94], ["didgeridoo", 13.43], ["synthesizer", 4.94]], [["music", 36.13], ["mosquito", 4.7], ["insect", 4.66]]], "duration": [25.42, 1.68, 1.0, 23.5, 3.28, 0.57, 0.65, 1.27, 7.44, 0.96, 9.77, 17.68]} \ No newline at end of file diff --git a/annotations_filtered/dw2jrtR9Px4_filtered.json b/annotations_filtered/dw2jrtR9Px4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05a70b065fdb682e83034f753d0b34e52ce969af --- /dev/null +++ b/annotations_filtered/dw2jrtR9Px4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [9.0, 10.89], [13.0, 13.59], [18.0, 26.32], [29.0, 33.18], [35.0, 35.99], [38.0, 38.48], [41.0, 46.53], [47.0, 48.41], [49.0, 53.42], [56.0, 56.91], [62.0, 65.91], [68.0, 69.55], [71.0, 70.95], [72.0, 75.37], [77.0, 78.29], [84.0, 84.16], [85.0, 87.15], [88.0, 89.43], [90.0, 91.2], [93.0, 95.18], [95.0, 104.48], [105.0, 106.83], [111.0, 113.91], [117.0, 117.22], [119.0, 129.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 93.29, 97.11, 0.0, 0.0, 95.51, 0.0, 67.25, 0.0, 80.82, 0.0, 0.0, 58.38, 0.0, 0.0, 96.17, 0.0, 0.0, 86.09, 80.64, 0.0, 99.65, 0.0, 90.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 1.89, 0.59, 8.32, 4.18, 0.99, 0.48, 5.53, 1.41, 4.42, 0.91, 3.91, 1.55, -0.05, 3.37, 1.29, 0.16, 2.15, 1.43, 1.2, 2.18, 9.48, 1.83, 2.91, 0.22, 10.88]} \ No newline at end of file diff --git a/annotations_filtered/dw95Qsj59NA_filtered.json b/annotations_filtered/dw95Qsj59NA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfe3398ec46fe30f79db049be0244341feadaa5e --- /dev/null +++ b/annotations_filtered/dw95Qsj59NA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.46], [15.0, 17.64], [19.0, 37.05], [40.0, 95.49], [98.0, 143.26], [149.0, 150.26]], "keep_status": [true, false, false, false, false, false], "silence_prob": [28.84, 30.7, 28.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 35.85], ["hum", 12.42], ["music", 11.83]], [["music", 31.43], ["throbbing", 26.4], ["hum", 22.26]], [["hum", 36.96], ["music", 18.94], ["mains hum", 18.63]], null, null, null], "duration": [8.46, 2.64, 18.05, 55.49, 45.26, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/dwD4JZsAuew_filtered.json b/annotations_filtered/dwD4JZsAuew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6357763f77bec9548e12c51cbc30b0d7d705d1f --- /dev/null +++ b/annotations_filtered/dwD4JZsAuew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 16.71], [18.0, 18.08], [19.0, 29.57], [30.0, 37.02], [40.0, 41.99], [43.0, 43.44], [47.0, 71.54], [82.0, 94.31], [95.0, 95.59], [97.0, 97.7], [105.0, 104.75], [106.0, 106.05], [107.0, 109.21], [110.0, 111.65], [113.0, 116.72], [119.0, 122.52], [124.0, 125.07], [125.0, 125.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.54, 83.88, 0.0, 0.0, 68.28, 42.53, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 98.86, 94.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.85], ["musical instrument", 10.17], ["harp", 10.08]], null, null, null, null, [["music", 47.99], ["speech", 17.48], ["piano", 5.9]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.29, 0.08, 10.57, 7.02, 1.99, 0.44, 24.54, 12.31, 0.59, 0.7, -0.25, 0.05, 2.21, 1.65, 3.72, 3.52, 1.07, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/dwK_rODYMrY_filtered.json b/annotations_filtered/dwK_rODYMrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30fe9dd2880fcae96e020bb1fe14d28c0f82f4f3 --- /dev/null +++ b/annotations_filtered/dwK_rODYMrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.83], [11.0, 11.7], [12.0, 52.08], [54.0, 54.04], [56.0, 80.13], [83.0, 84.87], [85.0, 89.26], [90.0, 93.99], [96.0, 98.51], [100.0, 102.03], [106.0, 108.7], [110.0, 111.62], [115.0, 116.65], [120.0, 121.56], [126.0, 130.17], [131.0, 136.38], [140.0, 141.71], [146.0, 146.42], [147.0, 147.6], [149.0, 149.54], [152.0, 153.98], [159.0, 160.59], [162.0, 163.0], [165.0, 167.98], [170.0, 171.58], [173.0, 173.31], [175.0, 175.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [80.46, 0.0, 0.0, 0.0, 51.23, 0.0, 58.72, 56.55, 79.41, 76.86, 36.71, 0.0, 0.0, 0.0, 64.97, 52.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 30.96], ["speech", 11.73], ["throbbing", 9.18]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.88], ["gasp", 7.43], ["hum", 6.0]], null, null, null], "duration": [3.83, 0.7, 40.08, 0.04, 24.13, 1.87, 4.26, 3.99, 2.51, 2.03, 2.7, 1.62, 1.65, 1.56, 4.17, 5.38, 1.71, 0.42, 0.6, 0.54, 1.98, 1.59, 1.0, 2.98, 1.58, 0.31, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/dwMoiBGmH_4_filtered.json b/annotations_filtered/dwMoiBGmH_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76ec44aacb238886df2123050a39cbf333ce7c0c --- /dev/null +++ b/annotations_filtered/dwMoiBGmH_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [7.0, 7.35], [12.0, 12.95], [13.0, 13.95], [17.0, 17.63], [20.0, 19.97], [22.0, 24.48], [25.0, 46.82], [47.0, 62.75], [81.0, 81.36], [92.0, 92.28], [94.0, 94.37], [98.0, 103.92], [104.0, 104.01], [104.0, 104.06], [104.0, 104.09], [104.0, 104.13], [105.0, 105.02], [114.0, 113.83], [114.0, 113.86], [114.0, 122.55], [123.0, 124.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 60.6, 56.4, 0.0, 0.0, 0.0, 39.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.81], ["fly, housefly", 16.33], ["sidetone", 9.96]], null, null, null, null, null, null, null, [["speech", 70.29], ["boing", 3.79], ["sidetone", 2.4]], null], "duration": [0.5, 0.35, 0.95, 0.95, 0.63, -0.03, 2.48, 21.82, 15.75, 0.36, 0.28, 0.37, 5.92, 0.01, 0.06, 0.09, 0.13, 0.02, -0.17, -0.14, 8.55, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/dwT9BEh7qZ0_filtered.json b/annotations_filtered/dwT9BEh7qZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48d33802fd04249480408fc15ded10269ef826d1 --- /dev/null +++ b/annotations_filtered/dwT9BEh7qZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 55.09]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [46.09]} \ No newline at end of file diff --git a/annotations_filtered/dwecZ5D3tFY_filtered.json b/annotations_filtered/dwecZ5D3tFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e017037497c7c4486a2f745e738d8982d072749 --- /dev/null +++ b/annotations_filtered/dwecZ5D3tFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.93], [15.0, 17.22], [18.0, 22.98], [27.0, 29.17], [30.0, 32.51], [34.0, 51.48], [52.0, 66.68], [69.0, 80.47], [82.0, 83.66], [84.0, 85.13], [88.0, 90.24], [92.0, 94.39], [95.0, 99.87], [103.0, 115.05], [119.0, 123.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.76, 50.97, 99.84, 99.96, 36.06, 34.04, 97.64, 0.0, 0.0, 88.28, 87.92, 85.54, 84.43, 63.42], "audiomae_on_audioset": [null, null, null, null, null, [["animal", 41.46], ["roaring cats (lions, tigers)", 17.14], ["roar", 11.5]], [["whale vocalization", 70.58], ["animal", 11.91], ["wild animals", 3.47]], null, null, null, null, null, null, null, null], "duration": [1.93, 2.22, 4.98, 2.17, 2.51, 17.48, 14.68, 11.47, 1.66, 1.13, 2.24, 2.39, 4.87, 12.05, 4.48]} \ No newline at end of file diff --git a/annotations_filtered/dwh6SShhnVI_filtered.json b/annotations_filtered/dwh6SShhnVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52e8ee994865c840946756885c99e65b71b3a103 --- /dev/null +++ b/annotations_filtered/dwh6SShhnVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 26.55], [27.0, 41.99], [42.0, 51.12], [53.0, 53.54], [56.0, 56.13], [57.0, 61.11], [62.0, 63.07], [65.0, 66.63], [67.0, 82.11], [84.0, 84.52], [85.0, 85.99], [87.0, 87.69], [94.0, 94.63], [96.0, 99.17], [100.0, 101.43], [102.0, 108.06], [110.0, 110.84], [112.0, 116.63], [120.0, 125.25], [127.0, 133.84], [136.0, 146.55], [147.0, 150.33], [154.0, 157.94]], "keep_status": [true, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, true, true, false, true, true, true], "silence_prob": [29.32, 30.62, 32.14, 0.0, 0.0, 30.41, 0.0, 0.0, 29.25, 0.0, 0.0, 0.0, 0.0, 30.41, 0.0, 54.97, 0.0, 29.75, 29.79, 29.68, 29.7, 29.4, 29.46], "audiomae_on_audioset": [[["vehicle", 41.22], ["music", 15.56], ["car", 11.36]], [["music", 63.31], ["theremin", 4.19], ["hum", 4.13]], [["hum", 43.68], ["throbbing", 19.25], ["mains hum", 16.58]], null, null, [["moo", 12.4], ["music", 12.08], ["fly, housefly", 10.6]], null, null, [["livestock, farm animals, working animals", 14.39], ["cattle, bovinae", 12.8], ["fly, housefly", 11.44]], null, null, null, null, [["fly, housefly", 12.23], ["livestock, farm animals, working animals", 11.94], ["roar", 6.72]], null, null, null, [["whack, thwack", 27.6], ["grunt", 26.28], ["sound effect", 9.14]], [["music", 31.52], ["speech", 20.94], ["fart", 6.17]], [["music", 40.22], ["speech", 29.91], ["whip", 3.68]], [["music", 52.65], ["theremin", 6.56], ["sound effect", 5.57]], [["music", 21.07], ["hum", 17.98], ["mains hum", 17.69]], [["music", 24.52], ["buzz", 11.49], ["vehicle", 9.51]]], "duration": [9.55, 14.99, 9.12, 0.54, 0.13, 4.11, 1.07, 1.63, 15.11, 0.52, 0.99, 0.69, 0.63, 3.17, 1.43, 6.06, 0.84, 4.63, 5.25, 6.84, 10.55, 3.33, 3.94]} \ No newline at end of file diff --git a/annotations_filtered/dwufX9GKI_4_filtered.json b/annotations_filtered/dwufX9GKI_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8b0c432feb699890fc9e9ca1f24d203dd0ccf2c --- /dev/null +++ b/annotations_filtered/dwufX9GKI_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.07], [19.0, 19.47], [20.0, 26.33], [26.0, 26.69], [30.0, 29.78], [32.0, 34.48], [39.0, 38.94], [40.0, 40.32], [40.0, 40.47], [40.0, 50.97], [66.0, 67.59], [68.0, 69.26], [71.0, 70.71], [93.0, 93.11], [95.0, 95.54], [98.0, 98.22], [101.0, 102.81], [105.0, 105.97], [108.0, 124.5], [132.0, 133.22], [135.0, 137.66], [144.0, 148.32], [152.0, 151.77], [154.0, 159.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [51.44, 0.0, 34.48, 0.0, 0.0, 42.19, 0.0, 0.0, 0.0, 34.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 33.38, 35.26, 0.0, 36.57], "audiomae_on_audioset": [null, null, [["speech", 61.89], ["fart", 8.07], ["boing", 4.13]], null, null, [["music", 36.77], ["speech", 31.59], ["didgeridoo", 14.27]], null, null, null, [["music", 61.04], ["speech", 9.57], ["synthesizer", 2.48]], null, null, null, null, null, null, null, null, [["music", 65.2], ["speech", 10.34], ["didgeridoo", 3.1]], null, [["music", 45.05], ["boing", 9.57], ["speech", 9.08]], [["music", 38.21], ["fly, housefly", 11.48], ["mosquito", 7.59]], null, [["music", 52.45], ["didgeridoo", 27.17], ["hum", 1.74]]], "duration": [3.07, 0.47, 6.33, 0.69, -0.22, 2.48, -0.06, 0.32, 0.47, 10.97, 1.59, 1.26, -0.29, 0.11, 0.54, 0.22, 1.81, 0.97, 16.5, 1.22, 2.66, 4.32, -0.23, 5.43]} \ No newline at end of file diff --git a/annotations_filtered/dwykptqZBj0_filtered.json b/annotations_filtered/dwykptqZBj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5c011c0b169e81976c4cbb9a7465e304c5e8937 --- /dev/null +++ b/annotations_filtered/dwykptqZBj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [3.0, 3.89], [5.0, 5.48], [7.0, 8.56], [17.0, 17.95], [21.0, 22.59], [25.0, 25.95], [27.0, 26.96], [28.0, 28.24], [29.0, 29.91], [32.0, 32.27], [36.0, 37.15], [39.0, 39.72], [41.0, 42.15], [45.0, 46.82], [48.0, 48.95], [50.0, 50.58], [51.0, 52.51], [61.0, 62.61], [64.0, 65.91], [67.0, 67.47], [68.0, 69.08], [70.0, 70.58], [76.0, 83.34], [84.0, 96.04], [97.0, 99.08], [100.0, 102.44], [103.0, 104.55], [107.0, 107.0], [109.0, 109.81], [112.0, 114.54], [115.0, 116.16], [119.0, 119.2], [122.0, 123.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.01, 31.57, 47.27, 45.43, 0.0, 0.0, 0.0, 52.8, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.5], ["theremin", 27.01], ["hum", 2.77]], [["theremin", 83.68], ["music", 13.4], ["musical instrument", 0.39]], [["hum", 25.01], ["mains hum", 19.17], ["speech", 15.66]], [["hiccup", 28.27], ["speech", 15.53], ["dog", 6.32]], null, null, null, null, null, null, null], "duration": [0.49, 0.89, 0.48, 1.56, 0.95, 1.59, 0.95, -0.04, 0.24, 0.91, 0.27, 1.15, 0.72, 1.15, 1.82, 0.95, 0.58, 1.51, 1.61, 1.91, 0.47, 1.08, 0.58, 7.34, 12.04, 2.08, 2.44, 1.55, 0.0, 0.81, 2.54, 1.16, 0.2, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/dwzoyEaHxSM_filtered.json b/annotations_filtered/dwzoyEaHxSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eca81f9597d0524946d3d8617ac7b9226ee5730 --- /dev/null +++ b/annotations_filtered/dwzoyEaHxSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [7.0, 7.72], [18.0, 18.45], [19.0, 18.93], [21.0, 21.59], [24.0, 24.46], [26.0, 26.57], [28.0, 29.13], [30.0, 30.75], [34.0, 34.23], [36.0, 38.03], [39.0, 40.17], [42.0, 43.43], [45.0, 45.5], [47.0, 47.44], [50.0, 50.4], [51.0, 52.56], [61.0, 61.2], [63.0, 65.01], [65.0, 66.99], [68.0, 69.97], [71.0, 73.16], [74.0, 75.27], [77.0, 78.41], [80.0, 81.84], [83.0, 83.98], [89.0, 90.02], [93.0, 93.8], [94.0, 95.74], [98.0, 98.05], [99.0, 100.6], [102.0, 104.04], [105.0, 107.01], [108.0, 108.65], [109.0, 110.2], [113.0, 114.03], [115.0, 116.31], [120.0, 121.73], [124.0, 125.79], [127.0, 128.33], [132.0, 133.22], [136.0, 137.56], [140.0, 141.08], [141.0, 142.5], [144.0, 144.15], [147.0, 148.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.64, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 69.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.72, 0.45, -0.07, 0.59, 0.46, 0.57, 1.13, 0.75, 0.23, 2.03, 1.17, 1.43, 0.5, 0.44, 0.4, 1.56, 0.2, 2.01, 1.99, 1.97, 2.16, 1.27, 1.41, 1.84, 0.98, 1.02, 0.8, 1.74, 0.05, 1.6, 2.04, 2.01, 0.65, 1.2, 1.03, 1.31, 1.73, 1.79, 1.33, 1.22, 1.56, 1.08, 1.5, 0.15, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/dx07n7Eov0o_filtered.json b/annotations_filtered/dx07n7Eov0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b9b93f788a12656809f9dbeb71d33636d4efdf3 --- /dev/null +++ b/annotations_filtered/dx07n7Eov0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.51], [5.0, 7.92], [12.0, 12.72], [14.0, 14.81], [19.0, 19.68], [23.0, 23.3], [28.0, 29.08], [33.0, 33.17], [35.0, 35.97], [38.0, 40.95], [44.0, 44.46], [47.0, 47.19], [50.0, 51.66], [67.0, 68.25], [70.0, 70.23], [72.0, 72.28], [85.0, 87.3], [94.0, 99.17], [105.0, 107.57], [110.0, 121.31], [123.0, 133.86], [135.0, 143.18], [151.0, 151.39], [155.0, 156.07], [160.0, 163.97], [167.0, 167.85], [170.0, 170.95], [172.0, 173.28], [175.0, 178.51], [179.0, 179.93], [187.0, 190.83], [191.0, 192.4], [194.0, 198.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, true, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.64, 54.3, 47.31, 35.22, 36.87, 44.72, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 49.0, 0.0, 47.94, 0.0, 31.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.76], ["electric shaver, electric razor", 7.78], ["didgeridoo", 7.44]], null, [["music", 46.12], ["speech", 12.41], ["synthesizer", 5.47]], [["hum", 31.33], ["electric shaver, electric razor", 17.6], ["mains hum", 13.37]], [["buzz", 38.3], ["whimper", 17.98], ["hum", 9.95]], [["music", 25.9], ["singing bowl", 10.6], ["whale vocalization", 7.56]], null, null, null, null, null, null, [["speech", 31.11], ["music", 20.51], ["hum", 6.67]], null, [["hum", 36.52], ["throbbing", 36.28], ["mains hum", 11.84]], null, [["music", 22.85], ["speech", 14.0], ["fly, housefly", 9.05]]], "duration": [1.51, 2.92, 0.72, 0.81, 0.68, 0.3, 1.08, 0.17, 0.97, 2.95, 0.46, 0.19, 1.66, 1.25, 0.23, 0.28, 2.3, 5.17, 2.57, 11.31, 10.86, 8.18, 0.39, 1.07, 3.97, 0.85, 0.95, 1.28, 3.51, 0.93, 3.83, 1.4, 4.59]} \ No newline at end of file diff --git a/annotations_filtered/dxfqu-v68IM_filtered.json b/annotations_filtered/dxfqu-v68IM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae265411d4600940eaf787368f4970a33ca8c27e --- /dev/null +++ b/annotations_filtered/dxfqu-v68IM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.0], [8.0, 7.94], [15.0, 16.16], [24.0, 23.95], [29.0, 31.53], [33.0, 33.57], [37.0, 37.08], [40.0, 40.02], [44.0, 44.93], [48.0, 48.83], [52.0, 52.19], [56.0, 59.24], [61.0, 60.89], [63.0, 63.56], [74.0, 74.36], [76.0, 77.08], [79.0, 78.87], [85.0, 91.17], [93.0, 97.39], [104.0, 105.38], [109.0, 110.0], [112.0, 111.97], [124.0, 124.33], [137.0, 139.18], [141.0, 142.48], [145.0, 147.34], [148.0, 151.39], [152.0, 153.69], [154.0, 157.91], [158.0, 160.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 63.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 48.65, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 56.25, 96.54, 0.0, 96.77, 65.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mosquito", 66.92], ["fly, housefly", 21.75], ["insect", 5.78]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, -0.06, 1.16, -0.05, 2.53, 0.57, 0.08, 0.02, 0.93, 0.83, 0.19, 3.24, -0.11, 0.56, 0.36, 1.08, -0.13, 6.17, 4.39, 1.38, 1.0, -0.03, 0.33, 2.18, 1.48, 2.34, 3.39, 1.69, 3.91, 2.3]} \ No newline at end of file diff --git a/annotations_filtered/dxlbeqeGkQ8_filtered.json b/annotations_filtered/dxlbeqeGkQ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ba78753cc6a30f187867214a3f4cee7d11db1a2 --- /dev/null +++ b/annotations_filtered/dxlbeqeGkQ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.69], [15.0, 15.18], [18.0, 18.6], [19.0, 22.22], [23.0, 24.54], [25.0, 26.57], [36.0, 36.29], [37.0, 59.48], [70.0, 70.46], [78.0, 80.81], [83.0, 82.66], [83.0, 83.94], [87.0, 90.46], [91.0, 93.33], [94.0, 97.8], [98.0, 101.44], [114.0, 119.96], [120.0, 121.88], [123.0, 123.26], [124.0, 125.14], [127.0, 127.5], [128.0, 128.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 80.29, 0.0, 83.34, 0.0, 0.0, 78.72, 77.87, 86.82, 70.02, 58.13, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.69, 0.18, 0.6, 3.22, 1.54, 1.57, 0.29, 22.48, 0.46, 2.81, -0.34, 0.94, 3.46, 2.33, 3.8, 3.44, 5.96, 1.88, 0.26, 1.14, 0.5, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/dy3yjv2YLh0_filtered.json b/annotations_filtered/dy3yjv2YLh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a29cd97d7a6b915d2875a52e1c6cc30e16f7b44 --- /dev/null +++ b/annotations_filtered/dy3yjv2YLh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.17], [15.0, 15.57], [21.0, 32.24], [49.0, 50.5], [55.0, 57.18], [76.0, 77.35], [83.0, 85.83], [95.0, 98.61], [100.0, 101.28], [103.0, 104.16], [108.0, 108.65], [116.0, 117.14], [123.0, 126.01], [127.0, 128.17], [130.0, 132.48], [134.0, 135.6], [139.0, 139.23], [141.0, 141.49], [143.0, 143.31]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 38.97, 0.0, 54.23, 0.0, 56.03, 52.74, 0.0, 0.0, 0.0, 0.0, 46.33, 0.0, 38.14, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["glass", 16.4], ["music", 15.42], ["coin (dropping)", 6.78]], null, null, null, null, null, null, null, null, null, [["speech", 24.85], ["music", 15.4], ["boing", 11.16]], null, [["music", 15.45], ["speech", 13.97], ["singing bowl", 6.0]], null, null, null, null], "duration": [1.17, 0.57, 11.24, 1.5, 2.18, 1.35, 2.83, 3.61, 1.28, 1.16, 0.65, 1.14, 3.01, 1.17, 2.48, 1.6, 0.23, 0.49, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/dy9fKXNAhA0_filtered.json b/annotations_filtered/dy9fKXNAhA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fab30beb1fe792da404cf360d7167e955fec1420 --- /dev/null +++ b/annotations_filtered/dy9fKXNAhA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.3], [3.0, 3.65], [8.0, 8.41], [9.0, 9.15], [10.0, 10.47], [12.0, 12.29], [13.0, 15.04], [18.0, 19.33], [20.0, 20.82], [22.0, 22.52], [23.0, 24.11], [28.0, 28.36], [31.0, 31.94], [34.0, 34.65], [39.0, 39.24], [41.0, 41.88], [43.0, 44.0], [45.0, 46.28], [49.0, 51.43], [52.0, 52.91], [54.0, 55.71], [57.0, 56.98], [58.0, 58.72], [59.0, 60.39], [61.0, 62.45], [64.0, 65.01], [66.0, 68.35], [71.0, 71.79], [74.0, 74.95], [76.0, 80.82], [83.0, 85.56], [87.0, 90.09], [91.0, 92.5], [93.0, 97.63], [99.0, 108.21], [109.0, 112.31], [113.0, 114.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 99.96, 100.0, 100.0, 0.0, 100.0, 98.93, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.65, 0.41, 0.15, 0.47, 0.29, 2.04, 1.33, 0.82, 0.52, 1.11, 0.36, 0.94, 0.65, 0.24, 0.88, 1.0, 1.28, 2.43, 0.91, 1.71, -0.02, 0.72, 1.39, 1.45, 1.01, 2.35, 0.79, 0.95, 4.82, 2.56, 3.09, 1.5, 4.63, 9.21, 3.31, 1.98]} \ No newline at end of file diff --git a/annotations_filtered/dyCbGaYPSIY_filtered.json b/annotations_filtered/dyCbGaYPSIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ef4d655a61dc08f66b39663e1ef80a1ec24e910 --- /dev/null +++ b/annotations_filtered/dyCbGaYPSIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.6], [16.0, 18.06], [19.0, 28.58], [54.0, 64.44], [92.0, 99.54], [135.0, 147.72]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 28.02, 28.08, 28.2, 28.01, 28.16], "audiomae_on_audioset": [null, [["music", 35.46], ["cacophony", 7.22], ["didgeridoo", 5.34]], [["music", 95.22], ["speech", 0.67], ["electronic music", 0.42]], [["music", 98.12], ["electronic music", 0.52], ["reverberation", 0.12]], [["music", 80.48], ["electronic music", 1.41], ["maraca", 1.14]], [["music", 70.85], ["speech", 15.04], ["electronic music", 2.29]]], "duration": [0.6, 2.06, 9.58, 10.44, 7.54, 12.72]} \ No newline at end of file diff --git a/annotations_filtered/dyXlsD7Gx0Y_filtered.json b/annotations_filtered/dyXlsD7Gx0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ac8a2d63ace8872bde4eb515bc779ee1e2f34c1 --- /dev/null +++ b/annotations_filtered/dyXlsD7Gx0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [4.0, 7.21], [8.0, 15.35], [16.0, 68.62], [70.0, 71.73], [72.0, 75.05], [75.0, 76.72], [79.0, 81.04], [82.0, 90.32], [92.0, 105.22], [106.0, 106.66], [107.0, 111.47], [112.0, 112.65], [113.0, 128.76], [131.0, 131.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.19, 100.0, 0.0, 0.0, 99.92, 0.0, 100.0, 97.64, 97.11, 0.0, 91.3, 0.0, 84.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 3.21, 7.35, 52.62, 1.73, 3.05, 1.72, 2.04, 8.32, 13.22, 0.66, 4.47, 0.65, 15.76, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/dyqDd8esYdc_filtered.json b/annotations_filtered/dyqDd8esYdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1f853ce045dc74ffd430162563d82ffa27be0d6 --- /dev/null +++ b/annotations_filtered/dyqDd8esYdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 16.21], [19.0, 20.97], [25.0, 30.11], [34.0, 35.85], [40.0, 40.59], [41.0, 41.42], [44.0, 44.59], [45.0, 47.19], [47.0, 47.28], [47.0, 47.75], [51.0, 53.7], [59.0, 59.29], [60.0, 68.47], [69.0, 72.3], [74.0, 75.32], [77.0, 78.21], [79.0, 80.37], [82.0, 86.41], [88.0, 90.17], [90.0, 95.5], [97.0, 98.32], [99.0, 111.64]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.25, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 45.33, 0.0, 0.0, 68.02, 0.0, 74.29, 93.91, 0.0, 0.0, 0.0, 73.82, 69.2, 64.75, 0.0, 85.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mains hum", 33.01], ["hum", 13.25], ["vehicle", 5.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.21, 1.97, 5.11, 1.85, 0.59, 0.42, 0.59, 2.19, 0.28, 0.75, 2.7, 0.29, 8.47, 3.3, 1.32, 1.21, 1.37, 4.41, 2.17, 5.5, 1.32, 12.64]} \ No newline at end of file diff --git a/annotations_filtered/dyxcQ4FV6KM_filtered.json b/annotations_filtered/dyxcQ4FV6KM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/dyxcQ4FV6KM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/dzbazAbjk8w_filtered.json b/annotations_filtered/dzbazAbjk8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f02b3af8ccbb95ed54fe499ffe8603ce0f0bc8c --- /dev/null +++ b/annotations_filtered/dzbazAbjk8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.1], [5.0, 5.91], [8.0, 8.11], [12.0, 12.9], [15.0, 16.21], [22.0, 22.28], [33.0, 35.56], [37.0, 37.67], [39.0, 39.73], [43.0, 43.9], [46.0, 46.41], [49.0, 49.44], [50.0, 52.12], [53.0, 53.94], [55.0, 54.77], [56.0, 59.17], [61.0, 62.06], [64.0, 64.84], [68.0, 68.49], [70.0, 70.7], [73.0, 73.6], [75.0, 75.34], [76.0, 78.26], [80.0, 80.22], [90.0, 92.82], [94.0, 94.66], [98.0, 98.17], [101.0, 102.51], [104.0, 105.04], [106.0, 107.2], [109.0, 109.92], [114.0, 114.22], [122.0, 122.81], [124.0, 124.58], [125.0, 127.97], [131.0, 131.73]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.92, 0.0, 0.0, 0.0, 0.0, 0.0, 33.32, 0.0, 0.0, 34.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.88, 0.0, 36.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 20.85], ["fly, housefly", 15.41], ["music", 13.4]], null, null, null, null, null, [["music", 37.25], ["musical instrument", 5.94], ["theremin", 4.21]], null, null, [["fly, housefly", 13.6], ["music", 10.96], ["mosquito", 5.32]], null, null, null, null, null, null, [["music", 11.95], ["didgeridoo", 7.81], ["fly, housefly", 5.38]], null, [["music", 24.58], ["speech", 5.96], ["hum", 4.9]], null, null, null, null, null, null, null, null, null, [["radio", 51.28], ["speech", 10.95], ["didgeridoo", 8.76]], null], "duration": [0.1, 0.91, 0.11, 0.9, 1.21, 0.28, 2.56, 0.67, 0.73, 0.9, 0.41, 0.44, 2.12, 0.94, -0.23, 3.17, 1.06, 0.84, 0.49, 0.7, 0.6, 0.34, 2.26, 0.22, 2.82, 0.66, 0.17, 1.51, 1.04, 1.2, 0.92, 0.22, 0.81, 0.58, 2.97, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/dzkjnPSbxJw_filtered.json b/annotations_filtered/dzkjnPSbxJw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b753f80049ba194d3024b434b2164a32dfef5cb --- /dev/null +++ b/annotations_filtered/dzkjnPSbxJw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.69], [9.0, 9.48], [10.0, 15.52], [17.0, 18.84], [26.0, 27.19], [33.0, 35.95], [38.0, 38.7], [39.0, 41.37], [50.0, 50.55], [52.0, 52.29], [55.0, 56.15], [64.0, 64.1], [68.0, 67.86], [69.0, 70.44], [76.0, 77.01], [87.0, 88.4], [90.0, 91.5], [97.0, 96.94], [100.0, 108.09], [109.0, 109.54], [112.0, 112.19], [116.0, 117.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.42, 0.0, 0.0, 100.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 0.48, 5.52, 1.84, 1.19, 2.95, 0.7, 2.37, 0.55, 0.29, 1.15, 0.1, -0.14, 1.44, 1.01, 1.4, 1.5, -0.06, 8.09, 0.54, 0.19, 1.64]} \ No newline at end of file diff --git a/annotations_filtered/dzvTHhWDjIg_filtered.json b/annotations_filtered/dzvTHhWDjIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f73294217e2e06033fc36c1bcab1c1c700cd346b --- /dev/null +++ b/annotations_filtered/dzvTHhWDjIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.12], [4.0, 21.95]], "keep_status": [false, false], "silence_prob": [0.0, 30.22], "audiomae_on_audioset": [null, [["music", 88.65], ["drum machine", 1.53], ["drum and bass", 1.19]]], "duration": [1.12, 17.95]} \ No newline at end of file diff --git a/annotations_filtered/dzzijuZof1w_filtered.json b/annotations_filtered/dzzijuZof1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46ce546f63bcd3b24d2072b9d8a62bb1dfc32cfb --- /dev/null +++ b/annotations_filtered/dzzijuZof1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.48], [28.0, 28.66], [29.0, 29.98], [31.0, 40.42], [41.0, 52.64], [59.0, 78.14], [79.0, 103.65], [105.0, 113.24], [114.0, 114.78], [116.0, 132.75], [135.0, 139.6], [143.0, 144.29], [148.0, 148.58]], "keep_status": [false, false, false, true, false, true, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.43, 29.18, 28.88, 29.03, 29.09, 0.0, 28.84, 28.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 24.37], ["speech", 22.91], ["hum", 21.42]], [["throbbing", 39.55], ["music", 30.28], ["hum", 15.94]], [["music", 28.51], ["speech", 15.98], ["hum", 9.39]], [["music", 27.05], ["machine gun", 20.18], ["hum", 11.68]], [["music", 27.45], ["rumble", 11.59], ["gong", 9.81]], null, [["music", 43.81], ["hum", 10.74], ["mains hum", 6.94]], [["music", 30.02], ["hum", 19.1], ["mains hum", 10.97]], null, null], "duration": [0.48, 0.66, 0.98, 9.42, 11.64, 19.14, 24.65, 8.24, 0.78, 16.75, 4.6, 1.29, 0.58]} \ No newline at end of file