diff --git a/annotations_filtered/q-1DREuXwjc_filtered.json b/annotations_filtered/q-1DREuXwjc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..878dee1383200e004a89e780017d0ff1a895525f --- /dev/null +++ b/annotations_filtered/q-1DREuXwjc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.24], [3.0, 2.83], [3.0, 7.64], [10.0, 10.2], [13.0, 13.76], [15.0, 18.27], [21.0, 21.07], [22.0, 22.17], [23.0, 23.45], [25.0, 26.55], [32.0, 32.41], [39.0, 39.73], [41.0, 41.45], [44.0, 44.51], [48.0, 48.95]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 38.84, 0.0, 0.0, 45.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 32.53], ["mains hum", 15.74], ["speech", 15.25]], null, null, [["speech", 40.42], ["sine wave", 30.86], ["chirp tone", 8.52]], null, null, null, null, null, null, null, null, null], "duration": [1.24, -0.17, 4.64, 0.2, 0.76, 3.27, 0.07, 0.17, 0.45, 1.55, 0.41, 0.73, 0.45, 0.51, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/q-H62GgHjeg_filtered.json b/annotations_filtered/q-H62GgHjeg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c3d957135dd3ea4595c9334185fc7c1c726f572 --- /dev/null +++ b/annotations_filtered/q-H62GgHjeg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.43], [17.0, 17.58], [29.0, 30.48], [55.0, 55.76], [59.0, 60.18], [71.0, 72.47], [74.0, 75.73], [76.0, 77.6], [78.0, 78.22], [81.0, 81.01], [83.0, 83.62], [94.0, 94.78], [105.0, 105.85], [110.0, 114.35], [115.0, 115.37], [122.0, 123.42], [126.0, 126.52], [128.0, 128.97], [130.0, 133.51], [138.0, 137.86], [139.0, 145.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.89, 0.0, 0.0, 0.0, 0.0, 32.84, 0.0, 31.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 34.47], ["speech", 29.46], ["music", 6.12]], null, null, null, null, [["cattle, bovinae", 23.0], ["music", 19.66], ["moo", 17.99]], null, [["speech", 26.02], ["cattle, bovinae", 24.3], ["moo", 17.48]]], "duration": [0.43, 0.58, 1.48, 0.76, 1.18, 1.47, 1.73, 1.6, 0.22, 0.01, 0.62, 0.78, 0.85, 4.35, 0.37, 1.42, 0.52, 0.97, 3.51, -0.14, 6.69]} \ No newline at end of file diff --git a/annotations_filtered/q-StMfE8NrA_filtered.json b/annotations_filtered/q-StMfE8NrA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3367e3c1c4632b915949d4f9e2ed3fd0a34b33bc --- /dev/null +++ b/annotations_filtered/q-StMfE8NrA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.21], [8.0, 49.08], [51.0, 85.87]], "keep_status": [false, false, false], "silence_prob": [32.37, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 34.28], ["music", 33.27], ["throbbing", 12.38]], null, null], "duration": [6.21, 41.08, 34.87]} \ No newline at end of file diff --git a/annotations_filtered/q-kLlfq4JpU_filtered.json b/annotations_filtered/q-kLlfq4JpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1399a9551f5d71c74e99f9a10561b0382f32c1b --- /dev/null +++ b/annotations_filtered/q-kLlfq4JpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 33.89], [42.0, 42.69], [44.0, 43.78]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [-0.11, 0.69, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/q-nQtR-WbIs_filtered.json b/annotations_filtered/q-nQtR-WbIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..859d5bd8a8db60b8a5bc926d9f78d290652f5aa1 --- /dev/null +++ b/annotations_filtered/q-nQtR-WbIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.99], [15.0, 16.09], [17.0, 18.67], [20.0, 21.05], [23.0, 24.83], [25.0, 27.5], [31.0, 31.35], [33.0, 33.89], [36.0, 42.15], [44.0, 45.4], [49.0, 53.2], [55.0, 57.52], [60.0, 61.84], [63.0, 65.65], [68.0, 70.68], [72.0, 91.34], [93.0, 97.53], [98.0, 101.28], [102.0, 109.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [61.87, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 0.0, 63.64, 0.0, 58.3, 80.11, 0.0, 73.51, 46.36, 53.22, 71.57, 53.4, 57.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.09], ["musical instrument", 12.16], ["guitar", 5.93]], null, null, null, null], "duration": [4.99, 1.09, 1.67, 1.05, 1.83, 2.5, 0.35, 0.89, 6.15, 1.4, 4.2, 2.52, 1.84, 2.65, 2.68, 19.34, 4.53, 3.28, 7.75]} \ No newline at end of file diff --git a/annotations_filtered/q-y6JBpCFtI_filtered.json b/annotations_filtered/q-y6JBpCFtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91d8a9f29f5c18341099019084a9d5c556d1ec55 --- /dev/null +++ b/annotations_filtered/q-y6JBpCFtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.1], [22.0, 23.14], [30.0, 31.24], [33.0, 34.59], [36.0, 37.62], [39.0, 40.53], [46.0, 47.65], [53.0, 53.43], [56.0, 57.03], [60.0, 63.61], [67.0, 68.25], [69.0, 70.36], [79.0, 80.13], [88.0, 99.45], [101.0, 101.01], [106.0, 106.32], [107.0, 107.69], [118.0, 120.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 93.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.1, 1.14, 1.24, 1.59, 1.62, 1.53, 1.65, 0.43, 1.03, 3.61, 1.25, 1.36, 1.13, 11.45, 0.01, 0.32, 0.69, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/q06t8RTLqMQ_filtered.json b/annotations_filtered/q06t8RTLqMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2fda730f465461b60b72a11f8fe98f5b3b24e514 --- /dev/null +++ b/annotations_filtered/q06t8RTLqMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.34], [10.0, 12.26], [15.0, 15.63], [17.0, 17.69], [25.0, 35.95], [36.0, 40.68], [41.0, 42.42], [43.0, 44.79], [47.0, 47.33], [50.0, 55.59], [57.0, 60.35], [62.0, 64.05], [66.0, 67.36], [71.0, 71.63], [74.0, 75.02], [83.0, 86.0], [88.0, 90.17], [92.0, 98.39], [102.0, 105.43], [107.0, 108.75], [110.0, 109.95], [113.0, 114.2], [115.0, 115.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.64, 84.25, 0.0, 0.0, 33.39, 32.21, 0.0, 0.0, 0.0, 73.06, 40.99, 40.93, 0.0, 0.0, 0.0, 59.42, 46.61, 80.11, 41.28, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["dial tone", 47.99], ["speech", 28.52], ["sidetone", 8.24]], [["cattle, bovinae", 48.9], ["moo", 33.44], ["livestock, farm animals, working animals", 10.75]], null, null, null, null, [["dial tone", 19.85], ["chirp tone", 19.43], ["sine wave", 14.41]], [["cattle, bovinae", 38.64], ["moo", 36.11], ["livestock, farm animals, working animals", 4.39]], null, null, null, null, [["chirp tone", 53.41], ["sine wave", 17.39], ["busy signal", 3.8]], null, [["speech", 51.68], ["noise", 11.67], ["sidetone", 8.07]], null, null, null, null], "duration": [4.34, 2.26, 0.63, 0.69, 10.95, 4.68, 1.42, 1.79, 0.33, 5.59, 3.35, 2.05, 1.36, 0.63, 1.02, 3.0, 2.17, 6.39, 3.43, 1.75, -0.05, 1.2, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/q0vvYHuA10U_filtered.json b/annotations_filtered/q0vvYHuA10U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd97b3c18332424f494adc80beafa473fe2e8284 --- /dev/null +++ b/annotations_filtered/q0vvYHuA10U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.32], [11.0, 21.81], [22.0, 21.9], [22.0, 39.26], [40.0, 46.63], [48.0, 56.4], [59.0, 76.94], [81.0, 85.7], [88.0, 91.1], [94.0, 106.15], [108.0, 108.85], [113.0, 117.41]], "keep_status": [true, true, false, true, true, false, true, true, true, false, false, false], "silence_prob": [29.39, 29.98, 0.0, 29.38, 29.85, 60.05, 32.6, 36.74, 33.44, 29.85, 0.0, 60.14], "audiomae_on_audioset": [[["speech", 56.75], ["explosion", 6.39], ["burst, pop", 4.82]], [["buzz", 37.02], ["hum", 11.18], ["music", 6.94]], null, [["music", 25.82], ["hum", 13.13], ["cacophony", 10.18]], [["speech", 57.7], ["vehicle", 4.2], ["explosion", 3.51]], null, [["music", 57.44], ["theremin", 9.18], ["electronic music", 2.88]], [["music", 46.44], ["brass instrument", 7.49], ["trombone", 4.7]], [["music", 37.71], ["speech", 15.08], ["didgeridoo", 4.84]], [["music", 50.91], ["buzz", 16.01], ["didgeridoo", 3.53]], null, null], "duration": [2.32, 10.81, -0.1, 17.26, 6.63, 8.4, 17.94, 4.7, 3.1, 12.15, 0.85, 4.41]} \ No newline at end of file diff --git a/annotations_filtered/q0yFqlPrLyE_filtered.json b/annotations_filtered/q0yFqlPrLyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b4669189fe00db6f9f23bfc4e9034a194fc61ad --- /dev/null +++ b/annotations_filtered/q0yFqlPrLyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.43], [8.0, 15.52], [18.0, 18.47], [19.0, 22.17], [23.0, 29.94], [31.0, 39.31], [45.0, 52.56], [56.0, 61.28], [62.0, 63.34], [65.0, 65.8], [74.0, 74.58], [75.0, 78.41], [80.0, 80.28], [83.0, 82.9], [95.0, 95.32], [98.0, 99.87], [100.0, 100.79], [104.0, 105.78], [108.0, 109.17], [113.0, 113.9], [115.0, 115.42], [116.0, 117.24], [118.0, 119.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.85, 93.29, 0.0, 74.6, 41.98, 38.23, 35.42, 36.6, 0.0, 0.0, 0.0, 63.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["boing", 58.0], ["music", 28.85], ["speech", 6.57]], [["music", 75.79], ["musical instrument", 4.69], ["brass instrument", 2.0]], [["music", 66.78], ["speech", 7.5], ["livestock, farm animals, working animals", 3.17]], [["music", 82.57], ["singing", 1.21], ["musical instrument", 0.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.43, 7.52, 0.47, 3.17, 6.94, 8.31, 7.56, 5.28, 1.34, 0.8, 0.58, 3.41, 0.28, -0.1, 0.32, 1.87, 0.79, 1.78, 1.17, 0.9, 0.42, 1.24, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/q15Yv0rZXqs_filtered.json b/annotations_filtered/q15Yv0rZXqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bb4b410aad287521586b32d360df6b802d92e45 --- /dev/null +++ b/annotations_filtered/q15Yv0rZXqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.78], [9.0, 11.82], [14.0, 15.75], [36.0, 36.64], [41.0, 43.06], [46.0, 56.37], [60.0, 80.72], [83.0, 90.31], [92.0, 104.9], [108.0, 108.16]], "keep_status": [false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 46.12, 0.0, 0.0, 86.64, 43.85, 37.11, 35.41, 32.44, 0.0], "audiomae_on_audioset": [null, [["music", 52.11], ["brass instrument", 6.08], ["clarinet", 6.06]], null, null, null, [["speech", 52.36], ["music", 22.95], ["musical instrument", 5.35]], [["music", 69.08], ["didgeridoo", 16.59], ["musical instrument", 2.19]], [["music", 37.52], ["didgeridoo", 18.35], ["speech", 6.39]], [["cattle, bovinae", 41.85], ["moo", 30.65], ["livestock, farm animals, working animals", 14.96]], null], "duration": [1.78, 2.82, 1.75, 0.64, 2.06, 10.37, 20.72, 7.31, 12.9, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/q1D9i-d1m4Y_filtered.json b/annotations_filtered/q1D9i-d1m4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..489d8ea175a4dad6014677ce5797bd1549aa654e --- /dev/null +++ b/annotations_filtered/q1D9i-d1m4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.02], [26.0, 25.93], [38.0, 38.47], [43.0, 45.25], [55.0, 59.07], [61.0, 76.32]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 44.96, 46.97, 43.74], "audiomae_on_audioset": [null, null, null, [["music", 92.01], ["speech", 0.89], ["musical instrument", 0.63]], [["music", 71.98], ["didgeridoo", 3.05], ["musical instrument", 2.5]], [["music", 76.88], ["trombone", 3.96], ["didgeridoo", 3.76]]], "duration": [1.02, -0.07, 0.47, 2.25, 4.07, 15.32]} \ No newline at end of file diff --git a/annotations_filtered/q1Pz7ppcuJc_filtered.json b/annotations_filtered/q1Pz7ppcuJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33b109dee9ee2902e71303671c5ecef79d065a52 --- /dev/null +++ b/annotations_filtered/q1Pz7ppcuJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.37], [6.0, 8.75], [9.0, 12.21], [13.0, 15.96], [20.0, 22.1], [23.0, 24.04], [26.0, 25.98], [28.0, 28.51], [29.0, 30.55], [32.0, 35.99], [37.0, 38.18], [40.0, 41.03], [44.0, 45.89], [47.0, 62.24], [63.0, 64.81], [66.0, 66.19], [67.0, 68.72], [69.0, 70.56], [74.0, 75.09], [77.0, 77.45], [78.0, 78.88], [80.0, 81.33], [83.0, 83.51], [87.0, 87.51], [88.0, 93.56], [96.0, 96.67], [97.0, 100.84], [103.0, 104.58], [105.0, 106.96], [111.0, 111.52], [112.0, 115.52], [117.0, 123.72], [129.0, 129.69]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.47, 84.98, 49.22, 85.72, 44.34, 0.0, 0.0, 0.0, 0.0, 48.06, 0.0, 0.0, 0.0, 41.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.71, 0.0, 51.82, 0.0, 0.0, 0.0, 54.04, 51.71, 0.0], "audiomae_on_audioset": [null, null, [["speech", 52.06], ["telephone", 13.12], ["sidetone", 7.11]], null, [["speech", 43.81], ["cat", 5.86], ["inside, small room", 3.66]], null, null, null, null, [["thunk", 15.77], ["noise", 14.97], ["crushing", 13.75]], null, null, null, [["music", 51.39], ["electric shaver, electric razor", 7.36], ["hum", 5.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.37, 2.75, 3.21, 2.96, 2.1, 1.04, -0.02, 0.51, 1.55, 3.99, 1.18, 1.03, 1.89, 15.24, 1.81, 0.19, 1.72, 1.56, 1.09, 0.45, 0.88, 1.33, 0.51, 0.51, 5.56, 0.67, 3.84, 1.58, 1.96, 0.52, 3.52, 6.72, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/q1SFvQhjK5I_filtered.json b/annotations_filtered/q1SFvQhjK5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00e18a206fc89cde1e872484411cd86ffe61c352 --- /dev/null +++ b/annotations_filtered/q1SFvQhjK5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 41.28], [42.0, 42.26], [43.0, 43.68], [45.0, 45.15], [50.0, 50.8], [53.0, 54.06], [55.0, 56.54], [58.0, 58.8], [65.0, 65.67], [66.0, 67.54], [69.0, 69.52], [70.0, 71.07], [73.0, 73.72], [80.0, 81.82], [84.0, 84.94], [101.0, 101.95], [103.0, 104.45], [105.0, 106.68], [108.0, 109.07], [111.0, 111.54], [112.0, 112.97], [114.0, 114.64], [116.0, 118.1], [129.0, 130.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0], "audiomae_on_audioset": [[["music", 77.7], ["theremin", 2.9], ["throbbing", 1.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.28, 0.26, 0.68, 0.15, 0.8, 1.06, 1.54, 0.8, 0.67, 1.54, 0.52, 1.07, 0.72, 1.82, 0.94, 0.95, 1.45, 1.68, 1.07, 0.54, 0.97, 0.64, 2.1, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/q1bV-D8cSz8_filtered.json b/annotations_filtered/q1bV-D8cSz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fdb1cc4765a78d247937cae11041ba0de172c80 --- /dev/null +++ b/annotations_filtered/q1bV-D8cSz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 37.77], [39.0, 44.68], [49.0, 71.68], [72.0, 72.62], [77.0, 77.25], [79.0, 79.62], [81.0, 82.07], [83.0, 96.45], [96.0, 115.42]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [80.11, 86.82, 72.75, 0.0, 0.0, 0.0, 0.0, 32.66, 33.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 23.95], ["speech", 16.88], ["hum", 14.72]], [["music", 37.04], ["speech", 24.19], ["smash, crash", 9.74]]], "duration": [22.77, 5.68, 22.68, 0.62, 0.25, 0.62, 1.07, 13.45, 19.42]} \ No newline at end of file diff --git a/annotations_filtered/q254XDNZ2Ao_filtered.json b/annotations_filtered/q254XDNZ2Ao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5d0e85225e0deb22a9b6bd08b2029452826d02a --- /dev/null +++ b/annotations_filtered/q254XDNZ2Ao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 30.75], [36.0, 38.52], [44.0, 48.05], [49.0, 50.36], [51.0, 85.09], [87.0, 116.95], [117.0, 117.02], [118.0, 117.78]], "keep_status": [true, true, true, false, false, true, false, false], "silence_prob": [31.56, 32.37, 39.41, 0.0, 0.0, 30.1, 0.0, 0.0], "audiomae_on_audioset": [[["music", 20.43], ["didgeridoo", 9.59], ["theremin", 6.52]], [["speech", 25.4], ["race car, auto racing", 8.76], ["vehicle", 5.75]], [["music", 34.53], ["fly, housefly", 7.43], ["mosquito", 5.22]], null, null, [["music", 15.18], ["fart", 14.86], ["whack, thwack", 10.16]], null, null], "duration": [16.75, 2.52, 4.05, 1.36, 34.09, 29.95, 0.02, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/q289a8P8Ht8_filtered.json b/annotations_filtered/q289a8P8Ht8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2d827271413ff968398496b2f7db9db8586bd01 --- /dev/null +++ b/annotations_filtered/q289a8P8Ht8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 116.88], [118.0, 149.82]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [82.88, 31.82]} \ No newline at end of file diff --git a/annotations_filtered/q292IDwEWZ0_filtered.json b/annotations_filtered/q292IDwEWZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7380f13ffe2262ea5f8ae6e42d3ae3265b9d61c8 --- /dev/null +++ b/annotations_filtered/q292IDwEWZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 19.99], [22.0, 22.94], [24.0, 25.79], [27.0, 30.15], [31.0, 43.44], [44.0, 44.31], [44.0, 44.37], [44.0, 46.87], [50.0, 83.42], [86.0, 101.17], [102.0, 102.41], [109.0, 109.85], [110.0, 118.83], [121.0, 134.59]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, true, true], "silence_prob": [29.32, 0.0, 0.0, 29.09, 29.06, 0.0, 0.0, 29.17, 0.0, 31.86, 0.0, 0.0, 29.92, 28.79], "audiomae_on_audioset": [[["music", 38.93], ["speech", 35.7], ["thunk", 2.42]], null, null, [["theremin", 31.87], ["music", 27.32], ["crowd", 3.77]], [["cattle, bovinae", 33.73], ["moo", 20.29], ["livestock, farm animals, working animals", 18.62]], null, null, [["whack, thwack", 30.92], ["throbbing", 15.67], ["whip", 9.01]], null, [["music", 44.22], ["theremin", 21.93], ["ambient music", 5.12]], null, null, [["music", 22.35], ["fly, housefly", 22.3], ["insect", 7.58]], [["livestock, farm animals, working animals", 13.56], ["music", 12.15], ["cattle, bovinae", 6.67]]], "duration": [18.99, 0.94, 1.79, 3.15, 12.44, 0.31, 0.37, 2.87, 33.42, 15.17, 0.41, 0.85, 8.83, 13.59]} \ No newline at end of file diff --git a/annotations_filtered/q2EU-k9I5yg_filtered.json b/annotations_filtered/q2EU-k9I5yg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf33f8ca162013533cbc139e174d7cf73ac3292f --- /dev/null +++ b/annotations_filtered/q2EU-k9I5yg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.48], [4.0, 4.45], [10.0, 10.39], [12.0, 12.04], [13.0, 13.61], [19.0, 19.57], [45.0, 45.6], [48.0, 48.61], [58.0, 59.19], [97.0, 97.12], [101.0, 101.33], [102.0, 102.1], [106.0, 107.32], [111.0, 111.91], [113.0, 113.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.48, 0.45, 0.39, 0.04, 0.61, 0.57, 0.6, 0.61, 1.19, 0.12, 0.33, 0.1, 1.32, 0.91, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/q2YwvMc96VY_filtered.json b/annotations_filtered/q2YwvMc96VY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed5fb815cca7de6d97ce2ead61b5a59dd07f0238 --- /dev/null +++ b/annotations_filtered/q2YwvMc96VY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 6.02], [7.0, 7.05], [9.0, 9.81], [11.0, 11.53], [14.0, 14.57], [16.0, 16.44], [20.0, 20.17], [22.0, 64.52], [65.0, 67.37], [68.0, 69.6], [70.0, 72.82], [73.0, 75.36], [76.0, 77.63], [79.0, 79.44], [80.0, 80.76], [83.0, 83.24], [85.0, 86.07], [87.0, 90.54], [91.0, 100.33], [103.0, 104.14], [107.0, 108.8], [109.0, 111.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 57.48, 64.07, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 33.63, 0.0, 0.0, 52.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.18], ["speech", 15.51], ["sidetone", 5.07]], null, null, null], "duration": [1.3, 1.02, 0.05, 0.81, 0.53, 0.57, 0.44, 0.17, 42.52, 2.37, 1.6, 2.82, 2.36, 1.63, 0.44, 0.76, 0.24, 1.07, 3.54, 9.33, 1.14, 1.8, 2.92]} \ No newline at end of file diff --git a/annotations_filtered/q2pzOimT9so_filtered.json b/annotations_filtered/q2pzOimT9so_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73b97c0f386b259b0e423b708d584ef2a7890c33 --- /dev/null +++ b/annotations_filtered/q2pzOimT9so_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 26.87], [27.0, 27.67], [29.0, 32.16], [34.0, 43.5], [44.0, 48.93], [51.0, 52.79], [55.0, 57.23], [58.0, 63.71], [68.0, 69.31]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [73.97, 0.0, 96.42, 99.97, 97.11, 0.0, 84.43, 99.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [18.87, 0.67, 3.16, 9.5, 4.93, 1.79, 2.23, 5.71, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/q30Pl1M6_DE_filtered.json b/annotations_filtered/q30Pl1M6_DE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eaac6bf946caee7a2f3fd1483ee6423e6145e19b --- /dev/null +++ b/annotations_filtered/q30Pl1M6_DE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 110.42], [113.0, 112.9], [114.0, 136.07]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 29.54], "audiomae_on_audioset": [null, null, [["music", 69.57], ["hum", 9.74], ["mains hum", 4.53]]], "duration": [92.42, -0.1, 22.07]} \ No newline at end of file diff --git a/annotations_filtered/q3JlGPF4Ko8_filtered.json b/annotations_filtered/q3JlGPF4Ko8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf919baa064f6f602b512ef0040070c07b94f745 --- /dev/null +++ b/annotations_filtered/q3JlGPF4Ko8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.06], [5.0, 5.68], [6.0, 8.14], [10.0, 10.89], [12.0, 13.42], [14.0, 18.84], [22.0, 29.89], [34.0, 35.33], [39.0, 47.58], [49.0, 50.01], [52.0, 53.5], [56.0, 58.6], [61.0, 63.51], [65.0, 65.89], [72.0, 115.67], [117.0, 118.32], [120.0, 121.95]], "keep_status": [true, false, true, false, false, false, false, false, true, false, false, true, true, false, false, false, false], "silence_prob": [30.41, 0.0, 39.24, 0.0, 0.0, 42.3, 54.1, 0.0, 41.64, 0.0, 0.0, 49.36, 35.68, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["sound effect", 10.76], ["music", 9.96], ["trombone", 8.21]], null, [["hum", 22.74], ["sidetone", 20.33], ["mains hum", 19.7]], null, null, [["speech", 46.75], ["radio", 26.61], ["hum", 4.39]], null, null, [["hum", 26.72], ["mains hum", 25.87], ["vehicle", 8.24]], null, null, [["hum", 6.52], ["vehicle", 6.36], ["creak", 5.51]], [["speech", 18.55], ["radio", 11.12], ["frog", 7.68]], null, null, null, null], "duration": [2.06, 0.68, 2.14, 0.89, 1.42, 4.84, 7.89, 1.33, 8.58, 1.01, 1.5, 2.6, 2.51, 0.89, 43.67, 1.32, 1.95]} \ No newline at end of file diff --git a/annotations_filtered/q3NI5sE3KeY_filtered.json b/annotations_filtered/q3NI5sE3KeY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eef57e27ec11cf537d802c6082a87417d4314f4a --- /dev/null +++ b/annotations_filtered/q3NI5sE3KeY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.23], [16.0, 17.61], [22.0, 22.77], [26.0, 26.47], [30.0, 30.91], [41.0, 41.64], [58.0, 59.07], [60.0, 61.59], [63.0, 64.66], [78.0, 78.58], [80.0, 80.11], [83.0, 90.98], [93.0, 94.41], [96.0, 97.39], [102.0, 104.58], [106.0, 107.2], [112.0, 112.77], [117.0, 117.04], [122.0, 122.91], [127.0, 126.86], [132.0, 134.25], [138.0, 137.74], [143.0, 143.67], [158.0, 159.87], [164.0, 164.25], [181.0, 181.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 56.03, 0.0, 0.0, 0.0, 0.0, 0.0, 48.35, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 46.53], ["music", 29.43], ["mains hum", 4.95]], null, null, null, null, null], "duration": [0.23, 1.61, 0.77, 0.47, 0.91, 0.64, 1.07, 1.59, 1.66, 0.58, 0.11, 7.98, 1.41, 1.39, 2.58, 1.2, 0.77, 0.04, 0.91, -0.14, 2.25, -0.26, 0.67, 1.87, 0.25, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/q3OTEdZkBaQ_filtered.json b/annotations_filtered/q3OTEdZkBaQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12b4343b9c74f0131a6b98707f01002e8c585b11 --- /dev/null +++ b/annotations_filtered/q3OTEdZkBaQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.7], [27.0, 31.75], [33.0, 35.41], [36.0, 37.18], [53.0, 54.16], [56.0, 56.61], [70.0, 70.33], [73.0, 78.49], [80.0, 80.57], [82.0, 82.32]], "keep_status": [true, false, false, false, false, false, false, true, false, false], "silence_prob": [32.69, 34.04, 32.52, 0.0, 0.0, 0.0, 0.0, 30.5, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 25.18], ["fly, housefly", 17.96], ["music", 13.51]], [["hum", 43.48], ["mains hum", 25.16], ["whale vocalization", 7.12]], [["mains hum", 32.88], ["whale vocalization", 23.9], ["hum", 17.33]], null, null, null, null, [["music", 41.53], ["speech", 16.67], ["fart", 6.5]], null, null], "duration": [3.7, 4.75, 2.41, 1.18, 1.16, 0.61, 0.33, 5.49, 0.57, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/q3Vvto0REuc_filtered.json b/annotations_filtered/q3Vvto0REuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f24b32a11034a4bb60f4b37641d5be338fa1fe5 --- /dev/null +++ b/annotations_filtered/q3Vvto0REuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.05], [28.0, 39.77], [41.0, 41.91], [44.0, 46.67], [48.0, 50.04], [51.0, 52.05], [53.0, 54.06], [56.0, 56.49], [57.0, 58.23], [63.0, 63.83], [65.0, 65.74], [67.0, 70.12], [71.0, 72.1], [73.0, 73.99], [75.0, 75.95], [77.0, 77.53], [79.0, 79.88], [81.0, 82.31], [83.0, 83.47], [85.0, 85.77], [88.0, 91.86], [93.0, 94.86], [97.0, 97.16], [99.0, 99.03], [101.0, 101.61], [102.0, 103.25], [104.0, 104.38], [105.0, 104.94], [107.0, 107.76], [109.0, 109.93], [111.0, 112.24], [115.0, 115.08], [116.0, 117.42], [119.0, 119.57], [122.0, 123.16], [124.0, 124.78], [126.0, 126.69], [128.0, 128.73], [130.0, 130.98], [133.0, 133.32], [134.0, 135.01], [136.0, 137.03], [139.0, 143.16], [148.0, 149.88], [150.0, 152.56], [153.0, 154.75], [156.0, 157.17], [158.0, 160.1], [161.0, 162.08], [164.0, 166.53], [168.0, 168.89], [172.0, 193.24], [194.0, 195.61], [197.0, 197.46], [200.0, 202.95], [204.0, 205.43], [208.0, 215.89], [217.0, 219.06], [219.0, 221.97], [222.0, 224.14], [225.0, 228.33]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 30.57, 0.0, 49.68, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 56.18, 0.0, 0.0, 53.84, 0.0, 99.76, 0.0, 94.95, 0.0, 0.0, 78.55, 0.0, 99.88, 62.78, 49.27, 39.63, 99.16], "audiomae_on_audioset": [null, [["fly, housefly", 15.2], ["hum", 15.1], ["music", 13.9]], null, [["speech", 11.13], ["hum", 10.58], ["sneeze", 9.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.07], ["sidetone", 24.02], ["hum", 3.63]], [["speech", 31.75], ["sidetone", 19.56], ["dial tone", 12.14]], null], "duration": [1.05, 11.77, 0.91, 2.67, 2.04, 1.05, 1.06, 0.49, 1.23, 0.83, 0.74, 3.12, 1.1, 0.99, 0.95, 0.53, 0.88, 1.31, 0.47, 0.77, 3.86, 1.86, 0.16, 0.03, 0.61, 1.25, 0.38, -0.06, 0.76, 0.93, 1.24, 0.08, 1.42, 0.57, 1.16, 0.78, 0.69, 0.73, 0.98, 0.32, 1.01, 1.03, 4.16, 1.88, 2.56, 1.75, 1.17, 2.1, 1.08, 2.53, 0.89, 21.24, 1.61, 0.46, 2.95, 1.43, 7.89, 2.06, 2.97, 2.14, 3.33]} \ No newline at end of file diff --git a/annotations_filtered/q3a5wxfm13Q_filtered.json b/annotations_filtered/q3a5wxfm13Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e25fea28303080f8b195d25570a8ecc8e21153d --- /dev/null +++ b/annotations_filtered/q3a5wxfm13Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.66], [7.0, 10.94], [12.0, 11.87], [17.0, 17.61], [18.0, 18.67], [20.0, 20.92], [22.0, 22.28], [26.0, 26.65], [31.0, 31.13], [37.0, 36.85], [37.0, 38.23], [40.0, 40.58], [42.0, 42.21], [43.0, 43.39], [46.0, 46.75], [49.0, 49.17], [52.0, 52.03], [57.0, 56.86], [58.0, 58.75], [63.0, 62.99], [65.0, 65.92], [68.0, 70.95], [71.0, 71.71], [72.0, 72.6], [83.0, 83.02], [85.0, 98.31], [99.0, 99.4], [101.0, 101.46], [103.0, 107.49], [109.0, 111.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.56, 0.0, 0.0, 0.0, 91.13, 0.0, 0.0, 31.23, 57.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 82.45], ["radio", 10.48], ["speech synthesizer", 1.65]], null, null, null, null, null, null, [["speech", 84.17], ["radio", 8.92], ["speech synthesizer", 1.88]], null], "duration": [0.66, 3.94, -0.13, 0.61, 0.67, 0.92, 0.28, 0.65, 0.13, -0.15, 1.23, 0.58, 0.21, 0.39, 0.75, 0.17, 0.03, -0.14, 0.75, -0.01, 0.92, 2.95, 0.71, 0.6, 0.02, 13.31, 0.4, 0.46, 4.49, 2.91]} \ No newline at end of file diff --git a/annotations_filtered/q42thgSKkpo_filtered.json b/annotations_filtered/q42thgSKkpo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71cdd813712ecf42a270c7d28116d0ab2cd15ca6 --- /dev/null +++ b/annotations_filtered/q42thgSKkpo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 64.52], [67.0, 75.03], [76.0, 81.19], [83.0, 83.44], [84.0, 83.61], [84.0, 99.37], [103.0, 110.79], [116.0, 118.81], [122.0, 132.19], [133.0, 153.87], [155.0, 158.97]], "keep_status": [false, true, true, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 29.06, 30.16, 0.0, 0.0, 29.37, 42.19, 36.52, 35.61, 38.9, 29.26], "audiomae_on_audioset": [null, [["music", 26.49], ["speech", 23.9], ["mains hum", 13.67]], [["music", 25.8], ["mains hum", 6.93], ["foghorn", 6.43]], null, null, [["music", 65.23], ["didgeridoo", 7.31], ["speech", 3.64]], [["music", 41.02], ["speech", 15.76], ["whale vocalization", 7.68]], [["theremin", 36.28], ["music", 31.47], ["wind instrument, woodwind instrument", 4.54]], [["music", 46.12], ["theremin", 25.52], ["whale vocalization", 4.7]], [["didgeridoo", 43.17], ["music", 34.13], ["musical instrument", 2.84]], [["music", 45.52], ["musical instrument", 9.54], ["sound effect", 6.44]]], "duration": [56.52, 8.03, 5.19, 0.44, -0.39, 15.37, 7.79, 2.81, 10.19, 20.87, 3.97]} \ No newline at end of file diff --git a/annotations_filtered/q437KEcmwmM_filtered.json b/annotations_filtered/q437KEcmwmM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dea49a350f20ddb7348aefed2574a9395b02b62 --- /dev/null +++ b/annotations_filtered/q437KEcmwmM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 37.13], [43.0, 43.48], [44.0, 49.01], [52.0, 85.55], [88.0, 93.88], [95.0, 96.89], [97.0, 104.48]], "keep_status": [true, false, true, false, false, false, false], "silence_prob": [35.0, 0.0, 30.58, 0.0, 70.72, 0.0, 46.05], "audiomae_on_audioset": [[["music", 9.82], ["vehicle", 6.77], ["eruption", 5.16]], null, [["music", 34.67], ["speech", 20.6], ["eruption", 11.35]], null, null, null, [["music", 67.71], ["hum", 4.34], ["electronic music", 3.81]]], "duration": [4.13, 0.48, 5.01, 33.55, 5.88, 1.89, 7.48]} \ No newline at end of file diff --git a/annotations_filtered/q4G5hUvL-wI_filtered.json b/annotations_filtered/q4G5hUvL-wI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b793fce6f2685c5d7a444544bcbf92984502f5d --- /dev/null +++ b/annotations_filtered/q4G5hUvL-wI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 32.09], [33.0, 39.65], [42.0, 48.54], [49.0, 49.4], [50.0, 72.47], [75.0, 87.45], [88.0, 96.13], [96.0, 113.88]], "keep_status": [false, false, false, false, false, true, false, true], "silence_prob": [33.76, 32.35, 37.9, 0.0, 36.35, 34.87, 34.6, 34.0], "audiomae_on_audioset": [[["music", 64.56], ["synthesizer", 10.34], ["musical instrument", 4.38]], [["music", 59.36], ["musical instrument", 12.59], ["synthesizer", 5.86]], [["music", 68.37], ["effects unit", 9.12], ["guitar", 5.57]], null, [["music", 63.74], ["synthesizer", 4.78], ["musical instrument", 2.77]], [["music", 49.96], ["clarinet", 12.2], ["saxophone", 7.81]], [["music", 58.76], ["saxophone", 9.59], ["musical instrument", 4.51]], [["music", 55.42], ["saxophone", 7.38], ["harmonica", 7.17]]], "duration": [11.09, 6.65, 6.54, 0.4, 22.47, 12.45, 8.13, 17.88]} \ No newline at end of file diff --git a/annotations_filtered/q4Qlk7sfZfQ_filtered.json b/annotations_filtered/q4Qlk7sfZfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28902b04769abbb0f2ffddabe514050bfaf9549f --- /dev/null +++ b/annotations_filtered/q4Qlk7sfZfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.39], [11.0, 14.98], [15.0, 25.84], [27.0, 32.75], [36.0, 43.77], [49.0, 76.6], [79.0, 82.76], [84.0, 83.91], [89.0, 89.56], [90.0, 89.82], [90.0, 90.95], [91.0, 92.16], [92.0, 95.84], [96.0, 96.82], [101.0, 117.51], [119.0, 123.97], [127.0, 127.36]], "keep_status": [true, true, true, true, true, true, true, false, false, false, false, false, false, false, true, true, false], "silence_prob": [39.25, 44.37, 31.19, 31.03, 30.41, 30.86, 43.13, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 0.0, 30.36, 30.33, 0.0], "audiomae_on_audioset": [[["music", 16.67], ["effects unit", 9.06], ["musical instrument", 6.95]], [["effects unit", 22.56], ["distortion", 13.1], ["noise", 6.49]], [["speech", 9.02], ["echo", 7.98], ["boing", 7.29]], [["noise", 12.4], ["hum", 11.83], ["buzz", 11.35]], [["car", 15.08], ["vehicle", 14.31], ["crowd", 9.19]], [["animal", 18.12], ["fly, housefly", 14.96], ["insect", 13.04]], [["fly, housefly", 24.15], ["noise", 17.64], ["insect", 11.4]], null, null, null, null, null, null, null, [["car", 12.76], ["echo", 10.57], ["vehicle", 10.23]], [["speech", 32.39], ["cacophony", 16.01], ["radio", 6.05]], null], "duration": [2.39, 3.98, 10.84, 5.75, 7.77, 27.6, 3.76, -0.09, 0.56, -0.18, 0.95, 1.16, 3.84, 0.82, 16.51, 4.97, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/q4RbzjuXB6E_filtered.json b/annotations_filtered/q4RbzjuXB6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dae6a3f778bed2b4883100dd86f8982f39b1d7fe --- /dev/null +++ b/annotations_filtered/q4RbzjuXB6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 31.16], [33.0, 37.44], [40.0, 45.69], [46.0, 69.31], [82.0, 82.95], [84.0, 85.94], [88.0, 113.26], [114.0, 115.16]], "keep_status": [true, false, false, false, false, false, false, false], "silence_prob": [34.6, 47.2, 40.43, 35.36, 0.0, 0.0, 33.36, 0.0], "audiomae_on_audioset": [[["music", 31.26], ["speech", 20.23], ["electric shaver, electric razor", 9.69]], [["music", 48.4], ["didgeridoo", 15.03], ["speech", 10.6]], [["speech", 60.1], ["music", 23.52], ["fly, housefly", 2.28]], [["music", 64.08], ["throbbing", 5.84], ["hum", 3.34]], null, null, [["music", 48.63], ["speech", 26.18], ["electric shaver, electric razor", 3.78]], null], "duration": [26.16, 4.44, 5.69, 23.31, 0.95, 1.94, 25.26, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/q4VIMzhfeYc_filtered.json b/annotations_filtered/q4VIMzhfeYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84423ee56833c836d879bb9c5b0a5b1f4b602ec3 --- /dev/null +++ b/annotations_filtered/q4VIMzhfeYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.09], [10.0, 16.53], [28.0, 29.56], [30.0, 38.58], [39.0, 49.77], [51.0, 51.41], [53.0, 54.23], [55.0, 56.56], [57.0, 65.74], [67.0, 68.12], [70.0, 70.66], [73.0, 72.89], [73.0, 73.06], [74.0, 74.9], [79.0, 82.53], [83.0, 82.95], [83.0, 83.17], [84.0, 84.2], [86.0, 86.93], [88.0, 88.89], [90.0, 98.1], [99.0, 103.47], [104.0, 105.56], [106.0, 107.03], [108.0, 108.94], [110.0, 111.42], [112.0, 113.04], [116.0, 116.61], [118.0, 118.5], [122.0, 123.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.54, 87.0, 0.0, 99.91, 100.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.09, 6.53, 1.56, 8.58, 10.77, 0.41, 1.23, 1.56, 8.74, 1.12, 0.66, -0.11, 0.06, 0.9, 3.53, -0.05, 0.17, 0.2, 0.93, 0.89, 8.1, 4.47, 1.56, 1.03, 0.94, 1.42, 1.04, 0.61, 0.5, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/q5BzDVDotzI_filtered.json b/annotations_filtered/q5BzDVDotzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a6d3b5bdc21d821dd322d9c38390a5e10f58b01 --- /dev/null +++ b/annotations_filtered/q5BzDVDotzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.3], [4.0, 5.05], [5.0, 6.39], [7.0, 7.7], [10.0, 10.47], [13.0, 13.27], [14.0, 15.35], [20.0, 21.36], [23.0, 23.62], [26.0, 27.43], [28.0, 29.17], [30.0, 31.13], [32.0, 33.4], [35.0, 35.01], [36.0, 36.54], [38.0, 38.58], [39.0, 40.26], [44.0, 44.1], [47.0, 47.73], [48.0, 49.25], [51.0, 51.66], [56.0, 55.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 1.05, 1.39, 0.7, 0.47, 0.27, 1.35, 1.36, 0.62, 1.43, 1.17, 1.13, 1.4, 0.01, 0.54, 0.58, 1.26, 0.1, 0.73, 1.25, 0.66, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/q5K1fm56gI8_filtered.json b/annotations_filtered/q5K1fm56gI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff3078db431de730c671e12bff8985b66e58e3f8 --- /dev/null +++ b/annotations_filtered/q5K1fm56gI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [6.0, 6.66], [8.0, 10.29], [12.0, 12.07], [13.0, 17.36], [22.0, 23.11], [29.0, 30.11], [35.0, 36.12], [39.0, 39.85], [45.0, 45.76], [48.0, 61.45], [62.0, 62.85], [65.0, 66.53], [68.0, 70.16], [73.0, 117.76], [119.0, 119.84], [123.0, 171.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 45.72, 0.0, 37.31, 0.0, 0.0, 0.0, 0.0, 0.0, 30.54, 0.0, 0.0, 30.08, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 69.18], ["speech", 18.74], ["chirp tone", 2.29]], null, [["speech", 56.16], ["sidetone", 12.94], ["hum", 4.17]], null, null, null, null, null, [["music", 53.88], ["synthesizer", 8.64], ["effects unit", 4.6]], null, null, [["music", 23.68], ["hum", 15.37], ["noise", 11.27]], null, null, null], "duration": [0.29, 0.66, 2.29, 0.07, 4.36, 1.11, 1.11, 1.12, 0.85, 0.76, 13.45, 0.85, 1.53, 2.16, 44.76, 0.84, 48.17]} \ No newline at end of file diff --git a/annotations_filtered/q5RSKejDWo8_filtered.json b/annotations_filtered/q5RSKejDWo8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b668e559887e787248df620dda7a746e3cab9f3 --- /dev/null +++ b/annotations_filtered/q5RSKejDWo8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [5.0, 5.07], [7.0, 9.42], [11.0, 17.31], [26.0, 27.53], [31.0, 31.41], [32.0, 32.49], [33.0, 33.79], [41.0, 40.86], [42.0, 42.82], [44.0, 44.1], [47.0, 48.25], [53.0, 54.24], [55.0, 56.94], [58.0, 60.0], [62.0, 65.6], [69.0, 69.01], [76.0, 76.4], [77.0, 77.06], [80.0, 79.95], [81.0, 81.48], [82.0, 83.07], [83.0, 83.59], [84.0, 87.07], [88.0, 88.64], [89.0, 90.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 85.72, 60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.07, 2.42, 6.31, 1.53, 0.41, 0.49, 0.79, -0.14, 0.82, 0.1, 1.25, 1.24, 1.94, 2.0, 3.6, 0.01, 0.4, 0.06, -0.05, 0.48, 1.07, 0.59, 3.07, 0.64, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/q5eGg_CgBPk_filtered.json b/annotations_filtered/q5eGg_CgBPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45bb471648d9e6d024c7cf48e62ce7ef59e4ec6c --- /dev/null +++ b/annotations_filtered/q5eGg_CgBPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.0], [14.0, 15.08], [20.0, 36.95], [59.0, 61.13], [65.0, 79.03], [79.0, 79.07], [79.0, 79.1], [79.0, 79.41], [79.0, 79.44], [85.0, 85.11], [92.0, 98.17], [100.0, 102.29], [113.0, 120.5], [128.0, 130.54], [133.0, 148.44]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 32.51, 32.22, 32.7, 0.0, 0.0, 0.0, 0.0, 0.0, 32.88, 34.17, 33.75, 31.01, 35.3], "audiomae_on_audioset": [null, null, [["music", 23.97], ["speech", 18.5], ["breaking", 15.7]], [["speech", 41.2], ["music", 32.48], ["boing", 3.31]], [["speech", 48.29], ["music", 35.28], ["explosion", 2.42]], null, null, null, null, null, [["music", 45.03], ["didgeridoo", 14.62], ["speech", 11.91]], [["music", 41.47], ["theremin", 4.79], ["musical instrument", 4.75]], [["speech", 45.67], ["music", 35.79], ["sidetone", 6.72]], [["music", 41.66], ["trombone", 8.49], ["speech", 7.33]], [["whale vocalization", 40.86], ["theremin", 20.63], ["music", 16.89]]], "duration": [0.0, 1.08, 16.95, 2.13, 14.03, 0.07, 0.1, 0.41, 0.44, 0.11, 6.17, 2.29, 7.5, 2.54, 15.44]} \ No newline at end of file diff --git a/annotations_filtered/q5v5DOEF45E_filtered.json b/annotations_filtered/q5v5DOEF45E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f592ad45b43988152ef8143326d6aa1b73b18a2e --- /dev/null +++ b/annotations_filtered/q5v5DOEF45E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.51], [8.0, 9.15], [12.0, 12.97], [14.0, 15.4], [20.0, 20.73], [25.0, 26.5], [41.0, 44.22], [54.0, 55.16], [59.0, 61.92], [66.0, 66.8], [68.0, 69.21], [70.0, 77.53], [78.0, 82.97], [84.0, 89.45], [92.0, 94.95], [110.0, 111.3], [112.0, 118.88], [120.0, 121.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 44.49, 63.74, 53.84, 54.97, 0.0, 40.41, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.46], ["music", 25.58], ["whale vocalization", 7.14]], null, null, null, null, [["livestock, farm animals, working animals", 17.36], ["hum", 16.68], ["speech", 14.08]], null], "duration": [1.51, 1.15, 0.97, 1.4, 0.73, 1.5, 3.22, 1.16, 2.92, 0.8, 1.21, 7.53, 4.97, 5.45, 2.95, 1.3, 6.88, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/q6ObhNBURyY_filtered.json b/annotations_filtered/q6ObhNBURyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7baf5e21a6979e8c05ab339e8bdfcbd6f46fc15 --- /dev/null +++ b/annotations_filtered/q6ObhNBURyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 74.87], [76.0, 143.33], [144.0, 143.95], [144.0, 166.08]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.5], "audiomae_on_audioset": [null, null, null, [["music", 19.68], ["vehicle", 13.41], ["car", 11.03]]], "duration": [45.87, 67.33, -0.05, 22.08]} \ No newline at end of file diff --git a/annotations_filtered/q6XF66xysgQ_filtered.json b/annotations_filtered/q6XF66xysgQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9aa5443be0b421bb40b78b53446196b0ed95edf6 --- /dev/null +++ b/annotations_filtered/q6XF66xysgQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.17], [7.0, 9.39], [11.0, 14.76], [16.0, 19.97], [22.0, 26.91], [27.0, 32.1], [39.0, 40.93], [42.0, 44.79], [46.0, 48.27], [52.0, 53.7], [57.0, 59.0], [60.0, 65.53], [67.0, 68.72], [76.0, 79.54], [81.0, 82.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.37, 93.29, 99.76, 98.66, 99.26, 97.33, 0.0, 97.92, 99.84, 0.0, 99.84, 99.71, 0.0, 99.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.17, 2.39, 3.76, 3.97, 4.91, 5.1, 1.93, 2.79, 2.27, 1.7, 2.0, 5.53, 1.72, 3.54, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/q6j_0vS_NNM_filtered.json b/annotations_filtered/q6j_0vS_NNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3222a58d5681c35fa936845350d7bdedd05d8a6c --- /dev/null +++ b/annotations_filtered/q6j_0vS_NNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [16.0, 18.57], [21.0, 22.17], [23.0, 27.63], [30.0, 36.73], [40.0, 41.08], [45.0, 49.71], [54.0, 54.53], [56.0, 58.04], [60.0, 64.32], [66.0, 76.3], [78.0, 81.97], [85.0, 85.72], [87.0, 99.3], [102.0, 109.26], [114.0, 113.86], [114.0, 113.9], [114.0, 117.98], [126.0, 127.23], [135.0, 136.34], [138.0, 144.41], [146.0, 152.27], [153.0, 154.09], [158.0, 161.25], [162.0, 163.02], [165.0, 173.42], [177.0, 177.04], [180.0, 182.07]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.27, 0.0, 47.12, 39.63, 0.0, 36.55, 0.0, 35.52, 38.93, 36.99, 39.83, 0.0, 35.77, 38.97, 0.0, 0.0, 41.89, 0.0, 0.0, 36.27, 35.59, 0.0, 34.88, 0.0, 37.05, 0.0, 46.64], "audiomae_on_audioset": [null, [["music", 56.9], ["fly, housefly", 5.47], ["insect", 2.84]], null, [["music", 63.09], ["bass guitar", 4.08], ["double bass", 2.84]], [["music", 74.2], ["bass guitar", 2.43], ["double bass", 2.09]], null, [["music", 77.85], ["musical instrument", 1.82], ["mantra", 1.59]], null, [["music", 73.24], ["humming", 3.63], ["carnatic music", 2.71]], [["music", 83.24], ["sad music", 1.23], ["musical instrument", 1.17]], [["music", 67.54], ["double bass", 7.28], ["cello", 5.9]], [["music", 69.54], ["mantra", 3.72], ["carnatic music", 2.64]], null, [["music", 79.48], ["sad music", 3.12], ["cello", 1.98]], [["music", 57.86], ["double bass", 11.95], ["cello", 9.96]], null, null, [["music", 62.64], ["theremin", 6.0], ["cello", 4.46]], null, null, [["music", 78.74], ["guitar", 3.5], ["plucked string instrument", 2.71]], [["music", 81.57], ["mantra", 1.87], ["musical instrument", 1.33]], null, [["music", 73.93], ["mantra", 2.11], ["vocal music", 1.46]], null, [["music", 79.52], ["double bass", 3.29], ["cello", 1.47]], null, [["music", 73.25], ["musical instrument", 1.8], ["scary music", 1.51]]], "duration": [0.58, 2.57, 1.17, 4.63, 6.73, 1.08, 4.71, 0.53, 2.04, 4.32, 10.3, 3.97, 0.72, 12.3, 7.26, -0.14, -0.1, 3.98, 1.23, 1.34, 6.41, 6.27, 1.09, 3.25, 1.02, 8.42, 0.04, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/q6zi7XGjQQw_filtered.json b/annotations_filtered/q6zi7XGjQQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..814416653c0a837383d0563dbdd0e676bec094d9 --- /dev/null +++ b/annotations_filtered/q6zi7XGjQQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.51], [25.0, 25.84], [28.0, 28.26], [30.0, 30.13], [31.0, 32.83], [35.0, 35.7], [36.0, 36.59], [47.0, 47.78], [51.0, 51.06], [52.0, 52.34], [53.0, 53.47], [55.0, 55.43], [56.0, 56.69], [61.0, 61.33], [70.0, 70.87], [79.0, 78.75], [80.0, 80.77], [86.0, 87.51], [88.0, 88.99], [90.0, 90.63], [91.0, 92.03], [95.0, 95.86], [108.0, 108.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 0.84, 0.26, 0.13, 1.83, 0.7, 0.59, 0.78, 0.06, 0.34, 0.47, 0.43, 0.69, 0.33, 0.87, -0.25, 0.77, 1.51, 0.99, 0.63, 1.03, 0.86, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/q74RKOmIjC8_filtered.json b/annotations_filtered/q74RKOmIjC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfcfe5c7a66ee14eb8ec1483555dd26b456b328e --- /dev/null +++ b/annotations_filtered/q74RKOmIjC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.49], [3.0, 3.47], [5.0, 6.4], [7.0, 7.86], [14.0, 14.32], [16.0, 16.68], [21.0, 22.57], [24.0, 25.61], [26.0, 39.18], [43.0, 43.28], [46.0, 48.36], [50.0, 50.92], [54.0, 55.38], [57.0, 59.07], [61.0, 62.01], [65.0, 65.8], [68.0, 68.96], [69.0, 70.39], [73.0, 73.68], [75.0, 75.91], [76.0, 77.3], [79.0, 79.81], [80.0, 80.5], [83.0, 83.39], [84.0, 87.05], [87.0, 89.58], [92.0, 92.72], [95.0, 95.98], [99.0, 99.13], [100.0, 100.82], [103.0, 104.26], [107.0, 110.27], [113.0, 113.8]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.45, 0.0, 99.31, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 43.13, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["fart", 23.88], ["fly, housefly", 14.05], ["speech", 10.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 42.51], ["speech", 6.36], ["dog", 5.23]], null, null, null, null, null, null, null], "duration": [1.49, 0.47, 1.4, 0.86, 0.32, 0.68, 1.57, 1.61, 13.18, 0.28, 2.36, 0.92, 1.38, 2.07, 1.01, 0.8, 0.96, 1.39, 0.68, 0.91, 1.3, 0.81, 0.5, 0.39, 3.05, 2.58, 0.72, 0.98, 0.13, 0.82, 1.26, 3.27, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/q7CX_5D6y6E_filtered.json b/annotations_filtered/q7CX_5D6y6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e5bc3977eb98fbe5a6073edc365b5594c950bb2 --- /dev/null +++ b/annotations_filtered/q7CX_5D6y6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 52.2]], "keep_status": [false], "silence_prob": [34.25], "audiomae_on_audioset": [[["music", 52.01], ["flute", 17.82], ["theremin", 14.7]]], "duration": [5.2]} \ No newline at end of file diff --git a/annotations_filtered/q7DHkw_5Wzw_filtered.json b/annotations_filtered/q7DHkw_5Wzw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d6c8c6ccf0c47539d3675d55538c04e5d1c3ec2 --- /dev/null +++ b/annotations_filtered/q7DHkw_5Wzw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.08], [9.0, 15.35], [15.0, 15.4], [15.0, 15.45], [15.0, 15.99], [16.0, 18.77], [19.0, 19.87], [23.0, 23.06], [24.0, 25.96], [28.0, 28.73], [30.0, 30.67], [31.0, 32.39], [33.0, 33.37], [36.0, 41.96], [45.0, 46.13], [47.0, 50.14], [53.0, 53.16], [56.0, 57.03], [59.0, 62.29], [63.0, 64.44], [66.0, 67.0], [69.0, 75.78], [77.0, 77.16], [81.0, 81.87], [83.0, 85.21], [88.0, 89.72], [93.0, 94.56], [103.0, 103.65], [112.0, 111.89], [114.0, 114.47], [118.0, 118.32], [122.0, 125.61], [126.0, 127.82], [130.0, 132.17], [134.0, 137.69], [138.0, 140.43], [145.0, 146.85], [149.0, 149.98], [152.0, 152.41], [154.0, 154.36], [155.0, 156.27], [160.0, 168.32], [170.0, 170.8], [172.0, 178.44], [179.0, 179.24], [181.0, 181.01], [182.0, 187.91], [189.0, 190.21], [192.0, 193.82], [198.0, 198.61], [202.0, 204.31], [206.0, 208.47], [209.0, 209.75], [211.0, 212.04], [213.0, 214.64], [216.0, 242.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.25, 59.07, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 100.0, 0.0, 0.0, 99.68, 0.0, 0.0, 99.05, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 100.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 98.99, 99.59, 0.0, 0.0, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.08, 6.35, 0.4, 0.45, 0.99, 2.77, 0.87, 0.06, 1.96, 0.73, 0.67, 1.39, 0.37, 5.96, 1.13, 3.14, 0.16, 1.03, 3.29, 1.44, 1.0, 6.78, 0.16, 0.87, 2.21, 1.72, 1.56, 0.65, -0.11, 0.47, 0.32, 3.61, 1.82, 2.17, 3.69, 2.43, 1.85, 0.98, 0.41, 0.36, 1.27, 8.32, 0.8, 6.44, 0.24, 0.01, 5.91, 1.21, 1.82, 0.61, 2.31, 2.47, 0.75, 1.04, 1.64, 26.4]} \ No newline at end of file diff --git a/annotations_filtered/q7QxVddVEW0_filtered.json b/annotations_filtered/q7QxVddVEW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82f4eb7763a06ceaf8215be1efe82e3e6cb6bd2e --- /dev/null +++ b/annotations_filtered/q7QxVddVEW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [6.0, 6.2], [8.0, 10.18], [11.0, 11.89], [15.0, 16.01], [17.0, 18.55], [21.0, 21.61], [25.0, 25.0], [28.0, 30.3], [34.0, 35.58], [40.0, 40.47], [50.0, 64.32], [65.0, 82.36], [84.0, 88.69], [89.0, 94.71], [97.0, 96.8], [97.0, 109.85], [110.0, 112.99], [114.0, 114.4], [116.0, 117.64], [119.0, 119.45], [121.0, 121.66], [123.0, 123.26], [125.0, 127.6], [130.0, 132.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 34.23, 44.2, 99.97, 99.94, 0.0, 79.41, 63.96, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 99.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 46.94], ["smash, crash", 20.03], ["speech", 16.66]], [["music", 45.63], ["speech", 28.74], ["hum", 5.21]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 0.2, 2.18, 0.89, 1.01, 1.55, 0.61, 0.0, 2.3, 1.58, 0.47, 14.32, 17.36, 4.69, 5.71, -0.2, 12.85, 2.99, 0.4, 1.64, 0.45, 0.66, 0.26, 2.6, 2.19]} \ No newline at end of file diff --git a/annotations_filtered/q7S2ckr4IkM_filtered.json b/annotations_filtered/q7S2ckr4IkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b00bd6ab8f5f647a9f73bb1b0739f6b3ffb48350 --- /dev/null +++ b/annotations_filtered/q7S2ckr4IkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.23], [29.0, 29.34], [32.0, 35.02], [35.0, 35.06], [35.0, 35.61], [37.0, 38.16], [45.0, 45.23], [48.0, 48.32], [53.0, 53.32], [54.0, 56.4], [62.0, 62.43], [69.0, 70.39], [71.0, 72.01], [75.0, 75.88], [77.0, 78.12], [80.0, 80.13], [82.0, 82.68], [86.0, 86.56], [89.0, 90.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.34, 3.02, 0.06, 0.61, 1.16, 0.23, 0.32, 0.32, 2.4, 0.43, 1.39, 1.01, 0.88, 1.12, 0.13, 0.68, 0.56, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/q7V1sM0VNaw_filtered.json b/annotations_filtered/q7V1sM0VNaw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b7635076f4d1842f95547a154cdf524d161e0b6 --- /dev/null +++ b/annotations_filtered/q7V1sM0VNaw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.25], [20.0, 26.97], [28.0, 28.56], [32.0, 33.72], [35.0, 35.51], [37.0, 38.28], [39.0, 39.92], [47.0, 48.24], [49.0, 49.98], [51.0, 52.05], [54.0, 54.5], [56.0, 56.47], [58.0, 59.64], [61.0, 63.48], [64.0, 64.84], [66.0, 67.56], [71.0, 71.96], [76.0, 77.26], [84.0, 84.47], [86.0, 86.49], [89.0, 92.13], [93.0, 93.33], [101.0, 101.97], [105.0, 105.51], [106.0, 106.54], [108.0, 111.92], [113.0, 113.78], [116.0, 115.6], [117.0, 118.64], [120.0, 124.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.86, 31.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0, 58.98, 0.0, 0.0, 0.0, 29.84], "audiomae_on_audioset": [[["music", 54.8], ["sidetone", 11.94], ["speech", 9.01]], [["music", 78.58], ["throbbing", 3.97], ["musical instrument", 2.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.68], ["speech", 12.16], ["applause", 4.75]]], "duration": [4.25, 6.97, 0.56, 1.72, 0.51, 1.28, 0.92, 1.24, 0.98, 1.05, 0.5, 0.47, 1.64, 2.48, 0.84, 1.56, 0.96, 1.26, 0.47, 0.49, 3.13, 0.33, 0.97, 0.51, 0.54, 3.92, 0.78, -0.4, 1.64, 4.77]} \ No newline at end of file diff --git a/annotations_filtered/q7heVIEyvQ4_filtered.json b/annotations_filtered/q7heVIEyvQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11ba8a28d1f8e52b40061657394934d335dbff82 --- /dev/null +++ b/annotations_filtered/q7heVIEyvQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 44.25], [47.0, 48.27]], "keep_status": [true, false], "silence_prob": [34.88, 0.0], "audiomae_on_audioset": [[["music", 52.21], ["didgeridoo", 4.22], ["throbbing", 3.6]], null], "duration": [3.25, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/q7qwqVbZSqE_filtered.json b/annotations_filtered/q7qwqVbZSqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/q7qwqVbZSqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/q7tLJC4pC14_filtered.json b/annotations_filtered/q7tLJC4pC14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba25ec36e7b1909c02a59ffce3ee332923263227 --- /dev/null +++ b/annotations_filtered/q7tLJC4pC14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [13.0, 14.03], [16.0, 23.46], [24.0, 31.4], [33.0, 33.76], [34.0, 35.18], [36.0, 36.34], [37.0, 40.46], [42.0, 43.12], [45.0, 46.43], [49.0, 49.59], [52.0, 53.28], [54.0, 55.0], [56.0, 59.1], [60.0, 61.3], [64.0, 65.7], [68.0, 68.39], [85.0, 85.72], [86.0, 87.0], [89.0, 93.73], [95.0, 95.62], [96.0, 96.57], [98.0, 107.25]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 32.29, 78.38, 0.0, 0.0, 0.0, 52.51, 0.0, 0.0, 0.0, 0.0, 0.0, 43.51, 0.0, 0.0, 0.0, 0.0, 0.0, 49.54, 0.0, 0.0, 31.69], "audiomae_on_audioset": [null, null, [["music", 54.84], ["electronic music", 4.13], ["speech", 2.56]], null, null, null, null, null, null, null, null, null, null, [["music", 31.79], ["speech", 15.51], ["fart", 9.13]], null, null, null, null, null, [["speech", 23.04], ["hum", 16.89], ["mains hum", 8.45]], null, null, [["speech", 16.6], ["animal", 12.71], ["beatboxing", 6.29]]], "duration": [0.34, 1.03, 7.46, 7.4, 0.76, 1.18, 0.34, 3.46, 1.12, 1.43, 0.59, 1.28, 1.0, 3.1, 1.3, 1.7, 0.39, 0.72, 1.0, 4.73, 0.62, 0.57, 9.25]} \ No newline at end of file diff --git a/annotations_filtered/q7vtWB4owdE_filtered.json b/annotations_filtered/q7vtWB4owdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf569dd718c629164de5246afee42e9cc7774835 --- /dev/null +++ b/annotations_filtered/q7vtWB4owdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.29], [8.0, 7.89], [10.0, 10.25], [12.0, 13.09], [15.0, 16.73], [19.0, 19.5], [22.0, 21.78], [26.0, 26.97], [27.0, 28.17], [29.0, 29.59], [31.0, 31.6], [37.0, 37.93], [38.0, 39.5], [41.0, 41.55], [44.0, 44.1], [46.0, 47.43], [51.0, 52.98], [56.0, 56.27], [59.0, 71.88], [74.0, 75.86], [77.0, 79.37], [81.0, 84.55], [87.0, 88.01], [90.0, 90.9], [108.0, 109.11], [110.0, 111.33], [112.0, 112.95], [114.0, 116.09], [118.0, 120.02], [121.0, 121.78], [124.0, 124.82], [127.0, 126.94], [129.0, 129.57], [130.0, 131.92], [134.0, 134.79], [137.0, 138.55], [142.0, 142.74], [144.0, 143.87], [149.0, 149.74], [151.0, 157.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.55, 0.0, 44.37, 44.09, 0.0, 0.0, 0.0, 0.0, 0.0, 46.4, 70.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.9], ["chime", 19.31], ["ding", 5.66]], null, [["music", 43.85], ["timpani", 15.33], ["musical instrument", 12.42]], [["music", 39.94], ["timpani", 15.82], ["musical instrument", 9.96]], null, null, null, null, null, [["speech", 25.19], ["music", 19.12], ["theremin", 15.23]], null, null, null, null, null, null, null, null, null, null, null, [["foghorn", 31.57], ["music", 18.49], ["speech", 11.26]]], "duration": [1.29, -0.11, 0.25, 1.09, 1.73, 0.5, -0.22, 0.97, 1.17, 0.59, 0.6, 0.93, 1.5, 0.55, 0.1, 1.43, 1.98, 0.27, 12.88, 1.86, 2.37, 3.55, 1.01, 0.9, 1.11, 1.33, 0.95, 2.09, 2.02, 0.78, 0.82, -0.06, 0.57, 1.92, 0.79, 1.55, 0.74, -0.13, 0.74, 6.01]} \ No newline at end of file diff --git a/annotations_filtered/q8-xQspXFag_filtered.json b/annotations_filtered/q8-xQspXFag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5e56e219ebbf2aaf766295263bef28b529d6b44 --- /dev/null +++ b/annotations_filtered/q8-xQspXFag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.85], [8.0, 10.37], [11.0, 11.69], [14.0, 14.99], [18.0, 18.91], [19.0, 22.22], [24.0, 45.0], [47.0, 48.09], [49.0, 53.38], [55.0, 56.1], [56.0, 143.45], [144.0, 143.72], [144.0, 143.75], [144.0, 143.82], [145.0, 147.04], [150.0, 153.52], [155.0, 155.98], [157.0, 164.89], [168.0, 171.39], [174.0, 175.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [98.8, 96.54, 0.0, 0.0, 0.0, 87.92, 79.07, 0.0, 35.54, 0.0, 0.0, 0.0, 0.0, 0.0, 62.47, 47.5, 0.0, 52.27, 61.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whale vocalization", 57.46], ["music", 17.03], ["pigeon, dove", 2.64]], null, null, null, null, null, null, [["thunk", 52.54], ["fart", 4.97], ["hum", 3.99]], null, null, null, null], "duration": [2.85, 2.37, 0.69, 0.99, 0.91, 3.22, 21.0, 1.09, 4.38, 1.1, 87.45, -0.28, -0.25, -0.18, 2.04, 3.52, 0.98, 7.89, 3.39, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/q85fsxWYG6A_filtered.json b/annotations_filtered/q85fsxWYG6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75d66b18e294f9093eb762172bbd4c76c52da5f5 --- /dev/null +++ b/annotations_filtered/q85fsxWYG6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.3], [5.0, 5.85], [7.0, 7.8], [12.0, 12.31], [13.0, 13.81], [15.0, 21.47], [24.0, 25.14], [27.0, 28.73], [31.0, 31.58], [33.0, 33.57], [37.0, 37.35], [39.0, 39.97], [42.0, 42.89], [45.0, 45.76], [48.0, 48.2], [51.0, 52.02], [54.0, 54.58], [57.0, 57.82], [59.0, 59.95], [62.0, 64.03], [67.0, 67.9], [70.0, 70.73], [71.0, 71.69], [73.0, 80.23], [88.0, 89.6], [90.0, 91.27], [94.0, 94.69], [112.0, 113.19], [115.0, 116.19], [121.0, 121.71], [122.0, 122.44], [123.0, 123.4], [124.0, 124.65], [125.0, 125.44], [126.0, 126.35], [131.0, 131.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 63.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.94, 0.0, 0.0, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 59.69], ["animal", 4.18], ["sheep", 2.24]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.85, 0.8, 0.31, 0.81, 6.47, 1.14, 1.73, 0.58, 0.57, 0.35, 0.97, 0.89, 0.76, 0.2, 1.02, 0.58, 0.82, 0.95, 2.03, 0.9, 0.73, 0.69, 7.23, 1.6, 1.27, 0.69, 1.19, 1.19, 0.71, 0.44, 0.4, 0.65, 0.44, 0.35, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/q8CXKTH5950_filtered.json b/annotations_filtered/q8CXKTH5950_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff960e976b397f3a5032771e06cac57b6aa70737 --- /dev/null +++ b/annotations_filtered/q8CXKTH5950_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.71], [9.0, 10.86], [13.0, 13.96], [16.0, 16.71], [17.0, 18.15], [20.0, 22.57], [24.0, 24.56], [25.0, 30.3], [32.0, 32.49], [33.0, 33.61], [34.0, 35.45], [38.0, 38.18], [47.0, 64.32], [65.0, 68.72], [72.0, 88.18], [88.0, 89.51], [95.0, 104.99]], "keep_status": [true, false, false, false, false, true, false, true, false, false, false, false, false, true, false, false, true], "silence_prob": [43.03, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0, 48.48, 0.0, 0.0, 0.0, 0.0, 33.82, 42.04, 35.89, 0.0, 35.25], "audiomae_on_audioset": [[["music", 46.11], ["musical instrument", 5.04], ["speech", 3.91]], null, null, null, null, [["music", 46.37], ["effects unit", 7.98], ["synthesizer", 5.03]], null, [["music", 44.56], ["synthesizer", 12.62], ["effects unit", 3.66]], null, null, null, null, [["music", 66.99], ["effects unit", 3.83], ["animal", 3.44]], [["music", 18.28], ["harp", 7.93], ["marimba, xylophone", 5.23]], [["music", 58.58], ["effects unit", 17.03], ["guitar", 5.51]], null, [["music", 42.25], ["effects unit", 18.89], ["musical instrument", 7.17]]], "duration": [3.71, 1.86, 0.96, 0.71, 1.15, 2.57, 0.56, 5.3, 0.49, 0.61, 1.45, 0.18, 17.32, 3.72, 16.18, 1.51, 9.99]} \ No newline at end of file diff --git a/annotations_filtered/q8HcMk_IimM_filtered.json b/annotations_filtered/q8HcMk_IimM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dedbc2fd564897c6352557516b9cf0dd779a902b --- /dev/null +++ b/annotations_filtered/q8HcMk_IimM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.06], [1.0, 2.44], [5.0, 18.81], [21.0, 42.99], [47.0, 50.14], [51.0, 55.24], [57.0, 57.5], [58.0, 58.87], [61.0, 61.08], [70.0, 77.8], [78.0, 78.07], [79.0, 79.35], [81.0, 81.3], [82.0, 83.03], [84.0, 85.21], [86.0, 86.75], [88.0, 88.13], [91.0, 91.47], [94.0, 99.89], [100.0, 136.7], [137.0, 138.59], [148.0, 172.3]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.59, 29.98, 31.63, 29.13, 0.0, 0.0, 0.0, 29.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.08, 0.0, 0.0, 28.58], "audiomae_on_audioset": [null, null, [["music", 61.76], ["didgeridoo", 6.31], ["whack, thwack", 5.87]], [["music", 29.07], ["whack, thwack", 29.02], ["whip", 11.75]], [["music", 79.78], ["boing", 2.78], ["electronic music", 2.75]], [["speech", 37.46], ["music", 30.38], ["burst, pop", 6.86]], null, null, null, [["music", 54.43], ["speech", 13.05], ["radio", 5.79]], null, null, null, null, null, null, null, null, [["music", 75.85], ["didgeridoo", 4.16], ["musical instrument", 2.06]], null, null, [["music", 61.05], ["music of latin america", 6.22], ["funny music", 2.37]]], "duration": [0.06, 1.44, 13.81, 21.99, 3.14, 4.24, 0.5, 0.87, 0.08, 7.8, 0.07, 0.35, 0.3, 1.03, 1.21, 0.75, 0.13, 0.47, 5.89, 36.7, 1.59, 24.3]} \ No newline at end of file diff --git a/annotations_filtered/q8RTGMsDTiw_filtered.json b/annotations_filtered/q8RTGMsDTiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0383154f21893b18e6f27bf6a6d8c5c186d67fcd --- /dev/null +++ b/annotations_filtered/q8RTGMsDTiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [7.0, 13.96], [20.0, 22.79], [25.0, 29.88], [36.0, 104.67], [106.0, 124.43], [126.0, 125.98]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 66.27, 71.72, 62.99, 0.0, 30.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 46.14], ["livestock, farm animals, working animals", 19.66], ["crowd", 4.43]], null], "duration": [0.82, 6.96, 2.79, 4.88, 68.67, 18.43, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/q8Wj4buHUtE_filtered.json b/annotations_filtered/q8Wj4buHUtE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b696a0508b4bd2ad34b5a20496f890b4dc45a6b4 --- /dev/null +++ b/annotations_filtered/q8Wj4buHUtE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.4], [4.0, 3.94], [5.0, 5.27], [8.0, 8.77], [10.0, 13.02], [15.0, 16.55], [19.0, 20.95], [25.0, 27.73], [29.0, 28.85], [32.0, 32.37], [33.0, 35.77], [38.0, 39.02], [41.0, 40.91], [45.0, 45.86], [47.0, 47.43], [50.0, 52.79], [54.0, 55.83], [58.0, 62.24], [64.0, 65.08], [66.0, 67.78], [68.0, 71.02], [73.0, 78.12], [79.0, 79.61], [83.0, 90.19], [92.0, 102.78], [104.0, 108.14], [114.0, 115.86], [119.0, 121.31], [124.0, 143.67], [146.0, 146.42], [147.0, 157.87]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.17, 0.0, 0.0, 49.97, 0.0, 0.0, 36.24, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 67.0, 0.0, 0.0, 43.79, 59.15, 0.0, 60.05, 57.64, 75.39, 0.0, 63.1, 54.63, 0.0, 42.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 26.0], ["mosquito", 5.93], ["synthesizer", 5.08]], null, null, [["music", 25.13], ["hum", 22.25], ["throbbing", 9.87]], null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 24.17], ["hum", 15.32], ["fly, housefly", 12.26]], null, null, null, null, null, null, null, null, null, [["music", 51.08], ["hum", 17.7], ["mains hum", 6.03]]], "duration": [1.4, -0.06, 0.27, 0.77, 3.02, 1.55, 1.95, 2.73, -0.15, 0.37, 2.77, 1.02, -0.09, 0.86, 0.43, 2.79, 1.83, 4.24, 1.08, 1.78, 3.02, 5.12, 0.61, 7.19, 10.78, 4.14, 1.86, 2.31, 19.67, 0.42, 10.87]} \ No newline at end of file diff --git a/annotations_filtered/q8nzGlXDvO8_filtered.json b/annotations_filtered/q8nzGlXDvO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a612c06193b9ca8d5fd1ca7e40c47565bffbcb6 --- /dev/null +++ b/annotations_filtered/q8nzGlXDvO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.82], [24.0, 24.65], [26.0, 26.42], [27.0, 26.92], [28.0, 28.66], [29.0, 31.89], [33.0, 33.1], [40.0, 39.88], [43.0, 44.69], [47.0, 47.7], [53.0, 53.89], [57.0, 56.96], [58.0, 58.26], [60.0, 62.41], [69.0, 80.32], [82.0, 84.97], [87.0, 105.88], [108.0, 114.08], [117.0, 117.63], [118.0, 124.09]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3, 51.6, 87.19, 47.54, 74.76, 0.0, 55.04], "audiomae_on_audioset": [null, null, null, null, null, [["music", 30.24], ["speech", 22.55], ["burping, eructation", 7.23]], null, null, null, null, null, null, null, null, null, null, [["music", 81.3], ["guitar", 2.01], ["drum machine", 1.41]], null, null, null], "duration": [1.82, 0.65, 0.42, -0.08, 0.66, 2.89, 0.1, -0.12, 1.69, 0.7, 0.89, -0.04, 0.26, 2.41, 11.32, 2.97, 18.88, 6.08, 0.63, 6.09]} \ No newline at end of file diff --git a/annotations_filtered/q8woScnBklo_filtered.json b/annotations_filtered/q8woScnBklo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef28657ad8231fd2a538d5b3c51ff4d2aee8dee8 --- /dev/null +++ b/annotations_filtered/q8woScnBklo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.85], [10.0, 10.93], [11.0, 14.2], [15.0, 16.39], [18.0, 18.3], [20.0, 34.26], [45.0, 52.89], [59.0, 59.97], [61.0, 62.33], [66.0, 65.77], [68.0, 71.51], [75.0, 84.62], [88.0, 88.4], [89.0, 92.4], [95.0, 100.03], [100.0, 101.49], [103.0, 103.89], [105.0, 105.83], [107.0, 111.43], [113.0, 112.89], [113.0, 113.93], [115.0, 115.13], [116.0, 121.66]], "keep_status": [false, false, true, false, false, true, true, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.52, 0.0, 0.0, 31.53, 30.65, 0.0, 0.0, 0.0, 46.64, 33.69, 0.0, 43.1, 72.75, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0, 57.72], "audiomae_on_audioset": [null, null, [["music", 34.39], ["foghorn", 21.29], ["musical instrument", 7.78]], null, null, [["music", 35.93], ["musical instrument", 7.83], ["foghorn", 4.61]], [["music", 41.17], ["foghorn", 11.23], ["quack", 8.46]], null, null, null, [["music", 44.16], ["theremin", 6.76], ["musical instrument", 5.01]], [["music", 46.94], ["musical instrument", 10.55], ["theremin", 8.52]], null, [["music", 53.88], ["theremin", 7.92], ["hum", 4.27]], null, null, null, null, null, null, null, null, null], "duration": [-0.15, 0.93, 3.2, 1.39, 0.3, 14.26, 7.89, 0.97, 1.33, -0.23, 3.51, 9.62, 0.4, 3.4, 5.03, 1.49, 0.89, 0.83, 4.43, -0.11, 0.93, 0.13, 5.66]} \ No newline at end of file diff --git a/annotations_filtered/q928Wa_h_gg_filtered.json b/annotations_filtered/q928Wa_h_gg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc94ab59cb9b93ac30371f48148164bed49be384 --- /dev/null +++ b/annotations_filtered/q928Wa_h_gg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.29], [31.0, 30.82], [31.0, 30.89], [31.0, 40.51], [56.0, 60.88], [68.0, 72.52], [74.0, 75.79], [81.0, 81.57], [87.0, 91.4], [94.0, 95.88]], "keep_status": [false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 31.85, 30.07, 32.84, 0.0, 0.0, 30.54, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 49.63], ["hum", 15.33], ["mains hum", 8.21]], [["fly, housefly", 46.03], ["mosquito", 32.07], ["insect", 15.72]], [["breaking", 20.63], ["gunshot, gunfire", 10.41], ["clang", 9.49]], null, null, [["music", 24.16], ["speech", 17.1], ["whack, thwack", 10.06]], null], "duration": [0.29, -0.18, -0.11, 9.51, 4.88, 4.52, 1.79, 0.57, 4.4, 1.88]} \ No newline at end of file diff --git a/annotations_filtered/q9FYBjSc3cU_filtered.json b/annotations_filtered/q9FYBjSc3cU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2b9e63352ae464b4ad76a70f7629c1c37599cfd --- /dev/null +++ b/annotations_filtered/q9FYBjSc3cU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.74], [16.0, 18.47], [20.0, 21.49], [23.0, 23.06], [27.0, 29.59], [34.0, 54.55], [56.0, 74.73], [75.0, 94.04], [97.0, 100.23], [102.0, 102.54], [103.0, 107.6], [109.0, 111.86], [113.0, 115.38], [117.0, 118.4], [121.0, 124.11], [126.0, 126.57], [129.0, 129.34], [132.0, 132.48], [134.0, 134.96], [137.0, 137.56], [143.0, 145.84], [148.0, 148.12], [152.0, 151.95], [163.0, 165.05], [170.0, 171.27], [172.0, 174.73], [176.0, 177.2], [178.0, 179.1], [180.0, 180.57]], "keep_status": [false, true, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 37.45, 0.0, 0.0, 38.91, 46.86, 32.24, 31.15, 33.2, 0.0, 32.5, 70.02, 93.6, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 76.86, 0.0, 0.0, 57.4, 0.0, 42.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.92], ["speech", 14.2], ["hum", 8.52]], null, null, [["hum", 41.94], ["mains hum", 12.28], ["throbbing", 11.41]], [["music", 59.53], ["throbbing", 13.08], ["hum", 11.12]], [["music", 57.79], ["throbbing", 17.4], ["hum", 4.98]], [["music", 64.34], ["throbbing", 9.35], ["electronic music", 3.6]], [["speech", 26.25], ["music", 24.69], ["smash, crash", 8.67]], null, [["speech", 70.16], ["fart", 8.9], ["music", 6.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.3], ["ambient music", 10.99], ["hum", 5.41]], null, null, null], "duration": [0.74, 2.47, 1.49, 0.06, 2.59, 20.55, 18.73, 19.04, 3.23, 0.54, 4.6, 2.86, 2.38, 1.4, 3.11, 0.57, 0.34, 0.48, 0.96, 0.56, 2.84, 0.12, -0.05, 2.05, 1.27, 2.73, 1.2, 1.1, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/q9OUIk4Oaq4_filtered.json b/annotations_filtered/q9OUIk4Oaq4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c2da18d6c1fb4cbf9d1af520cfca83f3aa4e31a --- /dev/null +++ b/annotations_filtered/q9OUIk4Oaq4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.5], [21.0, 21.71], [23.0, 24.51], [26.0, 27.19], [47.0, 48.41], [54.0, 55.22], [58.0, 58.67], [59.0, 68.81], [73.0, 76.72], [77.0, 110.25], [111.0, 111.3], [115.0, 120.18], [127.0, 132.97], [135.0, 135.5], [136.0, 137.62], [139.0, 143.83], [151.0, 153.23], [155.0, 162.7], [167.0, 169.18], [171.0, 173.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.03, 41.22, 0.0, 0.0, 33.95, 45.62, 0.0, 0.0, 38.11, 38.88, 32.36, 40.14, 34.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["radio", 28.71], ["mains hum", 22.51], ["hum", 20.52]], [["fly, housefly", 46.07], ["insect", 14.65], ["mosquito", 14.51]], null, null, [["frog", 81.68], ["croak", 3.98], ["animal", 2.19]], [["hum", 41.27], ["mains hum", 40.64], ["throbbing", 5.56]], null, null, [["mains hum", 47.82], ["hum", 27.58], ["noise", 12.28]], [["hum", 30.32], ["throbbing", 22.78], ["radio", 13.09]], [["whistling", 92.59], ["whistle", 3.67], ["theremin", 1.13]], [["beatboxing", 17.26], ["music", 15.78], ["radio", 9.66]], [["speech", 41.14], ["radio", 15.75], ["dog", 3.96]]], "duration": [1.5, 0.71, 1.51, 1.19, 1.41, 1.22, 0.67, 9.81, 3.72, 33.25, 0.3, 5.18, 5.97, 0.5, 1.62, 4.83, 2.23, 7.7, 2.18, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/q9QJ_S62yVo_filtered.json b/annotations_filtered/q9QJ_S62yVo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1251faa9727e0d5681c17ba1fef2c5b0131a7721 --- /dev/null +++ b/annotations_filtered/q9QJ_S62yVo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.76], [20.0, 26.38], [28.0, 44.17], [45.0, 44.68], [45.0, 109.19], [110.0, 118.34], [119.0, 121.66], [122.0, 122.62]], "keep_status": [false, true, true, false, false, true, true, false], "silence_prob": [31.19, 37.81, 34.69, 0.0, 0.0, 30.72, 37.23, 0.0], "audiomae_on_audioset": [[["speech", 39.25], ["music", 34.9], ["didgeridoo", 6.43]], [["speech", 22.06], ["music", 15.46], ["hum", 7.77]], [["music", 25.36], ["theremin", 12.66], ["whale vocalization", 11.44]], null, null, [["speech", 34.58], ["music", 27.82], ["explosion", 7.13]], [["music", 19.15], ["speech", 12.49], ["whale vocalization", 4.29]], null], "duration": [7.76, 6.38, 16.17, -0.32, 64.19, 8.34, 2.66, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/q9Wip3v8h40_filtered.json b/annotations_filtered/q9Wip3v8h40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fa2575a6a8cfb235c65b6cca86bba6cf1bb7bf7 --- /dev/null +++ b/annotations_filtered/q9Wip3v8h40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.85], [15.0, 15.15], [17.0, 17.56], [18.0, 17.76], [22.0, 24.73], [29.0, 29.51], [30.0, 29.62], [34.0, 40.58], [43.0, 46.23], [48.0, 48.95], [65.0, 65.96], [67.0, 67.12], [68.0, 70.56], [76.0, 79.71], [84.0, 84.45]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.61, 0.0, 0.0, 32.74, 33.9, 0.0, 0.0, 0.0, 34.99, 55.89, 0.0], "audiomae_on_audioset": [null, null, null, null, [["boing", 70.77], ["fly, housefly", 4.33], ["music", 3.48]], null, null, [["music", 68.48], ["musical instrument", 3.57], ["speech", 3.29]], [["music", 26.2], ["speech", 21.96], ["boing", 14.84]], null, null, null, [["cattle, bovinae", 29.44], ["moo", 17.85], ["livestock, farm animals, working animals", 10.88]], null, null], "duration": [1.85, 0.15, 0.56, -0.24, 2.73, 0.51, -0.38, 6.58, 3.23, 0.95, 0.96, 0.12, 2.56, 3.71, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/q9X6tpvxZyE_filtered.json b/annotations_filtered/q9X6tpvxZyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1b01ebdf274dd86ad58c47910653989bfc6d22b --- /dev/null +++ b/annotations_filtered/q9X6tpvxZyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.27], [11.0, 13.49], [24.0, 24.44], [27.0, 29.64], [39.0, 40.05], [46.0, 47.66], [49.0, 53.92], [55.0, 55.73], [59.0, 60.54], [61.0, 61.99], [63.0, 63.0], [63.0, 67.36], [69.0, 77.19], [78.0, 83.51], [85.0, 86.7], [89.0, 89.18], [89.0, 90.63], [102.0, 101.92], [117.0, 117.83], [126.0, 126.82], [128.0, 129.46], [130.0, 132.36], [133.0, 133.66], [135.0, 136.36], [142.0, 142.25], [144.0, 144.58], [157.0, 157.0], [158.0, 158.63], [159.0, 163.65], [165.0, 173.53], [174.0, 176.42], [178.0, 181.92], [183.0, 185.4], [186.0, 186.65], [187.0, 188.11], [192.0, 192.97], [193.0, 194.56], [195.0, 195.62], [196.0, 228.8], [230.0, 232.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.36, 0.0, 93.91, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 60.79, 99.59, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 94.95, 80.64, 73.67, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 31.51], ["speech", 26.87], ["music", 14.32]]], "duration": [0.27, 2.49, 0.44, 2.64, 1.05, 1.66, 4.92, 0.73, 1.54, 0.99, 0.0, 4.36, 8.19, 5.51, 1.7, 0.18, 1.63, -0.08, 0.83, 0.82, 1.46, 2.36, 0.66, 1.36, 0.25, 0.58, 0.0, 0.63, 4.65, 8.53, 2.42, 3.92, 2.4, 0.65, 1.11, 0.97, 1.56, 0.62, 32.8, 2.71]} \ No newline at end of file diff --git a/annotations_filtered/q9iIgRYUyA0_filtered.json b/annotations_filtered/q9iIgRYUyA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..118bf95ba770ccd166720280ed3aa12f4017dc29 --- /dev/null +++ b/annotations_filtered/q9iIgRYUyA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[62.0, 62.83], [65.0, 66.33], [67.0, 68.47], [70.0, 71.37], [73.0, 74.01], [77.0, 78.46], [80.0, 85.68], [87.0, 93.29], [95.0, 95.57], [99.0, 99.03], [103.0, 114.05], [114.0, 115.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 85.35, 0.0, 0.0, 46.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 59.23], ["synthesizer", 8.25], ["musical instrument", 6.96]], null], "duration": [0.83, 1.33, 1.47, 1.37, 1.01, 1.46, 5.68, 6.29, 0.57, 0.03, 11.05, 1.89]} \ No newline at end of file diff --git a/annotations_filtered/q9sjo2J6hIk_filtered.json b/annotations_filtered/q9sjo2J6hIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4395663414ad1c72b4a224fc5940e13c49f1a8ee --- /dev/null +++ b/annotations_filtered/q9sjo2J6hIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.07], [15.0, 107.87], [111.0, 111.47], [113.0, 113.59]], "keep_status": [false, false, false, false], "silence_prob": [38.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 30.52], ["cattle, bovinae", 20.28], ["moo", 20.09]], null, null, null], "duration": [9.07, 92.87, 0.47, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/qA73y2w3WUc_filtered.json b/annotations_filtered/qA73y2w3WUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50319b8ed927370dbe6b3ab15dba0cc495db4b3a --- /dev/null +++ b/annotations_filtered/qA73y2w3WUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.77], [8.0, 9.0], [21.0, 21.91], [24.0, 25.37], [28.0, 30.62], [33.0, 33.99], [37.0, 38.94], [42.0, 42.4], [45.0, 46.09], [47.0, 49.03], [54.0, 54.6], [56.0, 56.88], [59.0, 59.02], [62.0, 62.63], [64.0, 64.94], [68.0, 68.94], [70.0, 71.56], [72.0, 73.99], [75.0, 75.61], [77.0, 80.91], [85.0, 85.41], [88.0, 88.69], [90.0, 90.75], [91.0, 92.01], [95.0, 95.07], [96.0, 96.48], [97.0, 97.63], [100.0, 100.03], [103.0, 104.65]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.94, 0.0, 0.0, 0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 56.19], ["throbbing", 8.1], ["hum", 5.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.23], ["music", 19.91], ["hum", 11.29]], null, null, null, null, null, null, null, null, null], "duration": [-0.23, 1.0, 0.91, 1.37, 2.62, 0.99, 1.94, 0.4, 1.09, 2.03, 0.6, 0.88, 0.02, 0.63, 0.94, 0.94, 1.56, 1.99, 0.61, 3.91, 0.41, 0.69, 0.75, 1.01, 0.07, 0.48, 0.63, 0.03, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/qA7XKmC5QbQ_filtered.json b/annotations_filtered/qA7XKmC5QbQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3b916ae24ff47cfb0c1df7623606133647dd24a --- /dev/null +++ b/annotations_filtered/qA7XKmC5QbQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [5.0, 5.22], [19.0, 19.41], [26.0, 26.33], [39.0, 71.68], [91.0, 94.07], [111.0, 114.62], [116.0, 117.07], [120.0, 125.79], [132.0, 133.05]], "keep_status": [false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.16, 60.42, 0.0, 90.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 43.16], ["chant", 15.48], ["mantra", 7.59]], null, null, null, null], "duration": [0.52, 0.22, 0.41, 0.33, 32.68, 3.07, 3.62, 1.07, 5.79, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/qAFgj8mqPk0_filtered.json b/annotations_filtered/qAFgj8mqPk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d593a382c7e5ee8f100501c8b39373c662bc4dd8 --- /dev/null +++ b/annotations_filtered/qAFgj8mqPk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [3.0, 4.7], [7.0, 10.67], [16.0, 17.47], [18.0, 18.33], [20.0, 20.41], [21.0, 22.3], [29.0, 33.51], [41.0, 42.42], [43.0, 43.8], [44.0, 44.9], [48.0, 49.49], [50.0, 50.92], [55.0, 55.58], [62.0, 62.29], [62.0, 63.69], [64.0, 66.53], [67.0, 67.88], [69.0, 69.36], [70.0, 70.01], [70.0, 70.73], [71.0, 71.37], [73.0, 76.06], [83.0, 87.78], [94.0, 95.35], [96.0, 96.62], [103.0, 104.68], [109.0, 110.25], [118.0, 121.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.4, 0.0, 0.0, 0.0, 0.0, 0.0, 42.91, 57.72, 0.0, 0.0, 0.0, 0.0, 64.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.01], ["guitar", 8.03], ["effects unit", 6.01]], null, null, null, null, null, [["music", 54.45], ["theremin", 6.74], ["marimba, xylophone", 3.82]], null, null, null, null, null, null], "duration": [0.64, 1.7, 3.67, 1.47, 0.33, 0.41, 1.3, 4.51, 1.42, 0.8, 0.9, 1.49, 0.92, 0.58, 0.29, 1.69, 2.53, 0.88, 0.36, 0.01, 0.73, 0.37, 3.06, 4.78, 1.35, 0.62, 1.68, 1.25, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/qA_zzk2c7G8_filtered.json b/annotations_filtered/qA_zzk2c7G8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6984c2e263016dc5faa08cd39d77e0e015ec3c31 --- /dev/null +++ b/annotations_filtered/qA_zzk2c7G8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.36], [11.0, 20.11], [28.0, 28.07], [29.0, 28.98], [31.0, 31.62], [34.0, 34.18], [38.0, 38.87], [40.0, 43.75], [44.0, 44.42], [44.0, 51.06], [57.0, 57.77], [60.0, 63.22], [66.0, 66.66], [68.0, 68.28], [69.0, 69.21], [73.0, 74.43], [77.0, 101.51], [103.0, 103.44], [103.0, 103.52], [104.0, 104.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [89.9, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 42.74, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 54.19], ["speech", 10.43], ["mosquito", 8.44]], null, [["music", 43.92], ["speech", 8.82], ["boing", 5.34]], null, null, null, null, null, null, null, null], "duration": [2.36, 9.11, 0.07, -0.02, 0.62, 0.18, 0.87, 3.75, 0.42, 7.06, 0.77, 3.22, 0.66, 0.28, 0.21, 1.43, 24.51, 0.44, 0.52, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/qAdNnZqKGiQ_filtered.json b/annotations_filtered/qAdNnZqKGiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3aee94c8a3fb54209260938aa5ccd361b450a7de --- /dev/null +++ b/annotations_filtered/qAdNnZqKGiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.06], [12.0, 16.71], [17.0, 19.21], [20.0, 20.41], [22.0, 22.87], [27.0, 26.82], [29.0, 29.07], [31.0, 31.92], [33.0, 33.07], [34.0, 35.43], [38.0, 39.18], [41.0, 43.21], [44.0, 45.82], [48.0, 54.53], [55.0, 56.79], [60.0, 59.93], [69.0, 69.92], [76.0, 77.94], [78.0, 79.73], [81.0, 80.7], [83.0, 85.31], [86.0, 86.66], [88.0, 88.72]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.16, 93.13, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 54.6], ["music", 7.01], ["arrow", 5.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.06, 4.71, 2.21, 0.41, 0.87, -0.18, 0.07, 0.92, 0.07, 1.43, 1.18, 2.21, 1.82, 6.53, 1.79, -0.07, 0.92, 1.94, 1.73, -0.3, 2.31, 0.66, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/qAfsU2gI408_filtered.json b/annotations_filtered/qAfsU2gI408_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20d897ac60e0eecf4505fd2eab878ddc38e54f31 --- /dev/null +++ b/annotations_filtered/qAfsU2gI408_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.91], [5.0, 5.37], [7.0, 7.21], [10.0, 10.89], [12.0, 12.66], [14.0, 13.66], [15.0, 16.63], [18.0, 21.84], [23.0, 24.16], [25.0, 27.03], [28.0, 29.51], [30.0, 30.77], [32.0, 32.53], [34.0, 34.99], [35.0, 35.78], [36.0, 39.97], [41.0, 42.15], [44.0, 44.22], [44.0, 51.48], [52.0, 53.64], [54.0, 55.27], [58.0, 61.2], [62.0, 62.65], [64.0, 64.59], [65.0, 101.36], [102.0, 106.41], [109.0, 150.18], [152.0, 159.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 99.88, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 46.36, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 46.06], ["throbbing", 17.95], ["mains hum", 14.39]], null, null], "duration": [1.91, 0.37, 0.21, 0.89, 0.66, -0.34, 1.63, 3.84, 1.16, 2.03, 1.51, 0.77, 0.53, 0.99, 0.78, 3.97, 1.15, 0.22, 7.48, 1.64, 1.27, 3.2, 0.65, 0.59, 36.36, 4.41, 41.18, 7.24]} \ No newline at end of file diff --git a/annotations_filtered/qAhaYHHcYyk_filtered.json b/annotations_filtered/qAhaYHHcYyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f57b8510088196b7a594e516238e469c371b18e0 --- /dev/null +++ b/annotations_filtered/qAhaYHHcYyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.73], [4.0, 4.26], [8.0, 9.44], [21.0, 21.51], [28.0, 28.61], [30.0, 31.14], [36.0, 37.77], [41.0, 41.2]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.73, 0.26, 1.44, 0.51, 0.61, 1.14, 1.77, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/qAw0VczZGC8_filtered.json b/annotations_filtered/qAw0VczZGC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f355bcf8b1c57edcc55dab1c0481d06e2f14909b --- /dev/null +++ b/annotations_filtered/qAw0VczZGC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [1.0, 1.41], [1.0, 1.56], [2.0, 4.11], [6.0, 6.18], [8.0, 10.56], [12.0, 13.96], [14.0, 35.82], [38.0, 84.27]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 52.98, 0.0, 68.41, 0.0, 32.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 79.34], ["throbbing", 6.54], ["hum", 3.14]], null], "duration": [0.0, 0.41, 0.56, 2.11, 0.18, 2.56, 1.96, 21.82, 46.27]} \ No newline at end of file diff --git a/annotations_filtered/qB2H-Gp0nlE_filtered.json b/annotations_filtered/qB2H-Gp0nlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aaa2a3390c57d8f7bef5f780136806c1d6eee7ae --- /dev/null +++ b/annotations_filtered/qB2H-Gp0nlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.78], [10.0, 11.67], [29.0, 30.23], [34.0, 36.14]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 71.72], "audiomae_on_audioset": [null, null, null, null], "duration": [-0.22, 1.67, 1.23, 2.14]} \ No newline at end of file diff --git a/annotations_filtered/qB311wvyggM_filtered.json b/annotations_filtered/qB311wvyggM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4eb1898d36ed96e54fa2e130763dc83759e9281 --- /dev/null +++ b/annotations_filtered/qB311wvyggM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 38.01], [39.0, 39.65], [41.0, 55.07], [57.0, 66.8], [68.0, 71.0], [72.0, 92.21]], "keep_status": [false, false, true, false, true, true], "silence_prob": [35.08, 0.0, 41.62, 53.04, 34.69, 33.21], "audiomae_on_audioset": [[["speech", 57.19], ["sidetone", 11.27], ["hum", 6.95]], null, [["speech", 19.4], ["mains hum", 7.7], ["vehicle", 6.73]], null, [["music", 35.53], ["electronic music", 13.64], ["synthesizer", 6.38]], [["hum", 32.82], ["mains hum", 25.34], ["speech", 9.67]]], "duration": [2.01, 0.65, 14.07, 9.8, 3.0, 20.21]} \ No newline at end of file diff --git a/annotations_filtered/qB78U2aWihU_filtered.json b/annotations_filtered/qB78U2aWihU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30002c4fad8833226b2abcb5c64a3592049ebab7 --- /dev/null +++ b/annotations_filtered/qB78U2aWihU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.2], [7.0, 7.59], [9.0, 9.53], [14.0, 14.5], [15.0, 64.84], [68.0, 71.09], [101.0, 106.0], [107.0, 108.09], [112.0, 127.79], [132.0, 135.09], [138.0, 153.35], [155.0, 164.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 100.0, 0.0, 48.35, 57.25, 82.61, 59.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 54.83], ["music", 21.1], ["thunk", 3.94]], null, null, null], "duration": [0.2, 0.59, 0.53, 0.5, 49.84, 3.09, 5.0, 1.09, 15.79, 3.09, 15.35, 9.56]} \ No newline at end of file diff --git a/annotations_filtered/qB93c2JU4uQ_filtered.json b/annotations_filtered/qB93c2JU4uQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1ea77281ad3289bcba8a9aac58e3f779ac9843b --- /dev/null +++ b/annotations_filtered/qB93c2JU4uQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.96], [22.0, 22.84], [51.0, 50.92], [57.0, 57.55], [62.0, 65.69], [66.0, 67.78], [68.0, 68.52], [71.0, 70.95], [78.0, 78.43], [79.0, 79.57], [81.0, 105.22], [105.0, 106.42], [111.0, 111.3], [113.0, 136.9], [138.0, 144.02], [146.0, 179.05], [182.0, 199.94], [204.0, 205.43], [206.0, 206.52], [208.0, 209.97], [216.0, 225.96], [227.0, 234.25], [241.0, 243.43]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.7, 0.0, 0.0, 0.0, 0.0, 0.0, 31.42, 0.0, 0.0, 30.01, 30.46, 0.0, 29.95, 0.0, 0.0, 0.0, 30.16, 31.6, 43.48], "audiomae_on_audioset": [null, null, null, null, [["fly, housefly", 34.32], ["music", 12.6], ["insect", 11.09]], null, null, null, null, null, [["mains hum", 36.25], ["hum", 32.72], ["music", 16.55]], null, null, [["throbbing", 27.29], ["hum", 26.7], ["music", 23.85]], [["music", 54.36], ["throbbing", 21.51], ["hum", 10.9]], null, [["music", 44.56], ["speech", 24.95], ["groan", 5.42]], null, null, null, [["music", 40.83], ["boing", 12.0], ["smash, crash", 5.39]], [["music", 52.22], ["throbbing", 15.17], ["hum", 7.9]], [["music", 58.53], ["boing", 5.78], ["musical instrument", 4.11]]], "duration": [0.96, 0.84, -0.08, 0.55, 3.69, 1.78, 0.52, -0.05, 0.43, 0.57, 24.22, 1.42, 0.3, 23.9, 6.02, 33.05, 17.94, 1.43, 0.52, 1.97, 9.96, 7.25, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/qBFSCbptrJk_filtered.json b/annotations_filtered/qBFSCbptrJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..298e9f25bced97b6de098be4df2564e35595bd77 --- /dev/null +++ b/annotations_filtered/qBFSCbptrJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.19], [11.0, 12.01], [13.0, 15.13], [16.0, 17.68], [20.0, 21.69], [23.0, 22.84], [26.0, 25.79], [27.0, 28.46], [30.0, 30.47], [32.0, 34.6], [44.0, 52.52], [56.0, 57.32], [61.0, 63.02], [64.0, 65.23], [66.0, 67.91], [69.0, 69.62], [82.0, 89.43], [91.0, 95.91], [98.0, 98.17], [100.0, 104.45], [105.0, 105.11], [105.0, 106.22], [111.0, 113.41], [114.0, 126.22], [136.0, 136.22], [141.0, 141.42], [142.0, 153.13], [155.0, 167.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [53.34, 0.0, 37.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.42, 39.31, 0.0, 36.76, 0.0, 0.0, 0.0, 76.2, 57.48, 0.0, 40.9, 0.0, 0.0, 35.97, 33.87, 0.0, 0.0, 31.07, 33.12], "audiomae_on_audioset": [null, null, [["speech", 87.78], ["radio", 3.82], ["telephone", 1.56]], null, null, null, null, null, null, null, [["telephone", 44.7], ["sidetone", 25.17], ["speech", 17.7]], null, [["speech", 26.05], ["hum", 18.64], ["mains hum", 16.94]], null, null, null, null, null, null, [["music", 49.54], ["theremin", 27.26], ["wind instrument, woodwind instrument", 4.44]], null, null, [["music", 32.37], ["theremin", 10.46], ["musical instrument", 8.19]], [["music", 65.29], ["theremin", 10.57], ["musical instrument", 8.99]], null, null, [["music", 59.47], ["theremin", 7.83], ["musical instrument", 5.14]], [["speech", 54.17], ["music", 24.8], ["fart", 4.31]]], "duration": [5.19, 1.01, 2.13, 1.68, 1.69, -0.16, -0.21, 1.46, 0.47, 2.6, 8.52, 1.32, 2.02, 1.23, 1.91, 0.62, 7.43, 4.91, 0.17, 4.45, 0.11, 1.22, 2.41, 12.22, 0.22, 0.42, 11.13, 12.07]} \ No newline at end of file diff --git a/annotations_filtered/qBWbxMv6v_s_filtered.json b/annotations_filtered/qBWbxMv6v_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54bce7ee21591231ab17336a636d3532741ae293 --- /dev/null +++ b/annotations_filtered/qBWbxMv6v_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 30.16], [32.0, 31.68], [34.0, 37.44], [38.0, 41.5], [42.0, 42.65], [44.0, 45.27], [49.0, 49.08], [50.0, 59.17], [62.0, 62.73], [64.0, 64.91], [67.0, 67.85], [70.0, 72.76], [73.0, 73.06], [73.0, 74.19], [76.0, 77.16], [83.0, 84.69], [90.0, 91.1], [95.0, 95.0], [95.0, 95.25], [98.0, 101.55], [103.0, 103.71], [104.0, 111.21], [113.0, 129.3]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.62, 0.0, 40.66, 61.97, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 0.0, 65.67, 54.9], "audiomae_on_audioset": [[["speech", 21.9], ["vehicle", 12.44], ["mains hum", 9.22]], null, [["whale vocalization", 24.88], ["vehicle", 9.35], ["fly, housefly", 5.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.16, -0.32, 3.44, 3.5, 0.65, 1.27, 0.08, 9.17, 0.73, 0.91, 0.85, 2.76, 0.06, 1.19, 1.16, 1.69, 1.1, 0.0, 0.25, 3.55, 0.71, 7.21, 16.3]} \ No newline at end of file diff --git a/annotations_filtered/qBdgJs4tf60_filtered.json b/annotations_filtered/qBdgJs4tf60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f8f6632ed65374cad07ea342e6b951ab6096e31 --- /dev/null +++ b/annotations_filtered/qBdgJs4tf60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[116.0, 118.08], [119.0, 120.68], [122.0, 122.86], [124.0, 125.14]], "keep_status": [false, false, false, false], "silence_prob": [38.79, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["sine wave", 43.04], ["speech", 39.77], ["chirp tone", 2.67]], null, null, null], "duration": [2.08, 1.68, 0.86, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/qCYYMqHyPKk_filtered.json b/annotations_filtered/qCYYMqHyPKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f75dc67f97fdbdf8c2c2422a60b0fb6f265fa0e --- /dev/null +++ b/annotations_filtered/qCYYMqHyPKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.64], [8.0, 24.63], [28.0, 33.59], [34.0, 38.6], [39.0, 40.66], [52.0, 57.21], [66.0, 69.21], [71.0, 72.67], [80.0, 100.94], [104.0, 124.39]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 52.62, 64.18, 51.6, 0.0, 63.42, 50.61, 0.0, 63.21, 40.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 34.88], ["explosion", 13.29], ["hum", 7.61]]], "duration": [0.64, 16.63, 5.59, 4.6, 1.66, 5.21, 3.21, 1.67, 20.94, 20.39]} \ No newline at end of file diff --git a/annotations_filtered/qC_pkxnYQfk_filtered.json b/annotations_filtered/qC_pkxnYQfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..360d701b4fe3700ca0a876bdd8e74508967cb5cf --- /dev/null +++ b/annotations_filtered/qC_pkxnYQfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 44.47], [48.0, 51.76], [52.0, 96.7]], "keep_status": [true, false, false], "silence_prob": [43.9, 28.36, 0.0], "audiomae_on_audioset": [[["music", 56.03], ["hum", 7.02], ["ambient music", 6.41]], [["livestock, farm animals, working animals", 42.48], ["cattle, bovinae", 23.25], ["moo", 15.27]], null], "duration": [26.47, 3.76, 44.7]} \ No newline at end of file diff --git a/annotations_filtered/qCjSApp2o1E_filtered.json b/annotations_filtered/qCjSApp2o1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89d1871fe56ade197c01ae79967949a86ef6a1e9 --- /dev/null +++ b/annotations_filtered/qCjSApp2o1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.26], [24.0, 24.33], [28.0, 29.02], [31.0, 33.49], [37.0, 46.04], [51.0, 52.73], [54.0, 57.65], [60.0, 61.21], [64.0, 65.94], [72.0, 72.25], [74.0, 74.56], [78.0, 80.33], [82.0, 81.73], [84.0, 92.4], [96.0, 96.69], [99.0, 99.52], [100.0, 99.55]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 85.9, 31.92, 0.0, 44.72, 0.0, 0.0, 0.0, 0.0, 44.96, 0.0, 28.66, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 47.33], ["sidetone", 22.48], ["music", 11.55]], null, [["hum", 22.74], ["music", 20.05], ["throbbing", 17.06]], null, null, null, null, [["hum", 22.15], ["mains hum", 9.31], ["music", 7.24]], null, [["mains hum", 32.13], ["hum", 21.98], ["music", 19.88]], null, null, null], "duration": [1.26, 0.33, 1.02, 2.49, 9.04, 1.73, 3.65, 1.21, 1.94, 0.25, 0.56, 2.33, -0.27, 8.4, 0.69, 0.52, -0.45]} \ No newline at end of file diff --git a/annotations_filtered/qCpDKjDMo6Y_filtered.json b/annotations_filtered/qCpDKjDMo6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4651428f12296e86c07d68ed5cceb3108f6f7021 --- /dev/null +++ b/annotations_filtered/qCpDKjDMo6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.27], [5.0, 5.59], [7.0, 8.77], [9.0, 11.89], [14.0, 14.89], [17.0, 17.95], [19.0, 20.76], [26.0, 29.1], [30.0, 34.43], [37.0, 38.06], [38.0, 39.28], [41.0, 42.15], [45.0, 45.96], [49.0, 49.59], [53.0, 53.25], [55.0, 55.76], [58.0, 58.28], [61.0, 61.3], [61.0, 63.0], [65.0, 66.51], [67.0, 68.93], [70.0, 72.01], [83.0, 83.61], [96.0, 97.95], [101.0, 105.17], [121.0, 122.12], [124.0, 124.43], [127.0, 129.27], [133.0, 134.32], [135.0, 135.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 59.42, 0.0, 0.0, 0.0, 81.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.69, 0.0, 0.0, 39.05, 0.0, 0.0, 58.72, 0.0, 0.0, 38.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.49], ["speech", 17.46], ["didgeridoo", 13.14]], null, null, [["music", 59.98], ["theremin", 6.94], ["musical instrument", 5.57]], null, null, null, null, null, [["music", 37.97], ["speech", 32.95], ["boing", 3.57]], null, null], "duration": [0.27, 0.59, 1.77, 2.89, 0.89, 0.95, 1.76, 3.1, 4.43, 1.06, 1.28, 1.15, 0.96, 0.59, 0.25, 0.76, 0.28, 0.3, 2.0, 1.51, 1.93, 2.01, 0.61, 1.95, 4.17, 1.12, 0.43, 2.27, 1.32, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/qCq0IXXi_2U_filtered.json b/annotations_filtered/qCq0IXXi_2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3b85eb5d22a97b4dd060f272b8bcb20f6aa1689 --- /dev/null +++ b/annotations_filtered/qCq0IXXi_2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 49.92], [52.0, 52.89], [53.0, 59.0], [61.0, 61.59], [62.0, 62.46], [64.0, 64.67], [65.0, 76.47], [77.0, 96.28], [100.0, 102.37], [105.0, 104.79], [105.0, 105.66], [108.0, 111.64], [114.0, 120.12]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.91, 0.0, 0.0, 0.0, 43.18, 91.3, 84.25, 0.0, 0.0, 87.92, 64.07], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 26.49], ["cattle, bovinae", 16.45], ["moo", 10.23]], null, null, null, [["speech", 32.08], ["hum", 25.65], ["mains hum", 15.2]], null, null, null, null, null, null], "duration": [49.92, 0.89, 6.0, 0.59, 0.46, 0.67, 11.47, 19.28, 2.37, -0.21, 0.66, 3.64, 6.12]} \ No newline at end of file diff --git a/annotations_filtered/qCv3989nvog_filtered.json b/annotations_filtered/qCv3989nvog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..522768fbe88e2c78cd6271a73359b9d75ea6168c --- /dev/null +++ b/annotations_filtered/qCv3989nvog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [21.0, 25.84], [26.0, 26.96], [28.0, 28.75], [29.0, 29.39], [34.0, 34.82], [36.0, 55.88], [56.0, 56.54], [62.0, 65.45], [67.0, 67.39], [69.0, 69.85], [76.0, 77.25], [79.0, 80.86], [97.0, 98.85], [105.0, 108.24], [113.0, 114.91], [119.0, 119.31]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 34.2, 0.0, 31.52, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 54.3], ["hum", 10.72], ["electronic music", 7.29]], null, [["music", 36.67], ["speech", 23.47], ["electronic music", 3.32]], null, null, null, null, null, null, null, null], "duration": [0.26, 4.84, 0.96, 0.75, 0.39, 0.82, 19.88, 0.54, 3.45, 0.39, 0.85, 1.25, 1.86, 1.85, 3.24, 1.91, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/qD6IXIE0cok_filtered.json b/annotations_filtered/qD6IXIE0cok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3027e2bfa846f826374684130ba415ccfabff93c --- /dev/null +++ b/annotations_filtered/qD6IXIE0cok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 20.87], [21.0, 152.15], [153.0, 169.42]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 32.52], "audiomae_on_audioset": [null, null, [["music", 43.61], ["throbbing", 9.78], ["hum", 8.4]]], "duration": [-0.13, 131.15, 16.42]} \ No newline at end of file diff --git a/annotations_filtered/qDFzVZklg1Q_filtered.json b/annotations_filtered/qDFzVZklg1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a08a60e3d4c821678d03745bceaa47a38f8a031 --- /dev/null +++ b/annotations_filtered/qDFzVZklg1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 105.71], [107.0, 115.16]], "keep_status": [false, false], "silence_prob": [0.0, 33.12], "audiomae_on_audioset": [null, [["music", 66.41], ["hum", 7.55], ["throbbing", 3.7]]], "duration": [50.71, 8.16]} \ No newline at end of file diff --git a/annotations_filtered/qDR_yTik_xo_filtered.json b/annotations_filtered/qDR_yTik_xo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ce9497c38c065b68e2e72fa4e3a53d7637d9df5 --- /dev/null +++ b/annotations_filtered/qDR_yTik_xo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 21.05], [32.0, 35.18], [36.0, 36.76], [38.0, 39.23], [40.0, 40.61], [42.0, 42.96], [44.0, 44.42], [49.0, 50.03], [53.0, 53.7], [55.0, 55.88], [58.0, 59.81], [67.0, 67.34], [69.0, 69.82], [72.0, 72.33], [73.0, 73.6], [84.0, 84.37], [89.0, 89.07], [96.0, 96.4], [116.0, 116.45], [120.0, 121.85], [124.0, 124.68], [126.0, 126.62], [127.0, 127.72], [130.0, 130.35], [132.0, 132.51], [137.0, 140.12], [143.0, 149.13], [154.0, 154.01], [154.0, 155.85], [164.0, 171.14], [172.0, 172.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [32.26, 31.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.66, 35.68, 0.0, 0.0, 35.25, 0.0], "audiomae_on_audioset": [[["music", 32.31], ["whack, thwack", 14.66], ["speech", 12.23]], [["speech", 31.7], ["fart", 30.18], ["music", 10.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.23], ["sidetone", 6.05], ["busy signal", 2.02]], [["hum", 14.87], ["car", 13.9], ["mains hum", 12.27]], null, null, [["thunk", 13.56], ["music", 7.51], ["hum", 6.74]], null], "duration": [10.05, 3.18, 0.76, 1.23, 0.61, 0.96, 0.42, 1.03, 0.7, 0.88, 1.81, 0.34, 0.82, 0.33, 0.6, 0.37, 0.07, 0.4, 0.45, 1.85, 0.68, 0.62, 0.72, 0.35, 0.51, 3.12, 6.13, 0.01, 1.85, 7.14, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/qDTmyJdVAF0_filtered.json b/annotations_filtered/qDTmyJdVAF0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c852fe672a09f9e22b74c11c87b293328e4230ba --- /dev/null +++ b/annotations_filtered/qDTmyJdVAF0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [8.0, 9.31], [15.0, 15.57], [17.0, 17.34], [20.0, 23.9], [31.0, 32.43], [35.0, 37.17], [38.0, 39.61], [40.0, 44.27], [47.0, 51.09], [54.0, 67.02], [68.0, 85.67], [86.0, 89.75]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.9, 0.0, 33.11, 0.0, 32.64, 31.84, 33.82, 32.92, 32.83], "audiomae_on_audioset": [null, null, null, null, [["music", 53.24], ["musical instrument", 10.22], ["speech", 6.6]], null, [["music", 60.23], ["musical instrument", 4.44], ["guitar", 2.57]], null, [["music", 70.05], ["musical instrument", 2.18], ["synthesizer", 1.6]], [["music", 74.3], ["didgeridoo", 4.08], ["funk", 1.71]], [["music", 82.46], ["musical instrument", 3.07], ["sitar", 1.9]], [["music", 72.97], ["didgeridoo", 10.92], ["musical instrument", 1.65]], [["music", 32.87], ["carnatic music", 16.21], ["tabla", 13.51]]], "duration": [0.64, 1.31, 0.57, 0.34, 3.9, 1.43, 2.17, 1.61, 4.27, 4.09, 13.02, 17.67, 3.75]} \ No newline at end of file diff --git a/annotations_filtered/qDc-OGF_NJ0_filtered.json b/annotations_filtered/qDc-OGF_NJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31b28c8c4f39f8497d6f4b02264201fa0840aa1f --- /dev/null +++ b/annotations_filtered/qDc-OGF_NJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [5.0, 8.5], [9.0, 10.07], [11.0, 12.45], [13.0, 13.64], [14.0, 16.19], [17.0, 17.69], [18.0, 18.98], [23.0, 23.94], [30.0, 38.89], [40.0, 40.71], [41.0, 52.2], [53.0, 54.67]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.36, 0.0, 0.0, 0.0, 45.11, 0.0, 0.0, 0.0, 57.01, 0.0, 53.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 26.02], ["music", 23.06], ["musical instrument", 8.21]], null, null, null, null, null, null, null], "duration": [0.16, 3.5, 1.07, 1.45, 0.64, 2.19, 0.69, 0.98, 0.94, 8.89, 0.71, 11.2, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/qDjmN1TyJAU_filtered.json b/annotations_filtered/qDjmN1TyJAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cde8d0ef8d7547a8ad1dd5e025823d140313a07c --- /dev/null +++ b/annotations_filtered/qDjmN1TyJAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.23], [18.0, 38.5], [45.0, 49.64], [54.0, 60.83], [62.0, 63.14], [66.0, 66.21], [69.0, 69.43], [70.0, 73.08], [74.0, 74.83], [76.0, 75.74], [77.0, 79.69], [84.0, 84.45], [87.0, 90.49], [93.0, 94.46], [96.0, 97.23], [99.0, 100.16], [102.0, 102.59], [104.0, 105.04], [106.0, 108.36], [111.0, 111.35], [117.0, 119.26]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.47, 31.13, 36.52, 91.47, 0.0, 0.0, 0.0, 46.47, 0.0, 0.0, 97.83, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [[["speech", 25.88], ["hum", 21.65], ["throbbing", 13.02]], [["vehicle", 35.33], ["boat, water vehicle", 9.01], ["motorboat, speedboat", 7.88]], [["hum", 39.59], ["mains hum", 36.4], ["throbbing", 9.31]], null, null, null, null, [["speech", 71.58], ["sidetone", 11.53], ["dial tone", 3.29]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.23, 20.5, 4.64, 6.83, 1.14, 0.21, 0.43, 3.08, 0.83, -0.26, 2.69, 0.45, 3.49, 1.46, 1.23, 1.16, 0.59, 1.04, 2.36, 0.35, 2.26]} \ No newline at end of file diff --git a/annotations_filtered/qEH9lnYIndY_filtered.json b/annotations_filtered/qEH9lnYIndY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82f707bd6804c93d51ec00cd057e84890b3c1541 --- /dev/null +++ b/annotations_filtered/qEH9lnYIndY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.91], [15.0, 15.52], [24.0, 26.32], [36.0, 39.99], [41.0, 43.73], [45.0, 44.98], [46.0, 50.26], [52.0, 100.6], [105.0, 112.31], [113.0, 114.02], [116.0, 144.44], [147.0, 150.13], [150.0, 152.58], [157.0, 158.45]], "keep_status": [false, false, false, true, true, false, true, false, false, false, true, false, true, false], "silence_prob": [42.26, 0.0, 39.6, 49.09, 40.95, 0.0, 39.49, 0.0, 30.05, 0.0, 29.6, 31.48, 32.23, 0.0], "audiomae_on_audioset": [[["throbbing", 60.41], ["music", 14.57], ["hum", 13.51]], null, [["throbbing", 69.52], ["hum", 12.53], ["music", 5.75]], [["music", 27.6], ["hum", 22.69], ["throbbing", 12.38]], [["hum", 33.51], ["throbbing", 23.85], ["mains hum", 11.8]], null, [["synthesizer", 24.21], ["music", 22.99], ["hum", 12.16]], null, [["speech", 68.23], ["music", 6.34], ["eruption", 4.13]], null, [["speech", 46.97], ["music", 10.1], ["whip", 4.98]], [["music", 73.58], ["synthesizer", 4.19], ["musical instrument", 3.42]], [["speech", 31.34], ["music", 23.03], ["hum", 9.47]], null], "duration": [5.91, 0.52, 2.32, 3.99, 2.73, -0.02, 4.26, 48.6, 7.31, 1.02, 28.44, 3.13, 2.58, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/qEJNox8TCOw_filtered.json b/annotations_filtered/qEJNox8TCOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dac5f49f0128ff53aa81d83cacc52af7ba12904 --- /dev/null +++ b/annotations_filtered/qEJNox8TCOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.45], [21.0, 21.36], [23.0, 25.93], [32.0, 35.94], [40.0, 43.95], [49.0, 82.78], [83.0, 82.88], [83.0, 135.99], [136.0, 136.02], [138.0, 143.23], [145.0, 145.79], [146.0, 146.31]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [32.18, 0.0, 31.73, 29.86, 30.38, 0.0, 0.0, 0.0, 0.0, 36.2, 0.0, 0.0], "audiomae_on_audioset": [[["music", 75.6], ["bass guitar", 3.3], ["guitar", 1.58]], null, [["music", 49.62], ["musical instrument", 6.74], ["guitar", 6.56]], [["music", 71.75], ["bass guitar", 2.35], ["musical instrument", 1.31]], [["music", 69.6], ["guitar", 3.96], ["musical instrument", 3.29]], null, null, null, null, [["music", 50.18], ["synthesizer", 7.88], ["electric piano", 7.08]], null, null], "duration": [3.45, 0.36, 2.93, 3.94, 3.95, 33.78, -0.12, 52.99, 0.02, 5.23, 0.79, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/qEb51O12XFw_filtered.json b/annotations_filtered/qEb51O12XFw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdad4ff76927b08faf4023e31e0a72af855b40ad --- /dev/null +++ b/annotations_filtered/qEb51O12XFw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.8], [32.0, 31.8], [32.0, 32.61], [35.0, 37.84], [39.0, 41.2], [42.0, 42.84], [45.0, 45.96], [48.0, 64.98], [70.0, 74.75], [79.0, 106.95], [108.0, 108.53]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 50.81, 49.18, 0.0, 0.0, 29.05, 51.99, 29.44, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 49.69], ["speech", 12.28], ["music", 8.38]], null, null, [["music", 65.3], ["throbbing", 10.91], ["electronic music", 5.42]], null, [["music", 46.18], ["throbbing", 8.14], ["electronic music", 6.81]], null], "duration": [0.8, -0.2, 0.61, 2.84, 2.2, 0.84, 0.96, 16.98, 4.75, 27.95, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/qF0CMv413PA_filtered.json b/annotations_filtered/qF0CMv413PA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..678c86ef258cf5dd6b9c56502c584a6e87df7023 --- /dev/null +++ b/annotations_filtered/qF0CMv413PA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.5], [6.0, 7.62], [9.0, 16.24], [18.0, 20.29], [21.0, 22.27], [23.0, 28.36]], "keep_status": [false, false, true, false, false, false], "silence_prob": [99.52, 0.0, 36.07, 98.93, 0.0, 99.59], "audiomae_on_audioset": [null, null, [["speech", 37.98], ["sidetone", 12.31], ["music", 10.08]], null, null, null], "duration": [2.5, 1.62, 7.24, 2.29, 1.27, 5.36]} \ No newline at end of file diff --git a/annotations_filtered/qFH0mR6eVLg_filtered.json b/annotations_filtered/qFH0mR6eVLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd0360000ddf0c5fb9bf1f60f3021ce27ae03773 --- /dev/null +++ b/annotations_filtered/qFH0mR6eVLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.87], [12.0, 20.71], [21.0, 22.0], [22.0, 28.16], [29.0, 33.24], [34.0, 36.14], [41.0, 42.18], [43.0, 43.95], [44.0, 46.58], [48.0, 52.08], [52.0, 56.98], [58.0, 59.31], [61.0, 63.0], [63.0, 66.02], [67.0, 68.54], [69.0, 118.79], [120.0, 120.19], [126.0, 129.1]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [80.82, 69.74, 0.0, 47.23, 40.62, 41.46, 0.0, 0.0, 55.74, 57.48, 51.82, 0.0, 76.2, 42.67, 0.0, 0.0, 0.0, 37.77], "audiomae_on_audioset": [null, null, null, [["hum", 37.04], ["speech", 25.56], ["throbbing", 5.74]], [["speech", 48.85], ["sidetone", 14.54], ["music", 6.1]], [["speech", 28.86], ["music", 23.67], ["sidetone", 6.78]], null, null, null, null, null, null, null, [["speech", 39.88], ["sidetone", 9.67], ["music", 9.45]], null, null, null, [["whack, thwack", 12.43], ["mosquito", 7.42], ["fly, housefly", 6.96]]], "duration": [5.87, 8.71, 1.0, 6.16, 4.24, 2.14, 1.18, 0.95, 2.58, 4.08, 4.98, 1.31, 2.0, 3.02, 1.54, 49.79, 0.19, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/qFL0bfzriR0_filtered.json b/annotations_filtered/qFL0bfzriR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f0af4abc940de48c1e02effc4fbc446f8fcc36d --- /dev/null +++ b/annotations_filtered/qFL0bfzriR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.57], [14.0, 13.95], [16.0, 22.54], [23.0, 23.38], [26.0, 26.05], [30.0, 30.69], [39.0, 39.72], [42.0, 42.57], [45.0, 45.5], [46.0, 46.21], [62.0, 63.02], [71.0, 70.88], [81.0, 81.73], [85.0, 88.03], [91.0, 91.64]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [46.94, 0.0, 32.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.31, 0.0], "audiomae_on_audioset": [[["music", 31.11], ["speech", 16.98], ["fly, housefly", 7.16]], null, [["music", 65.59], ["synthesizer", 7.29], ["speech", 5.71]], null, null, null, null, null, null, null, null, null, null, [["speech", 30.65], ["music", 17.09], ["hum", 8.25]], null], "duration": [4.57, -0.05, 6.54, 0.38, 0.05, 0.69, 0.72, 0.57, 0.5, 0.21, 1.02, -0.12, 0.73, 3.03, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/qFNBUs7O-h4_filtered.json b/annotations_filtered/qFNBUs7O-h4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2efe040392699595c7b2038f5f895f72eff8d13f --- /dev/null +++ b/annotations_filtered/qFNBUs7O-h4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.5], [27.0, 103.44], [104.0, 174.68]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.5, 76.44, 70.68]} \ No newline at end of file diff --git a/annotations_filtered/qFOp7gSiC0I_filtered.json b/annotations_filtered/qFOp7gSiC0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6579e9cd8e940b84fea291b44b5c20b096c07873 --- /dev/null +++ b/annotations_filtered/qFOp7gSiC0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.68], [2.0, 2.54], [3.0, 4.43], [6.0, 6.03], [7.0, 7.69], [9.0, 8.99], [10.0, 10.12], [11.0, 11.2], [13.0, 13.24], [15.0, 15.62], [17.0, 17.29], [19.0, 19.84], [20.0, 22.22], [26.0, 43.26], [45.0, 44.96], [50.0, 50.62], [51.0, 51.88], [53.0, 53.38], [54.0, 55.04], [56.0, 56.22], [57.0, 58.06], [60.0, 60.59], [63.0, 63.81], [66.0, 66.53], [67.0, 78.04], [81.0, 81.77], [85.0, 85.4], [86.0, 86.53], [88.0, 89.04], [94.0, 94.63], [96.0, 97.33], [98.0, 99.22], [106.0, 106.74], [107.0, 108.6], [109.0, 109.75], [111.0, 112.78], [115.0, 116.01], [118.0, 118.84], [119.0, 119.85], [123.0, 128.31], [131.0, 132.29], [134.0, 135.31], [136.0, 136.78], [137.0, 139.46], [140.0, 142.47], [143.0, 144.88], [146.0, 147.26], [150.0, 151.41], [152.0, 153.2], [155.0, 155.85], [158.0, 161.03], [162.0, 164.29], [167.0, 168.24], [170.0, 170.38], [172.0, 172.93], [181.0, 181.55], [182.0, 183.19], [184.0, 184.91], [189.0, 190.12], [193.0, 193.24], [195.0, 195.34], [198.0, 202.34], [203.0, 203.3], [204.0, 204.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.36, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 0.54, 1.43, 0.03, 0.69, -0.01, 0.12, 0.2, 0.24, 0.62, 0.29, 0.84, 2.22, 17.26, -0.04, 0.62, 0.88, 0.38, 1.04, 0.22, 1.06, 0.59, 0.81, 0.53, 11.04, 0.77, 0.4, 0.53, 1.04, 0.63, 1.33, 1.22, 0.74, 1.6, 0.75, 1.78, 1.01, 0.84, 0.85, 5.31, 1.29, 1.31, 0.78, 2.46, 2.47, 1.88, 1.26, 1.41, 1.2, 0.85, 3.03, 2.29, 1.24, 0.38, 0.93, 0.55, 1.19, 0.91, 1.12, 0.24, 0.34, 4.34, 0.3, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/qFUISvEZ3aw_filtered.json b/annotations_filtered/qFUISvEZ3aw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..997d8571a9318ee97b09a33810438e873cd35317 --- /dev/null +++ b/annotations_filtered/qFUISvEZ3aw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.28], [8.0, 8.33], [14.0, 17.71], [19.0, 28.14], [31.0, 40.34], [41.0, 52.52], [54.0, 54.01]], "keep_status": [false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 42.74, 33.4, 32.85, 34.89, 0.0], "audiomae_on_audioset": [null, null, [["echo", 34.72], ["speech", 26.18], ["boing", 5.73]], [["speech", 64.74], ["fart", 3.35], ["livestock, farm animals, working animals", 2.81]], [["livestock, farm animals, working animals", 26.79], ["music", 18.77], ["animal", 9.76]], [["livestock, farm animals, working animals", 37.33], ["animal", 21.85], ["cowbell", 14.43]], null], "duration": [0.28, 0.33, 3.71, 9.14, 9.34, 11.52, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/qFWptPtHG78_filtered.json b/annotations_filtered/qFWptPtHG78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e29c7d76a145aafd13482bc3b49a9d69ffb184b --- /dev/null +++ b/annotations_filtered/qFWptPtHG78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 5.22], [6.0, 6.05], [7.0, 8.06], [15.0, 15.31], [17.0, 17.81], [20.0, 20.97], [22.0, 22.74], [27.0, 28.0], [29.0, 29.91], [33.0, 33.74], [34.0, 34.37], [35.0, 35.8], [36.0, 37.23], [38.0, 38.18], [39.0, 41.05], [41.0, 41.62], [46.0, 51.0], [55.0, 55.14], [58.0, 58.67], [62.0, 63.14], [71.0, 72.4], [81.0, 82.36], [83.0, 83.32], [84.0, 86.24], [95.0, 97.29], [100.0, 101.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.02, 0.0, 49.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.02, 39.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 33.96], ["rowboat, canoe, kayak", 13.54], ["speech", 13.19]], null, [["boat, water vehicle", 32.8], ["rowboat, canoe, kayak", 14.42], ["vehicle", 7.54]], null, null, null, null, null, null, [["whale vocalization", 22.88], ["splash, splatter", 19.26], ["speech", 11.5]], [["rowboat, canoe, kayak", 35.89], ["splash, splatter", 16.35], ["boat, water vehicle", 12.41]], null], "duration": [1.3, 0.22, 0.05, 1.06, 0.31, 0.81, 0.97, 0.74, 1.0, 0.91, 0.74, 0.37, 0.8, 1.23, 0.18, 2.05, 0.62, 5.0, 0.14, 0.67, 1.14, 1.4, 1.36, 0.32, 2.24, 2.29, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/qFprLPWDd-Y_filtered.json b/annotations_filtered/qFprLPWDd-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0554cf4ee5ad16801d0e52b717b245c5f7ca7581 --- /dev/null +++ b/annotations_filtered/qFprLPWDd-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.36], [13.0, 13.86], [14.0, 14.94], [20.0, 21.83]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.36, 0.86, 0.94, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/qG-B9IzugQM_filtered.json b/annotations_filtered/qG-B9IzugQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fde0d22012ee350941dfdc4ebec0c7e5740f69a7 --- /dev/null +++ b/annotations_filtered/qG-B9IzugQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.18], [27.0, 28.22], [30.0, 30.32], [31.0, 31.89], [36.0, 37.3], [39.0, 39.12], [40.0, 41.59], [43.0, 46.89], [48.0, 50.68], [53.0, 55.05], [56.0, 57.11], [58.0, 59.88], [62.0, 62.67], [64.0, 66.85], [70.0, 71.0], [72.0, 73.04], [75.0, 76.1], [78.0, 80.38], [82.0, 100.58], [103.0, 112.36], [114.0, 114.93], [116.0, 116.5], [117.0, 121.59], [124.0, 125.59], [128.0, 129.39], [132.0, 131.77], [138.0, 137.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [64.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.67, 69.07, 75.72, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 78.55, 49.4, 30.9, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.71], ["insect", 9.5], ["fly, housefly", 7.36]], [["music", 26.38], ["didgeridoo", 13.8], ["explosion", 9.21]], null, null, null, null, null, null, null], "duration": [3.18, 1.22, 0.32, 0.89, 1.3, 0.12, 1.59, 3.89, 2.68, 2.05, 1.11, 1.88, 0.67, 2.85, 1.0, 1.04, 1.1, 2.38, 18.58, 9.36, 0.93, 0.5, 4.59, 1.59, 1.39, -0.23, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/qG8YoqrNMEA_filtered.json b/annotations_filtered/qG8YoqrNMEA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..737011f44b94a86a88e0cee0ab441eef65b24bb6 --- /dev/null +++ b/annotations_filtered/qG8YoqrNMEA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.35], [12.0, 13.68], [16.0, 16.63], [18.0, 22.94], [25.0, 27.95], [31.0, 71.04], [73.0, 100.62]], "keep_status": [false, false, false, false, true, false, true], "silence_prob": [34.25, 0.0, 0.0, 49.97, 48.78, 0.0, 31.84], "audiomae_on_audioset": [[["throbbing", 47.76], ["music", 17.68], ["hum", 15.89]], null, null, [["music", 56.93], ["theremin", 11.04], ["musical instrument", 3.52]], [["music", 58.8], ["cello", 6.4], ["double bass", 4.78]], null, [["music", 17.12], ["race car, auto racing", 5.73], ["cacophony", 4.79]]], "duration": [3.35, 1.68, 0.63, 4.94, 2.95, 40.04, 27.62]} \ No newline at end of file diff --git a/annotations_filtered/qGf3--y_rcQ_filtered.json b/annotations_filtered/qGf3--y_rcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..820349a5b5267619441a8de4750079b28dfdb4e1 --- /dev/null +++ b/annotations_filtered/qGf3--y_rcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.18], [31.0, 31.58], [33.0, 33.52], [35.0, 36.98], [40.0, 41.64], [45.0, 46.28], [51.0, 51.46], [52.0, 52.32], [53.0, 53.92], [55.0, 71.96], [73.0, 101.41], [102.0, 118.17], [119.0, 123.7], [124.0, 133.54], [136.0, 145.32]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [35.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.28, 95.09, 41.64, 37.2, 31.26, 59.68], "audiomae_on_audioset": [[["music", 33.52], ["speech", 18.11], ["sound effect", 5.87]], null, null, null, null, null, null, null, null, [["breaking", 42.74], ["speech", 14.46], ["glass", 13.29]], null, [["speech", 49.53], ["theremin", 11.32], ["howl", 6.67]], [["music", 56.12], ["theremin", 8.22], ["scary music", 7.28]], [["speech", 40.17], ["music", 32.48], ["groan", 5.73]], null], "duration": [3.18, 0.58, 0.52, 1.98, 1.64, 1.28, 0.46, 0.32, 0.92, 16.96, 28.41, 16.17, 4.7, 9.54, 9.32]} \ No newline at end of file diff --git a/annotations_filtered/qGrKwxglKJ0_filtered.json b/annotations_filtered/qGrKwxglKJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddf41938860ec2d2470377a5252bd91bf615d2cb --- /dev/null +++ b/annotations_filtered/qGrKwxglKJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.57], [9.0, 9.61], [11.0, 11.65], [12.0, 15.21], [19.0, 25.57], [28.0, 28.9], [32.0, 47.75], [49.0, 49.49], [51.0, 52.79], [55.0, 71.47], [73.0, 77.11], [83.0, 84.82], [86.0, 94.9], [100.0, 101.09], [102.0, 104.65], [106.0, 111.94], [115.0, 121.26], [123.0, 123.45], [123.0, 127.08], [130.0, 130.4]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, true, false, true, false], "silence_prob": [36.23, 0.0, 0.0, 39.44, 36.59, 0.0, 34.83, 0.0, 0.0, 30.33, 36.69, 0.0, 30.4, 0.0, 35.35, 34.52, 29.83, 0.0, 29.68, 0.0], "audiomae_on_audioset": [[["music", 35.98], ["speech", 19.01], ["didgeridoo", 17.24]], null, null, [["speech", 34.69], ["music", 30.35], ["didgeridoo", 6.26]], [["music", 33.29], ["theremin", 12.05], ["didgeridoo", 10.01]], null, [["music", 42.54], ["speech", 19.96], ["theremin", 19.74]], null, null, [["music", 56.08], ["buzz", 13.73], ["sound effect", 3.17]], [["speech", 35.42], ["music", 19.21], ["synthesizer", 10.53]], null, [["music", 39.62], ["musical instrument", 9.11], ["synthesizer", 8.78]], null, [["music", 40.69], ["didgeridoo", 25.81], ["musical instrument", 8.91]], [["music", 75.57], ["didgeridoo", 6.79], ["musical instrument", 3.67]], [["music", 40.82], ["synthesizer", 9.24], ["musical instrument", 8.34]], null, [["music", 54.19], ["brass instrument", 5.72], ["musical instrument", 4.22]], null], "duration": [2.57, 0.61, 0.65, 3.21, 6.57, 0.9, 15.75, 0.49, 1.79, 16.47, 4.11, 1.82, 8.9, 1.09, 2.65, 5.94, 6.26, 0.45, 4.08, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/qHA5R-Q1Od8_filtered.json b/annotations_filtered/qHA5R-Q1Od8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ec00b83607f66ea1fd7654f7d87788d8a8aef4b --- /dev/null +++ b/annotations_filtered/qHA5R-Q1Od8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.76], [16.0, 15.96], [20.0, 21.09], [22.0, 23.87], [24.0, 27.06], [30.0, 30.03], [30.0, 30.38], [35.0, 36.32], [41.0, 41.05], [42.0, 46.23], [48.0, 47.97], [50.0, 50.23], [54.0, 54.85], [57.0, 58.99], [64.0, 64.4], [67.0, 67.81], [74.0, 82.0], [83.0, 86.71], [88.0, 90.69], [91.0, 93.04], [97.0, 98.24], [99.0, 100.97], [102.0, 102.9], [106.0, 106.95], [110.0, 112.45], [113.0, 115.28], [116.0, 118.32], [119.0, 125.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 85.9, 96.04, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, -0.04, 1.09, 1.87, 3.06, 0.03, 0.38, 1.32, 0.05, 4.23, -0.03, 0.23, 0.85, 1.99, 0.4, 0.81, 8.0, 3.71, 2.69, 2.04, 1.24, 1.97, 0.9, 0.95, 2.45, 2.28, 2.32, 6.61]} \ No newline at end of file diff --git a/annotations_filtered/qHisKG66fLI_filtered.json b/annotations_filtered/qHisKG66fLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0d252ccf403986400b92ce1184f588be0adfaa2 --- /dev/null +++ b/annotations_filtered/qHisKG66fLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.45], [5.0, 20.87], [25.0, 25.79], [30.0, 31.99], [33.0, 34.25], [35.0, 36.09], [39.0, 42.74], [44.0, 44.42], [45.0, 48.88], [51.0, 51.51], [54.0, 59.31], [64.0, 72.17], [78.0, 91.12], [95.0, 96.16], [98.0, 98.52], [100.0, 103.65], [105.0, 107.96], [110.0, 128.8], [130.0, 131.41], [133.0, 137.49], [139.0, 141.25], [143.0, 144.29], [146.0, 147.23], [149.0, 149.07], [151.0, 153.22], [154.0, 154.6], [156.0, 163.75], [166.0, 169.42], [171.0, 171.58], [173.0, 175.86]], "keep_status": [false, true, false, false, false, false, true, false, true, false, true, false, true, false, false, false, true, true, false, true, true, false, false, false, false, false, false, true, false, false], "silence_prob": [39.66, 30.27, 0.0, 0.0, 0.0, 0.0, 36.11, 0.0, 48.56, 0.0, 29.86, 30.27, 29.8, 0.0, 0.0, 53.16, 29.71, 29.11, 0.0, 30.07, 29.39, 0.0, 0.0, 0.0, 47.01, 0.0, 35.3, 48.1, 0.0, 39.77], "audiomae_on_audioset": [[["music", 58.26], ["hum", 11.27], ["singing bowl", 5.72]], [["grunt", 19.16], ["music", 15.51], ["animal", 14.62]], null, null, null, null, [["music", 28.04], ["gong", 18.6], ["hum", 11.89]], null, [["music", 49.86], ["foghorn", 11.51], ["ambient music", 5.47]], null, [["grunt", 39.23], ["music", 12.32], ["wild animals", 6.92]], [["music", 84.06], ["roaring cats (lions, tigers)", 1.99], ["wild animals", 1.74]], [["music", 40.99], ["sound effect", 5.5], ["hum", 5.23]], null, null, null, [["music", 27.42], ["speech", 20.33], ["carnatic music", 6.72]], [["music", 46.15], ["sound effect", 3.43], ["groan", 3.42]], null, [["speech", 28.9], ["music", 20.93], ["didgeridoo", 6.2]], [["hum", 22.7], ["music", 17.88], ["sonar", 8.24]], null, null, null, [["hum", 41.1], ["music", 25.36], ["throbbing", 6.38]], null, [["music", 73.66], ["ambient music", 6.29], ["synthesizer", 4.6]], [["music", 62.33], ["singing bowl", 3.45], ["ambient music", 3.13]], null, [["music", 50.09], ["theremin", 16.36], ["musical instrument", 3.58]]], "duration": [2.45, 15.87, 0.79, 1.99, 1.25, 1.09, 3.74, 0.42, 3.88, 0.51, 5.31, 8.17, 13.12, 1.16, 0.52, 3.65, 2.96, 18.8, 1.41, 4.49, 2.25, 1.29, 1.23, 0.07, 2.22, 0.6, 7.75, 3.42, 0.58, 2.86]} \ No newline at end of file diff --git a/annotations_filtered/qIOC-6zluBQ_filtered.json b/annotations_filtered/qIOC-6zluBQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06688366f6eca73e9a7ee44b31c2279790b2e7f4 --- /dev/null +++ b/annotations_filtered/qIOC-6zluBQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [6.0, 6.34], [8.0, 11.06], [12.0, 15.85], [18.0, 20.28], [23.0, 24.87], [26.0, 25.76], [28.0, 28.21], [31.0, 31.29], [34.0, 34.65], [37.0, 36.96], [39.0, 39.28], [41.0, 41.07], [43.0, 43.29], [48.0, 49.3], [51.0, 51.27], [54.0, 55.56], [58.0, 61.45], [63.0, 65.01], [66.0, 66.48], [68.0, 69.55], [74.0, 74.65], [78.0, 81.03], [87.0, 90.14], [92.0, 93.45], [95.0, 99.33], [102.0, 102.02], [102.0, 103.76], [104.0, 105.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.51, 98.44, 99.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 90.95, 0.0, 0.0, 0.0, 76.2, 97.64, 0.0, 99.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.34, 3.06, 3.85, 2.28, 1.87, -0.24, 0.21, 0.29, 0.65, -0.04, 0.28, 0.07, 0.29, 1.3, 0.27, 1.56, 3.45, 2.01, 0.48, 1.55, 0.65, 3.03, 3.14, 1.45, 4.33, 0.02, 1.76, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/qIalODmFrZk_filtered.json b/annotations_filtered/qIalODmFrZk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23456326960c6fbf43ac86964edef763ff5448b2 --- /dev/null +++ b/annotations_filtered/qIalODmFrZk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.51], [12.0, 20.06], [28.0, 28.05], [37.0, 37.22], [40.0, 41.01], [46.0, 47.68], [53.0, 53.28], [61.0, 61.37], [67.0, 70.09], [76.0, 82.61], [92.0, 92.31], [93.0, 94.32], [95.0, 96.7], [110.0, 114.4], [128.0, 128.83], [136.0, 136.49], [139.0, 144.04], [150.0, 157.77], [158.0, 159.56], [165.0, 172.96], [181.0, 182.19], [185.0, 186.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.05, 42.15, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 36.08, 36.27, 0.0, 37.17, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 63.53], ["door", 10.11], ["throbbing", 6.08]], null, null, null, null, null, null, [["music", 61.68], ["throbbing", 11.64], ["hum", 8.36]], [["music", 37.87], ["throbbing", 24.8], ["speech", 8.25]], null, null, null, [["music", 43.42], ["speech", 12.76], ["fusillade", 5.97]], null, null, [["music", 29.7], ["shuffling cards", 29.07], ["speech", 15.24]], [["music", 49.91], ["speech", 29.26], ["synthesizer", 3.57]], null, [["music", 68.35], ["chink, clink", 7.55], ["glass", 5.65]], null, null], "duration": [1.51, 8.06, 0.05, 0.22, 1.01, 1.68, 0.28, 0.37, 3.09, 6.61, 0.31, 1.32, 1.7, 4.4, 0.83, 0.49, 5.04, 7.77, 1.56, 7.96, 1.19, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/qIis4kiGo6Q_filtered.json b/annotations_filtered/qIis4kiGo6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56747b4c981ac7757f0a703f0b213efddc82d849 --- /dev/null +++ b/annotations_filtered/qIis4kiGo6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.71], [12.0, 13.46], [14.0, 16.38]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 33.5], "audiomae_on_audioset": [null, null, [["music", 67.26], ["synthesizer", 7.9], ["musical instrument", 2.64]]], "duration": [1.71, 1.46, 2.38]} \ No newline at end of file diff --git a/annotations_filtered/qIleHfrMWWE_filtered.json b/annotations_filtered/qIleHfrMWWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89427749ef4506210333b608c5305ccee70575a9 --- /dev/null +++ b/annotations_filtered/qIleHfrMWWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [2.0, 1.97], [11.0, 12.06], [15.0, 17.61], [20.0, 23.09], [31.0, 30.99], [33.0, 33.83], [36.0, 36.39], [37.0, 38.57], [42.0, 42.48], [44.0, 45.03], [48.0, 48.93], [50.0, 51.51], [52.0, 53.3], [54.0, 54.8], [55.0, 55.58], [62.0, 61.86], [63.0, 63.9], [65.0, 66.75], [68.0, 70.56], [71.0, 72.91], [75.0, 78.61], [90.0, 90.69], [95.0, 95.0], [95.0, 95.96], [98.0, 98.34], [99.0, 99.62], [100.0, 101.58], [104.0, 104.26], [105.0, 105.46], [108.0, 109.0], [113.0, 112.87], [117.0, 122.66], [123.0, 123.45], [124.0, 125.17], [126.0, 127.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 44.46, 60.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 0.0, 54.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.48, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 64.55], ["throbbing", 2.87], ["hum", 2.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 44.2], ["moo", 34.62], ["livestock, farm animals, working animals", 4.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, -0.03, 1.06, 2.61, 3.09, -0.01, 0.83, 0.39, 1.57, 0.48, 1.03, 0.93, 1.51, 1.3, 0.8, 0.58, -0.14, 0.9, 1.75, 2.56, 1.91, 3.61, 0.69, 0.0, 0.96, 0.34, 0.62, 1.58, 0.26, 0.46, 1.0, -0.13, 5.66, 0.45, 1.17, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/qIp_8RNNX4k_filtered.json b/annotations_filtered/qIp_8RNNX4k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4ca4f277a01e97a1f817e81a2d857d2f227cee4 --- /dev/null +++ b/annotations_filtered/qIp_8RNNX4k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 29.56], [31.0, 34.23], [36.0, 71.69], [77.0, 91.12], [95.0, 95.47], [102.0, 102.19], [106.0, 120.09], [120.0, 125.44], [127.0, 130.3], [135.0, 136.8], [138.0, 143.16], [147.0, 150.08], [151.0, 153.03], [154.0, 154.14], [157.0, 159.95], [161.0, 161.23]], "keep_status": [true, true, false, true, false, false, false, false, true, false, true, true, true, false, false, false], "silence_prob": [46.94, 36.11, 0.0, 33.53, 0.0, 0.0, 30.21, 34.14, 33.79, 0.0, 35.6, 39.09, 33.94, 0.0, 36.04, 0.0], "audiomae_on_audioset": [[["music", 36.06], ["hum", 6.61], ["mains hum", 6.26]], [["mains hum", 24.0], ["hum", 17.63], ["music", 15.68]], null, [["music", 43.17], ["hum", 16.28], ["throbbing", 8.96]], null, null, [["music", 61.92], ["ambient music", 5.8], ["synthesizer", 5.46]], [["hum", 26.9], ["music", 26.66], ["mains hum", 21.71]], [["music", 32.56], ["mains hum", 11.47], ["hum", 9.58]], null, [["music", 36.97], ["speech", 14.45], ["hum", 6.58]], [["music", 40.16], ["effects unit", 8.46], ["hum", 6.2]], [["music", 14.7], ["mains hum", 13.77], ["hum", 11.15]], null, [["hum", 46.89], ["mains hum", 24.14], ["music", 14.46]], null], "duration": [2.56, 3.23, 35.69, 14.12, 0.47, 0.19, 14.09, 5.44, 3.3, 1.8, 5.16, 3.08, 2.03, 0.14, 2.95, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/qIs2PMXvAmQ_filtered.json b/annotations_filtered/qIs2PMXvAmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f007e1ec6bf553bca64f78bcd2c9ddc1b24cf56 --- /dev/null +++ b/annotations_filtered/qIs2PMXvAmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [6.0, 6.61], [7.0, 6.81], [7.0, 6.94], [7.0, 8.04], [13.0, 13.76], [19.0, 23.43], [23.0, 23.5], [24.0, 23.73], [24.0, 23.79], [24.0, 23.82], [26.0, 25.74], [28.0, 27.77], [42.0, 43.29], [44.0, 44.71], [46.0, 54.94], [57.0, 57.47], [61.0, 65.18], [66.0, 81.33], [88.0, 93.36], [96.0, 114.49], [118.0, 120.72], [122.0, 123.08], [128.0, 133.12]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26, 0.0, 30.84, 31.36, 30.94, 31.16, 32.25, 0.0, 31.32], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 44.15], ["speech", 23.65], ["vehicle", 2.09]], null, null, null, null, null, null, null, null, [["music", 69.89], ["synthesizer", 3.37], ["throbbing", 2.45]], null, [["music", 54.92], ["electronic music", 4.55], ["boing", 4.15]], [["speech", 27.07], ["music", 23.96], ["hum", 20.29]], [["music", 46.49], ["speech", 11.78], ["cacophony", 7.78]], [["music", 23.76], ["speech", 23.08], ["buzz", 6.37]], [["music", 34.69], ["speech", 14.1], ["mains hum", 8.26]], null, [["music", 22.53], ["speech", 13.29], ["vehicle", 7.87]]], "duration": [0.56, 0.61, -0.19, -0.06, 1.04, 0.76, 4.43, 0.5, -0.27, -0.21, -0.18, -0.26, -0.23, 1.29, 0.71, 8.94, 0.47, 4.18, 15.33, 5.36, 18.49, 2.72, 1.08, 5.12]} \ No newline at end of file diff --git a/annotations_filtered/qItvl5cX4-A_filtered.json b/annotations_filtered/qItvl5cX4-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dd728891c42f4334b75e0c9537f73874508e852 --- /dev/null +++ b/annotations_filtered/qItvl5cX4-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.39], [7.0, 8.41], [11.0, 19.18], [21.0, 21.86], [23.0, 26.35], [28.0, 31.28], [32.0, 33.76], [36.0, 37.47], [38.0, 39.8], [45.0, 45.39], [50.0, 55.12], [57.0, 57.87], [60.0, 63.48], [67.0, 68.1], [75.0, 76.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 71.0, 0.0, 65.09, 68.8, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 64.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 1.41, 8.18, 0.86, 3.35, 3.28, 1.76, 1.47, 1.8, 0.39, 5.12, 0.87, 3.48, 1.1, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/qIxHb7cA6tg_filtered.json b/annotations_filtered/qIxHb7cA6tg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a533483b225b73db648dac76322898d94e4c471 --- /dev/null +++ b/annotations_filtered/qIxHb7cA6tg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.58], [16.0, 18.32], [20.0, 33.32], [38.0, 38.62]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 32.73, 34.85, 0.0], "audiomae_on_audioset": [null, [["speech", 53.21], ["music", 7.06], ["livestock, farm animals, working animals", 2.49]], [["speech", 67.4], ["music", 5.42], ["throbbing", 3.51]], null], "duration": [0.58, 2.32, 13.32, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/qJKahA8B9Ro_filtered.json b/annotations_filtered/qJKahA8B9Ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba953164b0f8d9280f678dfd118dca5f613d981d --- /dev/null +++ b/annotations_filtered/qJKahA8B9Ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.14], [5.0, 9.26], [13.0, 12.95], [14.0, 14.42], [15.0, 22.99], [28.0, 31.53], [35.0, 35.23], [38.0, 38.99], [42.0, 44.15], [45.0, 50.43], [52.0, 56.47], [58.0, 64.86], [66.0, 66.88], [69.0, 70.71], [73.0, 75.22], [75.0, 76.79], [79.0, 81.73], [83.0, 85.5], [87.0, 92.64], [97.0, 98.52], [100.0, 101.26], [103.0, 112.16], [114.0, 118.13], [120.0, 123.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.58, 0.0, 0.0, 99.84, 99.71, 0.0, 0.0, 63.53, 98.66, 99.84, 89.36, 0.0, 0.0, 44.46, 0.0, 99.97, 73.06, 97.92, 0.0, 0.0, 99.36, 99.73, 99.76], "audiomae_on_audioset": [null, [["sidetone", 84.02], ["dial tone", 4.26], ["sine wave", 3.02]], null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 41.04], ["speech", 8.55], ["livestock, farm animals, working animals", 3.85]], null, null, null, null, null, null, null, null, null], "duration": [1.14, 4.26, -0.05, 0.42, 7.99, 3.53, 0.23, 0.99, 2.15, 5.43, 4.47, 6.86, 0.88, 1.71, 2.22, 1.79, 2.73, 2.5, 5.64, 1.52, 1.26, 9.16, 4.13, 3.42]} \ No newline at end of file diff --git a/annotations_filtered/qJ_EsjyYevs_filtered.json b/annotations_filtered/qJ_EsjyYevs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..562559befe527385a17875e32751314e74b510cf --- /dev/null +++ b/annotations_filtered/qJ_EsjyYevs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [3.0, 4.97], [5.0, 8.67], [10.0, 12.21], [13.0, 13.42], [14.0, 18.12], [19.0, 49.91], [55.0, 55.36], [57.0, 56.89], [59.0, 73.65], [75.0, 75.02], [75.0, 96.97], [97.0, 97.88], [99.0, 102.17], [103.0, 118.56], [119.0, 120.29], [121.0, 121.22], [123.0, 125.29], [127.0, 126.67], [128.0, 129.68], [130.0, 130.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 60.7, 81.17, 0.0, 99.93, 0.0, 0.0, 0.0, 39.08, 0.0, 38.4, 0.0, 47.43, 75.72, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 48.34], ["cello", 12.87], ["bowed string instrument", 9.48]], null, [["cello", 36.25], ["bowed string instrument", 20.24], ["double bass", 18.42]], null, [["cello", 34.3], ["double bass", 32.15], ["music", 10.47]], null, null, null, null, null, null, null], "duration": [0.62, 1.97, 3.67, 2.21, 0.42, 4.12, 30.91, 0.36, -0.11, 14.65, 0.02, 21.97, 0.88, 3.17, 15.56, 1.29, 0.22, 2.29, -0.33, 1.68, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/qJznSue3tEs_filtered.json b/annotations_filtered/qJznSue3tEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ebd5b362adc804ffabcaac5d28c3e0d473fae39 --- /dev/null +++ b/annotations_filtered/qJznSue3tEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.62], [3.0, 5.58], [7.0, 9.76], [11.0, 13.54], [17.0, 18.99], [20.0, 21.34], [22.0, 23.3], [24.0, 26.69], [27.0, 30.3], [32.0, 31.95], [33.0, 35.78], [37.0, 43.34], [45.0, 47.73], [51.0, 53.94], [57.0, 59.46], [61.0, 65.16], [66.0, 67.17], [68.0, 69.2], [69.0, 69.53], [70.0, 75.25], [76.0, 78.49], [79.0, 87.71], [89.0, 91.23], [92.0, 102.44], [106.0, 108.72], [110.0, 116.5], [118.0, 122.12], [124.0, 126.86], [128.0, 130.06], [131.0, 132.26], [135.0, 148.17], [152.0, 156.27], [157.0, 161.45], [165.0, 167.02], [168.0, 169.67], [171.0, 173.35]], "keep_status": [false, true, true, true, false, false, false, true, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.44, 35.1, 33.78, 0.0, 0.0, 0.0, 35.07, 35.75, 0.0, 35.88, 37.2, 35.0, 59.77, 100.0, 66.76, 0.0, 0.0, 0.0, 62.58, 66.03, 91.98, 70.86, 94.81, 100.0, 100.0, 98.99, 99.73, 97.33, 0.0, 77.2, 80.29, 99.65, 91.47, 0.0, 99.73], "audiomae_on_audioset": [null, [["music", 44.36], ["hum", 8.51], ["throbbing", 6.21]], [["music", 34.77], ["hum", 17.66], ["throbbing", 8.7]], [["music", 36.64], ["didgeridoo", 14.94], ["speech", 8.69]], null, null, null, [["music", 24.52], ["speech", 16.43], ["synthesizer", 11.47]], [["hum", 26.52], ["music", 21.65], ["throbbing", 19.05]], null, [["music", 54.34], ["electronic music", 9.13], ["ambient music", 6.85]], [["music", 32.6], ["ambient music", 9.89], ["speech", 9.6]], [["music", 29.76], ["hum", 27.58], ["mains hum", 9.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.38, 2.58, 2.76, 2.54, 1.99, 1.34, 1.3, 2.69, 3.3, -0.05, 2.78, 6.34, 2.73, 2.94, 2.46, 4.16, 1.17, 1.2, 0.53, 5.25, 2.49, 8.71, 2.23, 10.44, 2.72, 6.5, 4.12, 2.86, 2.06, 1.26, 13.17, 4.27, 4.45, 2.02, 1.67, 2.35]} \ No newline at end of file diff --git a/annotations_filtered/qKYRwuoqETc_filtered.json b/annotations_filtered/qKYRwuoqETc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..add63df631a4b9df958d44820abb9b9e0dc63c07 --- /dev/null +++ b/annotations_filtered/qKYRwuoqETc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 60.37]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [37.37]} \ No newline at end of file diff --git a/annotations_filtered/qKerIOG7jdI_filtered.json b/annotations_filtered/qKerIOG7jdI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..645e2011b77279eb792123b5504f0a7b1b315b50 --- /dev/null +++ b/annotations_filtered/qKerIOG7jdI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [4.0, 5.22], [7.0, 8.45], [10.0, 10.61], [11.0, 17.51], [21.0, 21.57], [26.0, 56.37], [61.0, 65.16], [67.0, 67.05], [68.0, 70.34], [71.0, 74.43], [75.0, 83.05], [84.0, 87.03], [90.0, 90.76], [94.0, 94.56], [96.0, 97.55], [98.0, 110.93], [112.0, 112.45], [117.0, 118.1], [119.0, 119.11], [120.0, 121.07], [125.0, 125.51], [126.0, 126.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.79, 0.0, 0.0, 64.86, 0.0, 59.96, 57.4, 47.35, 84.07, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 72.43], ["sampler", 4.71], ["musical instrument", 3.52]], null, null, null, null, null, null, [["fly, housefly", 36.7], ["whack, thwack", 11.43], ["mosquito", 9.31]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.22, 1.45, 0.61, 6.51, 0.57, 30.37, 4.16, 0.05, 2.34, 3.43, 8.05, 3.03, 0.76, 0.56, 1.55, 12.93, 0.45, 1.1, 0.11, 1.07, 0.51, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/qKj2c67Ht98_filtered.json b/annotations_filtered/qKj2c67Ht98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4987eccb5dcc3f65665b7a8605e596db9e0fda5e --- /dev/null +++ b/annotations_filtered/qKj2c67Ht98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [5.0, 5.0], [7.0, 7.08], [8.0, 8.07], [16.0, 28.0], [31.0, 31.29], [37.0, 37.05], [37.0, 38.2], [39.0, 39.93], [50.0, 50.14], [51.0, 51.98], [52.0, 55.61], [59.0, 64.2], [64.0, 64.25], [67.0, 68.0], [71.0, 71.24], [78.0, 80.6], [81.0, 83.22], [89.0, 95.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 38.97, 0.0, 0.0, 0.0, 72.01, 68.67, 84.8], "audiomae_on_audioset": [null, null, null, null, [["music", 53.43], ["speech", 19.87], ["didgeridoo", 8.82]], null, null, null, null, null, null, null, [["speech", 49.43], ["music", 15.39], ["boing", 8.79]], null, null, null, null, null, null], "duration": [0.94, 0.0, 0.08, 0.07, 12.0, 0.29, 0.05, 1.2, 0.93, 0.14, 0.98, 3.61, 5.2, 0.25, 1.0, 0.24, 2.6, 2.22, 6.91]} \ No newline at end of file diff --git a/annotations_filtered/qL1WqN1XKK0_filtered.json b/annotations_filtered/qL1WqN1XKK0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47f0156c2b4a8762ad6f537047042740c8a02f15 --- /dev/null +++ b/annotations_filtered/qL1WqN1XKK0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.62], [21.0, 21.24], [23.0, 25.05], [27.0, 28.58], [30.0, 29.61], [32.0, 31.97], [34.0, 35.11], [36.0, 36.85], [38.0, 38.57], [41.0, 42.21], [43.0, 44.61], [45.0, 46.04], [47.0, 47.83], [51.0, 53.16], [53.0, 55.61], [56.0, 56.84], [59.0, 59.43], [61.0, 61.65], [63.0, 64.18], [69.0, 69.74], [70.0, 70.56], [72.0, 74.92], [76.0, 77.38], [86.0, 109.93], [116.0, 118.83], [120.0, 120.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [59.51, 0.0, 70.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 55.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 31.12, 98.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 13.35], ["hum", 12.31], ["electric shaver, electric razor", 12.27]], null, null], "duration": [2.62, 0.24, 2.05, 1.58, -0.39, -0.03, 1.11, 0.85, 0.57, 1.21, 1.61, 1.04, 0.83, 2.16, 2.61, 0.84, 0.43, 0.65, 1.18, 0.74, 0.56, 2.92, 1.38, 23.93, 2.83, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/qL5_xmtFVDo_filtered.json b/annotations_filtered/qL5_xmtFVDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcbdf0820c53b11801c7c957c429cac2ef3c5c77 --- /dev/null +++ b/annotations_filtered/qL5_xmtFVDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [5.0, 5.53], [7.0, 8.7], [23.0, 23.87], [34.0, 34.75], [46.0, 46.21], [47.0, 48.57], [56.0, 60.1], [66.0, 67.12], [72.0, 72.2], [78.0, 78.26], [102.0, 101.7], [104.0, 104.3], [112.0, 112.11], [127.0, 127.99], [139.0, 139.19], [140.0, 140.31], [141.0, 140.9], [141.0, 141.03], [157.0, 157.81], [158.0, 158.38], [164.0, 164.02], [165.0, 165.99], [176.0, 177.42], [184.0, 184.05], [193.0, 193.36], [202.0, 201.7], [206.0, 206.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["whale vocalization", 96.87], ["stomach rumble", 0.36], ["liquid", 0.35]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.05, 0.53, 1.7, 0.87, 0.75, 0.21, 1.57, 4.1, 1.12, 0.2, 0.26, -0.3, 0.3, 0.11, 0.99, 0.19, 0.31, -0.1, 0.03, 0.81, 0.38, 0.02, 0.99, 1.42, 0.05, 0.36, -0.3, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/qLCy66eZrQs_filtered.json b/annotations_filtered/qLCy66eZrQs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e823c94379300b751b325183678842fc1d6d02f --- /dev/null +++ b/annotations_filtered/qLCy66eZrQs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [5.0, 6.37], [9.0, 34.45], [38.0, 38.35], [44.0, 45.82], [47.0, 48.2], [53.0, 55.68], [59.0, 59.88], [62.0, 64.25], [67.0, 67.31], [68.0, 69.04], [71.0, 71.74], [77.0, 81.06], [83.0, 84.13], [87.0, 88.16], [90.0, 91.08], [92.0, 95.23], [98.0, 99.08]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.09, 0.0, 0.0, 0.0, 87.92, 0.0, 96.04, 0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 62.07, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.71], ["musical instrument", 11.07], ["speech", 9.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 1.37, 25.45, 0.35, 1.82, 1.2, 2.68, 0.88, 2.25, 0.31, 1.04, 0.74, 4.06, 1.13, 1.16, 1.08, 3.23, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/qLFrdv2R8ng_filtered.json b/annotations_filtered/qLFrdv2R8ng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2120f34919e03ce354156c00b476adf61f456d --- /dev/null +++ b/annotations_filtered/qLFrdv2R8ng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.75], [16.0, 19.53], [21.0, 22.94], [23.0, 25.05], [26.0, 26.87], [27.0, 28.86], [29.0, 32.64], [34.0, 34.33], [35.0, 39.8], [55.0, 55.44], [62.0, 64.15], [85.0, 85.89], [91.0, 92.53], [100.0, 101.58], [106.0, 106.34], [107.0, 109.16], [110.0, 122.34], [123.0, 124.11], [125.0, 126.71]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 61.57, 0.0, 67.38, 0.0, 0.0, 82.79, 0.0, 36.56, 0.0, 49.04, 0.0, 0.0, 0.0, 0.0, 100.0, 46.57, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 16.11], ["livestock, farm animals, working animals", 9.2], ["cattle, bovinae", 9.01]], null, [["fly, housefly", 32.49], ["sidetone", 29.3], ["insect", 22.03]], null, null, null, null, null, [["whoop", 15.64], ["speech", 11.33], ["crowd", 8.3]], null, null], "duration": [0.75, 3.53, 1.94, 2.05, 0.87, 1.86, 3.64, 0.33, 4.8, 0.44, 2.15, 0.89, 1.53, 1.58, 0.34, 2.16, 12.34, 1.11, 1.71]} \ No newline at end of file diff --git a/annotations_filtered/qLoufJLKN6Q_filtered.json b/annotations_filtered/qLoufJLKN6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a98206dc19e313b223b3d2086def3d5e6d402b53 --- /dev/null +++ b/annotations_filtered/qLoufJLKN6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [4.0, 4.95], [6.0, 6.02], [8.0, 30.13], [31.0, 32.39], [34.0, 36.22], [38.0, 39.39], [40.0, 42.67], [48.0, 48.71], [49.0, 50.3], [51.0, 52.39], [57.0, 57.45], [58.0, 58.48], [59.0, 61.55], [66.0, 67.91], [70.0, 69.69], [71.0, 73.75], [75.0, 77.65], [78.0, 79.03], [80.0, 81.89], [85.0, 84.7], [86.0, 87.3], [94.0, 94.8], [104.0, 105.36], [106.0, 106.79], [107.0, 108.46], [111.0, 111.28], [112.0, 113.16], [114.0, 115.37], [116.0, 130.76], [132.0, 133.54], [134.0, 134.55], [135.0, 148.49], [150.0, 152.25], [154.0, 154.97], [156.0, 156.88], [158.0, 160.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 30.65, 0.0, 38.09, 0.0, 42.15, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 0.0, 50.91, 29.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.43, 0.0, 0.0, 29.6, 33.76, 0.0, 0.0, 35.18], "audiomae_on_audioset": [null, null, null, [["music", 45.35], ["speech", 27.55], ["hum", 7.14]], null, [["music", 52.55], ["hum", 13.76], ["throbbing", 4.12]], null, [["speech", 31.7], ["music", 30.39], ["hum", 8.61]], null, null, null, null, null, [["music", 48.14], ["didgeridoo", 9.46], ["musical instrument", 8.25]], null, null, null, [["mains hum", 26.94], ["music", 20.98], ["hum", 20.18]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 47.56], ["throbbing", 29.01], ["mains hum", 9.68]], null, null, [["music", 53.57], ["electronic music", 5.37], ["hum", 5.21]], [["speech", 58.67], ["rumble", 23.3], ["music", 8.63]], null, null, [["music", 20.58], ["throbbing", 10.29], ["hum", 7.18]]], "duration": [0.48, 0.95, 0.02, 22.13, 1.39, 2.22, 1.39, 2.67, 0.71, 1.3, 1.39, 0.45, 0.48, 2.55, 1.91, -0.31, 2.75, 2.65, 1.03, 1.89, -0.3, 1.3, 0.8, 1.36, 0.79, 1.46, 0.28, 1.16, 1.37, 14.76, 1.54, 0.55, 13.49, 2.25, 0.97, 0.88, 2.07]} \ No newline at end of file diff --git a/annotations_filtered/qLvGnro4Cgw_filtered.json b/annotations_filtered/qLvGnro4Cgw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4b7ef2ca7113f883f1d86530813cf3bf30d60d1 --- /dev/null +++ b/annotations_filtered/qLvGnro4Cgw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.15], [11.0, 15.08], [16.0, 17.22], [20.0, 22.33], [32.0, 33.78], [42.0, 44.22], [54.0, 54.78], [64.0, 68.94], [76.0, 81.78], [87.0, 87.57], [91.0, 102.32], [105.0, 105.02], [107.0, 111.72], [118.0, 118.47], [125.0, 126.91], [127.0, 126.94], [129.0, 130.71], [138.0, 140.58], [143.0, 142.79]], "keep_status": [false, true, false, false, false, true, false, true, true, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 31.2, 0.0, 31.12, 0.0, 31.45, 0.0, 32.49, 32.35, 0.0, 31.53, 0.0, 31.99, 0.0, 0.0, 0.0, 0.0, 46.75, 0.0], "audiomae_on_audioset": [null, [["moo", 17.81], ["insect", 14.16], ["cattle, bovinae", 11.52]], null, [["moo", 32.11], ["cattle, bovinae", 31.41], ["livestock, farm animals, working animals", 11.97]], null, [["groan", 15.3], ["speech", 12.82], ["sound effect", 11.55]], null, [["fly, housefly", 20.84], ["insect", 17.68], ["livestock, farm animals, working animals", 11.01]], [["whale vocalization", 18.39], ["livestock, farm animals, working animals", 13.68], ["didgeridoo", 9.68]], null, [["animal", 19.96], ["fly, housefly", 13.16], ["insect", 11.68]], null, [["livestock, farm animals, working animals", 35.57], ["cattle, bovinae", 20.94], ["moo", 18.35]], null, null, null, null, [["didgeridoo", 22.42], ["animal", 16.23], ["music", 6.06]], null], "duration": [1.15, 4.08, 1.22, 2.33, 1.78, 2.22, 0.78, 4.94, 5.78, 0.57, 11.32, 0.02, 4.72, 0.47, 1.91, -0.06, 1.71, 2.58, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/qMaZAi73HDo_filtered.json b/annotations_filtered/qMaZAi73HDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42c1adf22b5309154e462621788d6fec88e72c93 --- /dev/null +++ b/annotations_filtered/qMaZAi73HDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.94], [13.0, 16.68], [18.0, 19.47], [24.0, 23.68], [26.0, 26.33], [30.0, 30.2], [34.0, 33.78], [88.0, 88.16], [91.0, 91.1], [92.0, 99.81], [103.0, 104.08], [105.0, 105.31], [115.0, 115.82]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.08], ["foghorn", 12.1], ["theremin", 10.89]], null, null, null, null, null, null, null, [["music", 62.72], ["musical instrument", 4.91], ["sidetone", 3.34]], null, null, null], "duration": [0.94, 3.68, 1.47, -0.32, 0.33, 0.2, -0.22, 0.16, 0.1, 7.81, 1.08, 0.31, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/qMwvHLe5m3g_filtered.json b/annotations_filtered/qMwvHLe5m3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0eabf5cefa7e632ac13cb314496c1d99624b416f --- /dev/null +++ b/annotations_filtered/qMwvHLe5m3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.27], [3.0, 43.04], [45.0, 75.44], [77.0, 78.56], [79.0, 87.59], [89.0, 90.05], [91.0, 92.38], [93.0, 102.73], [105.0, 115.53], [117.0, 163.14]], "keep_status": [false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 48.69, 0.0, 0.0, 47.05, 65.09, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 14.67], ["effects unit", 13.88], ["echo", 13.05]], null, null, [["throbbing", 35.75], ["hum", 23.01], ["music", 6.62]], null, null], "duration": [1.27, 40.04, 30.44, 1.56, 8.59, 1.05, 1.38, 9.73, 10.53, 46.14]} \ No newline at end of file diff --git a/annotations_filtered/qN-_cZNDy0w_filtered.json b/annotations_filtered/qN-_cZNDy0w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01c605f68b1612094bc5c3077c3d1227d05f6309 --- /dev/null +++ b/annotations_filtered/qN-_cZNDy0w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.07], [6.0, 6.51], [8.0, 8.6], [10.0, 10.93], [15.0, 15.28], [18.0, 19.52], [23.0, 24.81], [31.0, 35.73], [38.0, 38.52], [41.0, 45.55]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.1, 0.0, 72.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 51.82], ["didgeridoo", 5.19], ["groan", 4.02]], null, null], "duration": [0.07, 0.51, 0.6, 0.93, 0.28, 1.52, 1.81, 4.73, 0.52, 4.55]} \ No newline at end of file diff --git a/annotations_filtered/qNCFZLQOj_M_filtered.json b/annotations_filtered/qNCFZLQOj_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f750b6f13f128557f9ac402bb4a9a279d6b55aaf --- /dev/null +++ b/annotations_filtered/qNCFZLQOj_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.97], [7.0, 10.54], [16.0, 15.92], [30.0, 30.82], [32.0, 33.05], [35.0, 34.86], [38.0, 40.02], [41.0, 42.45], [44.0, 44.83], [47.0, 48.44], [50.0, 51.63], [53.0, 53.54], [55.0, 55.9], [57.0, 57.35], [65.0, 66.92], [75.0, 76.94], [78.0, 77.85], [85.0, 86.78], [88.0, 89.04], [97.0, 96.87], [97.0, 100.11], [121.0, 121.63], [124.0, 129.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.71, 0.0, 95.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.63], ["inside, small room", 2.25], ["boing", 1.93]], null, null], "duration": [2.97, 3.54, -0.08, 0.82, 1.05, -0.14, 2.02, 1.45, 0.83, 1.44, 1.63, 0.54, 0.9, 0.35, 1.92, 1.94, -0.15, 1.78, 1.04, -0.13, 3.11, 0.63, 5.91]} \ No newline at end of file diff --git a/annotations_filtered/qN_sGdVG0Yw_filtered.json b/annotations_filtered/qN_sGdVG0Yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e8f4aff076cdd33b202e586bb28728ba51d5011 --- /dev/null +++ b/annotations_filtered/qN_sGdVG0Yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.9], [24.0, 25.78], [30.0, 30.86], [33.0, 33.51], [34.0, 60.44], [61.0, 60.57], [62.0, 65.77], [66.0, 66.34], [75.0, 90.02], [92.0, 92.4], [94.0, 96.48], [97.0, 97.16], [99.0, 99.32], [106.0, 108.43], [112.0, 117.91], [118.0, 117.95], [120.0, 121.71], [123.0, 123.4], [127.0, 127.43], [133.0, 133.64]], "keep_status": [true, false, false, false, false, false, true, false, true, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [32.62, 0.0, 0.0, 0.0, 30.75, 0.0, 37.06, 0.0, 31.28, 0.0, 47.31, 0.0, 0.0, 30.31, 40.95, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.56], ["speech", 11.2], ["sidetone", 7.1]], null, null, null, [["tuning fork", 49.96], ["music", 24.07], ["breaking", 6.66]], null, [["hum", 14.71], ["fly, housefly", 12.66], ["throbbing", 11.81]], null, [["music", 41.42], ["noise", 10.97], ["hum", 8.81]], null, [["hum", 19.98], ["music", 17.82], ["mains hum", 16.06]], null, null, [["vehicle", 17.85], ["motorcycle", 12.49], ["speech", 10.3]], [["speech", 70.29], ["music", 2.56], ["eruption", 2.46]], null, null, null, null, null], "duration": [3.9, 1.78, 0.86, 0.51, 26.44, -0.43, 3.77, 0.34, 15.02, 0.4, 2.48, 0.16, 0.32, 2.43, 5.91, -0.05, 1.71, 0.4, 0.43, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/qNk-kc0XH4A_filtered.json b/annotations_filtered/qNk-kc0XH4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..329a24e5402f347ca0eda159b3c2e205c9c6160d --- /dev/null +++ b/annotations_filtered/qNk-kc0XH4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 43.63], [45.0, 45.23], [45.0, 47.04], [49.0, 52.03], [52.0, 54.26], [57.0, 58.18], [59.0, 60.74], [62.0, 62.33], [64.0, 65.67], [67.0, 68.01], [70.0, 72.06], [74.0, 73.77], [82.0, 82.32], [85.0, 85.08], [86.0, 86.14], [87.0, 90.1], [91.0, 92.74], [94.0, 95.39], [102.0, 107.0], [108.0, 110.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.87, 93.45, 45.24, 0.0, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 70.72, 0.0, 0.0, 51.07, 71.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 45.47], ["sidetone", 15.27], ["chirp tone", 11.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.63, 0.23, 2.04, 3.03, 2.26, 1.18, 1.74, 0.33, 1.67, 1.01, 2.06, -0.23, 0.32, 0.08, 0.14, 3.1, 1.74, 1.39, 5.0, 2.4]} \ No newline at end of file diff --git a/annotations_filtered/qNkP2Y5wme0_filtered.json b/annotations_filtered/qNkP2Y5wme0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f315728348db4240514d2ce6ac552299e844827 --- /dev/null +++ b/annotations_filtered/qNkP2Y5wme0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.1], [36.0, 36.14], [40.0, 41.03], [51.0, 54.09], [58.0, 62.45], [65.0, 65.43], [67.0, 67.85], [70.0, 71.76], [72.0, 72.72], [74.0, 76.74], [80.0, 81.19], [82.0, 83.08], [85.0, 86.12], [87.0, 87.71], [94.0, 94.19]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.42, 37.34, 0.0, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 28.59], ["theremin", 13.31], ["foghorn", 8.77]], [["hum", 32.79], ["mains hum", 32.65], ["music", 13.23]], null, null, null, null, null, null, null, null, null, null], "duration": [1.1, 0.14, 1.03, 3.09, 4.45, 0.43, 0.85, 1.76, 0.72, 2.74, 1.19, 1.08, 1.12, 0.71, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/qNnfnI8ai6o_filtered.json b/annotations_filtered/qNnfnI8ai6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb10a06868526aa4aeacf026a797be36e5591e3a --- /dev/null +++ b/annotations_filtered/qNnfnI8ai6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 41.3], [44.0, 44.29], [45.0, 45.01], [46.0, 61.42], [62.0, 65.82], [68.0, 69.36], [71.0, 93.29], [94.0, 95.59], [97.0, 97.06], [98.0, 99.28], [101.0, 101.98], [103.0, 103.52], [106.0, 108.84], [111.0, 112.06], [113.0, 113.29], [114.0, 114.27], [115.0, 116.23], [117.0, 118.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.8, 0.0, 0.0, 100.0, 99.85, 0.0, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.3, 0.29, 0.01, 15.42, 3.82, 1.36, 22.29, 1.59, 0.06, 1.28, 0.98, 0.52, 2.84, 1.06, 0.29, 0.27, 1.23, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/qO1-at2DUGU_filtered.json b/annotations_filtered/qO1-at2DUGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34bbd5db0a713b7c01736d10da25fe73145138b0 --- /dev/null +++ b/annotations_filtered/qO1-at2DUGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.95], [21.0, 22.6], [24.0, 27.11], [29.0, 29.98], [32.0, 32.95], [35.0, 36.41], [39.0, 39.78], [42.0, 42.3], [43.0, 43.8], [47.0, 56.13], [59.0, 58.82], [60.0, 61.16], [62.0, 63.59], [66.0, 67.22], [68.0, 69.75], [70.0, 74.01], [83.0, 83.89], [88.0, 88.2], [113.0, 113.93], [114.0, 116.53], [117.0, 119.04], [122.0, 122.54], [126.0, 126.84], [127.0, 128.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 80.29, 99.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.95, 1.6, 3.11, 0.98, 0.95, 1.41, 0.78, 0.3, 0.8, 9.13, -0.18, 1.16, 1.59, 1.22, 1.75, 4.01, 0.89, 0.2, 0.93, 2.53, 2.04, 0.54, 0.84, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/qOKE4dxjayU_filtered.json b/annotations_filtered/qOKE4dxjayU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80fc0e16a2f4665d2fc67ba1d39b30571dce2fac --- /dev/null +++ b/annotations_filtered/qOKE4dxjayU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 19.45], [26.0, 26.22], [29.0, 35.5], [37.0, 41.49], [47.0, 47.68], [50.0, 51.83], [55.0, 56.17], [58.0, 58.85], [61.0, 62.33], [63.0, 64.3], [65.0, 67.2], [68.0, 68.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.21, 0.0, 30.43, 31.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.89, 0.0], "audiomae_on_audioset": [[["music", 71.89], ["throbbing", 4.64], ["hum", 4.08]], null, [["music", 71.8], ["musical instrument", 4.95], ["synthesizer", 2.89]], [["music", 56.94], ["throbbing", 6.78], ["ambient music", 6.49]], null, null, null, null, null, null, [["music", 78.22], ["harmonic", 2.17], ["musical instrument", 1.63]], null], "duration": [13.45, 0.22, 6.5, 4.49, 0.68, 1.83, 1.17, 0.85, 1.33, 1.3, 2.2, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/qOeZ9TL0wHs_filtered.json b/annotations_filtered/qOeZ9TL0wHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eeba59d19251fe3fb45993930295e1e37c58272f --- /dev/null +++ b/annotations_filtered/qOeZ9TL0wHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.51], [22.0, 25.14], [33.0, 35.87], [39.0, 40.19], [52.0, 54.11], [69.0, 69.21], [82.0, 83.27], [97.0, 103.77], [107.0, 107.49], [110.0, 111.81]], "keep_status": [true, true, true, false, false, false, false, false, false, false], "silence_prob": [42.0, 46.79, 40.71, 0.0, 32.88, 0.0, 0.0, 33.38, 0.0, 0.0], "audiomae_on_audioset": [[["music", 26.3], ["didgeridoo", 20.6], ["fly, housefly", 10.73]], [["music", 51.69], ["theremin", 8.38], ["musical instrument", 3.5]], [["music", 28.05], ["speech", 13.26], ["foghorn", 5.69]], null, [["cattle, bovinae", 41.06], ["moo", 39.08], ["livestock, farm animals, working animals", 19.18]], null, null, [["foghorn", 38.04], ["music", 35.35], ["echo", 3.41]], null, null], "duration": [4.51, 3.14, 2.87, 1.19, 2.11, 0.21, 1.27, 6.77, 0.49, 1.81]} \ No newline at end of file diff --git a/annotations_filtered/qPXny_mZ0iE_filtered.json b/annotations_filtered/qPXny_mZ0iE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46d6c6acef8476ade6ab79b2dcc0a4253e10d2cc --- /dev/null +++ b/annotations_filtered/qPXny_mZ0iE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.23], [8.0, 8.19], [11.0, 10.89], [12.0, 12.5], [13.0, 14.71], [16.0, 16.92], [17.0, 18.76], [19.0, 20.19], [22.0, 22.37], [23.0, 25.41], [28.0, 28.73], [29.0, 30.23], [31.0, 31.77], [34.0, 34.99], [36.0, 36.96], [38.0, 40.46], [42.0, 43.33], [46.0, 46.95], [52.0, 53.27], [54.0, 54.33], [56.0, 56.42], [62.0, 67.26], [68.0, 68.45], [71.0, 72.5], [73.0, 74.61], [77.0, 76.99], [77.0, 85.08], [85.0, 85.77], [86.0, 87.17], [88.0, 87.88], [89.0, 89.29], [90.0, 91.27], [92.0, 92.84], [94.0, 93.9], [95.0, 95.59], [96.0, 96.47], [97.0, 97.41], [98.0, 98.41], [99.0, 98.88], [100.0, 100.68], [102.0, 102.03], [103.0, 103.37], [105.0, 105.63], [108.0, 109.56], [110.0, 111.86], [112.0, 112.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 74.92, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.19, -0.11, 0.5, 1.71, 0.92, 1.76, 1.19, 0.37, 2.41, 0.73, 1.23, 0.77, 0.99, 0.96, 2.46, 1.33, 0.95, 1.27, 0.33, 0.42, 5.26, 0.45, 1.5, 1.61, -0.01, 8.08, 0.77, 1.17, -0.12, 0.29, 1.27, 0.84, -0.1, 0.59, 0.47, 0.41, 0.41, -0.12, 0.68, 0.03, 0.37, 0.63, 1.56, 1.86, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/qPZWb3abC9I_filtered.json b/annotations_filtered/qPZWb3abC9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4adc6851a8f6de5e3b4872b97c54673dc7e8f97 --- /dev/null +++ b/annotations_filtered/qPZWb3abC9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [3.0, 5.83], [9.0, 9.68], [14.0, 16.51], [18.0, 19.45], [23.0, 25.3], [26.0, 27.95], [32.0, 31.95], [33.0, 33.66], [35.0, 40.9], [44.0, 44.96], [45.0, 50.23], [55.0, 56.57], [67.0, 69.75], [72.0, 80.0], [81.0, 81.99], [83.0, 87.88], [94.0, 96.01], [97.0, 97.97], [105.0, 116.87], [118.0, 119.77], [128.0, 130.42], [131.0, 132.41]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 44.01, 0.0, 100.0, 0.0, 0.0, 0.0, 95.23, 0.0, 99.59, 0.0, 100.0, 99.26, 0.0, 99.82, 99.82, 0.0, 40.64, 0.0, 95.91, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 43.14], ["fart", 10.68], ["thunk", 3.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 29.73], ["music", 22.42], ["mains hum", 20.48]], null, null, null], "duration": [0.49, 2.83, 0.68, 2.51, 1.45, 2.3, 1.95, -0.05, 0.66, 5.9, 0.96, 5.23, 1.57, 2.75, 8.0, 0.99, 4.88, 2.01, 0.97, 11.87, 1.77, 2.42, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/qPbOVPtdaZs_filtered.json b/annotations_filtered/qPbOVPtdaZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff99156c4f21fee4b3e547c9e86b070482a77695 --- /dev/null +++ b/annotations_filtered/qPbOVPtdaZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 28.93], [35.0, 50.92], [56.0, 56.1], [58.0, 58.5], [60.0, 60.29], [64.0, 64.1], [68.0, 96.85], [99.0, 105.78], [111.0, 111.03], [111.0, 112.33], [115.0, 125.66], [127.0, 142.15]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [37.77, 34.44, 0.0, 0.0, 0.0, 0.0, 30.26, 28.68, 0.0, 0.0, 35.14, 40.64], "audiomae_on_audioset": [[["music", 84.38], ["synthesizer", 2.95], ["musical instrument", 2.07]], [["music", 74.69], ["throbbing", 6.09], ["hum", 5.72]], null, null, null, null, [["music", 55.91], ["throbbing", 6.01], ["vehicle", 5.53]], [["speech", 39.92], ["music", 32.31], ["whack, thwack", 4.29]], null, null, [["music", 61.31], ["speech", 18.03], ["musical instrument", 5.01]], [["music", 49.64], ["synthesizer", 14.12], ["speech", 7.99]]], "duration": [15.93, 15.92, 0.1, 0.5, 0.29, 0.1, 28.85, 6.78, 0.03, 1.33, 10.66, 15.15]} \ No newline at end of file diff --git a/annotations_filtered/qPfLNjGXa2M_filtered.json b/annotations_filtered/qPfLNjGXa2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fc583aca030474dccf51c76db4e37e1a5e15c7b --- /dev/null +++ b/annotations_filtered/qPfLNjGXa2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.27], [4.0, 10.89], [12.0, 13.46], [14.0, 33.88], [36.0, 35.83], [46.0, 50.72], [51.0, 58.02], [59.0, 62.4], [63.0, 74.8], [75.0, 85.18], [87.0, 87.91], [93.0, 93.73], [102.0, 102.49], [106.0, 106.05], [108.0, 108.63], [111.0, 114.03]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 75.39, 0.0, 46.72, 0.0, 41.64, 57.89, 65.2, 35.72, 29.63, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 24.29], ["insect", 23.28], ["speech", 14.13]], null, [["hum", 36.91], ["mains hum", 16.83], ["burping, eructation", 4.75]], null, null, [["mains hum", 47.75], ["hum", 18.32], ["fly, housefly", 7.15]], [["speech", 82.26], ["screaming", 1.71], ["groan", 1.23]], null, null, null, null, null, null], "duration": [1.27, 6.89, 1.46, 19.88, -0.17, 4.72, 7.02, 3.4, 11.8, 10.18, 0.91, 0.73, 0.49, 0.05, 0.63, 3.03]} \ No newline at end of file diff --git a/annotations_filtered/qPkKjKAyJ8I_filtered.json b/annotations_filtered/qPkKjKAyJ8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a525f939f6dc93b19bcecc29a61624a154e0289 --- /dev/null +++ b/annotations_filtered/qPkKjKAyJ8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.14], [24.0, 25.27], [26.0, 38.74], [39.0, 39.48], [40.0, 41.13], [42.0, 42.84], [46.0, 46.97], [47.0, 59.41], [64.0, 99.64], [104.0, 108.18], [109.0, 128.9], [130.0, 131.94], [138.0, 144.19], [146.0, 152.29]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 31.51, 0.0, 0.0, 0.0, 0.0, 37.17, 0.0, 33.69, 31.65, 0.0, 30.65, 31.72], "audiomae_on_audioset": [null, null, [["music", 47.45], ["buzz", 7.71], ["fly, housefly", 7.04]], null, null, null, null, [["speech", 44.82], ["music", 31.55], ["throbbing", 3.85]], null, [["music", 70.76], ["hum", 6.41], ["electronic music", 4.76]], [["music", 44.55], ["noise", 6.58], ["hum", 6.34]], null, [["music", 24.29], ["mains hum", 19.51], ["hum", 18.63]], [["music", 74.14], ["throbbing", 3.51], ["hum", 3.37]]], "duration": [1.14, 1.27, 12.74, 0.48, 1.13, 0.84, 0.97, 12.41, 35.64, 4.18, 19.9, 1.94, 6.19, 6.29]} \ No newline at end of file diff --git a/annotations_filtered/qPtAocA3m2Y_filtered.json b/annotations_filtered/qPtAocA3m2Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f17da51e8fa4e096165640b00f19f274f0440385 --- /dev/null +++ b/annotations_filtered/qPtAocA3m2Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 36.58], [38.0, 39.45], [44.0, 48.14], [51.0, 61.4], [63.0, 66.46], [67.0, 83.0]], "keep_status": [false, false, false, false, false, false], "silence_prob": [66.15, 0.0, 66.51, 49.64, 80.29, 44.63], "audiomae_on_audioset": [null, null, null, [["music", 49.2], ["hum", 23.64], ["mains hum", 5.98]], null, [["hum", 47.2], ["mains hum", 20.78], ["noise", 20.02]]], "duration": [21.58, 1.45, 4.14, 10.4, 3.46, 16.0]} \ No newline at end of file diff --git a/annotations_filtered/qR9MgJkOFJ0_filtered.json b/annotations_filtered/qR9MgJkOFJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eadbfffb010423d646f76cbcc744b806a015ea9b --- /dev/null +++ b/annotations_filtered/qR9MgJkOFJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [11.0, 12.09], [18.0, 18.74], [20.0, 21.98], [23.0, 26.11], [29.0, 31.26], [33.0, 33.22], [34.0, 35.53], [36.0, 41.18], [47.0, 47.95], [51.0, 51.04], [54.0, 56.1], [57.0, 61.53], [62.0, 67.09], [70.0, 71.34], [72.0, 78.31], [80.0, 80.6], [83.0, 87.79], [89.0, 97.34], [98.0, 104.65], [106.0, 106.81], [112.0, 111.67], [114.0, 115.33], [116.0, 117.78], [119.0, 125.95], [127.0, 137.84], [143.0, 148.73], [151.0, 154.65], [157.0, 158.58], [160.0, 162.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.96, 99.8, 0.0, 0.0, 99.96, 0.0, 0.0, 99.91, 99.91, 99.98, 0.0, 99.85, 0.0, 100.0, 100.0, 99.98, 0.0, 0.0, 0.0, 0.0, 100.0, 94.37, 84.43, 89.72, 0.0, 73.06], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 1.09, 0.74, 1.98, 3.11, 2.26, 0.22, 1.53, 5.18, 0.95, 0.04, 2.1, 4.53, 5.09, 1.34, 6.31, 0.6, 4.79, 8.34, 6.65, 0.81, -0.33, 1.33, 1.78, 6.95, 10.84, 5.73, 3.65, 1.58, 2.13]} \ No newline at end of file diff --git a/annotations_filtered/qRAE0UOMyB8_filtered.json b/annotations_filtered/qRAE0UOMyB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b82bed40fc8b61fff348fa0df0e28a7089777ab4 --- /dev/null +++ b/annotations_filtered/qRAE0UOMyB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.55], [5.0, 7.25], [8.0, 8.77], [9.0, 10.29], [12.0, 12.7], [14.0, 14.91], [21.0, 21.76], [23.0, 25.51], [26.0, 28.61], [32.0, 34.86], [37.0, 38.45], [39.0, 41.15], [42.0, 49.5], [50.0, 51.66], [54.0, 54.36], [58.0, 59.63], [60.0, 61.38], [62.0, 62.48], [64.0, 66.29], [69.0, 69.55], [75.0, 75.56], [80.0, 80.62], [81.0, 81.75], [82.0, 83.71], [92.0, 93.31], [94.0, 95.15], [97.0, 100.09], [102.0, 105.87], [107.0, 108.35], [109.0, 112.63], [114.0, 118.34], [120.0, 121.24], [123.0, 126.28], [128.0, 128.28]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false, true, false], "silence_prob": [85.54, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 37.99, 96.04, 0.0, 98.44, 79.41, 0.0, 0.0, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 32.25, 0.0, 36.09, 37.84, 0.0, 37.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 34.39], ["didgeridoo", 13.39], ["speech", 6.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.53], ["fly, housefly", 8.4], ["synthesizer", 7.37]], [["music", 39.82], ["musical instrument", 8.31], ["guitar", 7.3]], null, [["music", 56.37], ["effects unit", 5.55], ["musical instrument", 5.25]], [["music", 42.97], ["theremin", 11.6], ["effects unit", 5.93]], null, [["music", 47.48], ["theremin", 9.49], ["speech", 4.86]], null], "duration": [3.55, 2.25, 0.77, 1.29, 0.7, 0.91, 0.76, 2.51, 2.61, 2.86, 1.45, 2.15, 7.5, 1.66, 0.36, 1.63, 1.38, 0.48, 2.29, 0.55, 0.56, 0.62, 0.75, 1.71, 1.31, 1.15, 3.09, 3.87, 1.35, 3.63, 4.34, 1.24, 3.28, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/qRAQivSrtm0_filtered.json b/annotations_filtered/qRAQivSrtm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daef7e5e6017a7007aff261cf96392490a56c906 --- /dev/null +++ b/annotations_filtered/qRAQivSrtm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.82], [8.0, 8.99], [13.0, 14.0], [17.0, 17.15], [19.0, 21.76], [26.0, 26.52], [27.0, 28.68], [31.0, 32.17]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [34.41, 0.0, 0.0, 0.0, 43.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 42.62], ["insect", 38.24], ["speech", 6.87]], null, null, null, [["creak", 13.25], ["noise", 13.16], ["radio", 8.42]], null, null, null], "duration": [4.82, 0.99, 1.0, 0.15, 2.76, 0.52, 1.68, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/qRGre50eHbQ_filtered.json b/annotations_filtered/qRGre50eHbQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..214740462d0abe1ff7fe5806366a383815bc1eb5 --- /dev/null +++ b/annotations_filtered/qRGre50eHbQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 124.88]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [121.88]} \ No newline at end of file diff --git a/annotations_filtered/qRQu4tZF1GA_filtered.json b/annotations_filtered/qRQu4tZF1GA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edeb12bd3eca077282b89e2b84c90aad1a8db517 --- /dev/null +++ b/annotations_filtered/qRQu4tZF1GA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.82], [16.0, 16.68], [21.0, 21.29], [22.0, 28.19], [34.0, 34.65], [38.0, 38.4], [39.0, 53.81], [57.0, 59.85], [61.0, 63.26], [68.0, 74.7], [80.0, 90.19], [91.0, 91.49], [92.0, 95.54], [103.0, 116.78], [119.0, 119.52], [132.0, 134.69], [136.0, 136.49], [141.0, 141.51]], "keep_status": [false, false, false, true, false, false, false, true, true, true, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.2, 0.0, 0.0, 29.94, 30.26, 32.97, 36.61, 30.8, 0.0, 35.84, 29.26, 0.0, 52.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 45.13], ["speech", 15.77], ["didgeridoo", 7.15]], null, null, [["throbbing", 46.87], ["music", 35.96], ["hum", 9.43]], [["music", 49.37], ["hum", 10.05], ["throbbing", 8.36]], [["music", 33.75], ["hum", 12.38], ["speech", 6.36]], [["music", 42.61], ["throbbing", 14.26], ["speech", 9.93]], [["speech", 35.04], ["music", 29.04], ["outside, rural or natural", 3.78]], null, [["music", 41.31], ["speech", 27.48], ["throbbing", 6.26]], [["music", 45.17], ["throbbing", 8.03], ["hum", 5.73]], null, null, null, null], "duration": [-0.18, 0.68, 0.29, 6.19, 0.65, 0.4, 14.81, 2.85, 2.26, 6.7, 10.19, 0.49, 3.54, 13.78, 0.52, 2.69, 0.49, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/qRahFLj59bc_filtered.json b/annotations_filtered/qRahFLj59bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8afd6d35ac882ee7cdc75aec43d99fcd62c7ca0 --- /dev/null +++ b/annotations_filtered/qRahFLj59bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.98], [20.0, 20.65], [34.0, 34.11], [40.0, 40.29], [44.0, 45.18], [46.0, 48.19], [54.0, 54.11], [68.0, 68.2], [69.0, 69.96], [77.0, 85.51], [89.0, 89.18], [90.0, 91.3], [91.0, 91.34], [91.0, 91.37], [91.0, 91.4], [104.0, 104.57], [106.0, 106.66], [107.0, 118.1], [126.0, 126.17], [132.0, 132.31], [133.0, 134.06], [140.0, 140.1], [141.0, 141.66], [143.0, 144.1], [145.0, 146.15], [147.0, 147.48], [154.0, 157.4], [166.0, 166.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.88, 0.0, 0.0, 0.0, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 63.15], ["radio", 14.74], ["music", 2.72]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.59], ["music", 19.76], ["whale vocalization", 10.76]], null, null, null, null, null, null, null, null, null, null], "duration": [0.98, 0.65, 0.11, 0.29, 1.18, 2.19, 0.11, 0.2, 0.96, 8.51, 0.18, 1.3, 0.34, 0.37, 0.4, 0.57, 0.66, 11.1, 0.17, 0.31, 1.06, 0.1, 0.66, 1.1, 1.15, 0.48, 3.4, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/qRnjswr1swo_filtered.json b/annotations_filtered/qRnjswr1swo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55c95e9e6d6aef7338910a1c832fb3279e3d4eca --- /dev/null +++ b/annotations_filtered/qRnjswr1swo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.3], [12.0, 14.15], [14.0, 14.35], [15.0, 14.96], [18.0, 19.87], [21.0, 31.9], [34.0, 35.29], [36.0, 36.56], [38.0, 40.05], [42.0, 44.78], [47.0, 47.92], [51.0, 52.61], [55.0, 58.8], [60.0, 62.41], [64.0, 64.98], [65.0, 83.42], [85.0, 85.43], [88.0, 90.29], [91.0, 98.42], [107.0, 107.96], [110.0, 111.48], [113.0, 114.45], [118.0, 118.54]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [59.15, 59.15, 0.0, 0.0, 0.0, 33.92, 0.0, 0.0, 39.43, 35.4, 0.0, 0.0, 46.68, 48.52, 0.0, 29.34, 0.0, 28.95, 29.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["crushing", 8.82], ["thunk", 6.66], ["mains hum", 6.36]], null, null, [["mains hum", 48.36], ["hum", 39.26], ["rumble", 1.74]], [["crushing", 65.12], ["hum", 7.28], ["mains hum", 4.68]], null, null, [["chirp tone", 25.97], ["sine wave", 20.43], ["coin (dropping)", 10.48]], [["fly, housefly", 14.96], ["squish", 11.33], ["hum", 6.02]], null, [["hum", 32.92], ["mains hum", 29.04], ["sidetone", 20.21]], null, [["music", 28.49], ["hum", 15.66], ["theremin", 8.56]], [["hum", 39.21], ["mains hum", 35.42], ["speech", 10.47]], null, null, null, null], "duration": [7.3, 2.15, 0.35, -0.04, 1.87, 10.9, 1.29, 0.56, 2.05, 2.78, 0.92, 1.61, 3.8, 2.41, 0.98, 18.42, 0.43, 2.29, 7.42, 0.96, 1.48, 1.45, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/qS2Np6zxXm0_filtered.json b/annotations_filtered/qS2Np6zxXm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d6d889b4c09f8d109df9b89443f47efe833e053 --- /dev/null +++ b/annotations_filtered/qS2Np6zxXm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [3.0, 5.44], [7.0, 7.32], [8.0, 8.58], [9.0, 10.45], [15.0, 16.11], [19.0, 24.36], [26.0, 28.65], [31.0, 33.47], [34.0, 37.29], [40.0, 64.03], [66.0, 69.75], [71.0, 72.84], [76.0, 78.83], [86.0, 86.54], [88.0, 88.16], [97.0, 99.39], [100.0, 101.39], [104.0, 106.68], [107.0, 111.05], [113.0, 123.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.71, 99.8, 82.43, 72.31, 81.89, 0.0, 97.73, 0.0, 0.0, 95.37, 0.0, 99.4, 95.23, 93.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 2.44, 0.32, 0.58, 1.45, 1.11, 5.36, 2.65, 2.47, 3.29, 24.03, 3.75, 1.84, 2.83, 0.54, 0.16, 2.39, 1.39, 2.68, 4.05, 10.11]} \ No newline at end of file diff --git a/annotations_filtered/qSE4dF_Feng_filtered.json b/annotations_filtered/qSE4dF_Feng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8872eb7577a2843abd567053bf3e718229c7733 --- /dev/null +++ b/annotations_filtered/qSE4dF_Feng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.02], [17.0, 17.09], [17.0, 18.64], [22.0, 23.77]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.02, 0.09, 1.64, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/qSabiG8q8-k_filtered.json b/annotations_filtered/qSabiG8q8-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..972ce0f7b4c54f0520e655c1eec6e49b9ea8d129 --- /dev/null +++ b/annotations_filtered/qSabiG8q8-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 22.18], [23.0, 23.87], [24.0, 26.59], [30.0, 33.84], [37.0, 37.13], [38.0, 38.96], [46.0, 46.36], [57.0, 57.67], [79.0, 79.22], [82.0, 82.43], [86.0, 86.64], [90.0, 91.08], [96.0, 96.53], [102.0, 102.68], [106.0, 105.92], [114.0, 114.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.51, 0.0, 33.33, 30.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 64.87], ["livestock, farm animals, working animals", 6.28], ["music", 4.16]], [["music", 66.18], ["theremin", 6.53], ["trombone", 5.36]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.18, 0.87, 2.59, 3.84, 0.13, 0.96, 0.36, 0.67, 0.22, 0.43, 0.64, 1.08, 0.53, 0.68, -0.08, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/qSbI8KRB74M_filtered.json b/annotations_filtered/qSbI8KRB74M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73465dbb2c801b1dee420b2512c8f6af5b2e5958 --- /dev/null +++ b/annotations_filtered/qSbI8KRB74M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.8], [12.0, 12.83], [16.0, 16.83], [18.0, 19.38], [22.0, 23.16], [25.0, 24.93], [29.0, 28.76], [34.0, 34.05], [35.0, 34.94], [35.0, 38.15], [40.0, 46.58], [47.0, 50.5], [51.0, 51.8], [52.0, 54.09], [55.0, 57.48], [58.0, 61.59], [65.0, 66.75], [68.0, 69.74], [71.0, 72.13], [72.0, 80.81], [82.0, 85.78], [87.0, 87.94], [89.0, 90.17], [95.0, 94.81], [97.0, 98.51], [100.0, 105.34], [106.0, 108.13], [109.0, 110.54], [111.0, 112.97], [118.0, 117.96], [119.0, 121.69], [124.0, 126.44]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [38.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.03, 59.07, 60.42, 0.0, 41.85, 79.24, 59.33, 0.0, 0.0, 0.0, 55.81, 53.16, 0.0, 0.0, 0.0, 0.0, 44.66, 74.44, 0.0, 0.0, 0.0, 37.84, 50.21], "audiomae_on_audioset": [[["hum", 34.04], ["music", 24.09], ["mains hum", 9.13]], null, null, null, null, null, null, null, null, [["speech", 38.62], ["sine wave", 13.33], ["chirp tone", 10.49]], null, null, null, [["burping, eructation", 10.05], ["hum", 8.22], ["ping", 6.45]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.88], ["hum", 17.78], ["chirp tone", 11.72]], null, null, null, null, [["speech", 36.13], ["hum", 19.61], ["mains hum", 17.26]], null], "duration": [4.8, 0.83, 0.83, 1.38, 1.16, -0.07, -0.24, 0.05, -0.06, 3.15, 6.58, 3.5, 0.8, 2.09, 2.48, 3.59, 1.75, 1.74, 1.13, 8.81, 3.78, 0.94, 1.17, -0.19, 1.51, 5.34, 2.13, 1.54, 1.97, -0.04, 2.69, 2.44]} \ No newline at end of file diff --git a/annotations_filtered/qSd4Q3GY7dc_filtered.json b/annotations_filtered/qSd4Q3GY7dc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf7fd7d148bd2cb53a28bd4a5502e0f53e85c14d --- /dev/null +++ b/annotations_filtered/qSd4Q3GY7dc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.16], [8.0, 8.23], [11.0, 11.72], [13.0, 13.42], [18.0, 17.76], [20.0, 20.48], [20.0, 20.51], [21.0, 21.86], [32.0, 33.35], [34.0, 34.15], [42.0, 44.51], [51.0, 51.71], [54.0, 53.92], [59.0, 59.31], [62.0, 64.64], [77.0, 82.39], [87.0, 87.99], [90.0, 90.96], [93.0, 97.75], [115.0, 114.64], [116.0, 117.78], [122.0, 122.61], [138.0, 139.08], [144.0, 144.22], [145.0, 147.31], [148.0, 151.26], [164.0, 164.05], [166.0, 165.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 0.0, 0.0, 0.0, 97.54, 99.59, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0, 0.0, 50.11, 64.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.23, 0.72, 0.42, -0.24, 0.48, 0.51, 0.86, 1.35, 0.15, 2.51, 0.71, -0.08, 0.31, 2.64, 5.39, 0.99, 0.96, 4.75, -0.36, 1.78, 0.61, 1.08, 0.22, 2.31, 3.26, 0.05, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/qSnUywWS9xs_filtered.json b/annotations_filtered/qSnUywWS9xs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11bb5ed555cd041f1b64d73c44cd8148a26758cd --- /dev/null +++ b/annotations_filtered/qSnUywWS9xs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 22.5], [27.0, 51.58], [54.0, 54.73], [59.0, 70.83], [73.0, 87.44], [88.0, 87.94], [91.0, 92.47], [95.0, 99.5], [101.0, 107.69], [111.0, 111.87], [114.0, 114.61], [117.0, 117.39]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [32.47, 30.04, 0.0, 29.83, 30.51, 0.0, 0.0, 55.6, 57.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 58.29], ["vehicle", 13.7], ["music", 8.96]], [["music", 57.39], ["throbbing", 20.4], ["electronic music", 3.38]], null, [["speech", 56.66], ["vehicle", 18.86], ["car", 4.96]], [["music", 33.18], ["throbbing", 14.09], ["cattle, bovinae", 10.79]], null, null, null, null, null, null, null], "duration": [6.5, 24.58, 0.73, 11.83, 14.44, -0.06, 1.47, 4.5, 6.69, 0.87, 0.61, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/qTIc6y5mojw_filtered.json b/annotations_filtered/qTIc6y5mojw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9422c33405774b39dab508aa1459910762da4a29 --- /dev/null +++ b/annotations_filtered/qTIc6y5mojw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.99], [14.0, 14.72], [15.0, 16.44], [18.0, 18.22], [19.0, 20.12], [25.0, 26.84], [28.0, 29.29], [30.0, 32.21], [33.0, 34.65], [35.0, 37.05], [38.0, 42.47], [43.0, 44.81], [46.0, 49.65], [50.0, 50.7], [53.0, 55.56], [57.0, 57.57], [58.0, 60.98], [62.0, 63.85], [66.0, 66.02], [68.0, 69.85], [74.0, 73.94], [76.0, 76.98], [79.0, 79.66], [81.0, 81.04], [82.0, 82.24], [84.0, 84.42], [85.0, 85.01], [87.0, 87.18], [94.0, 94.31], [98.0, 99.15], [100.0, 100.62], [116.0, 118.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 100.0, 100.0, 0.0, 86.09, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.99, 0.72, 1.44, 0.22, 1.12, 1.84, 1.29, 2.21, 1.65, 2.05, 4.47, 1.81, 3.65, 0.7, 2.56, 0.57, 2.98, 1.85, 0.02, 1.85, -0.06, 0.98, 0.66, 0.04, 0.24, 0.42, 0.01, 0.18, 0.31, 1.15, 0.62, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/qTUcFhCim_A_filtered.json b/annotations_filtered/qTUcFhCim_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c61e02d55774d97e3f201ce79a9d4c9fb5c774 --- /dev/null +++ b/annotations_filtered/qTUcFhCim_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.9], [8.0, 9.61], [13.0, 13.31], [14.0, 14.96], [16.0, 16.01], [17.0, 18.6], [20.0, 19.87], [22.0, 22.89], [32.0, 33.39], [35.0, 35.23], [36.0, 36.64], [38.0, 38.62], [41.0, 42.21], [43.0, 43.93], [49.0, 49.69], [59.0, 59.95], [63.0, 64.66], [66.0, 67.04], [68.0, 68.07], [69.0, 70.04], [72.0, 73.53], [80.0, 79.78], [85.0, 88.84], [93.0, 92.99], [96.0, 98.1], [103.0, 105.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.52, 0.0, 63.74, 58.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 14.4], ["cattle, bovinae", 8.1], ["moo", 6.88]], null, null, null], "duration": [0.9, 1.61, 0.31, 0.96, 0.01, 1.6, -0.13, 0.89, 1.39, 0.23, 0.64, 0.62, 1.21, 0.93, 0.69, 0.95, 1.66, 1.04, 0.07, 1.04, 1.53, -0.22, 3.84, -0.01, 2.1, 2.09]} \ No newline at end of file diff --git a/annotations_filtered/qTa5iKsbAno_filtered.json b/annotations_filtered/qTa5iKsbAno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31ed0766a809beec1c60f48ce6c11a07010d515c --- /dev/null +++ b/annotations_filtered/qTa5iKsbAno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.53], [6.0, 7.43], [9.0, 11.43], [14.0, 18.74], [20.0, 23.65], [25.0, 25.69], [50.0, 51.17], [52.0, 52.83], [54.0, 55.22], [57.0, 57.21], [58.0, 58.65], [63.0, 64.08], [69.0, 70.43], [72.0, 73.25], [76.0, 77.82], [79.0, 80.16], [81.0, 82.04], [83.0, 84.5], [86.0, 87.4], [91.0, 91.29], [92.0, 92.64], [95.0, 95.37], [98.0, 99.33], [111.0, 111.38], [113.0, 113.95], [118.0, 118.05], [119.0, 119.94], [121.0, 121.98], [123.0, 124.7], [126.0, 126.6], [128.0, 128.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 91.81, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 1.43, 2.43, 4.74, 3.65, 0.69, 1.17, 0.83, 1.22, 0.21, 0.65, 1.08, 1.43, 1.25, 1.82, 1.16, 1.04, 1.5, 1.4, 0.29, 0.64, 0.37, 1.33, 0.38, 0.95, 0.05, 0.94, 0.98, 1.7, 0.6, 0.78]} \ No newline at end of file diff --git a/annotations_filtered/qTey0qxMboA_filtered.json b/annotations_filtered/qTey0qxMboA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bac3ba45ec362d58e7dd47e888fcd99eafe5fa2 --- /dev/null +++ b/annotations_filtered/qTey0qxMboA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[109.0, 134.32]], "keep_status": [true], "silence_prob": [33.69], "audiomae_on_audioset": [[["speech", 33.31], ["music", 18.75], ["sonar", 9.54]]], "duration": [25.32]} \ No newline at end of file diff --git a/annotations_filtered/qTj4aSPwTBk_filtered.json b/annotations_filtered/qTj4aSPwTBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..329be6f1d4680ae41cdedaad63b4484d85ab4089 --- /dev/null +++ b/annotations_filtered/qTj4aSPwTBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 75.74], [76.0, 79.49], [80.0, 81.09], [87.0, 126.28], [130.0, 130.79], [138.0, 149.22], [152.0, 157.37], [164.0, 164.61]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 40.97, 0.0, 0.0, 0.0, 42.08, 36.74, 0.0], "audiomae_on_audioset": [null, [["music", 23.56], ["speech", 19.7], ["fly, housefly", 6.83]], null, null, null, [["music", 54.55], ["speech", 22.19], ["sidetone", 5.29]], [["speech", 33.72], ["music", 26.18], ["boing", 22.63]], null], "duration": [40.74, 3.49, 1.09, 39.28, 0.79, 11.22, 5.37, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/qTpB6q-YJwM_filtered.json b/annotations_filtered/qTpB6q-YJwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43299907a420e6128a3209e3652f8be3d8abc6e6 --- /dev/null +++ b/annotations_filtered/qTpB6q-YJwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.02], [5.0, 5.26], [6.0, 7.21], [11.0, 12.39], [14.0, 16.36], [17.0, 17.42], [18.0, 18.35], [26.0, 26.99], [31.0, 36.69], [38.0, 38.72], [41.0, 43.02], [44.0, 46.45], [47.0, 53.08], [55.0, 56.03], [57.0, 57.25], [58.0, 59.73], [63.0, 63.49], [64.0, 64.98], [66.0, 66.31], [68.0, 70.51], [73.0, 73.7], [75.0, 76.11], [79.0, 85.16], [86.0, 86.32], [90.0, 90.21], [91.0, 92.47], [96.0, 97.7], [100.0, 100.21], [102.0, 102.61], [105.0, 106.1], [108.0, 121.63], [124.0, 125.74], [127.0, 128.21], [129.0, 129.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 32.8, 0.0, 33.33, 89.36, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.67, 0.0, 0.0, 52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.39, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 32.52], ["trombone", 29.79], ["brass instrument", 19.71]], null, [["foghorn", 26.35], ["music", 18.48], ["brass instrument", 13.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.96], ["theremin", 7.92], ["musical instrument", 5.32]], null, null, null], "duration": [0.02, 0.26, 1.21, 1.39, 2.36, 0.42, 0.35, 0.99, 5.69, 0.72, 2.02, 2.45, 6.08, 1.03, 0.25, 1.73, 0.49, 0.98, 0.31, 2.51, 0.7, 1.11, 6.16, 0.32, 0.21, 1.47, 1.7, 0.21, 0.61, 1.1, 13.63, 1.74, 1.21, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/qTwXudZTWQA_filtered.json b/annotations_filtered/qTwXudZTWQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f59857324afebf97add27eb034e25862419424d5 --- /dev/null +++ b/annotations_filtered/qTwXudZTWQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.96], [14.0, 15.45], [16.0, 17.24], [19.0, 20.58], [23.0, 30.91], [31.0, 33.25], [37.0, 37.62], [40.0, 42.67], [44.0, 47.29], [48.0, 58.21], [60.0, 61.67], [78.0, 79.74], [81.0, 86.75], [87.0, 88.01], [99.0, 100.4], [102.0, 102.1], [102.0, 106.51], [107.0, 108.11], [109.0, 116.34], [117.0, 118.12], [121.0, 122.37], [126.0, 127.38]], "keep_status": [true, false, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [32.98, 0.0, 0.0, 0.0, 37.47, 31.28, 0.0, 85.72, 35.35, 54.43, 0.0, 0.0, 42.28, 0.0, 0.0, 0.0, 55.04, 0.0, 41.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 29.89], ["ding", 12.48], ["music", 11.87]], null, null, null, [["speech", 32.19], ["music", 32.12], ["sidetone", 6.91]], [["mains hum", 31.2], ["speech", 17.46], ["hum", 15.23]], null, null, [["didgeridoo", 38.42], ["cattle, bovinae", 10.69], ["music", 9.01]], null, null, null, [["music", 36.42], ["livestock, farm animals, working animals", 15.23], ["cattle, bovinae", 9.02]], null, null, null, null, null, [["grunt", 18.37], ["speech", 15.34], ["frog", 13.0]], null, null, null], "duration": [3.96, 1.45, 1.24, 1.58, 7.91, 2.25, 0.62, 2.67, 3.29, 10.21, 1.67, 1.74, 5.75, 1.01, 1.4, 0.1, 4.51, 1.11, 7.34, 1.12, 1.37, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/qU0H2mmgsjM_filtered.json b/annotations_filtered/qU0H2mmgsjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d7d3361065136be53059297712b2ddb1a67f770 --- /dev/null +++ b/annotations_filtered/qU0H2mmgsjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.2], [14.0, 14.0], [16.0, 16.83], [17.0, 18.12], [20.0, 21.07], [23.0, 23.28], [25.0, 25.76], [29.0, 29.78], [31.0, 41.05], [48.0, 48.2], [51.0, 53.64], [55.0, 56.02], [58.0, 58.56], [60.0, 61.92], [62.0, 63.41], [65.0, 65.33], [69.0, 69.69], [71.0, 71.27], [73.0, 72.77], [74.0, 74.14], [75.0, 77.52], [86.0, 90.75], [92.0, 93.73], [95.0, 95.05], [97.0, 97.01], [98.0, 97.93], [99.0, 99.22], [101.0, 102.25], [103.0, 103.79], [112.0, 112.23], [113.0, 113.88], [115.0, 117.21], [124.0, 124.23]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.33, 0.0, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.6, 37.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["telephone bell ringing", 10.73], ["noise", 6.5], ["telephone", 6.41]], null, null, null, null, null, null, null, null, null, null, null, [["music", 29.22], ["effects unit", 15.87], ["musical instrument", 5.68]], [["sidetone", 31.59], ["speech", 18.01], ["radio", 11.72]], null, null, null, null, null, null, null, null, null, [["civil defense siren", 37.75], ["speech", 25.08], ["siren", 21.57]], null], "duration": [0.2, 0.0, 0.83, 1.12, 1.07, 0.28, 0.76, 0.78, 10.05, 0.2, 2.64, 1.02, 0.56, 1.92, 1.41, 0.33, 0.69, 0.27, -0.23, 0.14, 2.52, 4.75, 1.73, 0.05, 0.01, -0.07, 0.22, 1.25, 0.79, 0.23, 0.88, 2.21, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/qU0Y6zo68t4_filtered.json b/annotations_filtered/qU0Y6zo68t4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81794e0a9bca15c545763227153c472d5c594213 --- /dev/null +++ b/annotations_filtered/qU0Y6zo68t4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 20.83], [22.0, 56.2], [57.0, 58.16], [58.0, 64.0], [64.0, 64.44], [64.0, 66.5], [72.0, 75.3], [76.0, 76.47], [77.0, 78.98], [81.0, 81.84], [83.0, 97.19], [102.0, 102.61], [103.0, 104.09], [104.0, 106.93], [111.0, 112.5], [113.0, 114.02], [115.0, 116.43], [117.0, 118.05], [120.0, 125.61], [126.0, 126.98], [128.0, 134.22], [144.0, 147.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.89, 0.0, 0.0, 62.89, 0.0, 77.7, 96.54, 0.0, 0.0, 0.0, 35.3, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 94.95, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 46.24], ["cattle, bovinae", 27.26], ["moo", 15.66]], null, null, null, null, null, null, null, null, null, null, null], "duration": [12.83, 34.2, 1.16, 6.0, 0.44, 2.5, 3.3, 0.47, 1.98, 0.84, 14.19, 0.61, 1.09, 2.93, 1.5, 1.02, 1.43, 1.05, 5.61, 0.98, 6.22, 3.72]} \ No newline at end of file diff --git a/annotations_filtered/qUDMInHr_wI_filtered.json b/annotations_filtered/qUDMInHr_wI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d52d9928efbe3c001cf5ec27b031346fee649bc --- /dev/null +++ b/annotations_filtered/qUDMInHr_wI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.21], [9.0, 11.64], [13.0, 14.62], [17.0, 19.01], [22.0, 23.43], [27.0, 27.35], [31.0, 31.87], [34.0, 34.6], [36.0, 38.31], [39.0, 40.27], [43.0, 44.44], [48.0, 49.62], [52.0, 52.79], [54.0, 55.31], [57.0, 58.68], [60.0, 61.94], [63.0, 64.37], [68.0, 70.09], [72.0, 73.5], [78.0, 78.02], [85.0, 85.33], [88.0, 88.35], [97.0, 97.85], [100.0, 103.49], [105.0, 106.78], [111.0, 112.09], [117.0, 117.46], [119.0, 119.62], [120.0, 123.99], [127.0, 128.04], [129.0, 128.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.81, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 0.0, 54.17, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.1], ["speech", 28.26], ["sidetone", 4.17]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 2.64, 1.62, 2.01, 1.43, 0.35, 0.87, 0.6, 2.31, 1.27, 1.44, 1.62, 0.79, 1.31, 1.68, 1.94, 1.37, 2.09, 1.5, 0.02, 0.33, 0.35, 0.85, 3.49, 1.78, 1.09, 0.46, 0.62, 3.99, 1.04, -0.07]} \ No newline at end of file diff --git a/annotations_filtered/qUKBDcMN7tg_filtered.json b/annotations_filtered/qUKBDcMN7tg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07d7453a052ef8b96f9d31e4cfc63b747937dc39 --- /dev/null +++ b/annotations_filtered/qUKBDcMN7tg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [3.0, 3.82], [4.0, 4.45], [6.0, 6.35], [25.0, 25.74], [26.0, 27.11], [29.0, 29.02], [39.0, 39.77], [44.0, 44.59], [45.0, 45.5], [49.0, 49.6], [53.0, 53.52], [63.0, 64.76], [71.0, 72.52], [76.0, 77.35], [79.0, 79.32], [80.0, 80.55], [83.0, 84.15], [96.0, 96.75], [103.0, 109.16], [114.0, 114.35], [115.0, 126.69], [128.0, 128.46], [129.0, 129.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.5, 0.0, 32.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.07], ["livestock, farm animals, working animals", 4.38], ["cattle, bovinae", 3.77]], null, [["music", 57.6], ["carnatic music", 10.64], ["tabla", 6.05]], null, null], "duration": [1.44, 0.82, 0.45, 0.35, 0.74, 1.11, 0.02, 0.77, 0.59, 0.5, 0.6, 0.52, 1.76, 1.52, 1.35, 0.32, 0.55, 1.15, 0.75, 6.16, 0.35, 11.69, 0.46, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/qULQCbfqJm8_filtered.json b/annotations_filtered/qULQCbfqJm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08505f0292cf0bfc383813c3d059560b51409a36 --- /dev/null +++ b/annotations_filtered/qULQCbfqJm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.92], [11.0, 12.24], [16.0, 17.15], [20.0, 24.17], [44.0, 45.59], [60.0, 61.1], [66.0, 65.97], [92.0, 93.55], [97.0, 97.66], [99.0, 100.53], [108.0, 112.51], [118.0, 118.45], [145.0, 148.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.23, 0.0, 37.26], "audiomae_on_audioset": [null, null, null, [["music", 76.29], ["musical instrument", 5.81], ["synthesizer", 5.4]], null, null, null, null, null, null, [["music", 68.37], ["synthesizer", 3.24], ["theremin", 2.97]], null, [["music", 65.62], ["speech", 6.51], ["flute", 2.75]]], "duration": [-0.08, 1.24, 1.15, 4.17, 1.59, 1.1, -0.03, 1.55, 0.66, 1.53, 4.51, 0.45, 3.42]} \ No newline at end of file diff --git a/annotations_filtered/qULlmr4lxb0_filtered.json b/annotations_filtered/qULlmr4lxb0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d3f48f20ae69c840bccff7e5df841844287d984 --- /dev/null +++ b/annotations_filtered/qULlmr4lxb0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.69], [10.0, 13.31], [13.0, 13.59], [22.0, 23.01], [28.0, 28.51], [34.0, 36.93], [38.0, 37.79], [39.0, 40.22], [43.0, 43.55], [46.0, 48.24], [60.0, 60.89], [66.0, 66.29], [66.0, 67.64], [77.0, 80.91], [82.0, 85.45], [91.0, 94.64], [98.0, 97.82], [101.0, 100.99], [102.0, 109.65], [110.0, 110.59]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 38.03, 0.0, 0.0, 0.0, 39.31, 0.0, 0.0, 0.0, 34.7, 0.0, 0.0, 0.0, 30.81, 32.4, 33.72, 0.0, 0.0, 32.17, 0.0], "audiomae_on_audioset": [null, [["speech", 53.81], ["music", 19.98], ["sidetone", 12.63]], null, null, null, [["speech", 29.9], ["music", 26.22], ["television", 7.28]], null, null, null, [["speech", 30.51], ["music", 19.18], ["sidetone", 6.1]], null, null, null, [["speech", 56.69], ["music", 11.14], ["noise", 4.82]], [["speech", 71.34], ["mains hum", 5.69], ["music", 3.55]], [["speech", 34.07], ["music", 28.35], ["fart", 2.57]], null, null, [["hum", 35.79], ["mains hum", 21.36], ["throbbing", 16.81]], null], "duration": [0.69, 3.31, 0.59, 1.01, 0.51, 2.93, -0.21, 1.22, 0.55, 2.24, 0.89, 0.29, 1.64, 3.91, 3.45, 3.64, -0.18, -0.01, 7.65, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/qUMSld6BwC0_filtered.json b/annotations_filtered/qUMSld6BwC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67b110c55c5e0aa1e96d4fd2ed78309267377372 --- /dev/null +++ b/annotations_filtered/qUMSld6BwC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.17], [15.0, 17.0], [65.0, 64.93], [81.0, 81.03]], "keep_status": [true, false, false, false], "silence_prob": [41.36, 31.17, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 10.99], ["hum", 10.34], ["fly, housefly", 6.83]], [["speech", 79.33], ["inside, small room", 1.85], ["chuckle, chortle", 1.73]], null, null], "duration": [3.17, 2.0, -0.07, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/qUammhHxd1k_filtered.json b/annotations_filtered/qUammhHxd1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e8b97fb81d721cbb8a7442ef05ecb1339ae8174 --- /dev/null +++ b/annotations_filtered/qUammhHxd1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [6.0, 9.69], [12.0, 12.43], [13.0, 13.68], [20.0, 19.82], [28.0, 30.4], [33.0, 33.54], [34.0, 34.89], [37.0, 37.66], [41.0, 45.79], [46.0, 48.63], [49.0, 50.53], [52.0, 63.91], [65.0, 64.94], [66.0, 71.02], [72.0, 82.65], [84.0, 88.5], [91.0, 94.83], [96.0, 126.89], [127.0, 126.98], [130.0, 203.32], [210.0, 212.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.99, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0, 83.34, 36.67, 0.0, 30.87, 0.0, 30.21, 29.79, 30.0, 30.47, 0.0, 0.0, 0.0, 30.7], "audiomae_on_audioset": [null, [["speech", 67.7], ["caw", 3.65], ["sine wave", 2.28]], null, null, null, null, null, null, null, null, [["music", 66.07], ["speech", 12.89], ["electronic music", 4.47]], null, [["music", 79.1], ["drum machine", 4.1], ["sampler", 3.81]], null, [["music", 71.58], ["sampler", 4.54], ["synthesizer", 3.31]], [["music", 82.37], ["sampler", 2.1], ["electronic music", 2.03]], [["music", 81.24], ["speech", 1.58], ["house music", 1.52]], [["music", 76.81], ["speech", 8.5], ["electronic music", 2.2]], null, null, null, [["music", 71.32], ["house music", 2.51], ["dance music", 1.94]]], "duration": [1.14, 3.69, 0.43, 0.68, -0.18, 2.4, 0.54, 0.89, 0.66, 4.79, 2.63, 1.53, 11.91, -0.06, 5.02, 10.65, 4.5, 3.83, 30.89, -0.02, 73.32, 2.53]} \ No newline at end of file diff --git a/annotations_filtered/qUiptlAJcyQ_filtered.json b/annotations_filtered/qUiptlAJcyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e57f2224fd5047a1715c46f84b6374aebdd4321 --- /dev/null +++ b/annotations_filtered/qUiptlAJcyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.81], [26.0, 26.97], [34.0, 34.59], [36.0, 36.04], [36.0, 36.9], [37.0, 37.69], [39.0, 39.07], [40.0, 41.49], [45.0, 45.84], [48.0, 48.07], [60.0, 61.42], [67.0, 69.38], [72.0, 74.71], [77.0, 123.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.71, 41.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.04], ["hum", 23.63], ["music", 13.34]], [["music", 23.58], ["theremin", 20.04], ["hum", 16.31]], null], "duration": [0.81, 0.97, 0.59, 0.04, 0.9, 0.69, 0.07, 1.49, 0.84, 0.07, 1.42, 2.38, 2.71, 46.36]} \ No newline at end of file diff --git a/annotations_filtered/qUqtwCfbjVw_filtered.json b/annotations_filtered/qUqtwCfbjVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36b0cad83fcc9e79e2e0a593e7a863282791a3a3 --- /dev/null +++ b/annotations_filtered/qUqtwCfbjVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.81], [5.0, 6.78], [9.0, 8.95], [10.0, 14.52], [18.0, 17.95], [19.0, 20.07], [21.0, 25.71], [27.0, 28.49], [31.0, 31.77], [32.0, 32.66], [34.0, 34.13], [35.0, 35.43], [36.0, 36.71], [38.0, 38.3], [39.0, 42.96], [44.0, 44.04], [46.0, 47.55], [48.0, 48.49], [51.0, 52.54], [54.0, 54.4], [56.0, 56.91], [57.0, 58.23], [59.0, 59.73], [61.0, 61.1], [63.0, 64.79], [66.0, 66.78], [68.0, 69.58], [71.0, 71.69], [73.0, 75.83], [77.0, 78.53], [81.0, 82.81], [84.0, 90.22], [92.0, 92.55], [94.0, 103.74], [106.0, 107.43]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.37, 0.0, 0.0, 48.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.05, 0.0, 0.0, 74.6, 0.0, 35.22, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 26.0], ["radio", 10.51], ["noise", 5.86]], null, null, [["mains hum", 10.1], ["busy signal", 7.41], ["sidetone", 7.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.7], ["sidetone", 9.54], ["radio", 7.88]], null], "duration": [1.81, 1.78, -0.05, 4.52, -0.05, 1.07, 4.71, 1.49, 0.77, 0.66, 0.13, 0.43, 0.71, 0.3, 3.96, 0.04, 1.55, 0.49, 1.54, 0.4, 0.91, 1.23, 0.73, 0.1, 1.79, 0.78, 1.58, 0.69, 2.83, 1.53, 1.81, 6.22, 0.55, 9.74, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/qUu8VHynw40_filtered.json b/annotations_filtered/qUu8VHynw40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c22799eb5c6290d1c890cb3ffcdd556a82a49b5 --- /dev/null +++ b/annotations_filtered/qUu8VHynw40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.61], [14.0, 14.91], [17.0, 19.63], [21.0, 21.14], [22.0, 23.04], [24.0, 25.34], [27.0, 28.27], [31.0, 32.39], [38.0, 40.88], [42.0, 42.72], [43.0, 44.69], [49.0, 51.98], [54.0, 56.34], [57.0, 57.33], [59.0, 58.72], [61.0, 62.51], [63.0, 63.48], [65.0, 70.24], [71.0, 73.25], [76.0, 80.16], [85.0, 85.89], [87.0, 87.27], [88.0, 88.72], [89.0, 90.53], [95.0, 95.17], [96.0, 97.7], [99.0, 99.57], [101.0, 100.68], [102.0, 102.17], [104.0, 104.23], [105.0, 105.51], [106.0, 108.23], [111.0, 111.13], [114.0, 114.54], [116.0, 116.33], [120.0, 121.41], [122.0, 123.15]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [31.58, 0.0, 36.95, 0.0, 0.0, 0.0, 0.0, 0.0, 34.98, 0.0, 0.0, 68.8, 55.96, 0.0, 0.0, 0.0, 0.0, 42.86, 84.25, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.67, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.12], ["hum", 19.33], ["throbbing", 14.79]], null, [["hum", 24.45], ["music", 23.45], ["mains hum", 19.76]], null, null, null, null, null, [["music", 69.14], ["chink, clink", 6.33], ["brass instrument", 2.1]], null, null, null, null, null, null, null, null, [["speech", 57.5], ["music", 12.25], ["explosion", 6.7]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["bee, wasp, etc.", 21.54], ["speech", 17.29], ["insect", 15.46]], null, null, null, null, null], "duration": [5.61, 0.91, 2.63, 0.14, 1.04, 1.34, 1.27, 1.39, 2.88, 0.72, 1.69, 2.98, 2.34, 0.33, -0.28, 1.51, 0.48, 5.24, 2.25, 4.16, 0.89, 0.27, 0.72, 1.53, 0.17, 1.7, 0.57, -0.32, 0.17, 0.23, 0.51, 2.23, 0.13, 0.54, 0.33, 1.41, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/qVDMu-erGtc_filtered.json b/annotations_filtered/qVDMu-erGtc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea346063ed788fa97ae868569ea13cdd8c1ba683 --- /dev/null +++ b/annotations_filtered/qVDMu-erGtc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 29.0], [32.0, 32.12], [38.0, 38.5], [41.0, 41.72], [48.0, 48.22], [49.0, 58.56], [64.0, 75.51], [80.0, 88.6], [90.0, 90.37], [92.0, 94.05], [97.0, 132.56], [134.0, 166.83], [170.0, 177.5], [179.0, 179.98], [181.0, 181.58], [183.0, 183.71], [184.0, 188.15], [189.0, 194.09], [198.0, 199.45], [200.0, 210.19], [213.0, 223.91]], "keep_status": [false, false, false, false, false, true, true, true, false, true, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [35.44, 0.0, 0.0, 0.0, 0.0, 29.12, 29.14, 29.48, 0.0, 29.86, 0.0, 0.0, 29.27, 0.0, 0.0, 0.0, 31.87, 29.57, 0.0, 29.59, 30.36], "audiomae_on_audioset": [[["music", 45.3], ["throbbing", 30.1], ["hum", 11.46]], null, null, null, null, [["music", 41.49], ["throbbing", 15.92], ["hum", 7.01]], [["music", 36.49], ["hum", 17.07], ["mains hum", 9.86]], [["music", 22.69], ["speech", 20.29], ["hum", 12.17]], null, [["music", 43.07], ["hum", 8.68], ["electronic music", 7.68]], null, null, [["machine gun", 40.5], ["music", 30.31], ["gunshot, gunfire", 6.14]], null, null, null, [["speech", 38.18], ["music", 19.42], ["hum", 6.23]], [["music", 16.91], ["speech", 11.48], ["mains hum", 11.34]], null, [["throbbing", 31.54], ["music", 31.01], ["hum", 13.63]], [["music", 26.78], ["siren", 7.51], ["vehicle", 6.71]]], "duration": [8.0, 0.12, 0.5, 0.72, 0.22, 9.56, 11.51, 8.6, 0.37, 2.05, 35.56, 32.83, 7.5, 0.98, 0.58, 0.71, 4.15, 5.09, 1.45, 10.19, 10.91]} \ No newline at end of file diff --git a/annotations_filtered/qVNAGVSKEBQ_filtered.json b/annotations_filtered/qVNAGVSKEBQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdd8d80de869e791a132512fb48cffac6c72bc51 --- /dev/null +++ b/annotations_filtered/qVNAGVSKEBQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.5], [22.0, 30.32], [31.0, 33.44], [37.0, 41.84], [42.0, 42.62], [53.0, 72.71], [74.0, 84.82], [88.0, 87.91], [91.0, 92.26], [93.0, 95.08], [97.0, 97.39], [103.0, 104.68], [106.0, 111.16], [114.0, 115.38]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.32, 32.92, 32.02, 33.32, 0.0, 31.39, 41.87, 0.0, 0.0, 100.0, 0.0, 0.0, 98.27, 0.0], "audiomae_on_audioset": [[["music", 67.5], ["musical instrument", 7.53], ["theremin", 3.84]], [["speech", 65.49], ["music", 11.82], ["didgeridoo", 2.49]], [["music", 26.61], ["throbbing", 23.32], ["speech", 7.45]], [["music", 17.92], ["fly, housefly", 15.19], ["mains hum", 12.72]], null, [["speech", 42.21], ["music", 26.04], ["eruption", 5.23]], [["hum", 43.01], ["mains hum", 20.06], ["speech", 9.21]], null, null, null, null, null, null, null], "duration": [5.5, 8.32, 2.44, 4.84, 0.62, 19.71, 10.82, -0.09, 1.26, 2.08, 0.39, 1.68, 5.16, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/qVS1E2L7DYg_filtered.json b/annotations_filtered/qVS1E2L7DYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71859fd2bef4f4005a92174df4250de373cb3d07 --- /dev/null +++ b/annotations_filtered/qVS1E2L7DYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 83.94], [84.0, 84.03], [84.0, 111.91], [116.0, 135.92], [136.0, 136.44]], "keep_status": [true, false, false, false, false], "silence_prob": [35.59, 0.0, 35.97, 98.44, 0.0], "audiomae_on_audioset": [[["throbbing", 24.67], ["hum", 23.04], ["speech", 16.33]], null, [["music", 40.96], ["eruption", 18.36], ["explosion", 12.19]], null, null], "duration": [12.94, 0.03, 27.91, 19.92, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/qVhCNgct9JQ_filtered.json b/annotations_filtered/qVhCNgct9JQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e1e8c6727623e3acd972940662ae1d8230f0470 --- /dev/null +++ b/annotations_filtered/qVhCNgct9JQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.38], [13.0, 13.91], [20.0, 20.38], [22.0, 22.52], [25.0, 25.79], [27.0, 27.57], [29.0, 29.76], [33.0, 32.86], [34.0, 34.33], [35.0, 36.19], [37.0, 37.76], [39.0, 39.63], [41.0, 41.07], [43.0, 44.32], [48.0, 51.7], [55.0, 55.93], [56.0, 58.8], [62.0, 65.01], [66.0, 72.79], [78.0, 78.48], [80.0, 80.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 36.97, 31.83, 36.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 15.47], ["foghorn", 13.41], ["didgeridoo", 10.66]], [["synthesizer", 21.11], ["effects unit", 13.3], ["sound effect", 10.23]], [["speech", 32.3], ["cattle, bovinae", 16.37], ["moo", 9.82]], null, null], "duration": [2.38, 0.91, 0.38, 0.52, 0.79, 0.57, 0.76, -0.14, 0.33, 1.19, 0.76, 0.63, 0.07, 1.32, 3.7, 0.93, 2.8, 3.01, 6.79, 0.48, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/qVwoeNk9554_filtered.json b/annotations_filtered/qVwoeNk9554_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4875367620941301066e3fda4d59c3f771ce7195 --- /dev/null +++ b/annotations_filtered/qVwoeNk9554_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [26.0, 27.18], [54.0, 55.8], [57.0, 58.19], [63.0, 63.39], [65.0, 68.23], [88.0, 88.33], [92.0, 93.33], [97.0, 99.79]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.99, 0.0, 0.0, 88.1], "audiomae_on_audioset": [null, null, null, null, null, [["music", 53.68], ["effects unit", 16.51], ["guitar", 6.23]], null, null, null], "duration": [0.73, 1.18, 1.8, 1.19, 0.39, 3.23, 0.33, 1.33, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/qWEaCJlKZXs_filtered.json b/annotations_filtered/qWEaCJlKZXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f09d2ecdae4ce66fc7a4d5f7671cfad16bb1b524 --- /dev/null +++ b/annotations_filtered/qWEaCJlKZXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.27], [10.0, 13.14], [17.0, 18.23], [24.0, 24.61], [31.0, 31.51], [35.0, 34.67], [38.0, 38.8], [40.0, 40.19], [43.0, 43.68], [44.0, 46.53], [51.0, 54.45], [56.0, 56.54], [61.0, 61.32], [64.0, 64.61], [67.0, 67.47], [70.0, 70.95], [73.0, 74.78], [77.0, 82.22], [85.0, 88.1], [91.0, 91.37], [94.0, 95.0], [99.0, 99.45], [103.0, 104.04], [107.0, 106.86], [109.0, 109.51], [112.0, 112.29], [114.0, 115.18], [116.0, 116.9], [117.0, 118.17], [124.0, 124.14], [131.0, 139.67], [148.0, 148.49], [150.0, 151.24]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [99.87, 30.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.2, 37.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.7, 33.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.44, 0.0, 0.0], "audiomae_on_audioset": [null, [["explosion", 27.14], ["fly, housefly", 15.63], ["gunshot, gunfire", 9.91]], null, null, null, null, null, null, null, [["music", 68.98], ["speech", 3.98], ["electronic music", 3.53]], [["music", 32.59], ["boing", 25.5], ["speech", 14.01]], null, null, null, null, null, null, [["music", 47.13], ["speech", 24.32], ["electronic music", 3.28]], [["music", 44.41], ["speech", 19.75], ["whack, thwack", 7.8]], null, null, null, null, null, null, null, null, null, null, null, [["music", 36.28], ["hum", 19.89], ["speech", 10.38]], null, null], "duration": [3.27, 3.14, 1.23, 0.61, 0.51, -0.33, 0.8, 0.19, 0.68, 2.53, 3.45, 0.54, 0.32, 0.61, 0.47, 0.95, 1.78, 5.22, 3.1, 0.37, 1.0, 0.45, 1.04, -0.14, 0.51, 0.29, 1.18, 0.9, 1.17, 0.14, 8.67, 0.49, 1.24]} \ No newline at end of file diff --git a/annotations_filtered/qWOQp-rJ0Vc_filtered.json b/annotations_filtered/qWOQp-rJ0Vc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea1117882bff8cbe3add4e8d18788ed6a84718ac --- /dev/null +++ b/annotations_filtered/qWOQp-rJ0Vc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [5.0, 31.33], [32.0, 34.74], [35.0, 36.66], [37.0, 81.63], [82.0, 82.86], [84.0, 85.06], [87.0, 87.78], [91.0, 164.22], [165.0, 165.48], [166.0, 167.56], [169.0, 168.76]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.57, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 19.96], ["speech", 12.15], ["insect", 11.82]], [["music", 36.22], ["speech", 19.02], ["didgeridoo", 3.27]], null, null, null, null, null, null, null, null, null], "duration": [1.42, 26.33, 2.74, 1.66, 44.63, 0.86, 1.06, 0.78, 73.22, 0.48, 1.56, -0.24]} \ No newline at end of file diff --git a/annotations_filtered/qWiGcXSaKUc_filtered.json b/annotations_filtered/qWiGcXSaKUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0517a789bcea190c43348dc6445ed284d438d0eb --- /dev/null +++ b/annotations_filtered/qWiGcXSaKUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.31], [7.0, 9.75], [11.0, 12.65], [14.0, 19.28], [22.0, 22.99], [26.0, 27.13], [29.0, 30.4], [32.0, 34.16], [39.0, 42.28], [44.0, 45.98], [47.0, 48.24], [50.0, 51.19], [55.0, 55.54], [61.0, 64.61], [67.0, 69.94], [70.0, 71.81], [73.0, 78.27], [80.0, 79.83], [87.0, 92.31], [98.0, 98.93], [118.0, 119.11], [128.0, 128.55], [137.0, 137.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 97.73, 0.0, 0.0, 0.0, 99.44, 100.0, 0.0, 0.0, 0.0, 0.0, 99.98, 97.92, 0.0, 68.41, 0.0, 29.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.93], ["hum", 5.29], ["fly, housefly", 4.94]], null, null, null, null], "duration": [2.31, 2.75, 1.65, 5.28, 0.99, 1.13, 1.4, 2.16, 3.28, 1.98, 1.24, 1.19, 0.54, 3.61, 2.94, 1.81, 5.27, -0.17, 5.31, 0.93, 1.11, 0.55, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/qWsC4YHbOlw_filtered.json b/annotations_filtered/qWsC4YHbOlw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f35a8020804c0417f0c8ee46dc763110bcd9e9af --- /dev/null +++ b/annotations_filtered/qWsC4YHbOlw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.14], [18.0, 26.91], [31.0, 31.11], [33.0, 32.95], [35.0, 35.41], [37.0, 37.42], [39.0, 38.91], [40.0, 58.77], [65.0, 65.87], [66.0, 66.36], [70.0, 70.48], [83.0, 85.65], [88.0, 95.08], [96.0, 98.15], [100.0, 100.67], [101.0, 101.22], [104.0, 104.23], [105.0, 106.69], [108.0, 108.06], [109.0, 110.25], [115.0, 116.4], [117.0, 117.63], [118.0, 120.45], [125.0, 125.78], [128.0, 129.41], [130.0, 132.54], [133.0, 133.39], [144.0, 145.22], [150.0, 151.21], [152.0, 152.44], [153.0, 155.36], [156.0, 155.83], [163.0, 164.1], [168.0, 169.57], [171.0, 176.93], [185.0, 185.85]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [61.18, 42.76, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 99.96, 93.29, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 97.11, 0.0], "audiomae_on_audioset": [null, [["emergency vehicle", 26.06], ["siren", 19.63], ["police car (siren)", 14.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 8.91, 0.11, -0.05, 0.41, 0.42, -0.09, 18.77, 0.87, 0.36, 0.48, 2.65, 7.08, 2.15, 0.67, 0.22, 0.23, 1.69, 0.06, 1.25, 1.4, 0.63, 2.45, 0.78, 1.41, 2.54, 0.39, 1.22, 1.21, 0.44, 2.36, -0.17, 1.1, 1.57, 5.93, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/qXKeIDlP-ys_filtered.json b/annotations_filtered/qXKeIDlP-ys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1f5b18ba1b8b4f9bce5c0cc784d66e316a77455 --- /dev/null +++ b/annotations_filtered/qXKeIDlP-ys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.56], [22.0, 22.01], [22.0, 29.71], [31.0, 36.12], [37.0, 36.95], [37.0, 50.6], [52.0, 58.95], [64.0, 67.47], [69.0, 70.23], [72.0, 72.72], [73.0, 75.78], [78.0, 78.98], [80.0, 80.28], [81.0, 94.74], [97.0, 97.88], [100.0, 103.65], [105.0, 105.58], [107.0, 108.85], [109.0, 110.67], [111.0, 161.52]], "keep_status": [true, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.94, 0.0, 43.66, 34.95, 0.0, 43.15, 41.95, 39.44, 0.0, 0.0, 56.93, 0.0, 0.0, 33.5, 0.0, 53.04, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.5], ["groan", 10.58], ["throbbing", 5.04]], null, [["didgeridoo", 38.53], ["music", 30.16], ["fart", 9.64]], [["music", 22.67], ["fly, housefly", 13.05], ["throbbing", 10.5]], null, [["music", 59.07], ["throbbing", 12.65], ["hum", 7.24]], [["mosquito", 37.99], ["fly, housefly", 19.93], ["insect", 5.68]], [["whale vocalization", 42.91], ["music", 10.65], ["mosquito", 9.61]], null, null, null, null, null, [["hum", 43.84], ["throbbing", 25.21], ["music", 13.15]], null, null, null, null, null, null], "duration": [15.56, 0.01, 7.71, 5.12, -0.05, 13.6, 6.95, 3.47, 1.23, 0.72, 2.78, 0.98, 0.28, 13.74, 0.88, 3.65, 0.58, 1.85, 1.67, 50.52]} \ No newline at end of file diff --git a/annotations_filtered/qXL3aXIGIKc_filtered.json b/annotations_filtered/qXL3aXIGIKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3231da35501da4f9482e6933c531300c0ed3111 --- /dev/null +++ b/annotations_filtered/qXL3aXIGIKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 34.38], [35.0, 35.28], [35.0, 45.77], [46.0, 49.96]], "keep_status": [true, false, true, false], "silence_prob": [30.35, 0.0, 47.16, 62.89], "audiomae_on_audioset": [[["music", 30.38], ["fireworks", 29.18], ["speech", 8.18]], null, [["music", 53.35], ["theremin", 6.08], ["hum", 5.99]], null], "duration": [2.38, 0.28, 10.77, 3.96]} \ No newline at end of file diff --git a/annotations_filtered/qXTTXNZucIU_filtered.json b/annotations_filtered/qXTTXNZucIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f8b97a14b81c02721c32129c4d2645844254be0 --- /dev/null +++ b/annotations_filtered/qXTTXNZucIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.14], [9.0, 32.46], [33.0, 33.2], [34.0, 37.98], [38.0, 40.02], [41.0, 43.83], [46.0, 46.75], [49.0, 50.16], [51.0, 52.54], [56.0, 58.02], [62.0, 71.47], [77.0, 99.22], [105.0, 106.27], [107.0, 107.03], [109.0, 110.91], [111.0, 113.48], [123.0, 124.5], [128.0, 129.36], [131.0, 131.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [93.13, 72.75, 0.0, 40.66, 59.15, 79.94, 0.0, 0.0, 0.0, 65.91, 40.5, 40.97, 0.0, 0.0, 0.0, 41.48, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 89.26], ["whale vocalization", 4.81], ["noise", 1.18]], null, null, null, null, null, null, [["speech", 57.41], ["explosion", 6.35], ["sidetone", 4.97]], [["speech", 90.84], ["whack, thwack", 0.9], ["male speech, man speaking", 0.53]], null, null, null, [["speech", 39.42], ["whip", 19.81], ["sidetone", 4.85]], null, null, null], "duration": [2.14, 23.46, 0.2, 3.98, 2.02, 2.83, 0.75, 1.16, 1.54, 2.02, 9.47, 22.22, 1.27, 0.03, 1.91, 2.48, 1.5, 1.36, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/qY7EPDCU5hc_filtered.json b/annotations_filtered/qY7EPDCU5hc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c2be1e4cf562af6913bbfc72225d083c6f01424 --- /dev/null +++ b/annotations_filtered/qY7EPDCU5hc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [11.0, 12.78], [16.0, 19.33], [24.0, 24.33], [28.0, 36.29], [42.0, 42.74], [58.0, 60.12], [66.0, 66.23], [71.0, 70.98], [83.0, 85.43], [89.0, 89.63], [97.0, 97.17], [98.0, 98.83], [100.0, 103.87], [107.0, 125.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.33, 0.0, 31.57, 0.0, 70.86, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 67.63, 30.52], "audiomae_on_audioset": [null, null, [["hum", 37.47], ["throbbing", 23.05], ["heart sounds, heartbeat", 9.7]], null, [["music", 30.42], ["mains hum", 25.72], ["hum", 19.73]], null, null, null, null, null, null, null, null, null, [["music", 78.28], ["didgeridoo", 4.1], ["musical instrument", 3.04]]], "duration": [0.49, 1.78, 3.33, 0.33, 8.29, 0.74, 2.12, 0.23, -0.02, 2.43, 0.63, 0.17, 0.83, 3.87, 18.31]} \ No newline at end of file diff --git a/annotations_filtered/qYCEXS6Ws_c_filtered.json b/annotations_filtered/qYCEXS6Ws_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..988681a5f4a9ffc6006bebc5e773c7df73697c36 --- /dev/null +++ b/annotations_filtered/qYCEXS6Ws_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.52], [17.0, 21.71], [23.0, 32.68], [34.0, 34.77], [36.0, 36.91], [38.0, 54.41], [55.0, 55.75], [57.0, 59.75], [68.0, 70.23], [82.0, 83.84], [86.0, 97.44], [99.0, 101.38], [105.0, 105.83], [114.0, 122.64], [123.0, 124.41], [125.0, 126.1], [126.0, 132.73], [134.0, 135.84], [137.0, 137.56], [142.0, 142.23], [154.0, 154.21], [158.0, 160.05], [161.0, 172.86]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 31.57, 35.14, 0.0, 0.0, 33.87, 0.0, 66.51, 61.97, 0.0, 38.02, 46.97, 0.0, 59.51, 0.0, 0.0, 32.76, 0.0, 0.0, 0.0, 0.0, 99.94, 35.99], "audiomae_on_audioset": [null, [["hum", 9.9], ["music", 9.87], ["speech", 8.16]], [["music", 86.83], ["musical instrument", 2.4], ["guitar", 1.86]], null, null, [["music", 83.58], ["musical instrument", 2.3], ["synthesizer", 2.26]], null, null, null, null, [["music", 74.69], ["electric shaver, electric razor", 8.56], ["buzz", 3.35]], [["animal", 11.53], ["livestock, farm animals, working animals", 10.74], ["speech", 9.39]], null, null, null, null, [["music", 49.14], ["theremin", 31.55], ["foghorn", 4.01]], null, null, null, null, null, [["speech", 14.84], ["crowd", 10.73], ["music", 9.61]]], "duration": [1.52, 4.71, 9.68, 0.77, 0.91, 16.41, 0.75, 2.75, 2.23, 1.84, 11.44, 2.38, 0.83, 8.64, 1.41, 1.1, 6.73, 1.84, 0.56, 0.23, 0.21, 2.05, 11.86]} \ No newline at end of file diff --git a/annotations_filtered/qYEOmZzqX28_filtered.json b/annotations_filtered/qYEOmZzqX28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81906d6c6a4808fc9a874c0a109211c3b8bee947 --- /dev/null +++ b/annotations_filtered/qYEOmZzqX28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.24], [10.0, 11.15], [15.0, 20.44], [21.0, 24.68], [29.0, 30.3], [35.0, 36.05], [54.0, 59.61], [70.0, 70.23], [105.0, 106.0], [106.0, 107.38], [136.0, 137.02], [156.0, 157.72], [161.0, 163.32], [164.0, 177.3], [178.0, 180.79], [182.0, 185.52], [188.0, 188.59], [190.0, 190.58], [196.0, 196.77], [202.0, 211.33]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 33.15, 33.24, 0.0, 0.0, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 30.87, 34.89, 36.78, 0.0, 0.0, 0.0, 30.63], "audiomae_on_audioset": [null, null, [["music", 62.25], ["speech", 18.6], ["sidetone", 3.3]], [["music", 48.8], ["hum", 9.63], ["speech", 5.15]], null, null, [["whack, thwack", 63.49], ["speech", 8.65], ["rumble", 3.78]], null, null, null, null, null, null, [["throbbing", 19.71], ["hum", 16.93], ["music", 14.94]], [["throbbing", 34.82], ["hum", 22.21], ["music", 17.47]], [["music", 30.61], ["hum", 23.52], ["mains hum", 8.81]], null, null, null, [["music", 36.22], ["speech", 24.2], ["buzz", 3.25]]], "duration": [1.24, 1.15, 5.44, 3.68, 1.3, 1.05, 5.61, 0.23, 1.0, 1.38, 1.02, 1.72, 2.32, 13.3, 2.79, 3.52, 0.59, 0.58, 0.77, 9.33]} \ No newline at end of file diff --git a/annotations_filtered/qYEceRHS8jM_filtered.json b/annotations_filtered/qYEceRHS8jM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5b169ca0793e071d821b6e0d2838a6e3029254e --- /dev/null +++ b/annotations_filtered/qYEceRHS8jM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.51], [11.0, 11.06], [14.0, 14.27], [15.0, 24.24], [26.0, 26.77], [27.0, 28.24], [30.0, 30.59], [32.0, 34.59], [36.0, 38.97], [41.0, 42.3], [43.0, 54.75], [56.0, 58.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 99.99, 80.46, 0.0, 99.21, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 0.06, 0.27, 9.24, 0.77, 1.24, 0.59, 2.59, 2.97, 1.3, 11.75, 2.4]} \ No newline at end of file diff --git a/annotations_filtered/qYXoNC_LbcI_filtered.json b/annotations_filtered/qYXoNC_LbcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..012d7e04a0128414624687256604b7d088418f9d --- /dev/null +++ b/annotations_filtered/qYXoNC_LbcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.56], [7.0, 8.83], [12.0, 13.63], [14.0, 26.6], [29.0, 30.64], [31.0, 38.67], [41.0, 42.58], [43.0, 51.56], [53.0, 77.79], [81.0, 81.89], [87.0, 91.18], [92.0, 94.15], [95.0, 95.79], [96.0, 99.6], [100.0, 103.82], [106.0, 107.55], [110.0, 115.06], [117.0, 118.52], [119.0, 121.32], [122.0, 123.33], [125.0, 126.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.57, 0.0, 51.5, 0.0, 40.36, 35.98, 0.0, 39.35, 34.86, 0.0, 39.58, 42.06, 0.0, 54.56, 0.0, 44.78, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 69.04], ["throbbing", 7.52], ["musical instrument", 5.37]], null, null, null, [["music", 42.41], ["speech", 16.89], ["didgeridoo", 11.03]], [["music", 51.31], ["throbbing", 19.92], ["hum", 14.79]], null, [["music", 30.2], ["throbbing", 23.81], ["hum", 5.2]], [["music", 58.67], ["pulse", 3.5], ["musical instrument", 3.15]], null, [["music", 62.14], ["guitar", 6.8], ["musical instrument", 6.4]], [["speech", 22.41], ["music", 19.43], ["mains hum", 11.8]], null, null, null, [["music", 37.3], ["speech", 11.54], ["hum", 8.59]], null, null], "duration": [1.56, 1.83, 1.63, 12.6, 1.64, 7.67, 1.58, 8.56, 24.79, 0.89, 4.18, 2.15, 0.79, 3.6, 3.82, 1.55, 5.06, 1.52, 2.32, 1.33, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/qYZw_tL0j9U_filtered.json b/annotations_filtered/qYZw_tL0j9U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..faa4b77489c99c916e2436d63e66439c7200c88a --- /dev/null +++ b/annotations_filtered/qYZw_tL0j9U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.13], [12.0, 13.29], [27.0, 28.17], [30.0, 38.16], [42.0, 53.33], [61.0, 67.44], [73.0, 75.44], [84.0, 84.08], [85.0, 91.34], [96.0, 104.99], [108.0, 108.57], [113.0, 114.17], [114.0, 114.2], [114.0, 122.23], [123.0, 123.48], [127.0, 138.28], [139.0, 145.69], [158.0, 166.77], [168.0, 175.73]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.49, 34.49, 33.36, 33.06, 0.0, 33.74, 34.13, 0.0, 0.0, 0.0, 38.3, 0.0, 39.05, 34.13, 45.62, 68.8], "audiomae_on_audioset": [null, null, null, [["sidetone", 60.91], ["music", 12.27], ["speech", 10.14]], [["music", 54.49], ["speech", 17.8], ["electronic music", 5.52]], [["music", 68.22], ["speech", 9.58], ["electronic music", 5.24]], [["music", 67.35], ["speech", 12.63], ["electronic music", 2.98]], null, [["music", 52.58], ["sidetone", 9.76], ["synthesizer", 7.31]], [["music", 33.54], ["sidetone", 25.57], ["speech", 23.15]], null, null, null, [["music", 64.81], ["house music", 5.88], ["speech", 5.34]], null, [["music", 39.42], ["moo", 11.88], ["cattle, bovinae", 9.28]], [["music", 64.61], ["rattle (instrument)", 8.71], ["musical instrument", 7.85]], [["music", 57.15], ["drum machine", 8.28], ["synthesizer", 5.12]], null], "duration": [1.13, 1.29, 1.17, 8.16, 11.33, 6.44, 2.44, 0.08, 6.34, 8.99, 0.57, 1.17, 0.2, 8.23, 0.48, 11.28, 6.69, 8.77, 7.73]} \ No newline at end of file diff --git a/annotations_filtered/qYf35nBq8Oo_filtered.json b/annotations_filtered/qYf35nBq8Oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eee327d52ff660e062cb3ca890c6922ae612704a --- /dev/null +++ b/annotations_filtered/qYf35nBq8Oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.17], [5.0, 5.21], [5.0, 9.91], [12.0, 12.45], [17.0, 27.06], [27.0, 32.14], [72.0, 75.74], [77.0, 77.84], [81.0, 83.47], [86.0, 88.84], [90.0, 90.32], [91.0, 91.71], [94.0, 93.73], [96.0, 96.58], [97.0, 98.22], [99.0, 104.55], [105.0, 105.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.31, 0.0, 30.35, 30.21, 52.74, 0.0, 85.9, 35.65, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0], "audiomae_on_audioset": [null, null, [["music", 42.67], ["brass instrument", 21.72], ["trombone", 14.52]], null, [["brass instrument", 34.75], ["trombone", 27.63], ["music", 27.22]], [["brass instrument", 29.49], ["trombone", 27.13], ["music", 24.85]], null, null, null, [["speech", 53.01], ["sidetone", 24.94], ["radio", 9.19]], null, null, null, null, null, null, null], "duration": [0.17, 0.21, 4.91, 0.45, 10.06, 5.14, 3.74, 0.84, 2.47, 2.84, 0.32, 0.71, -0.27, 0.58, 1.22, 5.55, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/qYgpnWoRbXg_filtered.json b/annotations_filtered/qYgpnWoRbXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..125da7fa8a59ec33d9dc14e95ddd5ab4f627a3be --- /dev/null +++ b/annotations_filtered/qYgpnWoRbXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [3.0, 3.37], [6.0, 6.15], [14.0, 14.71], [16.0, 25.19], [26.0, 26.43], [31.0, 35.34], [35.0, 35.38], [36.0, 87.22], [90.0, 100.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 94.95, 0.0, 48.48, 0.0, 0.0, 37.58], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 73.74], ["telephone", 3.27], ["domestic animals, pets", 2.55]], null, null, [["music", 58.64], ["synthesizer", 11.23], ["mains hum", 4.29]]], "duration": [0.52, 0.37, 0.15, 0.71, 9.19, 0.43, 4.34, 0.38, 51.22, 10.43]} \ No newline at end of file diff --git a/annotations_filtered/qZBVXYYcCjQ_filtered.json b/annotations_filtered/qZBVXYYcCjQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a812ef4385e42116f52dab4a0cf3f4ba9ab200df --- /dev/null +++ b/annotations_filtered/qZBVXYYcCjQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.86], [20.0, 20.51], [29.0, 32.8], [34.0, 35.33], [39.0, 39.6], [44.0, 44.32], [50.0, 51.54], [53.0, 75.71], [76.0, 77.5], [78.0, 86.59], [89.0, 89.9], [92.0, 92.16], [95.0, 98.0], [100.0, 101.46], [102.0, 102.96], [104.0, 105.29], [109.0, 109.88], [114.0, 115.06]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 33.31, 0.0, 62.07, 0.0, 0.0, 51.66, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 50.21], ["cattle, bovinae", 7.07], ["cowbell", 6.91]], null, null, null, null, null, null, null, null, null, null], "duration": [1.86, 0.51, 3.8, 1.33, 0.6, 0.32, 1.54, 22.71, 1.5, 8.59, 0.9, 0.16, 3.0, 1.46, 0.96, 1.29, 0.88, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/qZIIx-X5Bbc_filtered.json b/annotations_filtered/qZIIx-X5Bbc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4cd285e15f63c9900d825a6a2b9fb7a959ff999 --- /dev/null +++ b/annotations_filtered/qZIIx-X5Bbc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.81], [20.0, 20.07], [25.0, 26.01], [39.0, 39.56], [40.0, 40.88], [42.0, 42.87], [45.0, 45.66], [50.0, 51.61], [61.0, 62.9], [64.0, 64.17], [66.0, 66.26], [69.0, 69.47], [74.0, 74.04], [75.0, 76.03], [78.0, 81.01], [82.0, 82.85], [88.0, 89.33], [91.0, 91.2], [94.0, 94.56], [96.0, 96.8], [102.0, 103.0], [105.0, 105.46], [112.0, 113.83], [116.0, 116.5], [121.0, 122.0], [123.0, 124.66], [126.0, 127.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.07, 1.01, 0.56, 0.88, 0.87, 0.66, 1.61, 1.9, 0.17, 0.26, 0.47, 0.04, 1.03, 3.01, 0.85, 1.33, 0.2, 0.56, 0.8, 1.0, 0.46, 1.83, 0.5, 1.0, 1.66, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/qZRbStnLn3c_filtered.json b/annotations_filtered/qZRbStnLn3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..285b3d56a3f49391cfeebac6c15e112f85c731e8 --- /dev/null +++ b/annotations_filtered/qZRbStnLn3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.02], [12.0, 12.7], [20.0, 19.7], [27.0, 26.99], [29.0, 29.69], [33.0, 34.38], [35.0, 40.37], [44.0, 46.13], [49.0, 52.07], [56.0, 63.21], [72.0, 77.46], [83.0, 107.33], [123.0, 125.32], [129.0, 129.74], [143.0, 144.54], [146.0, 147.41], [148.0, 149.4]], "keep_status": [false, false, false, false, false, false, true, true, true, true, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.35, 48.27, 39.37, 38.23, 36.47, 37.75, 66.39, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 21.51], ["explosion", 8.74], ["whack, thwack", 8.28]], [["insect", 15.45], ["fly, housefly", 14.35], ["mosquito", 7.66]], [["speech", 60.59], ["music", 4.64], ["vehicle", 4.42]], [["speech", 36.45], ["hum", 11.46], ["throbbing", 11.02]], [["throbbing", 13.99], ["cacophony", 10.51], ["noise", 9.8]], [["speech", 33.93], ["vehicle", 5.81], ["buzz", 5.79]], null, null, null, null, null], "duration": [1.02, 0.7, -0.3, -0.01, 0.69, 1.38, 5.37, 2.13, 3.07, 7.21, 5.46, 24.33, 2.32, 0.74, 1.54, 1.41, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/qZmteh2hT9A_filtered.json b/annotations_filtered/qZmteh2hT9A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae0b47d7a803a7e3797fa354fd2d77f7ace3f3e2 --- /dev/null +++ b/annotations_filtered/qZmteh2hT9A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.59], [11.0, 11.01], [11.0, 14.82], [16.0, 24.22], [28.0, 31.55], [36.0, 56.37], [70.0, 75.59], [83.0, 87.2], [89.0, 92.72]], "keep_status": [false, false, true, false, true, false, false, false, false], "silence_prob": [31.76, 0.0, 33.17, 32.34, 31.71, 33.01, 32.57, 33.18, 31.97], "audiomae_on_audioset": [[["music", 59.13], ["fly, housefly", 7.54], ["didgeridoo", 7.32]], null, [["music", 45.15], ["synthesizer", 8.64], ["theremin", 6.68]], [["music", 65.49], ["didgeridoo", 7.28], ["speech", 5.32]], [["music", 43.39], ["mosquito", 13.59], ["didgeridoo", 9.94]], [["music", 76.76], ["yodeling", 6.42], ["boing", 4.23]], [["music", 91.02], ["musical instrument", 1.83], ["theremin", 0.98]], [["music", 69.48], ["didgeridoo", 23.08], ["musical instrument", 1.3]], [["music", 73.68], ["didgeridoo", 8.22], ["musical instrument", 5.21]]], "duration": [5.59, 0.01, 3.82, 8.22, 3.55, 20.37, 5.59, 4.2, 3.72]} \ No newline at end of file diff --git a/annotations_filtered/qZubhGcnsHk_filtered.json b/annotations_filtered/qZubhGcnsHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c1d8aedd3249c573d03da4dbf55fbcbc031790d --- /dev/null +++ b/annotations_filtered/qZubhGcnsHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.79], [30.0, 30.79], [31.0, 40.54], [42.0, 44.74], [45.0, 45.84], [47.0, 54.75], [56.0, 60.34], [62.0, 68.13], [70.0, 83.24], [84.0, 84.62], [87.0, 97.65], [98.0, 120.5]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 48.1, 98.73, 0.0, 99.59, 88.46, 73.21, 94.22, 0.0, 94.37, 38.33], "audiomae_on_audioset": [null, null, [["music", 33.72], ["noise", 6.06], ["whack, thwack", 5.96]], null, null, null, null, null, null, null, null, [["music", 39.24], ["brass instrument", 13.22], ["speech", 12.47]]], "duration": [1.79, 0.79, 9.54, 2.74, 0.84, 7.75, 4.34, 6.13, 13.24, 0.62, 10.65, 22.5]} \ No newline at end of file diff --git a/annotations_filtered/q_215iQ7KDs_filtered.json b/annotations_filtered/q_215iQ7KDs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12fc758f12b229ea7d1bef2b6ff4fd8d568997e1 --- /dev/null +++ b/annotations_filtered/q_215iQ7KDs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.27], [48.0, 48.51], [52.0, 120.6], [121.0, 124.01], [129.0, 145.86], [146.0, 147.18], [148.0, 154.3], [165.0, 169.37], [170.0, 170.68]], "keep_status": [false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.86, 31.35, 0.0, 33.38, 44.04, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 74.15], ["musical instrument", 3.17], ["guitar", 1.62]], [["music", 58.61], ["sidetone", 12.33], ["electronic music", 3.99]], null, [["speech", 26.9], ["cattle, bovinae", 16.43], ["livestock, farm animals, working animals", 12.66]], [["didgeridoo", 18.78], ["moo", 18.39], ["cattle, bovinae", 17.97]], null], "duration": [0.27, 0.51, 68.6, 3.01, 16.86, 1.18, 6.3, 4.37, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/q_tMagfE-nM_filtered.json b/annotations_filtered/q_tMagfE-nM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b279448d707e1ed104eaaee0c6d2cf43df2c9489 --- /dev/null +++ b/annotations_filtered/q_tMagfE-nM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.23], [4.0, 4.58], [5.0, 6.22], [10.0, 12.23], [14.0, 15.28], [19.0, 24.98], [27.0, 28.07], [29.0, 30.87], [33.0, 35.28], [36.0, 39.14], [41.0, 41.99], [44.0, 44.88], [45.0, 49.0], [51.0, 52.93], [54.0, 56.32], [60.0, 62.18], [64.0, 64.67], [68.0, 71.47], [74.0, 74.7], [77.0, 80.03], [83.0, 85.26], [87.0, 88.25], [91.0, 96.47], [100.0, 102.49], [104.0, 105.76], [108.0, 111.05], [113.0, 117.31], [120.0, 122.37], [126.0, 130.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.84, 0.0, 99.1, 0.0, 0.0, 97.11, 99.94, 0.0, 0.0, 95.09, 0.0, 82.25, 99.85, 0.0, 99.99, 0.0, 99.99, 99.71, 0.0, 83.34, 99.98, 0.0, 99.68, 92.64, 100.0, 99.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 0.58, 1.22, 2.23, 1.28, 5.98, 1.07, 1.87, 2.28, 3.14, 0.99, 0.88, 4.0, 1.93, 2.32, 2.18, 0.67, 3.47, 0.7, 3.03, 2.26, 1.25, 5.47, 2.49, 1.76, 3.05, 4.31, 2.37, 4.03]} \ No newline at end of file diff --git a/annotations_filtered/q_u6njqBaB8_filtered.json b/annotations_filtered/q_u6njqBaB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9cda88c354c8124bed37d5b2ce09c1e1e98087b0 --- /dev/null +++ b/annotations_filtered/q_u6njqBaB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.04], [34.0, 35.36], [68.0, 68.94], [70.0, 73.58], [74.0, 74.83], [77.0, 77.85], [80.0, 81.75], [92.0, 93.46], [96.0, 96.35], [99.0, 99.33], [101.0, 102.32], [113.0, 125.71], [128.0, 128.04], [130.0, 132.44], [133.0, 134.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 52.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.68, 0.0, 46.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 33.67], ["hum", 10.64], ["music", 9.92]], null, [["speech", 15.2], ["music", 14.9], ["mains hum", 13.02]], null], "duration": [0.04, 1.36, 0.94, 3.58, 0.83, 0.85, 1.75, 1.46, 0.35, 0.33, 1.32, 12.71, 0.04, 2.44, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/q_v3jNjwHNQ_filtered.json b/annotations_filtered/q_v3jNjwHNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53741cc29e8433fdb6864da3b7e7d13e8c83f844 --- /dev/null +++ b/annotations_filtered/q_v3jNjwHNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 93.58], [95.0, 141.86], [144.0, 166.75], [167.0, 166.82]], "keep_status": [false, false, false, false], "silence_prob": [34.06, 0.0, 31.38, 0.0], "audiomae_on_audioset": [[["music", 61.85], ["throbbing", 14.66], ["hum", 10.25]], null, [["hum", 36.27], ["music", 28.77], ["mains hum", 14.2]], null], "duration": [18.58, 46.86, 22.75, -0.18]} \ No newline at end of file diff --git a/annotations_filtered/q_wefCacDTE_filtered.json b/annotations_filtered/q_wefCacDTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5a6ea1e191cb7499699ea9b35940e06228382dc --- /dev/null +++ b/annotations_filtered/q_wefCacDTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 15.94], [17.0, 34.45], [37.0, 37.56], [39.0, 39.45], [47.0, 54.82]], "keep_status": [false, false, false, false, true], "silence_prob": [31.2, 32.08, 0.0, 0.0, 30.9], "audiomae_on_audioset": [[["music", 37.44], ["brass instrument", 23.61], ["trombone", 11.93]], [["music", 62.03], ["theremin", 11.26], ["didgeridoo", 5.84]], null, null, [["music", 28.57], ["theremin", 15.22], ["animal", 7.42]]], "duration": [11.94, 17.45, 0.56, 0.45, 7.82]} \ No newline at end of file diff --git a/annotations_filtered/q_y1Qe8dyCw_filtered.json b/annotations_filtered/q_y1Qe8dyCw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a5fbc64405ed22dacd2002a654177f35813b372 --- /dev/null +++ b/annotations_filtered/q_y1Qe8dyCw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.59], [31.0, 31.9], [34.0, 34.91], [36.0, 36.96], [39.0, 40.37]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.59, 0.9, 0.91, 0.96, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/q_y6O1yflZI_filtered.json b/annotations_filtered/q_y6O1yflZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2a1df22509cc1aa2b8e6eee23cb667cf110abf9 --- /dev/null +++ b/annotations_filtered/q_y6O1yflZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 61.8], [89.0, 92.72], [117.0, 119.04], [120.0, 121.8], [125.0, 127.28], [128.0, 131.16], [134.0, 134.69], [135.0, 135.41], [138.0, 140.98], [142.0, 142.4], [143.0, 144.49], [148.0, 148.88], [151.0, 155.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.71, 98.93, 0.0, 96.42, 99.48, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 3.72, 2.04, 1.8, 2.28, 3.16, 0.69, 0.41, 2.98, 0.4, 1.49, 0.88, 4.33]} \ No newline at end of file diff --git a/annotations_filtered/qa2Ng4a5yk0_filtered.json b/annotations_filtered/qa2Ng4a5yk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6664d29d352c14bbdce06304e1f792107784d20d --- /dev/null +++ b/annotations_filtered/qa2Ng4a5yk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 43.29], [46.0, 58.83], [60.0, 68.82], [70.0, 119.99], [123.0, 122.88]], "keep_status": [true, false, false, false, false], "silence_prob": [32.16, 33.94, 32.35, 0.0, 0.0], "audiomae_on_audioset": [[["music", 31.27], ["foghorn", 21.47], ["didgeridoo", 15.59]], [["music", 52.38], ["musical instrument", 14.2], ["speech", 6.35]], [["music", 39.98], ["brass instrument", 19.79], ["trombone", 13.34]], null, null], "duration": [7.29, 12.83, 8.82, 49.99, -0.12]} \ No newline at end of file diff --git a/annotations_filtered/qaAz6YklimY_filtered.json b/annotations_filtered/qaAz6YklimY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f7d75dabe7b4b09e159fa8be95878777d137d48 --- /dev/null +++ b/annotations_filtered/qaAz6YklimY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.35], [17.0, 19.45], [20.0, 20.46], [21.0, 23.21], [25.0, 25.74], [28.0, 28.75], [30.0, 34.97]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.35, 2.45, 0.46, 2.21, 0.74, 0.75, 4.97]} \ No newline at end of file diff --git a/annotations_filtered/qaBlaPsuHQw_filtered.json b/annotations_filtered/qaBlaPsuHQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4f4fe19bee4fc63f7a757d09912816b8a254811 --- /dev/null +++ b/annotations_filtered/qaBlaPsuHQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.71], [8.0, 8.38], [9.0, 43.39], [45.0, 62.94], [67.0, 89.63], [91.0, 90.61]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.54, 31.72, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 62.91], ["skidding", 4.33], ["vehicle", 4.26]], [["vehicle", 32.71], ["car", 21.25], ["race car, auto racing", 7.7]], null], "duration": [1.71, 0.38, 34.39, 17.94, 22.63, -0.39]} \ No newline at end of file diff --git a/annotations_filtered/qaQQ3LLyKvo_filtered.json b/annotations_filtered/qaQQ3LLyKvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a375c3b66dad45c21e2f74ee1cb64b599b3ab59e --- /dev/null +++ b/annotations_filtered/qaQQ3LLyKvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.03], [2.0, 2.07], [2.0, 2.1], [2.0, 2.13], [2.0, 2.17], [2.0, 2.25], [2.0, 2.32], [2.0, 2.49], [3.0, 2.54], [4.0, 4.19], [5.0, 7.69], [8.0, 9.34], [10.0, 15.21], [18.0, 31.95], [33.0, 35.34], [36.0, 39.16], [40.0, 43.28], [44.0, 44.27], [45.0, 45.62], [50.0, 50.53], [52.0, 88.91], [90.0, 95.62], [96.0, 99.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 58.64, 51.55, 63.96, 59.86, 44.49, 0.0, 0.0, 0.0, 0.0, 54.9, 44.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.75], ["mains hum", 25.98], ["speech", 8.62]], null, null, null, null, null, [["hum", 27.42], ["theremin", 18.96], ["music", 12.32]]], "duration": [0.03, 0.07, 0.1, 0.13, 0.17, 0.25, 0.32, 0.49, -0.46, 0.19, 2.69, 1.34, 5.21, 13.95, 2.34, 3.16, 3.28, 0.27, 0.62, 0.53, 36.91, 5.62, 3.42]} \ No newline at end of file diff --git a/annotations_filtered/qaQUmqNJTO8_filtered.json b/annotations_filtered/qaQUmqNJTO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..580977885020cd461840e7b64b47b1cb8974000b --- /dev/null +++ b/annotations_filtered/qaQUmqNJTO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.41], [17.0, 17.86], [22.0, 27.75], [31.0, 32.9], [40.0, 40.61], [42.0, 42.06], [44.0, 44.42], [49.0, 88.97], [91.0, 92.28], [95.0, 95.71], [96.0, 99.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.9, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.41, 0.86, 5.75, 1.9, 0.61, 0.06, 0.42, 39.97, 1.28, 0.71, 3.27]} \ No newline at end of file diff --git a/annotations_filtered/qabChviGItk_filtered.json b/annotations_filtered/qabChviGItk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4337d3b83d5b2c0980a107a6c1f25734c206cc1 --- /dev/null +++ b/annotations_filtered/qabChviGItk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 37.67], [38.0, 53.35], [55.0, 56.05], [59.0, 80.62], [82.0, 93.12], [93.0, 93.82]], "keep_status": [true, false, false, false, false, false], "silence_prob": [30.13, 30.41, 0.0, 30.54, 30.41, 0.0], "audiomae_on_audioset": [[["music", 21.15], ["car", 15.36], ["race car, auto racing", 10.77]], [["throbbing", 38.78], ["music", 31.4], ["hum", 19.37]], null, [["music", 45.8], ["hum", 14.68], ["throbbing", 11.47]], [["music", 56.49], ["smash, crash", 12.36], ["whack, thwack", 8.04]], null], "duration": [11.67, 15.35, 1.05, 21.62, 11.12, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/qalHjNdHFJc_filtered.json b/annotations_filtered/qalHjNdHFJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9243e15bfca2dfd3cdea71464ed00ff4ee6a9bb7 --- /dev/null +++ b/annotations_filtered/qalHjNdHFJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [3.0, 3.75], [6.0, 6.84], [9.0, 9.04], [32.0, 31.94], [41.0, 41.55], [43.0, 43.65], [48.0, 48.24], [52.0, 53.01], [54.0, 56.39], [58.0, 60.66], [66.0, 69.11], [77.0, 77.75], [83.0, 83.08], [88.0, 88.8], [90.0, 93.87], [94.0, 95.35], [99.0, 99.69], [100.0, 101.44], [117.0, 117.8], [119.0, 119.23], [121.0, 121.2], [126.0, 126.22], [127.0, 127.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.21, 33.11, 40.09, 0.0, 0.0, 0.0, 73.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["beatboxing", 16.56], ["music", 12.5], ["knock", 8.23]], [["sidetone", 53.29], ["speech", 26.57], ["dial tone", 9.56]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.75, 0.84, 0.04, -0.06, 0.55, 0.65, 0.24, 1.01, 2.39, 2.66, 3.11, 0.75, 0.08, 0.8, 3.87, 1.35, 0.69, 1.44, 0.8, 0.23, 0.2, 0.22, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/qb00B8U8UBw_filtered.json b/annotations_filtered/qb00B8U8UBw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b4aabdbda8a8f20ea0d8e3d7c40a3015311ca8f --- /dev/null +++ b/annotations_filtered/qb00B8U8UBw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.72], [13.0, 13.71], [15.0, 17.74], [19.0, 56.64], [61.0, 107.79], [108.0, 107.82], [108.0, 107.86], [108.0, 107.89], [108.0, 107.92], [109.0, 129.91]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [45.75, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.95], "audiomae_on_audioset": [[["music", 41.06], ["musical instrument", 9.48], ["cello", 6.06]], null, null, null, null, null, null, null, null, [["music", 66.26], ["didgeridoo", 3.35], ["musical instrument", 3.3]]], "duration": [4.72, 0.71, 2.74, 37.64, 46.79, -0.18, -0.14, -0.11, -0.08, 20.91]} \ No newline at end of file diff --git a/annotations_filtered/qb4e_GJzmrI_filtered.json b/annotations_filtered/qb4e_GJzmrI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b0469ebb08ea932f2d3ab817aaf82fc87430dfc --- /dev/null +++ b/annotations_filtered/qb4e_GJzmrI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [5.0, 4.68], [8.0, 7.94], [10.0, 10.81], [17.0, 16.88], [19.0, 19.85], [21.0, 22.91], [24.0, 25.79], [27.0, 28.56], [31.0, 32.26], [33.0, 34.3], [35.0, 34.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, -0.32, -0.06, 0.81, -0.12, 0.85, 1.91, 1.79, 1.56, 1.26, 1.3, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/qbIEepu8Z4w_filtered.json b/annotations_filtered/qbIEepu8Z4w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49b2f4ea4b2358ca18ec53d3af047d970cd27953 --- /dev/null +++ b/annotations_filtered/qbIEepu8Z4w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [9.0, 12.31], [14.0, 14.35], [20.0, 20.07], [26.0, 27.26], [31.0, 32.32], [37.0, 38.31], [40.0, 40.24], [48.0, 49.59], [51.0, 52.2], [54.0, 53.92], [57.0, 57.45], [62.0, 63.54], [64.0, 65.25], [68.0, 67.88], [69.0, 69.62], [71.0, 71.61], [72.0, 73.8], [75.0, 77.04], [78.0, 78.51], [79.0, 79.89], [81.0, 81.84], [84.0, 102.22], [104.0, 104.23], [106.0, 106.86], [108.0, 108.48], [110.0, 119.72], [121.0, 122.23], [123.0, 125.66], [126.0, 129.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 100.0, 0.0, 76.53, 96.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 64.71], ["sidetone", 24.3], ["dial tone", 1.57]], null, null, null, null, null, null, null], "duration": [0.87, 3.31, 0.35, 0.07, 1.26, 1.32, 1.31, 0.24, 1.59, 1.2, -0.08, 0.45, 1.54, 1.25, -0.12, 0.62, 0.61, 1.8, 2.04, 0.51, 0.89, 0.84, 18.22, 0.23, 0.86, 0.48, 9.72, 1.23, 2.66, 3.96]} \ No newline at end of file diff --git a/annotations_filtered/qbYHRU551nI_filtered.json b/annotations_filtered/qbYHRU551nI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f0cc1339daf5a6e5cf55ffe1dacbd705c76b75b --- /dev/null +++ b/annotations_filtered/qbYHRU551nI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [3.0, 4.89], [5.0, 18.3], [19.0, 20.85], [26.0, 26.0], [28.0, 28.54], [42.0, 42.87]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.24, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["whale vocalization", 31.53], ["music", 28.28], ["speech", 17.25]], null, null, null, null], "duration": [1.0, 1.89, 13.3, 1.85, 0.0, 0.54, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/qbYyYYHysqM_filtered.json b/annotations_filtered/qbYyYYHysqM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4d004fb50020e705f44fc3a4af2fc6752288d69 --- /dev/null +++ b/annotations_filtered/qbYyYYHysqM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.28], [6.0, 8.24], [10.0, 12.78], [15.0, 17.9], [22.0, 26.25], [30.0, 30.2], [31.0, 31.31], [38.0, 45.47], [47.0, 46.67], [61.0, 60.91], [75.0, 96.65], [99.0, 99.23], [107.0, 116.56], [118.0, 119.57], [121.0, 123.03], [133.0, 134.94], [140.0, 141.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.82, 99.95, 99.62, 99.1, 98.93, 0.0, 0.0, 88.83, 0.0, 0.0, 94.66, 0.0, 98.66, 0.0, 83.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.28, 2.24, 2.78, 2.9, 4.25, 0.2, 0.31, 7.47, -0.33, -0.09, 21.65, 0.23, 9.56, 1.57, 2.03, 1.94, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/qbdg6o8Z11I_filtered.json b/annotations_filtered/qbdg6o8Z11I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1b9fe41081bb877706eb3dbedbe5a6330d14732 --- /dev/null +++ b/annotations_filtered/qbdg6o8Z11I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.76], [19.0, 19.6], [33.0, 33.52], [35.0, 35.9], [41.0, 51.97], [61.0, 71.34], [86.0, 86.34], [88.0, 106.51], [107.0, 107.35], [109.0, 119.2]], "keep_status": [false, false, false, false, true, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.05, 30.39, 0.0, 30.09, 0.0, 30.06], "audiomae_on_audioset": [null, null, null, null, [["speech", 40.38], ["music", 10.9], ["mains hum", 10.79]], [["music", 38.63], ["speech", 21.15], ["whack, thwack", 2.9]], null, [["music", 42.66], ["speech", 10.18], ["whack, thwack", 5.97]], null, [["music", 52.38], ["speech", 11.22], ["fly, housefly", 2.27]]], "duration": [0.76, 0.6, 0.52, 0.9, 10.97, 10.34, 0.34, 18.51, 0.35, 10.2]} \ No newline at end of file diff --git a/annotations_filtered/qcFM5Xhg8W8_filtered.json b/annotations_filtered/qcFM5Xhg8W8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da117c512d95ae5c62b5f5926e2831bf889a8ba8 --- /dev/null +++ b/annotations_filtered/qcFM5Xhg8W8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.05], [2.0, 2.57], [6.0, 5.85], [8.0, 8.23], [15.0, 15.2], [18.0, 18.25], [19.0, 19.48], [20.0, 19.58], [20.0, 20.07], [20.0, 20.82], [32.0, 32.09], [33.0, 34.32], [39.0, 39.16], [42.0, 42.31], [52.0, 52.08], [53.0, 56.47], [57.0, 57.43], [58.0, 58.23], [59.0, 62.92], [63.0, 74.6], [75.0, 76.08], [77.0, 77.8], [79.0, 80.57], [81.0, 81.92], [83.0, 83.61], [85.0, 85.55], [89.0, 89.31], [91.0, 91.25], [95.0, 97.71], [99.0, 99.99], [101.0, 101.46], [103.0, 102.86], [104.0, 104.18], [105.0, 107.76], [108.0, 126.91], [129.0, 130.08], [131.0, 131.25], [132.0, 134.03], [136.0, 137.05], [138.0, 138.48], [141.0, 141.24], [143.0, 142.62], [143.0, 143.75], [145.0, 146.18], [149.0, 149.13], [150.0, 152.07], [153.0, 173.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 80.82, 41.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.16, 0.0, 0.0, 0.0, 0.0, 44.32, 35.42, 0.0, 0.0, 45.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.52, 31.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.29], ["speech", 18.63], ["burping, eructation", 4.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.8], ["speech", 17.79], ["musical instrument", 4.6]], [["music", 30.11], ["hum", 28.05], ["mains hum", 9.4]], null, null, [["animal", 30.35], ["grunt", 16.61], ["whale vocalization", 13.51]], null, null, null, null, null, null, null, [["screaming", 21.66], ["boing", 15.93], ["grunt", 9.26]], [["music", 23.48], ["fart", 16.85], ["whack, thwack", 5.98]]], "duration": [1.05, 0.57, -0.15, 0.23, 0.2, 0.25, 0.48, -0.42, 0.07, 0.82, 0.09, 1.32, 0.16, 0.31, 0.08, 3.47, 0.43, 0.23, 3.92, 11.6, 1.08, 0.8, 1.57, 0.92, 0.61, 0.55, 0.31, 0.25, 2.71, 0.99, 0.46, -0.14, 0.18, 2.76, 18.91, 1.08, 0.25, 2.03, 1.05, 0.48, 0.24, -0.38, 0.75, 1.18, 0.13, 2.07, 20.23]} \ No newline at end of file diff --git a/annotations_filtered/qcFVUGNUWuk_filtered.json b/annotations_filtered/qcFVUGNUWuk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c253519120895cafa71f4e7b8ec69a4fcb376dbc --- /dev/null +++ b/annotations_filtered/qcFVUGNUWuk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.98], [23.0, 24.0], [30.0, 30.23], [35.0, 74.22], [76.0, 77.06], [80.0, 80.33], [84.0, 84.65], [89.0, 89.63], [93.0, 93.01], [96.0, 96.48], [109.0, 108.78], [110.0, 110.29], [112.0, 111.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.98, 1.0, 0.23, 39.22, 1.06, 0.33, 0.65, 0.63, 0.01, 0.48, -0.22, 0.29, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/qcGEIq1AEGM_filtered.json b/annotations_filtered/qcGEIq1AEGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2be78db8dda5cb86b4b2b9860a373d5e428eefd2 --- /dev/null +++ b/annotations_filtered/qcGEIq1AEGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 66.88], [75.0, 74.71], [77.0, 116.11], [117.0, 117.39], [123.0, 123.63], [124.0, 136.02], [137.0, 137.93], [141.0, 147.93], [150.0, 151.01]], "keep_status": [false, false, false, false, false, true, false, true, false], "silence_prob": [28.85, 0.0, 0.0, 0.0, 0.0, 40.66, 0.0, 38.59, 0.0], "audiomae_on_audioset": [[["music", 53.47], ["speech", 10.92], ["glass", 6.08]], null, null, null, null, [["speech", 34.5], ["breaking", 20.53], ["sidetone", 9.81]], null, [["whack, thwack", 20.32], ["crushing", 18.0], ["smash, crash", 8.12]], null], "duration": [12.88, -0.29, 39.11, 0.39, 0.63, 12.02, 0.93, 6.93, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/qcMHKqF91tM_filtered.json b/annotations_filtered/qcMHKqF91tM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b36ed7c25af8c7f7818592d3311cd1b8ab0cdc0 --- /dev/null +++ b/annotations_filtered/qcMHKqF91tM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.66], [3.0, 3.72], [6.0, 10.52], [12.0, 14.79], [16.0, 21.1], [22.0, 22.57], [33.0, 34.55], [36.0, 36.26], [38.0, 40.04], [43.0, 43.61], [44.0, 44.42], [47.0, 47.24], [51.0, 53.67], [59.0, 59.78], [61.0, 63.37], [66.0, 66.93], [69.0, 69.75], [72.0, 71.83], [78.0, 77.95], [80.0, 80.57], [82.0, 83.47], [86.0, 87.1], [100.0, 101.16], [102.0, 102.41], [109.0, 109.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 99.95, 99.88, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 93.76, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 0.72, 4.52, 2.79, 5.1, 0.57, 1.55, 0.26, 2.04, 0.61, 0.42, 0.24, 2.67, 0.78, 2.37, 0.93, 0.75, -0.17, -0.05, 0.57, 1.47, 1.1, 1.16, 0.41, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/qcVr2eztQEk_filtered.json b/annotations_filtered/qcVr2eztQEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc60cb0dbb260eebeec668e122462f4a387d4806 --- /dev/null +++ b/annotations_filtered/qcVr2eztQEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.46], [30.0, 30.92], [37.0, 49.03], [51.0, 51.7], [59.0, 59.73], [61.0, 65.75], [67.0, 67.74], [73.0, 73.95], [75.0, 85.26], [93.0, 93.34], [95.0, 95.08]], "keep_status": [true, false, true, false, false, false, false, false, true, false, false], "silence_prob": [29.19, 0.0, 29.6, 0.0, 0.0, 31.27, 0.0, 0.0, 29.8, 0.0, 0.0], "audiomae_on_audioset": [[["music", 33.9], ["theremin", 10.09], ["musical instrument", 6.58]], null, [["music", 24.01], ["mains hum", 13.08], ["buzz", 12.15]], null, null, [["music", 65.2], ["cacophony", 3.87], ["mains hum", 3.33]], null, null, [["music", 29.21], ["hum", 20.37], ["mains hum", 13.88]], null, null], "duration": [5.46, 0.92, 12.03, 0.7, 0.73, 4.75, 0.74, 0.95, 10.26, 0.34, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/qcYPASs4jMQ_filtered.json b/annotations_filtered/qcYPASs4jMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..907fe2bc31cc7db287545acf390cfe08dba466ed --- /dev/null +++ b/annotations_filtered/qcYPASs4jMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.79], [24.0, 125.14], [128.0, 130.6]], "keep_status": [false, false, true], "silence_prob": [29.67, 0.0, 41.5], "audiomae_on_audioset": [[["eruption", 28.4], ["speech", 28.22], ["explosion", 21.09]], null, [["cattle, bovinae", 10.34], ["whale vocalization", 9.82], ["moo", 9.52]]], "duration": [9.79, 101.14, 2.6]} \ No newline at end of file diff --git a/annotations_filtered/qcaVM8TcZbA_filtered.json b/annotations_filtered/qcaVM8TcZbA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0eac198fc08a1828509fa65fa0b5f29192116b1 --- /dev/null +++ b/annotations_filtered/qcaVM8TcZbA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.89], [15.0, 15.15], [16.0, 16.98], [20.0, 21.1], [23.0, 25.49], [27.0, 29.2], [30.0, 32.98], [34.0, 34.33], [35.0, 36.12], [37.0, 38.3], [41.0, 41.72], [43.0, 45.1], [53.0, 53.22], [58.0, 61.79], [63.0, 63.68], [64.0, 65.67], [68.0, 67.78], [69.0, 70.53], [76.0, 84.47], [92.0, 92.65], [98.0, 99.01], [101.0, 116.02], [119.0, 121.68], [122.0, 124.95], [128.0, 129.54], [133.0, 133.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 90.43, 97.11, 83.7, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 47.66, 0.0, 0.0, 0.0, 0.0, 38.76, 0.0, 0.0, 29.04, 29.93, 29.39, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.44], ["speech", 19.25], ["singing bowl", 5.31]], null, null, null, null, [["music", 41.3], ["ambient music", 13.06], ["speech", 12.38]], null, null, [["music", 40.11], ["hum", 20.18], ["throbbing", 19.47]], [["music", 34.57], ["cattle, bovinae", 12.35], ["moo", 8.79]], [["music", 76.86], ["speech", 9.46], ["throbbing", 1.33]], null, null], "duration": [-0.11, 0.15, 0.98, 1.1, 2.49, 2.2, 2.98, 0.33, 1.12, 1.3, 0.72, 2.1, 0.22, 3.79, 0.68, 1.67, -0.22, 1.53, 8.47, 0.65, 1.01, 15.02, 2.68, 2.95, 1.54, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/qckVPZkmiNU_filtered.json b/annotations_filtered/qckVPZkmiNU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbd27954dc0e18ba87a6a5b4136adc5f1f65aeac --- /dev/null +++ b/annotations_filtered/qckVPZkmiNU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.56], [2.0, 3.0], [5.0, 6.57], [9.0, 12.88], [17.0, 17.78], [19.0, 19.47], [31.0, 30.96], [39.0, 38.87], [45.0, 45.0], [50.0, 50.55], [52.0, 52.78], [56.0, 56.32], [66.0, 66.99], [69.0, 70.36], [80.0, 80.74], [82.0, 82.05], [85.0, 85.46], [98.0, 100.55], [104.0, 103.91], [111.0, 112.23], [114.0, 119.37], [120.0, 122.4], [126.0, 127.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 80.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 100.0, 99.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 1.0, 1.57, 3.88, 0.78, 0.47, -0.04, -0.13, 0.0, 0.55, 0.78, 0.32, 0.99, 1.36, 0.74, 0.05, 0.46, 2.55, -0.09, 1.23, 5.37, 2.4, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/qdK7QVuaSlM_filtered.json b/annotations_filtered/qdK7QVuaSlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..191a8395ea87caef7958c25c6c44086a43265883 --- /dev/null +++ b/annotations_filtered/qdK7QVuaSlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 103.32], [104.0, 109.44], [110.0, 130.15], [131.0, 166.14]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 29.41, 31.37, 0.0], "audiomae_on_audioset": [null, [["music", 50.02], ["smash, crash", 7.49], ["throbbing", 4.51]], [["music", 61.72], ["speech", 5.42], ["synthesizer", 4.45]], null], "duration": [55.32, 5.44, 20.15, 35.14]} \ No newline at end of file diff --git a/annotations_filtered/qdbrIrFxas0_filtered.json b/annotations_filtered/qdbrIrFxas0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..404d216dcc8a39194a78f850df3050ad14e7db83 --- /dev/null +++ b/annotations_filtered/qdbrIrFxas0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.67], [20.0, 20.61], [23.0, 23.7], [24.0, 34.21], [38.0, 38.31], [39.0, 52.24], [53.0, 53.64], [56.0, 68.03], [80.0, 111.21], [113.0, 118.03], [118.0, 120.14], [122.0, 126.79], [128.0, 134.84], [137.0, 148.36], [152.0, 156.68], [157.0, 158.48], [159.0, 160.44], [161.0, 161.42]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [48.61, 0.0, 0.0, 32.61, 0.0, 30.63, 0.0, 31.78, 0.0, 31.81, 31.74, 31.75, 31.16, 31.52, 29.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 27.66], ["speech", 18.19], ["synthesizer", 15.94]], null, null, [["music", 74.43], ["reggae", 6.77], ["swing music", 1.22]], null, [["music", 79.42], ["saxophone", 1.89], ["musical instrument", 1.55]], null, [["music", 71.49], ["reggae", 9.45], ["musical instrument", 2.17]], null, [["music", 70.97], ["speech", 6.03], ["boing", 5.05]], [["music", 61.43], ["speech", 8.85], ["musical instrument", 2.55]], [["music", 45.43], ["boing", 12.92], ["speech", 9.51]], [["music", 72.04], ["musical instrument", 2.22], ["moo", 1.86]], [["music", 88.23], ["funny music", 1.67], ["musical instrument", 1.59]], [["boing", 51.51], ["crowd", 15.66], ["cheering", 5.37]], null, null, null], "duration": [8.67, 0.61, 0.7, 10.21, 0.31, 13.24, 0.64, 12.03, 31.21, 5.03, 2.14, 4.79, 6.84, 11.36, 4.68, 1.48, 1.44, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/qdq07pa6sPA_filtered.json b/annotations_filtered/qdq07pa6sPA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..455d5ba6d990c9e17881c699192526ca389eaa82 --- /dev/null +++ b/annotations_filtered/qdq07pa6sPA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.83], [8.0, 9.85], [11.0, 11.31], [12.0, 13.2], [17.0, 16.93], [21.0, 23.08], [24.0, 31.77], [46.0, 46.47], [47.0, 48.46], [52.0, 52.86], [54.0, 53.94], [55.0, 57.64], [61.0, 61.21], [66.0, 66.33], [70.0, 69.94], [70.0, 71.73], [75.0, 76.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 99.99, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 1.85, 0.31, 1.2, -0.07, 2.08, 7.77, 0.47, 1.46, 0.86, -0.06, 2.64, 0.21, 0.33, -0.06, 1.73, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/qdrvmgnw1YQ_filtered.json b/annotations_filtered/qdrvmgnw1YQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a876927a496bd02c8e070bbe57bd171d03193a8 --- /dev/null +++ b/annotations_filtered/qdrvmgnw1YQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 22.99], [23.0, 25.61], [26.0, 28.68], [29.0, 32.17], [34.0, 38.91], [39.0, 44.36], [44.0, 44.39], [47.0, 48.57], [50.0, 54.13], [56.0, 57.81], [59.0, 59.73], [64.0, 64.37], [67.0, 67.91]], "keep_status": [false, true, false, true, true, true, false, false, true, false, false, false, false], "silence_prob": [69.47, 35.29, 70.16, 35.8, 33.68, 30.66, 0.0, 0.0, 36.95, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 62.41], ["music", 4.09], ["coin (dropping)", 2.56]], null, [["music", 36.96], ["didgeridoo", 9.3], ["fart", 6.36]], [["music", 29.37], ["speech", 22.5], ["animal", 5.15]], [["grunt", 25.99], ["burping, eructation", 15.88], ["sound effect", 12.59]], null, null, [["speech", 50.79], ["music", 13.0], ["animal", 3.07]], null, null, null, null], "duration": [9.99, 2.61, 2.68, 3.17, 4.91, 5.36, 0.39, 1.57, 4.13, 1.81, 0.73, 0.37, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/qdtCFKVtSls_filtered.json b/annotations_filtered/qdtCFKVtSls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e3dd37845bcf93d76ab19c32fbe85fcf79093ce --- /dev/null +++ b/annotations_filtered/qdtCFKVtSls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.31], [9.0, 10.23], [11.0, 11.89], [13.0, 13.29], [14.0, 23.53], [31.0, 33.17], [35.0, 34.94], [37.0, 36.8], [37.0, 44.49], [54.0, 54.28], [55.0, 55.43], [56.0, 56.44], [58.0, 58.67], [61.0, 61.59], [65.0, 65.8], [66.0, 66.72], [68.0, 68.3], [69.0, 69.23], [70.0, 71.07], [72.0, 74.39], [74.0, 74.49], [75.0, 77.57], [78.0, 78.29], [78.0, 78.61], [80.0, 80.06], [81.0, 85.7], [88.0, 95.08], [96.0, 97.48], [117.0, 123.4]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 80.29, 76.2, 0.0, 0.0, 44.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 45.08, 0.0, 0.0, 0.0, 66.39, 70.72, 0.0, 32.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 32.92], ["buzz", 8.93], ["cattle, bovinae", 8.59]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 16.81], ["mosquito", 16.51], ["fly, housefly", 12.08]], null, null, null, null, null, null, [["music", 41.23], ["brass instrument", 26.14], ["trombone", 16.4]]], "duration": [1.31, 1.23, 0.89, 0.29, 9.53, 2.17, -0.06, -0.2, 7.49, 0.28, 0.43, 0.44, 0.67, 0.59, 0.8, 0.72, 0.3, 0.23, 1.07, 2.39, 0.49, 2.57, 0.29, 0.61, 0.06, 4.7, 7.08, 1.48, 6.4]} \ No newline at end of file diff --git a/annotations_filtered/qe5s8UTNw4c_filtered.json b/annotations_filtered/qe5s8UTNw4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3446e37400ce92b22a3081a13c3ccc152fc67f7 --- /dev/null +++ b/annotations_filtered/qe5s8UTNw4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.49], [29.0, 32.56], [36.0, 37.49], [56.0, 57.33], [72.0, 73.94], [78.0, 78.26], [92.0, 94.39], [97.0, 99.12], [105.0, 105.22]], "keep_status": [false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 47.74, 0.0, 0.0, 0.0, 0.0, 43.3, 58.13, 0.0], "audiomae_on_audioset": [null, [["music", 52.94], ["mantra", 5.12], ["carnatic music", 4.0]], null, null, null, null, [["music", 40.53], ["mantra", 15.69], ["chant", 5.7]], null, null], "duration": [1.49, 3.56, 1.49, 1.33, 1.94, 0.26, 2.39, 2.12, 0.22]} \ No newline at end of file diff --git a/annotations_filtered/qe8IY41zyCc_filtered.json b/annotations_filtered/qe8IY41zyCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64d515d0cdaa298d09475d5ad17a39aacf26f68e --- /dev/null +++ b/annotations_filtered/qe8IY41zyCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 66.48], [67.0, 112.04], [113.0, 112.95], [113.0, 120.31]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.1], "audiomae_on_audioset": [null, null, null, [["throbbing", 43.48], ["music", 25.18], ["hum", 19.68]]], "duration": [34.48, 45.04, -0.05, 7.31]} \ No newline at end of file diff --git a/annotations_filtered/qeY1mkXqKgk_filtered.json b/annotations_filtered/qeY1mkXqKgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53cdc6ce96b07a1c3e81d08087e92af44b5012ee --- /dev/null +++ b/annotations_filtered/qeY1mkXqKgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.78], [4.0, 7.43], [8.0, 26.97], [31.0, 31.77], [32.0, 48.69], [52.0, 56.15], [57.0, 57.11], [58.0, 58.56], [60.0, 60.29], [62.0, 61.84], [63.0, 64.98], [65.0, 69.15], [70.0, 73.52], [75.0, 75.81], [77.0, 77.85], [81.0, 84.06], [86.0, 86.29], [88.0, 90.02], [91.0, 91.12], [92.0, 91.96], [93.0, 93.45], [95.0, 110.57], [111.0, 119.38], [120.0, 124.51], [127.0, 130.4]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.68, 35.98, 0.0, 34.25, 33.46, 0.0, 0.0, 0.0, 0.0, 0.0, 33.69, 35.54, 0.0, 0.0, 33.42, 0.0, 32.99, 0.0, 0.0, 0.0, 32.83, 32.62, 33.56, 29.68], "audiomae_on_audioset": [null, [["hum", 30.13], ["music", 16.98], ["mains hum", 8.65]], [["music", 70.46], ["mains hum", 4.83], ["hum", 4.16]], null, [["music", 45.88], ["theremin", 43.06], ["ambient music", 1.76]], [["theremin", 87.64], ["music", 10.38], ["musical instrument", 0.54]], null, null, null, null, null, [["music", 66.42], ["theremin", 15.74], ["musical instrument", 3.08]], [["music", 61.9], ["theremin", 10.02], ["ambient music", 2.95]], null, null, [["music", 41.36], ["scary music", 5.05], ["theremin", 4.51]], null, [["music", 16.93], ["cello", 16.45], ["double bass", 13.27]], null, null, null, [["music", 76.32], ["theremin", 10.24], ["didgeridoo", 6.83]], [["music", 59.46], ["theremin", 21.0], ["scary music", 4.97]], [["music", 48.73], ["theremin", 28.36], ["musical instrument", 6.88]], [["theremin", 71.62], ["music", 19.79], ["musical instrument", 1.61]]], "duration": [1.78, 3.43, 18.97, 0.77, 16.69, 4.15, 0.11, 0.56, 0.29, -0.16, 1.98, 4.15, 3.52, 0.81, 0.85, 3.06, 0.29, 2.02, 0.12, -0.04, 0.45, 15.57, 8.38, 4.51, 3.4]} \ No newline at end of file diff --git a/annotations_filtered/qeZ0SIG2eJY_filtered.json b/annotations_filtered/qeZ0SIG2eJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02a5bca97853c19e7445d70faba098b0b3e882ae --- /dev/null +++ b/annotations_filtered/qeZ0SIG2eJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.66], [7.0, 8.41], [9.0, 10.84], [14.0, 14.4], [16.0, 52.74], [53.0, 59.91], [67.0, 68.71], [69.0, 69.18], [69.0, 69.89], [77.0, 80.67], [87.0, 92.33], [95.0, 95.77], [99.0, 99.72], [105.0, 113.34]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.71, 0.0, 0.0, 0.0, 30.79, 32.32, 0.0, 0.0, 29.74], "audiomae_on_audioset": [null, null, null, null, null, [["music", 43.34], ["hum", 15.39], ["synthesizer", 7.78]], null, null, null, [["music", 15.74], ["animal", 9.37], ["whale vocalization", 6.29]], [["music", 35.47], ["speech", 22.0], ["hum", 12.68]], null, null, [["music", 51.25], ["hum", 5.89], ["didgeridoo", 4.33]]], "duration": [-0.34, 1.41, 1.84, 0.4, 36.74, 6.91, 1.71, 0.18, 0.89, 3.67, 5.33, 0.77, 0.72, 8.34]} \ No newline at end of file diff --git a/annotations_filtered/qeaiVveZWD8_filtered.json b/annotations_filtered/qeaiVveZWD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c2a7d5bee9a35b0b1611f5ae818e380b9870f61 --- /dev/null +++ b/annotations_filtered/qeaiVveZWD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 47.93], [48.0, 48.15], [49.0, 51.83], [54.0, 89.04], [89.0, 137.1]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.28, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 43.18], ["ambient music", 21.31], ["scary music", 6.17]], null, null], "duration": [1.93, 0.15, 2.83, 35.04, 48.1]} \ No newline at end of file diff --git a/annotations_filtered/qeytg9JLx-o_filtered.json b/annotations_filtered/qeytg9JLx-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9873fd96a49a57916e0d455e82712864da307858 --- /dev/null +++ b/annotations_filtered/qeytg9JLx-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 60.02], [60.0, 60.54], [67.0, 67.05], [67.0, 101.88], [102.0, 129.02], [133.0, 136.19], [139.0, 139.65], [168.0, 168.12], [180.0, 180.06], [205.0, 209.34], [211.0, 212.01], [213.0, 214.69], [217.0, 217.86], [223.0, 223.47], [224.0, 225.19]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.76, 34.38, 0.0, 0.0, 0.0, 40.88, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 40.8], ["music", 13.76], ["didgeridoo", 9.15]], [["speech", 62.68], ["music", 13.83], ["mains hum", 3.94]], null, null, null, [["music", 22.82], ["hum", 21.1], ["mains hum", 13.73]], null, null, null, null, null], "duration": [43.02, 0.54, 0.05, 34.88, 27.02, 3.19, 0.65, 0.12, 0.06, 4.34, 1.01, 1.69, 0.86, 0.47, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/qf-4TDEpycw_filtered.json b/annotations_filtered/qf-4TDEpycw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea60448901a648c0f5191f2b7f21fc5e60f8db01 --- /dev/null +++ b/annotations_filtered/qf-4TDEpycw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [2.0, 2.0], [12.0, 12.56], [22.0, 23.01], [26.0, 26.89], [28.0, 28.19], [29.0, 29.89], [37.0, 37.59], [67.0, 67.66], [70.0, 74.34], [77.0, 77.41], [94.0, 94.78], [99.0, 100.25], [101.0, 104.65], [105.0, 110.35], [113.0, 127.03], [128.0, 136.24], [137.0, 137.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.4, 0.0, 0.0, 0.0, 31.97, 33.63, 34.26, 57.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 56.03], ["music", 13.99], ["didgeridoo", 8.09]], null, null, null, [["speech", 58.53], ["livestock, farm animals, working animals", 4.94], ["vehicle", 4.2]], [["fly, housefly", 21.23], ["speech", 17.29], ["insect", 15.68]], [["music", 21.15], ["speech", 15.93], ["breaking", 4.34]], null, null], "duration": [0.35, 0.0, 0.56, 1.01, 0.89, 0.19, 0.89, 0.59, 0.66, 4.34, 0.41, 0.78, 1.25, 3.65, 5.35, 14.03, 8.24, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/qfIzHlWOiuE_filtered.json b/annotations_filtered/qfIzHlWOiuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03ee72b6c2efb943221200b770aad27e9421e77e --- /dev/null +++ b/annotations_filtered/qfIzHlWOiuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [6.0, 10.1], [17.0, 17.59]], "keep_status": [false, false, false], "silence_prob": [0.0, 82.79, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.38, 4.1, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/qfq5VozCshY_filtered.json b/annotations_filtered/qfq5VozCshY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89e0ad340e3f6ec3473a47eb8ef81fc632d7a0e4 --- /dev/null +++ b/annotations_filtered/qfq5VozCshY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [2.0, 3.3], [8.0, 9.8], [14.0, 14.67], [17.0, 21.46], [37.0, 41.55], [44.0, 47.48], [55.0, 55.41], [55.0, 55.49], [71.0, 71.1], [75.0, 76.4], [84.0, 84.64], [92.0, 92.69], [100.0, 100.01], [101.0, 103.2], [105.0, 105.53], [108.0, 108.21], [109.0, 109.63], [110.0, 111.28], [112.0, 112.09], [124.0, 124.01], [125.0, 125.44], [126.0, 126.45], [130.0, 134.01], [136.0, 136.8], [156.0, 159.38], [163.0, 163.41], [169.0, 169.57], [174.0, 174.8], [180.0, 180.69], [182.0, 182.28], [185.0, 185.28], [188.0, 188.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.71, 44.46, 37.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.44, 0.0, 57.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["thunk", 60.04], ["music", 25.01], ["door", 3.9]], [["music", 75.07], ["speech", 6.48], ["musical instrument", 3.68]], [["music", 72.79], ["maraca", 4.61], ["musical instrument", 2.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 1.3, 1.8, 0.67, 4.46, 4.55, 3.48, 0.41, 0.49, 0.1, 1.4, 0.64, 0.69, 0.01, 2.2, 0.53, 0.21, 0.63, 1.28, 0.09, 0.01, 0.44, 0.45, 4.01, 0.8, 3.38, 0.41, 0.57, 0.8, 0.69, 0.28, 0.28, 0.0]} \ No newline at end of file diff --git a/annotations_filtered/qfwei0pOLVs_filtered.json b/annotations_filtered/qfwei0pOLVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9cda9dcbe6769c36acff9521fd0d5e7ecb6ab856 --- /dev/null +++ b/annotations_filtered/qfwei0pOLVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [7.0, 7.2], [8.0, 8.58], [18.0, 22.35], [24.0, 26.57], [27.0, 28.27], [33.0, 35.45], [35.0, 35.48], [35.0, 35.55], [36.0, 35.63], [36.0, 37.07], [38.0, 39.63], [42.0, 43.73], [44.0, 45.87], [46.0, 46.25], [47.0, 47.38], [47.0, 47.68], [48.0, 48.1], [48.0, 48.71], [56.0, 58.28], [60.0, 61.08], [62.0, 71.31], [72.0, 73.41], [75.0, 76.6], [78.0, 80.28], [82.0, 82.29], [84.0, 86.16], [87.0, 87.52], [88.0, 89.28], [90.0, 92.31], [93.0, 94.53], [95.0, 103.84], [105.0, 110.47], [111.0, 111.81], [113.0, 119.79], [120.0, 121.24], [122.0, 123.74], [124.0, 125.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.97, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 99.98, 0.0, 100.0, 100.0, 0.0, 59.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 0.2, 0.58, 4.35, 2.57, 1.27, 2.45, 0.48, 0.55, -0.37, 1.07, 1.63, 1.73, 1.87, 0.25, 0.38, 0.68, 0.1, 0.71, 2.28, 1.08, 9.31, 1.41, 1.6, 2.28, 0.29, 2.16, 0.52, 1.28, 2.31, 1.53, 8.84, 5.47, 0.81, 6.79, 1.24, 1.74, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/qgRXFJqB-9Q_filtered.json b/annotations_filtered/qgRXFJqB-9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91ea6b05666d6e966d5e2ab673cda2e44214d074 --- /dev/null +++ b/annotations_filtered/qgRXFJqB-9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.8], [13.0, 24.98], [31.0, 43.71], [48.0, 81.6], [82.0, 88.35], [92.0, 92.42], [99.0, 99.39], [100.0, 123.45], [126.0, 140.56], [143.0, 147.23], [152.0, 152.39], [154.0, 156.19], [156.0, 156.25], [158.0, 161.72], [165.0, 173.08]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 28.51, 28.75, 0.0, 28.72, 0.0, 0.0, 29.35, 31.22, 30.59, 0.0, 31.15, 0.0, 29.79, 30.02], "audiomae_on_audioset": [null, [["music", 66.24], ["hum", 7.68], ["throbbing", 3.77]], [["music", 62.14], ["hum", 9.27], ["throbbing", 5.76]], null, [["music", 43.7], ["hum", 6.88], ["speech", 6.81]], null, null, [["music", 75.38], ["throbbing", 6.98], ["electronic music", 5.69]], [["speech", 27.96], ["music", 27.56], ["hum", 12.11]], [["music", 35.51], ["speech", 32.65], ["didgeridoo", 5.27]], null, [["music", 30.55], ["whale vocalization", 7.95], ["vehicle", 7.38]], null, [["music", 49.9], ["speech", 16.8], ["throbbing", 7.33]], [["music", 58.03], ["speech", 15.95], ["cacophony", 4.3]]], "duration": [0.8, 11.98, 12.71, 33.6, 6.35, 0.42, 0.39, 23.45, 14.56, 4.23, 0.39, 2.19, 0.25, 3.72, 8.08]} \ No newline at end of file diff --git a/annotations_filtered/qgm_ou3TsIs_filtered.json b/annotations_filtered/qgm_ou3TsIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..128a61fba9426cedc2bce133a48927a713b6ff0b --- /dev/null +++ b/annotations_filtered/qgm_ou3TsIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [5.0, 5.83], [8.0, 30.96], [34.0, 47.83], [51.0, 53.59], [57.0, 57.37], [59.0, 63.44], [64.0, 65.58], [67.0, 68.74], [70.0, 71.54], [74.0, 74.8], [77.0, 77.28], [78.0, 78.88], [83.0, 91.13], [92.0, 96.77], [99.0, 99.23], [100.0, 107.42], [108.0, 111.87], [115.0, 121.46]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 76.04, 53.28, 66.88, 0.0, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 54.43, 0.0, 35.47, 33.81, 34.42], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 29.01], ["didgeridoo", 9.92], ["fly, housefly", 4.29]], null, null, null, null, null, null, null, null, null, [["music", 42.17], ["clarinet", 16.95], ["musical instrument", 7.38]], [["music", 63.22], ["effects unit", 9.13], ["musical instrument", 9.12]], [["music", 45.12], ["theremin", 33.99], ["musical instrument", 4.57]]], "duration": [0.6, 0.83, 22.96, 13.83, 2.59, 0.37, 4.44, 1.58, 1.74, 1.54, 0.8, 0.28, 0.88, 8.13, 4.77, 0.23, 7.42, 3.87, 6.46]} \ No newline at end of file diff --git a/annotations_filtered/qgmcXs02URY_filtered.json b/annotations_filtered/qgmcXs02URY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7149b644fb9d03d3cc0eddee9d1af42e09552a97 --- /dev/null +++ b/annotations_filtered/qgmcXs02URY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [7.0, 7.43], [10.0, 11.77], [13.0, 15.21], [22.0, 23.9], [26.0, 27.18], [29.0, 30.06], [31.0, 36.61], [39.0, 40.27], [41.0, 42.26], [43.0, 44.54], [46.0, 47.97], [49.0, 50.9], [52.0, 55.21], [56.0, 58.04], [59.0, 63.15], [65.0, 66.97], [68.0, 68.81], [71.0, 72.57], [73.0, 76.17], [77.0, 78.7], [80.0, 80.49], [83.0, 84.6], [86.0, 86.8], [87.0, 87.74], [89.0, 89.58], [92.0, 96.16], [100.0, 102.41], [104.0, 108.58], [109.0, 110.69], [112.0, 112.09], [113.0, 113.46], [115.0, 123.01], [123.0, 129.54], [130.0, 132.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 84.43, 97.83, 0.0, 0.0, 0.0, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.62, 99.21, 84.07, 0.0, 0.0, 0.0, 81.89, 56.93, 97.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 0.43, 1.77, 2.21, 1.9, 1.18, 1.06, 5.61, 1.27, 1.26, 1.54, 1.97, 1.9, 3.21, 2.04, 4.15, 1.97, 0.81, 1.57, 3.17, 1.7, 0.49, 1.6, 0.8, 0.74, 0.58, 4.16, 2.41, 4.58, 1.69, 0.09, 0.46, 8.01, 6.54, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/qgv_7j1_CdA_filtered.json b/annotations_filtered/qgv_7j1_CdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba4734d7a6b04fc2e061ee44183a6f9e1e365681 --- /dev/null +++ b/annotations_filtered/qgv_7j1_CdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.4], [9.0, 9.58], [11.0, 13.8], [16.0, 15.65], [17.0, 17.15], [20.0, 20.6], [21.0, 21.49], [23.0, 23.97], [26.0, 33.34], [35.0, 36.31], [39.0, 41.66], [46.0, 48.2], [50.0, 72.98], [79.0, 99.62], [106.0, 108.18], [110.0, 114.89], [116.0, 116.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.13, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 0.0, 83.34, 76.04, 41.24, 42.35, 67.89, 67.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.84], ["animal", 10.66], ["horse", 2.92]], [["music", 69.14], ["synthesizer", 5.58], ["musical instrument", 5.06]], null, null, null], "duration": [2.4, 0.58, 2.8, -0.35, 0.15, 0.6, 0.49, 0.97, 7.34, 1.31, 2.66, 2.2, 22.98, 20.62, 2.18, 4.89, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/qh1KCsqqHFY_filtered.json b/annotations_filtered/qh1KCsqqHFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa43041cbdefeda9bf6003fde1873e82b5718ed0 --- /dev/null +++ b/annotations_filtered/qh1KCsqqHFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.61], [7.0, 7.57], [8.0, 9.44], [10.0, 11.42], [15.0, 16.09], [18.0, 18.87], [20.0, 21.41], [22.0, 22.82], [26.0, 27.48], [29.0, 28.8], [29.0, 39.41], [41.0, 41.28], [42.0, 43.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 64.71], ["telephone bell ringing", 20.64], ["alarm clock", 4.85]], null, null], "duration": [2.61, 0.57, 1.44, 1.42, 1.09, 0.87, 1.41, 0.82, 1.48, -0.2, 10.41, 0.28, 1.7]} \ No newline at end of file diff --git a/annotations_filtered/qhAYzFv4HYc_filtered.json b/annotations_filtered/qhAYzFv4HYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..614f3a1e5a6459cf2cd1d3f0e4d41e4ff15c88ca --- /dev/null +++ b/annotations_filtered/qhAYzFv4HYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.85], [4.0, 5.48], [13.0, 15.04], [18.0, 24.09], [26.0, 30.64], [31.0, 32.31], [38.0, 37.96]], "keep_status": [false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 66.76, 34.31, 36.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 27.5], ["effects unit", 17.23], ["distortion", 13.48]], [["music", 23.91], ["hum", 12.32], ["speech", 5.21]], null, null], "duration": [-0.15, 1.48, 2.04, 6.09, 4.64, 1.31, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/qhH634B4jGg_filtered.json b/annotations_filtered/qhH634B4jGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..292178241501fecd2573ddc444393cc9ab866c5c --- /dev/null +++ b/annotations_filtered/qhH634B4jGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.28], [25.0, 27.53], [29.0, 31.31], [34.0, 35.99], [37.0, 56.91], [58.0, 57.99], [64.0, 64.34], [66.0, 66.39], [67.0, 67.56], [72.0, 72.0], [74.0, 76.13], [78.0, 77.82], [81.0, 81.77], [83.0, 82.65], [85.0, 85.89], [91.0, 92.7], [108.0, 109.92], [112.0, 112.9], [114.0, 114.12], [115.0, 115.23], [119.0, 119.91], [124.0, 139.58]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [54.83, 44.87, 51.6, 0.0, 38.16, 0.0, 0.0, 0.0, 0.0, 0.0, 44.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.51], "audiomae_on_audioset": [null, [["speech", 45.2], ["cattle, bovinae", 9.12], ["moo", 7.11]], null, null, [["speech", 69.65], ["sidetone", 6.74], ["breaking", 4.11]], null, null, null, null, null, [["speech", 27.81], ["moo", 15.26], ["cattle, bovinae", 8.6]], null, null, null, null, null, null, null, null, null, null, [["speech", 53.69], ["music", 30.82], ["clip-clop", 2.18]]], "duration": [2.28, 2.53, 2.31, 1.99, 19.91, -0.01, 0.34, 0.39, 0.56, 0.0, 2.13, -0.18, 0.77, -0.35, 0.89, 1.7, 1.92, 0.9, 0.12, 0.23, 0.91, 15.58]} \ No newline at end of file diff --git a/annotations_filtered/qhgkpZecrTY_filtered.json b/annotations_filtered/qhgkpZecrTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fde4f5ac216d9cfeb4c61276110dcb919071dd2a --- /dev/null +++ b/annotations_filtered/qhgkpZecrTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 23.03], [24.0, 27.45], [35.0, 35.83], [53.0, 58.99], [62.0, 64.23], [66.0, 67.04], [70.0, 73.48], [75.0, 80.18], [87.0, 88.53], [92.0, 96.45], [97.0, 98.51], [102.0, 105.63], [108.0, 111.62], [114.0, 119.85], [121.0, 131.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.75, 100.0, 0.0, 99.76, 100.0, 0.0, 100.0, 99.99, 0.0, 99.84, 0.0, 99.97, 100.0, 82.61, 89.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [20.03, 3.45, 0.83, 5.99, 2.23, 1.04, 3.48, 5.18, 1.53, 4.45, 1.51, 3.63, 3.62, 5.85, 10.45]} \ No newline at end of file diff --git a/annotations_filtered/qhquCQirt48_filtered.json b/annotations_filtered/qhquCQirt48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..523dcdc5e2aa46d882cb76767a5e51f69a3d9f6f --- /dev/null +++ b/annotations_filtered/qhquCQirt48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.45], [12.0, 13.44], [14.0, 15.03], [27.0, 28.22], [29.0, 29.93], [33.0, 33.88], [39.0, 38.97], [40.0, 40.88], [42.0, 43.07], [45.0, 45.42], [49.0, 50.06], [51.0, 51.63], [52.0, 53.03], [54.0, 53.69], [55.0, 55.93], [56.0, 56.52], [57.0, 57.62], [58.0, 59.43], [63.0, 64.4], [66.0, 66.19], [69.0, 69.84], [72.0, 73.67], [75.0, 79.07], [82.0, 83.24], [84.0, 85.36], [87.0, 87.47], [93.0, 93.8], [102.0, 103.0], [104.0, 105.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 1.44, 1.03, 1.22, 0.93, 0.88, -0.03, 0.88, 1.07, 0.42, 1.06, 0.63, 1.03, -0.31, 0.93, 0.52, 0.62, 1.43, 1.4, 0.19, 0.84, 1.67, 4.07, 1.24, 1.36, 0.47, 0.8, 1.0, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/qhxDQ1g964U_filtered.json b/annotations_filtered/qhxDQ1g964U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b657a93a66015f2d0940748e645fd77b88bebd0e --- /dev/null +++ b/annotations_filtered/qhxDQ1g964U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.48], [17.0, 17.93], [21.0, 22.33], [36.0, 40.12], [48.0, 47.66], [49.0, 50.45], [58.0, 59.73], [71.0, 118.35]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.67, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 55.85], ["speech", 22.44], ["synthesizer", 2.02]], null, null, null, null], "duration": [1.48, 0.93, 1.33, 4.12, -0.34, 1.45, 1.73, 47.35]} \ No newline at end of file diff --git a/annotations_filtered/qhzCkJXZVJg_filtered.json b/annotations_filtered/qhzCkJXZVJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2045ef21fdf8e8bf4ed95a1b30c052722c2ad4c3 --- /dev/null +++ b/annotations_filtered/qhzCkJXZVJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.75], [7.0, 9.36], [12.0, 21.15], [23.0, 23.48], [27.0, 27.14], [28.0, 56.57], [60.0, 60.18], [61.0, 73.09], [74.0, 75.29], [76.0, 79.88], [81.0, 81.03], [83.0, 88.05]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 43.33, 38.23, 0.0, 0.0, 34.28, 0.0, 30.2, 0.0, 30.72, 0.0, 31.97], "audiomae_on_audioset": [null, [["music", 37.75], ["speech", 30.72], ["hum", 4.94]], [["music", 83.01], ["throbbing", 2.08], ["hum", 1.49]], null, null, [["music", 76.52], ["speech", 12.01], ["synthesizer", 1.58]], null, [["music", 89.33], ["drum machine", 1.77], ["synthesizer", 1.48]], null, [["music", 58.09], ["carnatic music", 5.08], ["throbbing", 3.96]], null, [["music", 74.65], ["synthesizer", 4.89], ["musical instrument", 3.15]]], "duration": [1.75, 2.36, 9.15, 0.48, 0.14, 28.57, 0.18, 12.09, 1.29, 3.88, 0.03, 5.05]} \ No newline at end of file diff --git a/annotations_filtered/qiVy40O1_Lc_filtered.json b/annotations_filtered/qiVy40O1_Lc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/qiVy40O1_Lc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/qi_t-McN6Vk_filtered.json b/annotations_filtered/qi_t-McN6Vk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06c7c9f531d4d76925f8b5b847db2dac9fc23cbf --- /dev/null +++ b/annotations_filtered/qi_t-McN6Vk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.16], [14.0, 30.05], [31.0, 31.56], [32.0, 37.62], [40.0, 40.51], [45.0, 44.95]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 30.52, 0.0, 31.38, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.12], ["music", 24.87], ["throbbing", 11.28]], null, [["sidetone", 34.83], ["speech", 34.11], ["music", 11.2]], null, null], "duration": [0.16, 16.05, 0.56, 5.62, 0.51, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/qilGSZ9UWTc_filtered.json b/annotations_filtered/qilGSZ9UWTc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..503ef23beeb8fd028e2f8a38d54e17e2fb80a331 --- /dev/null +++ b/annotations_filtered/qilGSZ9UWTc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.48], [7.0, 7.82], [11.0, 12.99], [18.0, 22.77], [24.0, 25.27], [26.0, 43.28], [44.0, 48.15], [49.0, 61.87], [63.0, 115.92], [118.0, 132.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.96, 0.0, 99.71, 96.29, 84.8, 0.0, 97.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 0.82, 1.99, 4.77, 1.27, 17.28, 4.15, 12.87, 52.92, 14.61]} \ No newline at end of file diff --git a/annotations_filtered/qj0L0g36IXU_filtered.json b/annotations_filtered/qj0L0g36IXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe5b02242bcfd2805d0a2c6cc87ef8191716a8ad --- /dev/null +++ b/annotations_filtered/qj0L0g36IXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.76], [5.0, 5.63], [6.0, 6.74], [9.0, 9.9], [12.0, 12.99], [13.0, 14.03], [15.0, 16.56], [32.0, 32.83], [62.0, 62.92], [70.0, 82.14], [83.0, 89.95], [91.0, 95.35], [98.0, 109.86], [111.0, 112.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.06, 54.17, 52.74, 57.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 68.02], ["hum", 4.77], ["music", 2.89]], null, null, null, null], "duration": [1.76, 0.63, 0.74, 0.9, 0.99, 1.03, 1.56, 0.83, 0.92, 12.14, 6.95, 4.35, 11.86, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/qj3TqaXp2Mg_filtered.json b/annotations_filtered/qj3TqaXp2Mg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a76df2a2029fc305038ffeb478b0937a24e1fa35 --- /dev/null +++ b/annotations_filtered/qj3TqaXp2Mg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.6], [14.0, 14.89], [16.0, 16.17], [18.0, 17.66], [20.0, 20.95], [22.0, 30.35], [35.0, 44.37], [45.0, 48.24], [52.0, 56.84], [59.0, 62.18], [63.0, 63.22], [65.0, 68.91], [72.0, 83.81], [84.0, 87.02], [89.0, 90.34], [95.0, 99.35], [101.0, 101.82], [103.0, 114.34]], "keep_status": [false, false, false, false, false, true, false, false, true, true, false, true, true, true, false, false, false, true], "silence_prob": [42.74, 0.0, 0.0, 0.0, 0.0, 40.29, 41.24, 35.79, 45.14, 44.99, 0.0, 44.37, 39.05, 34.73, 0.0, 44.34, 0.0, 39.21], "audiomae_on_audioset": [[["sidetone", 44.73], ["speech", 28.85], ["whale vocalization", 10.41]], null, null, null, null, [["speech", 25.91], ["didgeridoo", 9.27], ["hum", 8.93]], [["speech", 60.35], ["hum", 9.17], ["sidetone", 6.35]], [["speech", 70.84], ["sidetone", 15.78], ["radio", 3.09]], [["hum", 17.78], ["rumble", 9.72], ["whale vocalization", 9.3]], [["speech", 29.58], ["hum", 10.43], ["rumble", 5.73]], null, [["speech", 29.75], ["noise", 12.82], ["whale vocalization", 6.49]], [["music", 35.0], ["didgeridoo", 11.09], ["hum", 7.49]], [["reverberation", 12.98], ["speech", 6.38], ["animal", 5.86]], null, [["speech", 64.5], ["sidetone", 7.05], ["music", 3.99]], null, [["mains hum", 23.8], ["hum", 16.92], ["fly, housefly", 13.43]]], "duration": [5.6, 0.89, 0.17, -0.34, 0.95, 8.35, 9.37, 3.24, 4.84, 3.18, 0.22, 3.91, 11.81, 3.02, 1.34, 4.35, 0.82, 11.34]} \ No newline at end of file diff --git a/annotations_filtered/qjFCVTpsIps_filtered.json b/annotations_filtered/qjFCVTpsIps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a04a506439c2015561c33e5d3eb0ad285ee05268 --- /dev/null +++ b/annotations_filtered/qjFCVTpsIps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.83], [11.0, 12.48], [14.0, 24.12], [25.0, 29.03], [30.0, 30.48], [37.0, 44.19], [44.0, 66.93], [69.0, 71.78], [74.0, 77.26], [78.0, 79.42], [81.0, 89.58], [95.0, 95.61], [96.0, 101.44], [105.0, 107.11]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [38.11, 0.0, 33.11, 34.08, 0.0, 32.89, 32.77, 31.62, 33.38, 0.0, 33.94, 0.0, 32.96, 34.57], "audiomae_on_audioset": [[["mechanisms", 27.44], ["gears", 14.06], ["speech", 11.36]], null, [["music", 55.23], ["fart", 8.33], ["trombone", 7.21]], [["trombone", 38.63], ["brass instrument", 22.71], ["music", 21.92]], null, [["music", 72.77], ["speech", 5.52], ["trombone", 3.45]], [["music", 59.09], ["hum", 7.17], ["speech", 7.15]], [["music", 35.87], ["sidetone", 25.13], ["speech", 13.6]], [["music", 46.4], ["speech", 15.1], ["didgeridoo", 4.45]], null, [["music", 80.39], ["drum machine", 2.49], ["musical instrument", 2.12]], null, [["music", 44.61], ["mosquito", 4.49], ["fly, housefly", 3.55]], [["music", 46.97], ["speech", 13.68], ["musical instrument", 3.46]]], "duration": [3.83, 1.48, 10.12, 4.03, 0.48, 7.19, 22.93, 2.78, 3.26, 1.42, 8.58, 0.61, 5.44, 2.11]} \ No newline at end of file diff --git a/annotations_filtered/qjJnk3MgNgc_filtered.json b/annotations_filtered/qjJnk3MgNgc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60fe87650ac0340a722f05a5e7fe3adb07386a25 --- /dev/null +++ b/annotations_filtered/qjJnk3MgNgc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.86], [10.0, 10.42], [13.0, 13.68], [21.0, 21.51], [29.0, 36.73], [39.0, 38.97], [44.0, 44.15], [47.0, 46.89], [51.0, 51.53], [55.0, 55.46], [57.0, 58.11], [66.0, 66.61], [74.0, 74.24], [75.0, 76.55], [77.0, 78.76], [79.0, 84.1], [86.0, 88.05], [93.0, 95.79], [99.0, 101.53], [104.0, 105.71], [110.0, 110.42], [111.0, 111.55], [112.0, 112.43], [113.0, 113.12], [114.0, 113.97], [119.0, 119.2], [126.0, 127.13], [129.0, 128.92], [132.0, 132.36], [134.0, 138.74], [140.0, 142.3], [143.0, 146.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.34, 51.34, 42.13, 45.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.31, 34.65, 34.42], "audiomae_on_audioset": [null, null, null, null, [["music", 58.55], ["synthesizer", 8.26], ["hum", 7.89]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.91], ["hum", 17.16], ["speech", 7.23]], [["music", 52.24], ["guitar", 6.77], ["plucked string instrument", 5.44]], null, null, null, null, null, null, null, null, null, null, [["music", 57.26], ["synthesizer", 5.78], ["ambient music", 5.28]], [["music", 32.46], ["speech", 31.19], ["synthesizer", 13.93]], [["music", 68.15], ["synthesizer", 7.35], ["electronic music", 6.29]]], "duration": [0.86, 0.42, 0.68, 0.51, 7.73, -0.03, 0.15, -0.11, 0.53, 0.46, 1.11, 0.61, 0.24, 1.55, 1.76, 5.1, 2.05, 2.79, 2.53, 1.71, 0.42, 0.55, 0.43, 0.12, -0.03, 0.2, 1.13, -0.08, 0.36, 4.74, 2.3, 3.16]} \ No newline at end of file diff --git a/annotations_filtered/qjUsrdzDbuY_filtered.json b/annotations_filtered/qjUsrdzDbuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cdee922285d16d159e5627be1429db2e690451a --- /dev/null +++ b/annotations_filtered/qjUsrdzDbuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.38], [22.0, 22.94], [23.0, 23.16], [27.0, 26.79], [28.0, 28.16], [28.0, 30.03], [31.0, 30.86], [34.0, 34.11], [35.0, 35.73], [37.0, 37.35], [38.0, 39.68], [43.0, 48.25], [50.0, 50.97], [52.0, 66.66], [73.0, 73.72], [74.0, 74.68], [76.0, 76.62], [79.0, 79.88], [82.0, 82.51], [83.0, 84.35], [85.0, 86.09], [90.0, 92.21], [92.0, 94.27], [95.0, 96.23], [97.0, 98.19], [99.0, 98.93], [106.0, 107.27], [110.0, 111.43], [113.0, 114.74], [116.0, 118.66]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [49.45, 0.0, 0.0, 0.0, 0.0, 39.24, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 37.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 43.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.62], "audiomae_on_audioset": [[["speech", 70.56], ["hum", 4.42], ["radio", 3.2]], null, null, null, null, [["speech", 47.86], ["music", 6.65], ["coin (dropping)", 3.77]], null, null, null, null, null, null, null, [["music", 45.36], ["speech", 23.51], ["sidetone", 6.59]], null, null, null, null, null, null, null, null, [["music", 37.41], ["speech", 9.69], ["singing bowl", 6.84]], null, null, null, null, null, null, [["speech", 33.27], ["music", 17.45], ["hum", 16.64]]], "duration": [9.38, 0.94, 0.16, -0.21, 0.16, 2.03, -0.14, 0.11, 0.73, 0.35, 1.68, 5.25, 0.97, 14.66, 0.72, 0.68, 0.62, 0.88, 0.51, 1.35, 1.09, 2.21, 2.27, 1.23, 1.19, -0.07, 1.27, 1.43, 1.74, 2.66]} \ No newline at end of file diff --git a/annotations_filtered/qjYP7J3oP9Q_filtered.json b/annotations_filtered/qjYP7J3oP9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5ba12ba3c8caf01a9e17bda9358175018c2393f --- /dev/null +++ b/annotations_filtered/qjYP7J3oP9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.57], [13.0, 17.39], [19.0, 19.95], [22.0, 26.37], [29.0, 33.13], [34.0, 34.97], [36.0, 39.61], [42.0, 43.51], [45.0, 48.69], [51.0, 51.93], [53.0, 55.49], [57.0, 60.91], [62.0, 63.91], [66.0, 68.45], [71.0, 76.71], [78.0, 80.4], [82.0, 85.63], [87.0, 96.94], [100.0, 102.78], [105.0, 108.87], [109.0, 108.94], [110.0, 112.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 99.99, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 79.76, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.57, 4.39, 0.95, 4.37, 4.13, 0.97, 3.61, 1.51, 3.69, 0.93, 2.49, 3.91, 1.91, 2.45, 5.71, 2.4, 3.63, 9.94, 2.78, 3.87, -0.06, 2.5]} \ No newline at end of file diff --git a/annotations_filtered/qjhh_5PMBZs_filtered.json b/annotations_filtered/qjhh_5PMBZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..505e4837de1c532b39c2de40a9c8d657c8e4664d --- /dev/null +++ b/annotations_filtered/qjhh_5PMBZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.84], [3.0, 4.01], [5.0, 5.05], [10.0, 10.4], [12.0, 13.71], [14.0, 22.71], [23.0, 36.59]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.63, 34.61], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 84.21], ["telephone bell ringing", 2.91], ["telephone", 2.89]], [["speech", 58.81], ["music", 11.27], ["buzzer", 6.34]]], "duration": [1.84, 1.01, 0.05, 0.4, 1.71, 8.71, 13.59]} \ No newline at end of file diff --git a/annotations_filtered/qjqJtri_EG4_filtered.json b/annotations_filtered/qjqJtri_EG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62670efc11c7a046abeb55f3d614da3c1eecaf7f --- /dev/null +++ b/annotations_filtered/qjqJtri_EG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.81], [17.0, 17.09], [28.0, 28.68], [37.0, 38.77], [43.0, 46.23], [51.0, 50.95], [53.0, 54.77], [56.0, 57.1], [58.0, 58.43], [60.0, 61.99], [73.0, 73.63], [90.0, 90.54], [93.0, 93.34], [94.0, 94.56], [95.0, 96.31], [100.0, 100.5], [109.0, 112.95], [122.0, 122.59], [124.0, 125.2], [134.0, 135.57], [137.0, 137.39], [141.0, 141.88], [151.0, 151.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.37, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 73.1], ["electronic music", 3.03], ["ambient music", 2.99]], null, null, null, null, null, null], "duration": [2.81, 0.09, 0.68, 1.77, 3.23, -0.05, 1.77, 1.1, 0.43, 1.99, 0.63, 0.54, 0.34, 0.56, 1.31, 0.5, 3.95, 0.59, 1.2, 1.57, 0.39, 0.88, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/qkGDaroLl_M_filtered.json b/annotations_filtered/qkGDaroLl_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13c73b177191e24b2e13eff9d1d73f5895039263 --- /dev/null +++ b/annotations_filtered/qkGDaroLl_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.19], [13.0, 13.2], [35.0, 34.62], [35.0, 34.65], [35.0, 35.5], [36.0, 35.56], [47.0, 49.15], [72.0, 72.66]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 69.27], ["synthetic singing", 5.53], ["sidetone", 3.69]], null], "duration": [1.19, 0.2, -0.38, -0.35, 0.5, -0.44, 2.15, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/qkHSTpTqlug_filtered.json b/annotations_filtered/qkHSTpTqlug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a3fbc070ea1a9fde281d7bb790f0a9c19006f60 --- /dev/null +++ b/annotations_filtered/qkHSTpTqlug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.52], [24.0, 24.83], [26.0, 27.35], [29.0, 33.83], [41.0, 42.28], [43.0, 45.2], [48.0, 52.17], [53.0, 55.92], [57.0, 57.72], [58.0, 60.79], [63.0, 62.61], [64.0, 65.79], [66.0, 94.39], [97.0, 102.79], [106.0, 107.37], [109.0, 111.43], [115.0, 121.36], [123.0, 124.26]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [80.64, 0.0, 0.0, 69.74, 0.0, 90.78, 51.23, 77.53, 0.0, 41.2, 0.0, 0.0, 51.5, 75.39, 0.0, 55.53, 97.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 11.88], ["thunk", 11.88], ["rumble", 7.6]], null, null, null, null, null, null, null, null], "duration": [2.52, 0.83, 1.35, 4.83, 1.28, 2.2, 4.17, 2.92, 0.72, 2.79, -0.39, 1.79, 28.39, 5.79, 1.37, 2.43, 6.36, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/qkVImymH0A0_filtered.json b/annotations_filtered/qkVImymH0A0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0557ddcdfab0d00651230a3cb40ff62a0834eb2 --- /dev/null +++ b/annotations_filtered/qkVImymH0A0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [5.0, 6.72], [8.0, 8.99], [10.0, 11.03], [12.0, 13.41], [15.0, 52.29], [53.0, 53.74], [55.0, 55.44], [56.0, 58.09], [59.0, 60.78], [63.0, 63.46], [64.0, 64.52], [65.0, 69.18], [70.0, 70.77], [71.0, 77.89], [86.0, 86.14], [87.0, 87.83], [107.0, 112.65], [120.0, 121.37], [125.0, 128.53], [136.0, 136.8], [138.0, 138.6], [143.0, 145.02], [150.0, 152.59], [153.0, 153.74], [154.0, 154.41], [157.0, 157.1], [158.0, 158.8], [162.0, 163.07], [167.0, 170.8], [175.0, 178.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 99.36, 0.0, 99.56, 0.0, 0.0, 35.45, 0.0, 34.28, 0.0, 0.0, 40.97, 44.93, 0.0, 0.0, 0.0, 0.0, 0.0, 33.24, 38.06], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.39], ["speech", 5.65], ["sidetone", 3.94]], null, [["cattle, bovinae", 27.39], ["moo", 21.4], ["whale vocalization", 13.0]], null, null, [["speech", 20.76], ["music", 11.87], ["fly, housefly", 7.15]], [["music", 62.87], ["croak", 2.19], ["frog", 2.16]], null, null, null, null, null, [["music", 66.02], ["speech", 7.65], ["groan", 3.24]], [["music", 55.0], ["fart", 5.4], ["music of latin america", 3.34]]], "duration": [0.44, 1.72, 0.99, 1.03, 1.41, 37.29, 0.74, 0.44, 2.09, 1.78, 0.46, 0.52, 4.18, 0.77, 6.89, 0.14, 0.83, 5.65, 1.37, 3.53, 0.8, 0.6, 2.02, 2.59, 0.74, 0.41, 0.1, 0.8, 1.07, 3.8, 3.85]} \ No newline at end of file diff --git a/annotations_filtered/qkjpTwOa0GY_filtered.json b/annotations_filtered/qkjpTwOa0GY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c15f0b7a971a7bddb93920a8ea2990bde8842820 --- /dev/null +++ b/annotations_filtered/qkjpTwOa0GY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 68.84], [71.0, 80.65], [82.0, 83.66], [86.0, 86.8], [89.0, 102.36], [102.0, 103.91], [107.0, 112.48], [114.0, 114.71], [118.0, 128.33]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [96.54, 98.19, 0.0, 0.0, 71.72, 0.0, 98.73, 0.0, 31.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 59.05], ["music", 20.7], ["echo", 2.47]]], "duration": [2.84, 9.65, 1.66, 0.8, 13.36, 1.91, 5.48, 0.71, 10.33]} \ No newline at end of file diff --git a/annotations_filtered/ql0DycjR8wQ_filtered.json b/annotations_filtered/ql0DycjR8wQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1534b966793d2f1b09ee79200ac5d8844fe1090 --- /dev/null +++ b/annotations_filtered/ql0DycjR8wQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.02], [32.0, 32.73], [56.0, 56.61], [58.0, 58.41], [66.0, 66.19], [68.0, 71.56], [72.0, 73.82]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.02, 0.73, 0.61, 0.41, 0.19, 3.56, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/ql5i_tg-wZY_filtered.json b/annotations_filtered/ql5i_tg-wZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e25b2a639603bc8b016246968ae471a8db8cb240 --- /dev/null +++ b/annotations_filtered/ql5i_tg-wZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.84], [3.0, 2.88], [3.0, 2.91], [3.0, 2.94], [3.0, 2.98], [3.0, 3.01], [3.0, 3.05], [3.0, 3.18], [3.0, 3.21], [12.0, 14.13], [19.0, 19.52], [21.0, 21.54], [33.0, 35.19], [36.0, 37.56], [39.0, 40.12], [48.0, 56.22], [59.0, 60.71], [66.0, 66.04], [67.0, 67.9], [71.0, 71.2], [72.0, 72.5], [75.0, 75.39], [82.0, 83.37], [85.0, 85.16], [88.0, 87.57], [89.0, 89.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 0.0, 52.39, 0.0, 0.0, 55.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.16, -0.12, -0.09, -0.06, -0.02, 0.01, 0.05, 0.18, 0.21, 2.13, 0.52, 0.54, 2.19, 1.56, 1.12, 8.22, 1.71, 0.04, 0.9, 0.2, 0.5, 0.39, 1.37, 0.16, -0.43, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/qlUmBE6uGu8_filtered.json b/annotations_filtered/qlUmBE6uGu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85e14ca0ee4b377b2aaf7b9b296941fa3643eefb --- /dev/null +++ b/annotations_filtered/qlUmBE6uGu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [14.0, 14.18], [16.0, 15.85], [16.0, 18.52], [21.0, 21.34], [23.0, 29.96], [47.0, 50.79], [59.0, 60.22], [61.0, 62.34], [75.0, 77.72], [78.0, 80.15], [81.0, 84.59], [85.0, 85.75], [95.0, 94.73], [103.0, 104.41], [113.0, 114.35], [115.0, 118.72], [119.0, 120.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.16, 0.0, 33.2, 84.8, 0.0, 0.0, 63.96, 57.4, 55.11, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 61.3], ["speech", 19.1], ["drum", 6.45]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.18, -0.15, 2.52, 0.34, 6.96, 3.79, 1.22, 1.34, 2.72, 2.15, 3.59, 0.75, -0.27, 1.41, 1.35, 3.72, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/ql_VifCJG7I_filtered.json b/annotations_filtered/ql_VifCJG7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0edc3a814146a278f2cbc28aae515d6a7e4e6237 --- /dev/null +++ b/annotations_filtered/ql_VifCJG7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.06], [8.0, 13.74], [17.0, 17.05], [32.0, 32.85], [34.0, 34.67], [36.0, 38.23], [40.0, 40.66], [41.0, 48.79], [49.0, 61.33]], "keep_status": [true, false, false, false, false, false, false, false, false], "silence_prob": [36.52, 38.19, 0.0, 0.0, 0.0, 56.25, 0.0, 51.55, 30.32], "audiomae_on_audioset": [[["music", 38.24], ["mains hum", 15.1], ["hum", 13.61]], [["music", 53.76], ["electronic music", 11.6], ["speech", 7.54]], null, null, null, null, null, null, [["music", 67.29], ["speech", 12.53], ["sound effect", 1.99]]], "duration": [3.06, 5.74, 0.05, 0.85, 0.67, 2.23, 0.66, 7.79, 12.33]} \ No newline at end of file diff --git a/annotations_filtered/qlfI_AppyIk_filtered.json b/annotations_filtered/qlfI_AppyIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce3f04a5f138e2af5576853eaea4cf520b4972a5 --- /dev/null +++ b/annotations_filtered/qlfI_AppyIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.81], [4.0, 5.49], [6.0, 6.25], [9.0, 16.5], [20.0, 24.83], [27.0, 32.9], [36.0, 39.26], [42.0, 46.18], [48.0, 53.32], [54.0, 58.85], [70.0, 73.6], [75.0, 92.5], [93.0, 95.79], [96.0, 107.18], [108.0, 117.86], [119.0, 120.53], [121.0, 123.18], [124.0, 130.55]], "keep_status": [false, false, false, false, false, true, false, true, false, true, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 99.98, 42.06, 57.56, 43.23, 81.89, 33.75, 50.71, 37.03, 37.78, 30.45, 76.2, 0.0, 64.07, 69.61], "audiomae_on_audioset": [null, null, null, null, null, [["music", 26.8], ["speech", 12.78], ["singing bowl", 12.33]], null, [["hum", 20.21], ["mains hum", 12.75], ["music", 12.04]], null, [["speech", 40.1], ["hum", 17.27], ["music", 11.73]], null, [["music", 26.94], ["hum", 10.5], ["thunk", 6.48]], [["chirp tone", 29.29], ["sine wave", 26.75], ["music", 10.34]], [["speech", 37.78], ["sonar", 13.11], ["hum", 11.8]], null, null, null, null], "duration": [1.81, 1.49, 0.25, 7.5, 4.83, 5.9, 3.26, 4.18, 5.32, 4.85, 3.6, 17.5, 2.79, 11.18, 9.86, 1.53, 2.18, 6.55]} \ No newline at end of file diff --git a/annotations_filtered/qlrpmMPkRUM_filtered.json b/annotations_filtered/qlrpmMPkRUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/qlrpmMPkRUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/qlwQsJOKoIo_filtered.json b/annotations_filtered/qlwQsJOKoIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d07e8368359f6678e26196275dfcad1500ef32c2 --- /dev/null +++ b/annotations_filtered/qlwQsJOKoIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.72], [19.0, 19.21], [20.0, 20.19], [21.0, 29.27], [31.0, 32.37], [36.0, 36.27], [36.0, 44.0], [44.0, 45.47], [49.0, 49.59], [54.0, 56.39], [58.0, 58.82], [62.0, 62.48], [73.0, 89.45], [90.0, 91.59], [94.0, 99.22]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.09, 0.0, 0.0, 41.42, 0.0, 0.0, 49.82, 0.0, 0.0, 42.19, 0.0, 0.0, 60.98, 0.0, 73.97], "audiomae_on_audioset": [[["beatboxing", 25.33], ["noise", 24.02], ["speech", 12.93]], null, null, [["speech", 38.15], ["noise", 15.96], ["fart", 7.49]], null, null, [["speech", 53.05], ["radio", 10.54], ["sidetone", 8.83]], null, null, [["speech", 72.91], ["electric shaver, electric razor", 5.58], ["noise", 4.32]], null, null, null, null, null], "duration": [5.72, 0.21, 0.19, 8.27, 1.37, 0.27, 8.0, 1.47, 0.59, 2.39, 0.82, 0.48, 16.45, 1.59, 5.22]} \ No newline at end of file diff --git a/annotations_filtered/qmBAF_JTwDs_filtered.json b/annotations_filtered/qmBAF_JTwDs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33f6b1086620bbdbe71369e43fe667432b369221 --- /dev/null +++ b/annotations_filtered/qmBAF_JTwDs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.06], [14.0, 32.88], [39.0, 85.73], [88.0, 88.69]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 37.75, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 47.87], ["speech", 8.32], ["buzz", 6.49]], null, null], "duration": [1.06, 18.88, 46.73, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/qnFWCagTOtw_filtered.json b/annotations_filtered/qnFWCagTOtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..175d1f3d6b6cf5973d9f9e8c2ef987f127ba5144 --- /dev/null +++ b/annotations_filtered/qnFWCagTOtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.21], [26.0, 26.43], [45.0, 45.87], [63.0, 63.59], [64.0, 68.4], [70.0, 70.24], [72.0, 72.12], [73.0, 73.21], [73.0, 74.88], [79.0, 79.12], [80.0, 79.84], [81.0, 81.24], [82.0, 82.05], [87.0, 87.35], [88.0, 89.75], [98.0, 98.76], [113.0, 113.64], [120.0, 120.72], [121.0, 122.34], [127.0, 127.74], [128.0, 128.09], [136.0, 136.53], [137.0, 140.98], [142.0, 143.18], [144.0, 144.66], [145.0, 144.96], [148.0, 149.64], [151.0, 152.0], [161.0, 161.76], [162.0, 165.37], [166.0, 167.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.43, 0.87, 0.59, 4.4, 0.24, 0.12, 0.21, 1.88, 0.12, -0.16, 0.24, 0.05, 0.35, 1.75, 0.76, 0.64, 0.72, 1.34, 0.74, 0.09, 0.53, 3.98, 1.18, 0.66, -0.04, 1.64, 1.0, 0.76, 3.37, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/qnNr8etyi08_filtered.json b/annotations_filtered/qnNr8etyi08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a10964123156bcf77995ca3892aef356a51c745 --- /dev/null +++ b/annotations_filtered/qnNr8etyi08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.5], [15.0, 16.36], [18.0, 19.35], [22.0, 23.45], [33.0, 33.94], [40.0, 43.55], [47.0, 73.97], [76.0, 86.27], [88.0, 90.1]], "keep_status": [false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.11, 59.51, 46.54, 44.4], "audiomae_on_audioset": [null, null, null, null, null, [["didgeridoo", 41.1], ["speech", 17.81], ["music", 14.63]], null, [["hum", 31.43], ["mains hum", 21.34], ["music", 16.09]], [["buzz", 24.8], ["music", 14.96], ["hum", 8.39]]], "duration": [1.5, 1.36, 1.35, 1.45, 0.94, 3.55, 26.97, 10.27, 2.1]} \ No newline at end of file diff --git a/annotations_filtered/qnVGIFPFry8_filtered.json b/annotations_filtered/qnVGIFPFry8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..058e2105ca06263da62e8403f9261619e11bbc34 --- /dev/null +++ b/annotations_filtered/qnVGIFPFry8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 28.17], [38.0, 38.58], [41.0, 42.16], [45.0, 50.55], [53.0, 53.64], [56.0, 57.11], [57.0, 58.46], [59.0, 60.05], [61.0, 62.77], [71.0, 71.69], [78.0, 78.39], [81.0, 81.68], [85.0, 86.91], [91.0, 91.99], [96.0, 106.35], [109.0, 110.81], [112.0, 112.97], [118.0, 119.06], [121.0, 121.98], [124.0, 131.65], [133.0, 133.91], [134.0, 134.67], [135.0, 136.73], [137.0, 138.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.8, 0.0, 0.0, 43.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 54.16], ["speech", 12.67], ["electronic music", 6.12]], null, null, [["throbbing", 38.17], ["music", 29.27], ["hum", 18.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.17, 0.58, 1.16, 5.55, 0.64, 1.11, 1.46, 1.05, 1.77, 0.69, 0.39, 0.68, 1.91, 0.99, 10.35, 1.81, 0.97, 1.06, 0.98, 7.65, 0.91, 0.67, 1.73, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/qo1cSaFhPiQ_filtered.json b/annotations_filtered/qo1cSaFhPiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8034e0417452d2810dadd4b24bd3851fce7e063 --- /dev/null +++ b/annotations_filtered/qo1cSaFhPiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.27], [28.0, 28.8], [31.0, 41.4], [46.0, 46.3], [48.0, 47.97], [52.0, 54.33], [55.0, 55.73], [56.0, 58.24], [59.0, 59.37], [59.0, 59.49], [63.0, 63.76], [65.0, 66.16], [68.0, 69.3], [72.0, 72.3], [74.0, 73.84], [76.0, 77.62], [79.0, 82.88]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 33.97, 0.0, 0.0, 44.66, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.42], "audiomae_on_audioset": [null, null, [["fly, housefly", 64.72], ["insect", 25.26], ["mosquito", 4.51]], null, null, [["radio", 27.95], ["speech", 25.15], ["sidetone", 5.51]], null, null, null, null, null, null, null, null, null, null, [["speech", 30.2], ["explosion", 10.47], ["burst, pop", 4.22]]], "duration": [1.27, 0.8, 10.4, 0.3, -0.03, 2.33, 0.73, 2.24, 0.37, 0.49, 0.76, 1.16, 1.3, 0.3, -0.16, 1.62, 3.88]} \ No newline at end of file diff --git a/annotations_filtered/qoWjU8OAUaU_filtered.json b/annotations_filtered/qoWjU8OAUaU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0ff772000727d6baf8a9ed272d91fb207a9f2fc --- /dev/null +++ b/annotations_filtered/qoWjU8OAUaU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.57], [4.0, 4.92], [6.0, 7.82], [10.0, 13.19], [16.0, 17.12], [18.0, 18.79], [19.0, 20.7], [22.0, 22.98], [24.0, 28.07], [29.0, 30.23], [31.0, 31.67], [33.0, 34.64], [36.0, 46.97], [51.0, 63.22], [64.0, 64.62], [65.0, 73.38], [77.0, 86.36], [88.0, 95.74], [97.0, 100.2], [101.0, 104.25], [105.0, 106.3], [107.0, 108.38], [110.0, 110.47], [111.0, 112.06], [113.0, 114.81], [116.0, 117.93], [118.0, 121.59], [123.0, 124.83], [126.0, 128.8], [129.0, 129.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.24, 0.0, 0.0, 0.0, 0.0, 36.61, 0.0, 0.0, 0.0, 31.22, 43.18, 0.0, 35.2, 45.49, 55.46, 62.68, 48.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0, 81.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 58.27], ["sidetone", 11.24], ["hum", 5.78]], null, null, null, null, [["eruption", 20.89], ["hum", 17.65], ["throbbing", 9.36]], null, null, null, [["explosion", 42.96], ["burst, pop", 24.55], ["gunshot, gunfire", 7.35]], [["speech", 14.2], ["hum", 11.67], ["grunt", 6.26]], null, [["speech", 68.98], ["music", 3.57], ["outside, rural or natural", 1.78]], [["wind chime", 12.14], ["glass", 7.33], ["eruption", 6.84]], null, null, [["speech", 47.86], ["hum", 11.97], ["mains hum", 4.9]], null, null, null, null, null, null, [["speech", 46.83], ["hum", 13.33], ["throbbing", 6.07]], null, null, null], "duration": [1.57, 0.92, 1.82, 3.19, 1.12, 0.79, 1.7, 0.98, 4.07, 1.23, 0.67, 1.64, 10.97, 12.22, 0.62, 8.38, 9.36, 7.74, 3.2, 3.25, 1.3, 1.38, 0.47, 1.06, 1.81, 1.93, 3.59, 1.83, 2.8, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/qoXJJin1e7g_filtered.json b/annotations_filtered/qoXJJin1e7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..511f1e8191aba0f3a42801a771eea6f4f80a2bb5 --- /dev/null +++ b/annotations_filtered/qoXJJin1e7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.85], [19.0, 19.85], [28.0, 28.41], [31.0, 31.7], [34.0, 44.96], [54.0, 54.43], [59.0, 60.66], [62.0, 61.96], [63.0, 70.87], [72.0, 72.62], [74.0, 74.71], [81.0, 82.34], [89.0, 89.88], [93.0, 95.99], [101.0, 103.25], [104.0, 107.91], [109.0, 110.34], [112.0, 112.7]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 0.0, 43.25, 0.0, 0.0, 0.0, 0.0, 45.49, 42.04, 40.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 22.93], ["rumble", 17.09], ["music", 15.84]], null, null, null, [["hum", 37.33], ["mains hum", 25.32], ["throbbing", 12.05]], null, null, null, null, [["creak", 19.65], ["vehicle", 5.96], ["fly, housefly", 5.42]], [["telephone", 80.82], ["telephone bell ringing", 13.59], ["ringtone", 1.93]], [["music", 18.99], ["hum", 8.35], ["synthesizer", 7.57]], null, null], "duration": [0.85, 0.85, 0.41, 0.7, 10.96, 0.43, 1.66, -0.04, 7.87, 0.62, 0.71, 1.34, 0.88, 2.99, 2.25, 3.91, 1.34, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/qoftQY-P85o_filtered.json b/annotations_filtered/qoftQY-P85o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3bc5d245d8074d6639c89047533ac49aaa99fb0 --- /dev/null +++ b/annotations_filtered/qoftQY-P85o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.15], [16.0, 32.27], [34.0, 38.5], [42.0, 75.74], [77.0, 77.62], [80.0, 81.63], [84.0, 93.45]], "keep_status": [true, true, false, false, false, false, false], "silence_prob": [34.77, 30.54, 31.1, 0.0, 0.0, 0.0, 40.71], "audiomae_on_audioset": [[["music", 19.84], ["speech", 16.25], ["musical instrument", 5.45]], [["speech", 43.28], ["music", 13.71], ["buzz", 10.61]], [["music", 59.72], ["hum", 11.97], ["mains hum", 8.9]], null, null, null, [["music", 34.27], ["crow", 26.76], ["caw", 12.23]]], "duration": [3.15, 16.27, 4.5, 33.74, 0.62, 1.63, 9.45]} \ No newline at end of file diff --git a/annotations_filtered/qokWn0jfbM4_filtered.json b/annotations_filtered/qokWn0jfbM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82fae41675c3c5fe3a1437e3e840591070bae5a7 --- /dev/null +++ b/annotations_filtered/qokWn0jfbM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.33], [25.0, 29.62], [33.0, 36.91], [41.0, 52.88], [54.0, 54.68], [56.0, 56.61], [58.0, 60.35], [71.0, 75.42], [82.0, 85.28], [88.0, 87.99], [89.0, 89.63], [92.0, 92.77], [94.0, 95.18], [99.0, 104.7], [107.0, 107.7], [122.0, 122.25], [128.0, 128.46]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.77, 99.76, 97.92, 35.57, 0.0, 0.0, 33.11, 35.23, 39.93, 0.0, 0.0, 0.0, 0.0, 43.15, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 43.8], ["speech", 21.56], ["outside, rural or natural", 3.01]], null, null, [["music", 70.95], ["synthesizer", 5.76], ["hum", 3.56]], null, null, [["music", 68.04], ["hum", 3.98], ["synthesizer", 2.88]], [["music", 60.3], ["speech", 12.62], ["scary music", 8.59]], [["music", 72.69], ["scary music", 4.75], ["musical instrument", 3.62]], null, null, null, null, [["music", 70.06], ["hum", 6.23], ["mains hum", 3.73]], null, null, null], "duration": [13.33, 4.62, 3.91, 11.88, 0.68, 0.61, 2.35, 4.42, 3.28, -0.01, 0.63, 0.77, 1.18, 5.7, 0.7, 0.25, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/qopdYE3_QoU_filtered.json b/annotations_filtered/qopdYE3_QoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a6372d9373978963e61a0a7859d53a36de6443b --- /dev/null +++ b/annotations_filtered/qopdYE3_QoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.67], [6.0, 8.19], [20.0, 20.85], [22.0, 22.4], [26.0, 27.04], [29.0, 29.64], [31.0, 31.28], [32.0, 32.8], [42.0, 46.55], [51.0, 59.27], [64.0, 71.63], [72.0, 88.52], [89.0, 94.76], [96.0, 103.05], [104.0, 106.15], [107.0, 112.78], [113.0, 113.97]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.94, 32.21, 94.81, 96.29, 99.84, 90.95, 99.59, 93.6, 0.0], "audiomae_on_audioset": [null, [["speech", 16.41], ["throbbing", 8.91], ["hum", 7.46]], null, null, null, null, null, null, [["music", 17.64], ["speech", 15.77], ["vehicle", 11.01]], [["music", 49.06], ["sidetone", 13.44], ["speech", 12.54]], null, null, null, null, null, null, null], "duration": [0.67, 2.19, 0.85, 0.4, 1.04, 0.64, 0.28, 0.8, 4.55, 8.27, 7.63, 16.52, 5.76, 7.05, 2.15, 5.78, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/qoxMZtAmAiI_filtered.json b/annotations_filtered/qoxMZtAmAiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb2c824a2574b29faa77b74f399c513b48cf1c1f --- /dev/null +++ b/annotations_filtered/qoxMZtAmAiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.43], [13.0, 24.81], [28.0, 29.88], [31.0, 35.56], [41.0, 41.57], [45.0, 54.45], [58.0, 58.26], [66.0, 67.27], [72.0, 72.49], [76.0, 76.08], [78.0, 77.89], [82.0, 81.89], [83.0, 90.12], [91.0, 91.56], [94.0, 94.46], [97.0, 97.23], [101.0, 101.65]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.05, 0.0, 30.25, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 68.91], ["hum", 8.89], ["throbbing", 8.79]], null, [["music", 51.36], ["hum", 6.84], ["noise", 4.52]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 11.81, 1.88, 4.56, 0.57, 9.45, 0.26, 1.27, 0.49, 0.08, -0.11, -0.11, 7.12, 0.56, 0.46, 0.23, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/qp-Jr4oEFWo_filtered.json b/annotations_filtered/qp-Jr4oEFWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c47b52f5a3220ad5b90e5e1cf00728a6be47fb0 --- /dev/null +++ b/annotations_filtered/qp-Jr4oEFWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.4], [9.0, 9.8], [11.0, 11.91], [14.0, 16.04], [18.0, 19.01], [23.0, 23.26], [27.0, 26.81], [28.0, 28.27], [29.0, 29.67], [31.0, 33.13], [36.0, 38.37], [41.0, 45.13], [48.0, 49.08], [49.0, 50.52], [52.0, 53.15], [56.0, 56.1], [58.0, 60.03], [62.0, 64.39], [67.0, 70.12], [72.0, 72.2], [74.0, 76.11], [78.0, 78.65], [81.0, 81.5], [82.0, 83.05], [85.0, 86.66], [87.0, 90.51], [103.0, 104.14], [105.0, 106.19], [109.0, 109.49], [122.0, 122.39], [125.0, 127.72], [132.0, 132.34], [145.0, 146.65], [149.0, 151.55], [153.0, 155.16], [155.0, 157.2], [158.0, 159.11], [161.0, 161.47], [170.0, 178.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 100.0, 98.27, 0.0, 0.0, 0.0, 0.0, 100.0, 60.32, 38.78, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 43.98, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 100.0, 84.98, 36.19, 0.0, 0.0, 98.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 70.41], ["speech synthesizer", 3.04], ["radio", 2.44]], null, null, null, null, null, null, [["speech", 34.96], ["electric shaver, electric razor", 9.01], ["didgeridoo", 6.81]], null, null, null, null, null, null, null, null, null, [["speech", 39.92], ["sidetone", 14.98], ["frog", 7.17]], null, null, null], "duration": [1.4, 0.8, 0.91, 2.04, 1.01, 0.26, -0.19, 0.27, 0.67, 2.13, 2.37, 4.13, 1.08, 1.52, 1.15, 0.1, 2.03, 2.39, 3.12, 0.2, 2.11, 0.65, 0.5, 1.05, 1.66, 3.51, 1.14, 1.19, 0.49, 0.39, 2.72, 0.34, 1.65, 2.55, 2.16, 2.2, 1.11, 0.47, 8.7]} \ No newline at end of file diff --git a/annotations_filtered/qp-uFNB9jYo_filtered.json b/annotations_filtered/qp-uFNB9jYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87602b5008b36762f8281bb70181bf411e962dc4 --- /dev/null +++ b/annotations_filtered/qp-uFNB9jYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.32], [8.0, 8.73], [10.0, 14.84], [15.0, 22.64], [23.0, 24.95], [27.0, 28.09], [29.0, 32.17], [33.0, 33.89], [34.0, 36.09], [37.0, 43.5], [45.0, 45.64], [47.0, 49.0], [50.0, 52.14], [54.0, 57.62], [58.0, 60.08], [62.0, 62.58], [65.0, 66.07], [67.0, 67.76], [70.0, 71.95], [73.0, 76.15], [77.0, 78.85], [80.0, 81.3], [85.0, 85.68], [86.0, 87.62], [88.0, 89.58], [90.0, 91.4], [94.0, 95.82], [101.0, 101.71], [104.0, 104.23], [105.0, 107.65], [109.0, 109.17], [112.0, 112.6], [113.0, 113.68], [117.0, 118.17], [123.0, 124.78], [128.0, 128.75], [130.0, 130.45], [139.0, 140.22], [143.0, 143.07], [147.0, 147.21], [148.0, 149.44], [150.0, 151.63], [154.0, 155.49], [158.0, 160.0], [163.0, 167.12], [171.0, 171.78], [173.0, 174.6], [175.0, 178.19], [181.0, 181.33], [187.0, 189.08], [190.0, 196.97], [200.0, 203.49], [205.0, 206.04], [207.0, 207.94], [211.0, 211.76], [213.0, 214.89], [218.0, 220.06], [221.0, 222.78], [223.0, 230.89]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 49.97, 94.95, 0.0, 0.0, 80.46, 0.0, 44.15, 51.6, 0.0, 74.6, 51.82, 74.92, 48.02, 0.0, 0.0, 0.0, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 99.97, 0.0, 0.0, 99.9, 0.0, 95.91, 97.11, 65.67, 0.0, 0.0, 0.0, 0.0, 47.2, 0.0, 51.82], "audiomae_on_audioset": [null, null, [["whale vocalization", 67.11], ["noise", 3.57], ["music", 3.53]], null, null, null, null, null, [["speech", 25.61], ["music", 22.98], ["whale vocalization", 11.63]], null, null, null, null, null, [["mains hum", 43.45], ["hum", 32.14], ["sidetone", 8.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.35], ["music", 21.09], ["sidetone", 5.36]], null, null], "duration": [1.32, 0.73, 4.84, 7.64, 1.95, 1.09, 3.17, 0.89, 2.09, 6.5, 0.64, 2.0, 2.14, 3.62, 2.08, 0.58, 1.07, 0.76, 1.95, 3.15, 1.85, 1.3, 0.68, 1.62, 1.58, 1.4, 1.82, 0.71, 0.23, 2.65, 0.17, 0.6, 0.68, 1.17, 1.78, 0.75, 0.45, 1.22, 0.07, 0.21, 1.44, 1.63, 1.49, 2.0, 4.12, 0.78, 1.6, 3.19, 0.33, 2.08, 6.97, 3.49, 1.04, 0.94, 0.76, 1.89, 2.06, 1.78, 7.89]} \ No newline at end of file diff --git a/annotations_filtered/qpLovLQoJ6c_filtered.json b/annotations_filtered/qpLovLQoJ6c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b96d871977e6c0d6b550a433dd1d6a6816cb2c82 --- /dev/null +++ b/annotations_filtered/qpLovLQoJ6c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.7], [11.0, 27.5], [29.0, 29.61], [30.0, 30.89], [32.0, 48.14], [51.0, 52.37], [53.0, 54.46], [56.0, 58.82], [60.0, 86.81], [89.0, 90.96], [92.0, 93.33], [95.0, 98.04], [99.0, 100.23], [101.0, 101.04], [102.0, 103.05], [103.0, 103.89], [104.0, 106.62]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 31.26, 0.0, 0.0, 37.39, 0.0, 0.0, 48.61, 36.07, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 34.28], "audiomae_on_audioset": [null, [["music", 57.17], ["theremin", 10.5], ["synthesizer", 6.4]], null, null, [["music", 38.74], ["radio", 3.88], ["boat, water vehicle", 2.94]], null, null, [["speech", 43.96], ["sidetone", 19.2], ["radio", 11.15]], [["music", 47.33], ["musical instrument", 11.39], ["speech", 8.15]], null, null, null, null, null, null, null, [["music", 43.83], ["foghorn", 10.09], ["theremin", 9.53]]], "duration": [1.7, 16.5, 0.61, 0.89, 16.14, 1.37, 1.46, 2.82, 26.81, 1.96, 1.33, 3.04, 1.23, 0.04, 1.05, 0.89, 2.62]} \ No newline at end of file diff --git a/annotations_filtered/qpZBUlqRoeA_filtered.json b/annotations_filtered/qpZBUlqRoeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd63bd3600e239310c0a67df325604034a71e4ac --- /dev/null +++ b/annotations_filtered/qpZBUlqRoeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.17], [7.0, 14.76], [16.0, 18.59], [31.0, 48.95], [50.0, 52.08], [53.0, 54.08], [55.0, 57.03], [59.0, 75.86], [78.0, 86.04], [87.0, 87.74], [89.0, 94.42], [95.0, 111.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.05, 100.0, 99.71, 99.96, 100.0, 0.0, 100.0, 99.97, 99.93, 0.0, 99.98, 97.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.17, 7.76, 2.59, 17.95, 2.08, 1.08, 2.03, 16.86, 8.04, 0.74, 5.42, 16.81]} \ No newline at end of file diff --git a/annotations_filtered/qpxUYzNSGn0_filtered.json b/annotations_filtered/qpxUYzNSGn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c811bab3e16fc2a512ac7f8aa84f8f370f5f981 --- /dev/null +++ b/annotations_filtered/qpxUYzNSGn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.73], [30.0, 30.82], [31.0, 32.48], [40.0, 41.42], [44.0, 46.43], [47.0, 49.35], [52.0, 55.05], [63.0, 63.68], [65.0, 65.3], [69.0, 74.7], [76.0, 77.85], [79.0, 79.93], [81.0, 81.82], [83.0, 83.0], [83.0, 83.17], [94.0, 93.92], [120.0, 120.66], [125.0, 125.14], [128.0, 128.51], [130.0, 130.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 66.15, 74.92, 44.32, 0.0, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 53.93], ["music", 13.18], ["sidetone", 5.3]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.27, 0.82, 1.48, 1.42, 2.43, 2.35, 3.05, 0.68, 0.3, 5.7, 1.85, 0.93, 0.82, 0.0, 0.17, -0.08, 0.66, 0.14, 0.51, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/qq4gK8PkKNM_filtered.json b/annotations_filtered/qq4gK8PkKNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0550590bd7b550c8e3eb6f542174522496b54fd4 --- /dev/null +++ b/annotations_filtered/qq4gK8PkKNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 25.19], [25.0, 26.05], [27.0, 27.5], [76.0, 77.79], [83.0, 88.6]], "keep_status": [false, false, false, false, true], "silence_prob": [43.77, 0.0, 0.0, 0.0, 40.66], "audiomae_on_audioset": [[["music", 27.85], ["cattle, bovinae", 27.06], ["moo", 23.1]], null, null, null, [["music", 35.76], ["synthesizer", 13.14], ["effects unit", 11.0]]], "duration": [9.19, 1.05, 0.5, 1.79, 5.6]} \ No newline at end of file diff --git a/annotations_filtered/qqAzmt1d8kU_filtered.json b/annotations_filtered/qqAzmt1d8kU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff6a3a306bc7d7bd55def7035200970dca618475 --- /dev/null +++ b/annotations_filtered/qqAzmt1d8kU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.67]], "keep_status": [false], "silence_prob": [64.97], "audiomae_on_audioset": [null], "duration": [3.67]} \ No newline at end of file diff --git a/annotations_filtered/qqSS99m2dQ0_filtered.json b/annotations_filtered/qqSS99m2dQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87bfd62b27eb302a2b8386105a4e45571211bec2 --- /dev/null +++ b/annotations_filtered/qqSS99m2dQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.8], [12.0, 13.85], [15.0, 15.15], [16.0, 17.17], [23.0, 23.89], [26.0, 25.84], [26.0, 31.6], [39.0, 39.01], [40.0, 40.15], [43.0, 44.34], [46.0, 46.11], [47.0, 48.3], [51.0, 51.21], [54.0, 53.69], [56.0, 56.76], [57.0, 57.4], [59.0, 60.88], [61.0, 61.87], [67.0, 71.71], [73.0, 76.5], [78.0, 78.58], [80.0, 80.43], [88.0, 89.18], [94.0, 94.19], [95.0, 96.89], [98.0, 98.79], [104.0, 104.65], [105.0, 105.27], [106.0, 105.9], [116.0, 116.55], [119.0, 120.23], [122.0, 125.05], [131.0, 135.48], [136.0, 137.96], [138.0, 138.91], [140.0, 140.48], [141.0, 141.76], [145.0, 144.88], [156.0, 157.35], [159.0, 159.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.07, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.06, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.34], ["fly, housefly", 7.54], ["insect", 6.69]], null, null, null, null, null, null, null, null], "duration": [0.8, 1.85, 0.15, 1.17, 0.89, -0.16, 5.6, 0.01, 0.15, 1.34, 0.11, 1.3, 0.21, -0.31, 0.76, 0.4, 1.88, 0.87, 4.71, 3.5, 0.58, 0.43, 1.18, 0.19, 1.89, 0.79, 0.65, 0.27, -0.1, 0.55, 1.23, 3.05, 4.48, 1.96, 0.91, 0.48, 0.76, -0.12, 1.35, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/qqWVQuCaB6Y_filtered.json b/annotations_filtered/qqWVQuCaB6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6b28964fbac80a9994e8a0e929385ff952f50d0 --- /dev/null +++ b/annotations_filtered/qqWVQuCaB6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 41.67], [42.0, 104.16], [105.0, 106.1], [107.0, 109.21], [110.0, 111.06]], "keep_status": [false, false, false, false, false], "silence_prob": [71.43, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [12.67, 62.16, 1.1, 2.21, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/qqX1d64OcvI_filtered.json b/annotations_filtered/qqX1d64OcvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0918d2c00242205b733fc23b56e0f8972f0fb5f0 --- /dev/null +++ b/annotations_filtered/qqX1d64OcvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.5], [16.0, 16.02], [19.0, 64.29], [65.0, 66.02], [67.0, 67.27], [68.0, 75.27], [77.0, 79.64], [83.0, 85.67], [88.0, 88.6], [89.0, 91.56], [93.0, 94.42], [96.0, 100.43], [109.0, 108.87], [113.0, 115.91], [118.0, 119.87]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [30.2, 0.0, 0.0, 0.0, 0.0, 60.79, 40.55, 39.57, 0.0, 36.71, 0.0, 76.7, 0.0, 84.62, 0.0], "audiomae_on_audioset": [[["music", 30.04], ["crowd", 20.66], ["speech", 10.96]], null, null, null, null, null, [["speech", 9.35], ["bleat", 8.69], ["bee, wasp, etc.", 8.55]], [["fly, housefly", 38.75], ["insect", 17.6], ["bee, wasp, etc.", 17.01]], null, [["fly, housefly", 58.08], ["insect", 22.35], ["bee, wasp, etc.", 6.06]], null, null, null, null, null], "duration": [4.5, 0.02, 45.29, 1.02, 0.27, 7.27, 2.64, 2.67, 0.6, 2.56, 1.42, 4.43, -0.13, 2.91, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/qqZPej42OkE_filtered.json b/annotations_filtered/qqZPej42OkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..657824bbfcc91533c223a6ff37d0b482840edd82 --- /dev/null +++ b/annotations_filtered/qqZPej42OkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.1], [3.0, 12.01], [13.0, 16.44], [18.0, 20.48], [23.0, 30.28], [31.0, 32.29], [33.0, 37.18]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 89.36, 99.8, 66.27, 72.46, 0.0, 87.92], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.1, 9.01, 3.44, 2.48, 7.28, 1.29, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/qqaFGM-AyNA_filtered.json b/annotations_filtered/qqaFGM-AyNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e14f2356d897fbd56cb71a7fe4fa32f1d9ad70a9 --- /dev/null +++ b/annotations_filtered/qqaFGM-AyNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 49.94], [52.0, 83.22], [85.0, 95.17], [99.0, 101.53]], "keep_status": [true, false, true, true], "silence_prob": [32.05, 0.0, 31.04, 30.44], "audiomae_on_audioset": [[["music", 43.77], ["synthesizer", 17.32], ["echo", 7.17]], null, [["music", 34.9], ["effects unit", 18.74], ["distortion", 10.72]], [["echo", 26.99], ["music", 19.07], ["synthesizer", 17.0]]], "duration": [6.94, 31.22, 10.17, 2.53]} \ No newline at end of file diff --git a/annotations_filtered/qqhQ9jN3gj4_filtered.json b/annotations_filtered/qqhQ9jN3gj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20a612ee5a46897ccd8d5f73310106f1d44a41c8 --- /dev/null +++ b/annotations_filtered/qqhQ9jN3gj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.1], [7.0, 7.47], [9.0, 9.39], [12.0, 12.9], [14.0, 14.98], [16.0, 17.32], [18.0, 19.08], [22.0, 22.22], [24.0, 24.68], [26.0, 27.06], [28.0, 28.09], [29.0, 29.22], [30.0, 31.48], [33.0, 33.2], [34.0, 34.57], [36.0, 38.31], [39.0, 39.61], [40.0, 43.43], [47.0, 47.19], [63.0, 63.34], [66.0, 66.01], [67.0, 67.47], [69.0, 69.69], [71.0, 73.11], [78.0, 78.85], [79.0, 79.68], [83.0, 82.7], [83.0, 83.96], [84.0, 86.86], [88.0, 93.26], [95.0, 95.71], [96.0, 97.34], [99.0, 99.55], [104.0, 104.62], [106.0, 107.47], [109.0, 109.73], [110.0, 110.78], [117.0, 120.95], [122.0, 122.88], [124.0, 124.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 60.51, 41.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 70.06], ["radio", 9.91], ["telephone", 6.38]], null, null, null, null, null, null, null, null, null, null], "duration": [2.1, 0.47, 0.39, 0.9, 0.98, 1.32, 1.08, 0.22, 0.68, 1.06, 0.09, 0.22, 1.48, 0.2, 0.57, 2.31, 0.61, 3.43, 0.19, 0.34, 0.01, 0.47, 0.69, 2.11, 0.85, 0.68, -0.3, 0.96, 2.86, 5.26, 0.71, 1.34, 0.55, 0.62, 1.47, 0.73, 0.78, 3.95, 0.88, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/qqhyIIZt87A_filtered.json b/annotations_filtered/qqhyIIZt87A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dab733a0405cba33bff9909a22d47ce3cce8630f --- /dev/null +++ b/annotations_filtered/qqhyIIZt87A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.1], [8.0, 8.61], [17.0, 16.66], [46.0, 47.24], [49.0, 50.43], [52.0, 52.22], [54.0, 54.62], [57.0, 59.27], [62.0, 66.95], [71.0, 72.23], [75.0, 76.92], [78.0, 82.97], [85.0, 86.93], [87.0, 88.2], [89.0, 91.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 99.73, 0.0, 0.0, 43.58, 0.0, 0.0, 56.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 61.21], ["drum", 7.12], ["bass drum", 4.62]], null, null, null], "duration": [0.1, 0.61, -0.34, 1.24, 1.43, 0.22, 0.62, 2.27, 4.95, 1.23, 1.92, 4.97, 1.93, 1.2, 2.17]} \ No newline at end of file diff --git a/annotations_filtered/qr7oBpkkxIQ_filtered.json b/annotations_filtered/qr7oBpkkxIQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b444e0b01ba00067960880f1e92f194812c2d6e4 --- /dev/null +++ b/annotations_filtered/qr7oBpkkxIQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.87], [9.0, 105.78], [107.0, 107.37], [108.0, 109.26], [110.0, 111.16]], "keep_status": [true, false, false, false, false], "silence_prob": [34.94, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 25.44], ["throbbing", 23.46], ["music", 18.48]], null, null, null, null], "duration": [4.87, 96.78, 0.37, 1.26, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/qrCkASenz7I_filtered.json b/annotations_filtered/qrCkASenz7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a097083d9858a870f4e5d12829ffe95575f04a54 --- /dev/null +++ b/annotations_filtered/qrCkASenz7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [10.0, 10.74], [16.0, 16.56], [22.0, 23.41], [29.0, 29.37], [30.0, 30.87], [39.0, 39.58], [40.0, 40.49], [43.0, 43.16], [44.0, 44.24], [45.0, 45.52], [48.0, 51.92], [56.0, 57.54], [60.0, 60.81], [62.0, 62.55], [63.0, 66.55], [74.0, 76.06], [83.0, 84.6], [90.0, 90.54], [93.0, 93.41], [95.0, 97.5], [98.0, 99.66], [101.0, 101.83], [104.0, 104.67], [107.0, 108.45], [110.0, 111.96], [115.0, 117.42], [118.0, 120.41], [123.0, 124.48], [126.0, 129.54], [132.0, 132.0], [134.0, 135.28], [136.0, 136.8], [138.0, 138.38], [140.0, 140.54], [147.0, 148.2], [151.0, 152.83], [154.0, 155.33], [158.0, 158.4], [160.0, 160.79], [163.0, 163.38], [165.0, 168.08], [170.0, 173.2], [174.0, 175.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 55.96, 64.75, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 88.64, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 39.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.29], ["hum", 11.72], ["electronic music", 9.13]], null], "duration": [1.11, 0.74, 0.56, 1.41, 0.37, 0.87, 0.58, 0.49, 0.16, 0.24, 0.52, 3.92, 1.54, 0.81, 0.55, 3.55, 2.06, 1.6, 0.54, 0.41, 2.5, 1.66, 0.83, 0.67, 1.45, 1.96, 2.42, 2.41, 1.48, 3.54, 0.0, 1.28, 0.8, 0.38, 0.54, 1.2, 1.83, 1.33, 0.4, 0.79, 0.38, 3.08, 3.2, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/qrIt5BPvCv8_filtered.json b/annotations_filtered/qrIt5BPvCv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57ea0b7a10ebfa5c27b003f147ef1838138c004b --- /dev/null +++ b/annotations_filtered/qrIt5BPvCv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.75], [11.0, 14.25], [47.0, 47.92], [50.0, 50.58], [54.0, 54.99], [56.0, 70.95], [75.0, 76.65], [79.0, 82.85], [84.0, 84.97], [86.0, 87.08], [88.0, 89.26], [90.0, 90.68], [92.0, 94.41], [96.0, 96.4], [97.0, 97.9], [101.0, 100.99], [104.0, 106.95], [108.0, 108.41], [110.0, 111.28], [113.0, 114.13], [115.0, 116.06], [117.0, 117.37], [119.0, 120.68], [122.0, 122.66], [123.0, 124.21], [127.0, 126.77], [129.0, 129.25]], "keep_status": [true, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.95, 38.51, 0.0, 0.0, 0.0, 31.07, 0.0, 43.23, 0.0, 0.0, 0.0, 0.0, 49.5, 0.0, 0.0, 0.0, 44.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["noise", 47.79], ["music", 14.96], ["musical instrument", 5.22]], [["speech", 42.47], ["music", 23.66], ["didgeridoo", 5.49]], null, null, null, [["speech", 36.26], ["hum", 10.47], ["vehicle", 6.32]], null, [["music", 21.47], ["hum", 11.86], ["throbbing", 7.18]], null, null, null, null, [["sidetone", 20.0], ["hum", 18.4], ["speech", 11.42]], null, null, null, [["speech", 30.58], ["music", 4.69], ["hum", 3.44]], null, null, null, null, null, null, null, null, null, null], "duration": [3.75, 3.25, 0.92, 0.58, 0.99, 14.95, 1.65, 3.85, 0.97, 1.08, 1.26, 0.68, 2.41, 0.4, 0.9, -0.01, 2.95, 0.41, 1.28, 1.13, 1.06, 0.37, 1.68, 0.66, 1.21, -0.23, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/qrONj6Srq7M_filtered.json b/annotations_filtered/qrONj6Srq7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ccb6734f721a39152e31da1ec11b920e3062777 --- /dev/null +++ b/annotations_filtered/qrONj6Srq7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [3.0, 4.97], [6.0, 12.53], [15.0, 14.66], [16.0, 16.92], [18.0, 19.74], [22.0, 22.89], [23.0, 25.44], [27.0, 28.0], [35.0, 37.17], [37.0, 39.83], [42.0, 44.07], [46.0, 47.93], [51.0, 53.47], [54.0, 54.41], [57.0, 57.15], [58.0, 58.82], [61.0, 62.26], [63.0, 65.62], [66.0, 68.13], [75.0, 75.81], [77.0, 77.65], [79.0, 79.03], [82.0, 84.67], [87.0, 88.33], [89.0, 92.72], [97.0, 99.67], [100.0, 100.77], [104.0, 107.35], [109.0, 110.83], [114.0, 118.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.52, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 99.44, 99.68, 74.92, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 99.92, 99.93, 0.0, 0.0, 0.0, 99.95, 0.0, 98.19, 99.8, 0.0, 98.01, 0.0, 99.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 1.97, 6.53, -0.34, 0.92, 1.74, 0.89, 2.44, 1.0, 2.17, 2.83, 2.07, 1.93, 2.47, 0.41, 0.15, 0.82, 1.26, 2.62, 2.13, 0.81, 0.65, 0.03, 2.67, 1.33, 3.72, 2.67, 0.77, 3.35, 1.83, 4.59]} \ No newline at end of file diff --git a/annotations_filtered/qrTBSBYpzg0_filtered.json b/annotations_filtered/qrTBSBYpzg0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f84c3f84f3238e9bfbad7e1c198ea587f08093eb --- /dev/null +++ b/annotations_filtered/qrTBSBYpzg0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.8], [3.0, 8.63], [12.0, 12.9], [14.0, 14.22], [15.0, 15.18], [19.0, 20.55], [23.0, 27.13], [28.0, 28.54], [29.0, 29.59], [32.0, 32.97], [35.0, 35.46], [37.0, 38.57], [40.0, 40.61], [41.0, 42.96], [45.0, 45.17], [49.0, 51.83], [53.0, 53.33], [56.0, 58.85], [62.0, 82.75]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 31.19, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.92, 0.0, 39.37, 29.93], "audiomae_on_audioset": [null, [["music", 25.38], ["effects unit", 14.43], ["synthesizer", 10.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.36], ["brass instrument", 8.99], ["theremin", 8.55]], [["music", 65.95], ["theremin", 14.3], ["musical instrument", 3.81]]], "duration": [0.8, 5.63, 0.9, 0.22, 0.18, 1.55, 4.13, 0.54, 0.59, 0.97, 0.46, 1.57, 0.61, 1.96, 0.17, 2.83, 0.33, 2.85, 20.75]} \ No newline at end of file diff --git a/annotations_filtered/qru3WdOfj8s_filtered.json b/annotations_filtered/qru3WdOfj8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bce3fc22bd7a8cf5a03e0e88e850a60e137d57c --- /dev/null +++ b/annotations_filtered/qru3WdOfj8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.64], [8.0, 9.59], [20.0, 27.97], [29.0, 30.42], [32.0, 32.44], [35.0, 42.21], [49.0, 51.8], [58.0, 58.85], [61.0, 62.34], [65.0, 66.14], [68.0, 68.18], [70.0, 71.14], [75.0, 75.47], [81.0, 81.24], [83.0, 83.71], [88.0, 87.67]], "keep_status": [true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.08, 0.0, 41.91, 0.0, 0.0, 35.24, 53.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.69], ["speech", 10.76], ["sidetone", 4.1]], null, [["speech", 31.06], ["fly, housefly", 25.63], ["insect", 11.68]], null, null, [["speech", 24.27], ["hum", 20.94], ["music", 15.99]], null, null, null, null, null, null, null, null, null, null], "duration": [2.64, 1.59, 7.97, 1.42, 0.44, 7.21, 2.8, 0.85, 1.34, 1.14, 0.18, 1.14, 0.47, 0.24, 0.71, -0.33]} \ No newline at end of file diff --git a/annotations_filtered/qs0J2F3ErMc_filtered.json b/annotations_filtered/qs0J2F3ErMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d4ead68c901b0871c241b5d0fee3fa329cfd76e --- /dev/null +++ b/annotations_filtered/qs0J2F3ErMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.64], [14.0, 15.96], [19.0, 23.75], [25.0, 25.96], [34.0, 36.0], [37.0, 37.61], [43.0, 45.17], [46.0, 45.99], [48.0, 50.72], [52.0, 52.68], [54.0, 54.89], [59.0, 59.31], [73.0, 77.08], [83.0, 83.57], [90.0, 92.03], [101.0, 102.84], [107.0, 112.45], [115.0, 115.08], [124.0, 129.05], [131.0, 131.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 99.21, 0.0, 98.86, 0.0, 92.8, 0.0, 92.97, 0.0, 0.0, 0.0, 88.1, 0.0, 54.5, 0.0, 87.74, 0.0, 39.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.2], ["throbbing", 23.47], ["hum", 21.13]], null], "duration": [1.64, 1.96, 4.75, 0.96, 2.0, 0.61, 2.17, -0.01, 2.72, 0.68, 0.89, 0.31, 4.08, 0.57, 2.03, 1.84, 5.45, 0.08, 5.05, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/qs1QcRTOMEg_filtered.json b/annotations_filtered/qs1QcRTOMEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c70bc7f62858fd2cdc25f1ee04aa8aebb09c38ae --- /dev/null +++ b/annotations_filtered/qs1QcRTOMEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 91.99], [93.0, 111.37]], "keep_status": [true, false], "silence_prob": [30.59, 30.27], "audiomae_on_audioset": [[["music", 30.69], ["buzz", 19.42], ["speech", 7.33]], [["music", 64.02], ["smash, crash", 8.86], ["breaking", 7.25]]], "duration": [25.99, 18.37]} \ No newline at end of file diff --git a/annotations_filtered/qsdgNxuhPgc_filtered.json b/annotations_filtered/qsdgNxuhPgc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04be882499e4a618532838817e1466e0495d779c --- /dev/null +++ b/annotations_filtered/qsdgNxuhPgc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [5.0, 5.04], [5.0, 6.61], [11.0, 16.8], [19.0, 44.71], [46.0, 47.65], [51.0, 52.25], [53.0, 54.73], [56.0, 60.12], [61.0, 63.98], [66.0, 66.97], [68.0, 70.31], [75.0, 84.57], [85.0, 86.19], [88.0, 96.47], [101.0, 102.64], [104.0, 126.99], [129.0, 130.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 93.91, 97.0, 0.0, 0.0, 0.0, 99.98, 99.87, 0.0, 98.93, 77.36, 0.0, 99.26, 0.0, 99.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.04, 1.61, 5.8, 25.71, 1.65, 1.25, 1.73, 4.12, 2.98, 0.97, 2.31, 9.57, 1.19, 8.47, 1.64, 22.99, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/qsyYw2x1-js_filtered.json b/annotations_filtered/qsyYw2x1-js_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f094cc09f4caf8f0378daf11d89a473108a5a23b --- /dev/null +++ b/annotations_filtered/qsyYw2x1-js_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.02], [5.0, 16.44], [21.0, 26.99], [27.0, 32.54], [34.0, 47.09], [48.0, 82.07], [83.0, 131.45], [132.0, 134.79], [136.0, 147.56], [150.0, 149.54], [151.0, 174.92], [178.0, 178.68]], "keep_status": [true, true, true, true, true, false, false, true, false, false, false, false], "silence_prob": [38.68, 29.57, 29.48, 30.7, 31.58, 0.0, 0.0, 40.99, 29.56, 0.0, 65.79, 0.0], "audiomae_on_audioset": [[["hum", 37.13], ["speech", 18.19], ["music", 11.82]], [["music", 45.9], ["hum", 10.64], ["didgeridoo", 7.17]], [["whack, thwack", 19.16], ["speech", 18.4], ["music", 12.77]], [["speech", 33.01], ["groan", 12.44], ["music", 5.45]], [["music", 19.32], ["speech", 16.57], ["breaking", 7.96]], null, null, [["music", 20.85], ["cello", 15.87], ["foghorn", 10.74]], [["speech", 50.32], ["music", 32.98], ["roar", 1.81]], null, null, null], "duration": [3.02, 11.44, 5.99, 5.54, 13.09, 34.07, 48.45, 2.79, 11.56, -0.46, 23.92, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/qtKtxLmxl24_filtered.json b/annotations_filtered/qtKtxLmxl24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..428425ff81bbd95f9d2acb684201ba6be22ad4a6 --- /dev/null +++ b/annotations_filtered/qtKtxLmxl24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.47], [17.0, 19.62], [29.0, 29.25], [40.0, 41.25], [44.0, 45.91], [53.0, 53.18], [54.0, 54.8], [94.0, 95.22], [109.0, 114.94], [117.0, 117.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.74, 38.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.54, 0.0], "audiomae_on_audioset": [[["music", 65.85], ["throbbing", 3.29], ["musical instrument", 3.08]], [["music", 55.98], ["musical instrument", 9.75], ["guitar", 9.44]], null, null, null, null, null, null, [["hum", 34.36], ["throbbing", 34.15], ["mains hum", 6.06]], null], "duration": [8.47, 2.62, 0.25, 1.25, 1.91, 0.18, 0.8, 1.22, 5.94, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/qu4v5hB1dKk_filtered.json b/annotations_filtered/qu4v5hB1dKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..362bd5ec916cece150d1856e3cdede2d6dceacb5 --- /dev/null +++ b/annotations_filtered/qu4v5hB1dKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [16.0, 16.31], [17.0, 17.42], [18.0, 19.94], [24.0, 24.44], [30.0, 30.03], [31.0, 31.46], [35.0, 34.52], [38.0, 41.99], [43.0, 44.09], [50.0, 51.07], [67.0, 67.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 65.66], ["carnatic music", 6.03], ["middle eastern music", 2.52]], null, null, null], "duration": [0.5, 0.31, 0.42, 1.94, 0.44, 0.03, 0.46, -0.48, 3.99, 1.09, 1.07, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/qu68Gym5PvE_filtered.json b/annotations_filtered/qu68Gym5PvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f5eaeb7526ed8eb629711920369f1580626ae9c --- /dev/null +++ b/annotations_filtered/qu68Gym5PvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 42.06], [49.0, 55.71], [62.0, 65.03], [66.0, 97.34], [98.0, 114.42], [115.0, 116.61], [117.0, 117.19], [120.0, 120.75], [122.0, 126.93], [130.0, 130.6]], "keep_status": [false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 32.31, 31.66, 0.0, 30.39, 0.0, 0.0, 0.0, 49.18, 0.0], "audiomae_on_audioset": [null, [["music", 51.39], ["throbbing", 11.53], ["didgeridoo", 8.03]], [["music", 55.48], ["theremin", 6.8], ["timpani", 5.0]], null, [["music", 40.82], ["speech", 20.7], ["hum", 9.32]], null, null, null, [["fart", 38.31], ["noise", 5.89], ["throbbing", 5.02]], null], "duration": [32.06, 6.71, 3.03, 31.34, 16.42, 1.61, 0.19, 0.75, 4.93, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/quEBzmchcwc_filtered.json b/annotations_filtered/quEBzmchcwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa34606a55e468b885910e432c57a31bbd0c0774 --- /dev/null +++ b/annotations_filtered/quEBzmchcwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.64], [30.0, 34.82], [39.0, 41.2], [45.0, 46.7], [49.0, 48.93], [50.0, 50.67], [52.0, 54.21], [57.0, 59.41], [62.0, 63.07], [64.0, 65.48], [67.0, 69.99], [74.0, 74.58], [77.0, 85.21], [86.0, 90.1], [91.0, 107.55], [111.0, 116.36], [121.0, 123.35], [127.0, 127.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 99.99, 0.0, 0.0, 0.0, 99.84, 99.95, 0.0, 0.0, 99.98, 0.0, 99.97, 99.44, 99.4, 99.98, 91.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 4.82, 2.2, 1.7, -0.07, 0.67, 2.21, 2.41, 1.07, 1.48, 2.99, 0.58, 8.21, 4.1, 16.55, 5.36, 2.35, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/quJX9XLQe78_filtered.json b/annotations_filtered/quJX9XLQe78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d44bb6d3ba09ca3f820edb4f4565054916bdc5f2 --- /dev/null +++ b/annotations_filtered/quJX9XLQe78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.39], [18.0, 19.35], [20.0, 21.68], [23.0, 23.75], [24.0, 25.81], [27.0, 29.19], [30.0, 30.81], [33.0, 34.8], [37.0, 37.66], [38.0, 45.77], [50.0, 52.42], [53.0, 54.63], [57.0, 57.89], [59.0, 60.84], [63.0, 63.86], [64.0, 66.48], [69.0, 69.38], [70.0, 70.65], [73.0, 76.28], [77.0, 77.14], [80.0, 81.23], [83.0, 83.52], [85.0, 88.96], [90.0, 91.71], [92.0, 95.25], [96.0, 97.14], [98.0, 98.9], [111.0, 111.69], [116.0, 118.25], [120.0, 121.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 0.0, 0.0, 71.72, 95.37, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 94.07, 0.0, 44.9, 0.0, 0.0, 0.0, 38.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 67.04], ["tuning fork", 17.31], ["speech", 7.14]], null, null, null, [["sidetone", 30.23], ["music", 12.97], ["whale vocalization", 5.58]], null], "duration": [0.39, 1.35, 1.68, 0.75, 1.81, 2.19, 0.81, 1.8, 0.66, 7.77, 2.42, 1.63, 0.89, 1.84, 0.86, 2.48, 0.38, 0.65, 3.28, 0.14, 1.23, 0.52, 3.96, 1.71, 3.25, 1.14, 0.9, 0.69, 2.25, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/qv4BPYX4B8U_filtered.json b/annotations_filtered/qv4BPYX4B8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b372bc90fe24c2df6920c4140042daaf58551e3f --- /dev/null +++ b/annotations_filtered/qv4BPYX4B8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [6.0, 6.45], [7.0, 9.91], [12.0, 12.31], [14.0, 14.23], [16.0, 17.17], [19.0, 18.59], [19.0, 19.75], [22.0, 22.49], [23.0, 24.44], [29.0, 31.92], [33.0, 33.42], [38.0, 38.23], [39.0, 39.41], [40.0, 40.22], [43.0, 44.42], [50.0, 51.22], [53.0, 54.35], [56.0, 55.97], [57.0, 57.72], [63.0, 64.54], [67.0, 67.64], [68.0, 69.75], [70.0, 72.3], [74.0, 77.4], [79.0, 78.61], [91.0, 92.08], [96.0, 105.95], [107.0, 108.01], [109.0, 114.44], [115.0, 117.1], [119.0, 119.33], [122.0, 134.16], [135.0, 139.46], [140.0, 141.35], [146.0, 145.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53, 61.77, 0.0, 0.0, 87.37, 0.0, 85.9, 64.63, 0.0, 58.89, 53.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.45, 2.91, 0.31, 0.23, 1.17, -0.41, 0.75, 0.49, 1.44, 2.92, 0.42, 0.23, 0.41, 0.22, 1.42, 1.22, 1.35, -0.03, 0.72, 1.54, 0.64, 1.75, 2.3, 3.4, -0.39, 1.08, 9.95, 1.01, 5.44, 2.1, 0.33, 12.16, 4.46, 1.35, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/qvFBGYjAXW8_filtered.json b/annotations_filtered/qvFBGYjAXW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14683103c7e6224b313088ac5deabfbc5b0d1788 --- /dev/null +++ b/annotations_filtered/qvFBGYjAXW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.79], [20.0, 20.44], [21.0, 21.0], [22.0, 22.25], [27.0, 30.75], [50.0, 51.29], [56.0, 57.74], [60.0, 61.11], [62.0, 64.57], [65.0, 66.83], [68.0, 70.97], [73.0, 74.28], [78.0, 78.21], [79.0, 81.6], [82.0, 86.7], [88.0, 89.43], [90.0, 99.98], [103.0, 110.37], [112.0, 112.9], [118.0, 121.69], [141.0, 152.51], [156.0, 155.85]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.47, 0.0, 0.0, 0.0, 49.64, 0.0, 48.27, 0.0, 0.0, 63.85, 30.9, 0.0, 30.87, 30.73, 0.0, 32.42, 30.47, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 67.0], ["speech", 11.22], ["drum machine", 2.85]], null, null, null, [["music", 30.88], ["speech", 29.25], ["musical instrument", 6.1]], null, [["music", 33.81], ["guitar", 12.96], ["speech", 11.38]], null, null, null, [["music", 52.38], ["speech", 12.15], ["drum", 4.84]], null, [["music", 38.35], ["groan", 12.07], ["whack, thwack", 10.06]], [["music", 34.69], ["speech", 29.1], ["sidetone", 7.38]], null, [["music", 59.51], ["musical instrument", 5.6], ["guitar", 2.71]], [["music", 71.72], ["speech", 5.47], ["musical instrument", 1.92]], null], "duration": [1.79, 0.44, 0.0, 0.25, 3.75, 1.29, 1.74, 1.11, 2.57, 1.83, 2.97, 1.28, 0.21, 2.6, 4.7, 1.43, 9.98, 7.37, 0.9, 3.69, 11.51, -0.15]} \ No newline at end of file diff --git a/annotations_filtered/qvFduxMK7zo_filtered.json b/annotations_filtered/qvFduxMK7zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d593cf832eb893eede535398d98e7fcc9ff66ec --- /dev/null +++ b/annotations_filtered/qvFduxMK7zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [9.0, 8.68], [10.0, 10.03], [12.0, 11.58], [14.0, 13.71], [17.0, 17.63], [24.0, 25.2], [27.0, 27.6], [35.0, 34.92], [37.0, 48.27], [52.0, 52.15], [55.0, 55.51], [58.0, 58.73], [63.0, 63.21], [66.0, 79.37], [80.0, 80.43], [81.0, 82.14]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.02, 0.0, 0.0, 0.0, 0.0, 32.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 36.06], ["speech", 17.82], ["mains hum", 11.72]], null, null, null, null, [["music", 29.9], ["synthesizer", 11.36], ["theremin", 10.98]], null, null], "duration": [0.56, -0.32, 0.03, -0.42, -0.29, 0.63, 1.2, 0.6, -0.08, 11.27, 0.15, 0.51, 0.73, 0.21, 13.37, 0.43, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/qv_DJYvELTQ_filtered.json b/annotations_filtered/qv_DJYvELTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70b16399f661c36df8f840473427a17efc95f8bf --- /dev/null +++ b/annotations_filtered/qv_DJYvELTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 19.97], [21.0, 21.76], [26.0, 26.77], [29.0, 30.01], [35.0, 39.8], [41.0, 42.62], [43.0, 45.71], [47.0, 47.85], [48.0, 51.31], [52.0, 58.21], [60.0, 60.61], [62.0, 63.07], [66.0, 69.8], [71.0, 73.31], [74.0, 74.63], [76.0, 77.45], [83.0, 84.23], [86.0, 87.91], [91.0, 92.21], [96.0, 98.37], [102.0, 112.41], [115.0, 116.41], [119.0, 119.87], [121.0, 121.88], [130.0, 132.48], [133.0, 137.19], [137.0, 137.52], [138.0, 144.98], [147.0, 160.89], [165.0, 167.9], [168.0, 170.18], [172.0, 174.65]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, true, true], "silence_prob": [33.56, 0.0, 0.0, 0.0, 66.76, 0.0, 36.61, 0.0, 68.8, 39.8, 0.0, 0.0, 41.52, 36.42, 0.0, 0.0, 0.0, 0.0, 0.0, 62.47, 40.48, 0.0, 0.0, 0.0, 53.65, 29.99, 0.0, 29.41, 36.98, 40.38, 41.18, 30.03], "audiomae_on_audioset": [[["hum", 59.61], ["mains hum", 30.69], ["throbbing", 6.75]], null, null, null, null, null, [["hum", 21.3], ["whale vocalization", 17.31], ["cattle, bovinae", 11.52]], null, null, [["speech", 75.62], ["sidetone", 7.96], ["radio", 2.77]], null, null, [["stomach rumble", 45.24], ["speech", 17.37], ["whale vocalization", 7.16]], [["sidetone", 69.1], ["hum", 9.0], ["music", 5.58]], null, null, null, null, null, null, [["hum", 41.62], ["speech", 25.15], ["mains hum", 7.49]], null, null, null, null, [["speech", 32.58], ["bee, wasp, etc.", 9.01], ["fly, housefly", 7.14]], null, [["speech", 43.04], ["animal", 9.46], ["outside, rural or natural", 5.1]], [["hum", 41.38], ["throbbing", 29.67], ["music", 6.03]], [["speech", 31.53], ["gong", 11.36], ["hum", 8.96]], [["speech", 36.86], ["hum", 20.67], ["whale vocalization", 8.56]], [["speech", 64.04], ["outside, rural or natural", 3.24], ["rumble", 2.01]]], "duration": [7.97, 0.76, 0.77, 1.01, 4.8, 1.62, 2.71, 0.85, 3.31, 6.21, 0.61, 1.07, 3.8, 2.31, 0.63, 1.45, 1.23, 1.91, 1.21, 2.37, 10.41, 1.41, 0.87, 0.88, 2.48, 4.19, 0.52, 6.98, 13.89, 2.9, 2.18, 2.65]} \ No newline at end of file diff --git a/annotations_filtered/qvo_HDqOKww_filtered.json b/annotations_filtered/qvo_HDqOKww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..747ff67b60a0b75ce278aea2bbe88cd55a49c60d --- /dev/null +++ b/annotations_filtered/qvo_HDqOKww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.24], [9.0, 10.39], [17.0, 17.34], [23.0, 23.6], [28.0, 32.29], [35.0, 37.4], [38.0, 37.96], [39.0, 39.39], [41.0, 43.01], [43.0, 48.59], [50.0, 54.3], [56.0, 56.81], [59.0, 58.83], [64.0, 65.06], [66.0, 68.4], [70.0, 73.5], [75.0, 77.04], [77.0, 78.41], [81.0, 82.17], [91.0, 91.61], [108.0, 108.94], [112.0, 114.1], [120.0, 121.04], [122.0, 123.52], [131.0, 133.02], [135.0, 138.67]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 44.18, 83.16, 0.0, 0.0, 99.97, 83.34, 96.04, 0.0, 0.0, 0.0, 87.0, 64.63, 67.13, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0, 0.0, 56.86, 63.21], "audiomae_on_audioset": [null, null, null, null, [["speech", 59.48], ["sidetone", 5.02], ["music", 3.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 1.39, 0.34, 0.6, 4.29, 2.4, -0.04, 0.39, 2.01, 5.59, 4.3, 0.81, -0.17, 1.06, 2.4, 3.5, 2.04, 1.41, 1.17, 0.61, 0.94, 2.1, 1.04, 1.52, 2.02, 3.67]} \ No newline at end of file diff --git a/annotations_filtered/qvvcVzNqXVg_filtered.json b/annotations_filtered/qvvcVzNqXVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41e68efb62a36ca80d35b4887087d928722a7499 --- /dev/null +++ b/annotations_filtered/qvvcVzNqXVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.49], [32.0, 35.6], [37.0, 37.62], [52.0, 52.14], [53.0, 54.04], [76.0, 76.33], [88.0, 90.91], [92.0, 92.18], [97.0, 98.58], [100.0, 100.77], [101.0, 103.0], [107.0, 109.44], [110.0, 110.57], [119.0, 120.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 33.06, 0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 0.0, 0.0, 53.16, 34.57, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 72.92], ["boing", 4.02], ["snicker", 3.92]], null, null, null, null, null, null, null, null, null, [["music", 57.44], ["synthesizer", 3.97], ["musical instrument", 3.64]], null, null], "duration": [0.49, 3.6, 0.62, 0.14, 1.04, 0.33, 2.91, 0.18, 1.58, 0.77, 2.0, 2.44, 0.57, 1.92]} \ No newline at end of file diff --git a/annotations_filtered/qvwHppI95K0_filtered.json b/annotations_filtered/qvwHppI95K0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61a661b1615436021ee661b6b17236f71ac36ebc --- /dev/null +++ b/annotations_filtered/qvwHppI95K0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.69], [14.0, 14.67], [17.0, 17.63], [18.0, 19.7], [21.0, 22.08], [23.0, 23.28], [24.0, 24.38], [25.0, 26.22], [33.0, 33.39], [34.0, 34.47], [38.0, 38.69], [40.0, 41.03], [48.0, 48.22], [53.0, 53.74], [55.0, 55.02], [64.0, 63.83], [65.0, 65.79], [67.0, 68.69], [70.0, 70.56], [72.0, 86.71], [92.0, 92.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.09], ["hum", 5.1], ["throbbing", 4.85]], null], "duration": [0.69, 0.67, 0.63, 1.7, 1.08, 0.28, 0.38, 1.22, 0.39, 0.47, 0.69, 1.03, 0.22, 0.74, 0.02, -0.17, 0.79, 1.69, 0.56, 14.71, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/qw0kuEG7NR8_filtered.json b/annotations_filtered/qw0kuEG7NR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54f69cf3c3b940e94c7d6c8f3539d3c018f9576e --- /dev/null +++ b/annotations_filtered/qw0kuEG7NR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.93], [17.0, 17.81], [23.0, 23.4], [24.0, 24.65], [26.0, 26.01], [27.0, 28.24], [30.0, 30.64], [32.0, 32.7], [35.0, 36.9], [38.0, 38.8], [40.0, 44.98], [46.0, 47.33], [48.0, 55.71], [57.0, 60.32], [62.0, 63.42], [64.0, 68.12], [70.0, 71.05], [72.0, 75.05], [76.0, 78.14], [79.0, 80.94], [82.0, 83.71], [89.0, 90.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.93, 0.0, 50.71, 79.41, 0.0, 70.44, 0.0, 65.2, 58.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["crushing", 36.59], ["sidetone", 11.63], ["sine wave", 8.66]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 0.81, 0.4, 0.65, 0.01, 1.24, 0.64, 0.7, 1.9, 0.8, 4.98, 1.33, 7.71, 3.32, 1.42, 4.12, 1.05, 3.05, 2.14, 1.94, 1.71, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/qwMmxh3r8YM_filtered.json b/annotations_filtered/qwMmxh3r8YM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6b12b7bb191764f9dec7c1cb039dff3cec557b2 --- /dev/null +++ b/annotations_filtered/qwMmxh3r8YM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.65], [5.0, 8.82], [12.0, 41.5], [44.0, 47.7], [50.0, 54.73], [57.0, 58.45], [61.0, 62.31], [65.0, 80.32], [85.0, 87.78], [90.0, 91.45], [94.0, 95.77], [97.0, 107.16], [111.0, 111.48], [118.0, 121.71]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.13, 39.46, 49.68, 40.16, 0.0, 0.0, 56.48, 100.0, 0.0, 0.0, 99.99, 0.0, 100.0], "audiomae_on_audioset": [null, null, [["music", 48.17], ["theremin", 32.31], ["synthesizer", 4.2]], [["music", 50.05], ["theremin", 5.31], ["hum", 4.68]], [["music", 57.43], ["mains hum", 6.23], ["hum", 6.22]], null, null, null, null, null, null, null, null, null], "duration": [-0.35, 3.82, 29.5, 3.7, 4.73, 1.45, 1.31, 15.32, 2.78, 1.45, 1.77, 10.16, 0.48, 3.71]} \ No newline at end of file diff --git a/annotations_filtered/qwUgyrgP9H4_filtered.json b/annotations_filtered/qwUgyrgP9H4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a69fc6ba34d62d2abc673d080e33ae045717ec6b --- /dev/null +++ b/annotations_filtered/qwUgyrgP9H4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [10.0, 10.03], [33.0, 34.08], [44.0, 45.25], [46.0, 46.94], [47.0, 48.78], [50.0, 51.75], [55.0, 55.46], [64.0, 64.22], [66.0, 66.82], [69.0, 69.72], [73.0, 73.36], [87.0, 88.01], [89.0, 89.5], [90.0, 89.97], [100.0, 100.53], [101.0, 101.66], [102.0, 103.08], [105.0, 107.33], [124.0, 123.94], [130.0, 132.73], [143.0, 143.07], [145.0, 144.9], [145.0, 145.37], [146.0, 146.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 94.81, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 0.03, 1.08, 1.25, 0.94, 1.78, 1.75, 0.46, 0.22, 0.82, 0.72, 0.36, 1.01, 0.5, -0.03, 0.53, 0.66, 1.08, 2.33, -0.06, 2.73, 0.07, -0.1, 0.37, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/qwwLKFCR4K0_filtered.json b/annotations_filtered/qwwLKFCR4K0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53ceac545e0e1a5c711887a802b257c09ae6c905 --- /dev/null +++ b/annotations_filtered/qwwLKFCR4K0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.09]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.09]} \ No newline at end of file diff --git a/annotations_filtered/qxFHPIFGFmk_filtered.json b/annotations_filtered/qxFHPIFGFmk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9486fe496ee0139ff45fc2c7a670ffb6cf141b7 --- /dev/null +++ b/annotations_filtered/qxFHPIFGFmk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [10.0, 10.5], [11.0, 11.84], [16.0, 16.39], [17.0, 20.55], [22.0, 23.4], [24.0, 36.98], [38.0, 39.65], [43.0, 79.12], [84.0, 91.79], [93.0, 94.85], [95.0, 96.43], [99.0, 98.85], [107.0, 107.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.76, 0.0, 33.82, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["fart", 49.66], ["mosquito", 10.84], ["speech", 10.56]], null, null, null, null, null, null, null], "duration": [0.43, 0.5, 0.84, 0.39, 3.55, 1.4, 12.98, 1.65, 36.12, 7.79, 1.85, 1.43, -0.15, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/qyLJCNyRov0_filtered.json b/annotations_filtered/qyLJCNyRov0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8fb2a63566ff457202c07571bc9ae88c125d756 --- /dev/null +++ b/annotations_filtered/qyLJCNyRov0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.47], [22.0, 23.8], [26.0, 25.91], [28.0, 31.19], [36.0, 39.41], [43.0, 47.68], [52.0, 53.13], [61.0, 60.96], [62.0, 66.75], [75.0, 76.6], [80.0, 82.46]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 50.16, 40.84, 34.32, 0.0, 0.0, 30.07, 0.0, 45.88], "audiomae_on_audioset": [null, null, null, null, [["music", 57.04], ["musical instrument", 7.59], ["guitar", 1.99]], [["music", 57.04], ["speech", 19.02], ["musical instrument", 3.0]], null, null, [["music", 35.23], ["speech", 34.14], ["explosion", 5.86]], null, [["speech", 16.13], ["fart", 15.82], ["music", 7.04]]], "duration": [0.47, 1.8, -0.09, 3.19, 3.41, 4.68, 1.13, -0.04, 4.75, 1.6, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/qyMVXU7qMGw_filtered.json b/annotations_filtered/qyMVXU7qMGw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45c3615db47396686849f44492aaf971172e7bcf --- /dev/null +++ b/annotations_filtered/qyMVXU7qMGw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [6.0, 8.16], [9.0, 16.82], [18.0, 19.99], [27.0, 28.93], [29.0, 33.03], [43.0, 43.95], [44.0, 55.9], [56.0, 60.64], [62.0, 65.13], [65.0, 67.51], [74.0, 89.04], [89.0, 89.07], [90.0, 91.67], [92.0, 95.84], [97.0, 97.04], [97.0, 98.36], [100.0, 108.11], [110.0, 119.82], [121.0, 125.74], [126.0, 132.16], [133.0, 134.55], [138.0, 142.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 79.94, 46.47, 0.0, 0.0, 87.74, 0.0, 96.04, 46.61, 75.39, 80.64, 45.59, 0.0, 0.0, 44.66, 0.0, 0.0, 53.53, 55.11, 42.81, 81.0, 0.0, 57.89], "audiomae_on_audioset": [null, null, [["hum", 56.45], ["mains hum", 24.17], ["throbbing", 7.56]], null, null, null, null, null, [["speech", 67.05], ["hum", 5.46], ["echo", 3.94]], null, null, [["music", 49.62], ["hum", 7.93], ["effects unit", 5.99]], null, null, [["hum", 22.38], ["music", 21.69], ["throbbing", 14.57]], null, null, null, null, [["music", 62.66], ["speech", 5.96], ["guitar", 4.2]], null, null, null], "duration": [0.57, 2.16, 7.82, 1.99, 1.93, 4.03, 0.95, 11.9, 4.64, 3.13, 2.51, 15.04, 0.07, 1.67, 3.84, 0.04, 1.36, 8.11, 9.82, 4.74, 6.16, 1.55, 4.32]} \ No newline at end of file diff --git a/annotations_filtered/qyXpj-yVjVg_filtered.json b/annotations_filtered/qyXpj-yVjVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78a1e6018baf2142831163b0640a1bc6518851e4 --- /dev/null +++ b/annotations_filtered/qyXpj-yVjVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.98], [21.0, 27.57], [28.0, 31.48], [32.0, 36.78], [38.0, 39.41], [40.0, 41.89], [47.0, 49.06], [51.0, 51.09], [54.0, 55.8], [57.0, 58.89], [61.0, 60.62], [64.0, 68.91], [70.0, 72.42], [76.0, 77.3], [79.0, 80.86], [82.0, 82.26], [84.0, 85.77], [87.0, 87.44], [88.0, 88.86], [90.0, 90.21], [92.0, 92.64], [93.0, 93.75], [96.0, 97.09], [101.0, 106.81], [108.0, 109.11], [111.0, 112.16], [113.0, 112.95], [113.0, 114.24], [115.0, 116.36], [117.0, 118.67], [120.0, 120.85], [123.0, 123.58], [124.0, 124.88], [127.0, 127.45], [129.0, 129.05], [130.0, 131.31], [133.0, 133.79], [134.0, 134.96], [136.0, 136.61], [138.0, 138.3], [141.0, 142.82]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.62, 51.82, 77.53, 88.83, 0.0, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 46.61, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.4], ["speech", 12.35], ["door", 3.9]], null, null, null, null, null, null, null, null, null, null, [["music", 30.33], ["didgeridoo", 14.43], ["mains hum", 12.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.98, 6.57, 3.48, 4.78, 1.41, 1.89, 2.06, 0.09, 1.8, 1.89, -0.38, 4.91, 2.42, 1.3, 1.86, 0.26, 1.77, 0.44, 0.86, 0.21, 0.64, 0.75, 1.09, 5.81, 1.11, 1.16, -0.05, 1.24, 1.36, 1.67, 0.85, 0.58, 0.88, 0.45, 0.05, 1.31, 0.79, 0.96, 0.61, 0.3, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/qyZXW5Md1HM_filtered.json b/annotations_filtered/qyZXW5Md1HM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bbe14f204df4538ff2ec3aa8910a949f1732a8c --- /dev/null +++ b/annotations_filtered/qyZXW5Md1HM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.55], [27.0, 28.75], [31.0, 38.62], [50.0, 49.72], [50.0, 53.33], [58.0, 57.94], [64.0, 79.46], [80.0, 94.53], [98.0, 113.53], [115.0, 144.07]], "keep_status": [true, false, false, false, true, false, false, true, false, false], "silence_prob": [30.57, 0.0, 32.53, 0.0, 31.59, 0.0, 31.48, 46.4, 62.07, 36.86], "audiomae_on_audioset": [[["music", 29.42], ["grunt", 12.8], ["speech", 11.34]], null, [["music", 67.53], ["plop", 16.94], ["bass guitar", 2.01]], null, [["speech", 30.63], ["music", 13.24], ["cattle, bovinae", 12.34]], null, [["music", 85.83], ["plop", 1.82], ["bass guitar", 1.11]], [["speech", 14.72], ["hoot", 7.95], ["whimper", 6.41]], null, [["dial tone", 49.58], ["busy signal", 17.26], ["music", 10.29]]], "duration": [3.55, 1.75, 7.62, -0.28, 3.33, -0.06, 15.46, 14.53, 15.53, 29.07]} \ No newline at end of file diff --git a/annotations_filtered/qy_ZclSCUwA_filtered.json b/annotations_filtered/qy_ZclSCUwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30a4fb779010697ea2903bc85b18f8f7ed11bcf2 --- /dev/null +++ b/annotations_filtered/qy_ZclSCUwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.07], [18.0, 21.95], [26.0, 26.37], [28.0, 41.13], [41.0, 42.28], [46.0, 46.95], [48.0, 59.39], [61.0, 68.81], [69.0, 74.82], [81.0, 81.26], [85.0, 89.51], [90.0, 98.51], [102.0, 118.89], [125.0, 127.9], [136.0, 144.27], [145.0, 149.82], [152.0, 152.79], [156.0, 157.25], [160.0, 162.43], [167.0, 170.75], [176.0, 184.38], [186.0, 190.38], [194.0, 196.7]], "keep_status": [false, false, false, true, false, false, true, false, true, false, true, false, false, false, true, true, false, false, true, true, true, false, false], "silence_prob": [0.0, 31.0, 0.0, 30.35, 0.0, 0.0, 31.01, 31.16, 31.55, 0.0, 31.84, 31.31, 32.88, 39.54, 40.29, 36.3, 0.0, 0.0, 32.06, 31.75, 29.83, 32.43, 38.49], "audiomae_on_audioset": [null, [["fart", 54.85], ["fly, housefly", 17.27], ["insect", 9.35]], null, [["music", 38.69], ["speech", 19.89], ["sidetone", 9.22]], null, null, [["music", 44.44], ["speech", 18.58], ["musical instrument", 2.55]], [["music", 42.37], ["speech", 27.1], ["foghorn", 4.48]], [["speech", 53.0], ["music", 5.05], ["moo", 2.49]], null, [["music", 50.38], ["trombone", 5.55], ["speech", 5.52]], [["speech", 77.8], ["sidetone", 2.17], ["explosion", 2.09]], [["speech", 71.02], ["hubbub, speech noise, speech babble", 3.5], ["explosion", 2.27]], [["speech", 49.14], ["radio", 15.38], ["aircraft", 9.74]], [["speech", 19.91], ["music", 17.41], ["gurgling", 5.12]], [["music", 26.96], ["speech", 16.33], ["livestock, farm animals, working animals", 7.98]], null, null, [["music", 18.29], ["hum", 6.27], ["didgeridoo", 5.85]], [["speech", 34.14], ["music", 10.29], ["crowd", 8.24]], [["theremin", 33.59], ["music", 19.29], ["synthesizer", 4.26]], [["theremin", 88.3], ["music", 8.43], ["musical instrument", 1.18]], [["music", 55.79], ["hum", 9.18], ["noise", 5.7]]], "duration": [1.07, 3.95, 0.37, 13.13, 1.28, 0.95, 11.39, 7.81, 5.82, 0.26, 4.51, 8.51, 16.89, 2.9, 8.27, 4.82, 0.79, 1.25, 2.43, 3.75, 8.38, 4.38, 2.7]} \ No newline at end of file diff --git a/annotations_filtered/qyj1tT-vqSQ_filtered.json b/annotations_filtered/qyj1tT-vqSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2f14f3c530e400ed0395c25802d06fab62435a9 --- /dev/null +++ b/annotations_filtered/qyj1tT-vqSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.46], [9.0, 9.34], [10.0, 13.44], [15.0, 14.94], [15.0, 16.16], [17.0, 17.05], [18.0, 23.57], [24.0, 24.98], [25.0, 29.37], [30.0, 56.78], [58.0, 62.67]], "keep_status": [false, false, true, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 35.4, 0.0, 0.0, 0.0, 49.31, 0.0, 44.66, 68.15, 66.27], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 26.23], ["cattle, bovinae", 9.99], ["cowbell", 7.83]], null, null, null, [["coin (dropping)", 22.27], ["speech", 14.44], ["crushing", 10.86]], null, [["music", 23.02], ["speech", 19.01], ["didgeridoo", 4.18]], null, null], "duration": [0.46, 0.34, 3.44, -0.06, 1.16, 0.05, 5.57, 0.98, 4.37, 26.78, 4.67]} \ No newline at end of file diff --git a/annotations_filtered/qyvR5lglbTE_filtered.json b/annotations_filtered/qyvR5lglbTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7289cad99be09eb2dd88121764ae56cf906e3aa1 --- /dev/null +++ b/annotations_filtered/qyvR5lglbTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [3.0, 3.64], [4.0, 5.85], [7.0, 9.05], [10.0, 23.97], [25.0, 25.78], [26.0, 35.67], [36.0, 54.36]], "keep_status": [false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 49.36, 28.43, 0.0, 29.09, 28.91], "audiomae_on_audioset": [null, null, null, [["music", 59.81], ["throbbing", 5.3], ["synthesizer", 3.89]], [["vehicle", 43.56], ["speech", 15.69], ["car", 15.03]], null, [["speech", 56.86], ["hum", 12.94], ["music", 10.87]], [["speech", 23.82], ["music", 18.31], ["mains hum", 10.52]]], "duration": [0.76, 0.64, 1.85, 2.05, 13.97, 0.78, 9.67, 18.36]} \ No newline at end of file diff --git a/annotations_filtered/qz0rKdYiqDQ_filtered.json b/annotations_filtered/qz0rKdYiqDQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a59b85d764758d2aa7e38b9c363284f58c89e4e --- /dev/null +++ b/annotations_filtered/qz0rKdYiqDQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.19], [10.0, 14.4], [16.0, 17.07], [21.0, 21.76], [24.0, 29.46], [30.0, 32.61], [34.0, 36.69], [40.0, 42.28], [56.0, 58.14], [61.0, 60.86], [62.0, 64.1], [65.0, 68.27], [70.0, 70.07], [71.0, 71.46], [75.0, 77.21], [78.0, 81.84], [83.0, 89.73], [91.0, 92.23], [93.0, 94.24], [95.0, 96.97], [98.0, 98.46], [100.0, 107.86], [109.0, 112.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, true, false], "silence_prob": [64.86, 63.74, 0.0, 0.0, 37.59, 36.07, 38.87, 41.48, 41.44, 0.0, 44.9, 56.25, 0.0, 0.0, 37.13, 42.79, 39.69, 0.0, 0.0, 0.0, 0.0, 40.19, 62.17], "audiomae_on_audioset": [null, null, null, null, [["music", 34.54], ["singing bowl", 30.99], ["speech", 8.9]], [["music", 35.99], ["speech", 27.23], ["theremin", 8.13]], [["music", 59.78], ["singing bowl", 14.14], ["crow", 2.72]], [["music", 70.42], ["theremin", 4.58], ["singing bowl", 3.0]], [["music", 47.03], ["theremin", 18.59], ["singing bowl", 6.94]], null, [["music", 58.36], ["singing bowl", 10.65], ["musical instrument", 3.49]], null, null, null, [["cattle, bovinae", 22.46], ["moo", 20.79], ["music", 15.24]], [["music", 21.25], ["moo", 4.43], ["cattle, bovinae", 4.33]], [["music", 32.5], ["speech", 16.02], ["knock", 9.04]], null, null, null, null, [["music", 32.8], ["noise", 8.78], ["breaking", 6.73]], null], "duration": [2.19, 4.4, 1.07, 0.76, 5.46, 2.61, 2.69, 2.28, 2.14, -0.14, 2.1, 3.27, 0.07, 0.46, 2.21, 3.84, 6.73, 1.23, 1.24, 1.97, 0.46, 7.86, 3.4]} \ No newline at end of file diff --git a/annotations_filtered/qzQdwPNUcME_filtered.json b/annotations_filtered/qzQdwPNUcME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9f9ce998f314abdcb314f14189ef6fbe11f4fb6 --- /dev/null +++ b/annotations_filtered/qzQdwPNUcME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.24], [16.0, 17.24], [18.0, 18.44], [34.0, 37.25], [38.0, 38.25], [40.0, 50.31], [51.0, 53.4], [53.0, 54.94], [56.0, 57.42], [81.0, 81.58], [82.0, 82.75], [83.0, 83.52], [85.0, 85.68], [87.0, 86.66], [87.0, 88.65], [89.0, 90.12], [91.0, 94.04], [98.0, 99.2], [104.0, 104.68], [134.0, 134.94], [149.0, 150.42], [151.0, 153.2], [156.0, 156.83], [158.0, 162.77], [164.0, 166.04]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [47.9, 0.0, 0.0, 31.98, 0.0, 74.76, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 29.23, 0.0, 27.91, 64.29], "audiomae_on_audioset": [[["fart", 75.97], ["noise", 5.7], ["speech", 5.22]], null, null, [["moo", 23.12], ["speech", 20.34], ["cattle, bovinae", 20.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.28], ["didgeridoo", 12.6], ["musical instrument", 2.95]], null, [["speech", 39.2], ["screaming", 10.7], ["explosion", 5.85]], null], "duration": [7.24, 1.24, 0.44, 3.25, 0.25, 10.31, 2.4, 1.94, 1.42, 0.58, 0.75, 0.52, 0.68, -0.34, 1.65, 1.12, 3.04, 1.2, 0.68, 0.94, 1.42, 2.2, 0.83, 4.77, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/qzZegCkbJAw_filtered.json b/annotations_filtered/qzZegCkbJAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afa1d109b00cb60673b7fd84dfb58b28d7b8c732 --- /dev/null +++ b/annotations_filtered/qzZegCkbJAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [11.0, 11.31], [13.0, 13.44], [16.0, 17.24], [20.0, 20.78], [24.0, 31.36], [39.0, 43.78], [45.0, 46.21], [48.0, 62.51], [67.0, 73.85], [76.0, 92.26], [95.0, 101.83], [103.0, 103.62], [108.0, 109.58], [117.0, 116.68], [119.0, 120.85], [123.0, 125.05]], "keep_status": [false, false, false, false, false, true, false, false, true, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 27.97, 28.1, 0.0, 28.17, 28.43, 28.24, 28.12, 0.0, 0.0, 0.0, 0.0, 28.01], "audiomae_on_audioset": [null, null, null, null, null, [["music", 27.25], ["hum", 16.38], ["rumble", 6.41]], [["clang", 78.87], ["ding", 8.11], ["sound effect", 1.35]], null, [["music", 51.57], ["speech", 13.54], ["hum", 3.81]], [["mains hum", 15.82], ["hum", 14.63], ["rumble", 12.31]], [["music", 19.75], ["mains hum", 16.08], ["hum", 10.22]], [["music", 74.38], ["grunt", 7.94], ["sound effect", 3.31]], null, null, null, null, [["livestock, farm animals, working animals", 15.02], ["cattle, bovinae", 13.32], ["moo", 11.87]]], "duration": [0.26, 0.31, 0.44, 1.24, 0.78, 7.36, 4.78, 1.21, 14.51, 6.85, 16.26, 6.83, 0.62, 1.58, -0.32, 1.85, 2.05]} \ No newline at end of file diff --git a/annotations_filtered/qzayNPEmoK0_filtered.json b/annotations_filtered/qzayNPEmoK0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af02662252a85fd21b55647c18ab4054584fb91f --- /dev/null +++ b/annotations_filtered/qzayNPEmoK0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [6.0, 7.18], [10.0, 14.28], [17.0, 17.34], [18.0, 19.97], [21.0, 21.71], [31.0, 31.02], [34.0, 33.96], [36.0, 38.72], [43.0, 51.0], [53.0, 60.72], [71.0, 72.08], [73.0, 74.9], [79.0, 80.47], [82.0, 84.4]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 38.66, 37.85, 0.0, 0.0, 0.0, 50.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 34.25], ["speech", 13.19], ["hum", 12.39]], [["music", 30.64], ["speech", 11.82], ["thunk", 9.87]], null, null, null, null], "duration": [1.04, 1.18, 4.28, 0.34, 1.97, 0.71, 0.02, -0.04, 2.72, 8.0, 7.72, 1.08, 1.9, 1.47, 2.4]} \ No newline at end of file diff --git a/annotations_filtered/r-IE6wNNbAI_filtered.json b/annotations_filtered/r-IE6wNNbAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5b3eef65f108ab4bfaf462efb7520529345f1ee --- /dev/null +++ b/annotations_filtered/r-IE6wNNbAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [4.0, 5.86], [9.0, 10.49], [11.0, 10.93], [24.0, 24.56], [42.0, 47.68], [49.0, 50.75], [52.0, 54.01], [61.0, 60.91], [64.0, 72.03], [73.0, 75.66], [85.0, 105.49], [106.0, 106.61], [108.0, 119.53], [121.0, 122.62], [124.0, 136.93], [138.0, 140.34], [142.0, 154.62]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.66, 0.0, 37.67, 0.0, 31.79, 33.31, 35.22, 0.0, 31.71, 0.0, 33.06, 37.46, 30.36], "audiomae_on_audioset": [null, null, null, null, null, [["music", 20.35], ["speech", 17.84], ["didgeridoo", 13.13]], null, [["music", 79.07], ["musical instrument", 2.48], ["throbbing", 1.94]], null, [["music", 40.14], ["moo", 9.52], ["cattle, bovinae", 8.01]], [["music", 35.19], ["speech", 8.9], ["carnatic music", 4.34]], [["music", 84.39], ["reggae", 1.01], ["funny music", 0.84]], null, [["music", 41.49], ["buzz", 28.27], ["breaking", 9.09]], null, [["music", 62.76], ["speech", 16.05], ["boing", 2.68]], [["music", 68.05], ["speech", 4.58], ["electronic music", 2.4]], [["music", 49.29], ["hum", 13.3], ["throbbing", 6.96]]], "duration": [0.43, 1.86, 1.49, -0.07, 0.56, 5.68, 1.75, 2.01, -0.09, 8.03, 2.66, 20.49, 0.61, 11.53, 1.62, 12.93, 2.34, 12.62]} \ No newline at end of file diff --git a/annotations_filtered/r-ddXOrPiZ0_filtered.json b/annotations_filtered/r-ddXOrPiZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e71b7a82a54c6991b5c57e78031413a9ad7a83c8 --- /dev/null +++ b/annotations_filtered/r-ddXOrPiZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 19.14], [21.0, 22.76], [24.0, 27.48], [28.0, 32.05], [32.0, 64.05], [64.0, 67.95], [69.0, 81.65], [83.0, 125.27]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 100.0, 100.0, 0.0, 87.37, 98.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [4.14, 1.76, 3.48, 4.05, 32.05, 3.95, 12.65, 42.27]} \ No newline at end of file diff --git a/annotations_filtered/r-xcvVWqny0_filtered.json b/annotations_filtered/r-xcvVWqny0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb3aaed0d2fb308566e0166945d513fe4901a8dc --- /dev/null +++ b/annotations_filtered/r-xcvVWqny0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.32], [12.0, 12.23], [18.0, 17.83], [21.0, 21.69], [23.0, 23.89], [25.0, 25.62], [36.0, 40.96], [42.0, 42.62], [47.0, 50.55], [59.0, 59.76], [61.0, 66.31], [80.0, 80.72], [81.0, 89.83], [90.0, 92.62], [98.0, 108.97], [110.0, 112.02], [114.0, 121.51], [122.0, 125.96], [127.0, 131.3], [132.0, 136.76], [138.0, 138.54], [141.0, 144.91], [149.0, 149.94], [151.0, 151.56], [152.0, 152.41], [158.0, 158.95], [161.0, 162.87], [166.0, 166.78], [175.0, 176.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 91.3, 0.0, 48.02, 0.0, 94.81, 46.09, 94.52, 96.54, 87.19, 81.71, 93.29, 97.11, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 26.95], ["hum", 19.0], ["mains hum", 8.13]], null, null, [["speech", 38.9], ["music", 7.05], ["single-lens reflex camera", 2.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.32, 0.23, -0.17, 0.69, 0.89, 0.62, 4.96, 0.62, 3.55, 0.76, 5.31, 0.72, 8.83, 2.62, 10.97, 2.02, 7.51, 3.96, 4.3, 4.76, 0.54, 3.91, 0.94, 0.56, 0.41, 0.95, 1.87, 0.78, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/r-zlkOg6_Zw_filtered.json b/annotations_filtered/r-zlkOg6_Zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/r-zlkOg6_Zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/r0-vDDcDUMo_filtered.json b/annotations_filtered/r0-vDDcDUMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e8dbc70a6fb52cb79e4c6edf41b386255786062 --- /dev/null +++ b/annotations_filtered/r0-vDDcDUMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.13], [3.0, 9.56], [10.0, 10.88], [11.0, 21.61], [22.0, 23.99], [25.0, 34.99], [36.0, 44.22], [47.0, 49.82], [50.0, 51.12], [55.0, 65.26], [67.0, 66.77], [68.0, 68.08], [73.0, 76.06], [88.0, 92.48], [94.0, 106.34], [108.0, 111.1]], "keep_status": [false, false, false, false, false, false, true, true, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 53.47, 0.0, 58.64, 0.0, 44.49, 45.43, 32.42, 0.0, 32.78, 0.0, 0.0, 36.67, 49.45, 56.25, 90.08], "audiomae_on_audioset": [null, null, null, null, null, [["sidetone", 69.36], ["hum", 5.83], ["speech", 5.48]], [["speech", 28.68], ["mains hum", 9.27], ["hum", 8.72]], [["speech", 31.57], ["music", 29.74], ["musical instrument", 4.99]], null, [["music", 35.02], ["speech", 18.91], ["hum", 9.39]], null, null, [["speech", 42.29], ["music", 14.44], ["didgeridoo", 6.08]], [["music", 19.55], ["hum", 11.99], ["mains hum", 11.43]], null, null], "duration": [0.13, 6.56, 0.88, 10.61, 1.99, 9.99, 8.22, 2.82, 1.12, 10.26, -0.23, 0.08, 3.06, 4.48, 12.34, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/r0Iq2_euH44_filtered.json b/annotations_filtered/r0Iq2_euH44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..292700d2e97656455bf4adb66e8af04ad533f40e --- /dev/null +++ b/annotations_filtered/r0Iq2_euH44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.94], [17.0, 17.09], [17.0, 17.12], [17.0, 19.21], [21.0, 41.96], [46.0, 46.75], [50.0, 51.83], [62.0, 63.44], [88.0, 88.03], [98.0, 99.72]], "keep_status": [true, false, false, true, false, false, false, false, false, false], "silence_prob": [49.04, 0.0, 0.0, 38.55, 34.88, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["yodeling", 13.3], ["music", 12.14], ["singing", 10.18]], null, null, [["music", 43.36], ["carnatic music", 7.13], ["middle eastern music", 6.09]], [["music", 77.86], ["musical instrument", 3.09], ["didgeridoo", 1.48]], null, null, null, null, null], "duration": [4.94, 0.09, 0.12, 2.21, 20.96, 0.75, 1.83, 1.44, 0.03, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/r0N4KlcTSUQ_filtered.json b/annotations_filtered/r0N4KlcTSUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..648ef56d3fc43e0a5724f56e5719f22d5a4df7a4 --- /dev/null +++ b/annotations_filtered/r0N4KlcTSUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.59], [12.0, 12.24], [15.0, 16.29], [20.0, 19.99], [23.0, 23.65], [26.0, 27.63], [29.0, 28.88], [33.0, 35.09], [37.0, 37.3], [38.0, 39.6], [40.0, 40.93], [41.0, 42.23], [47.0, 48.42], [50.0, 50.38], [51.0, 51.7], [52.0, 52.54], [55.0, 55.85], [57.0, 57.82], [62.0, 62.77], [63.0, 64.03], [65.0, 66.14], [71.0, 74.02], [77.0, 78.92], [80.0, 80.55], [82.0, 82.81], [83.0, 84.28], [87.0, 88.26], [91.0, 93.02], [95.0, 97.26], [98.0, 98.25], [99.0, 101.73], [103.0, 103.06], [104.0, 104.67], [105.0, 105.83], [107.0, 107.67], [112.0, 117.39], [118.0, 118.69], [119.0, 120.01], [124.0, 124.14], [125.0, 125.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 95.37, 0.0, 72.31, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.59, 0.24, 1.29, -0.01, 0.65, 1.63, -0.12, 2.09, 0.3, 1.6, 0.93, 1.23, 1.42, 0.38, 0.7, 0.54, 0.85, 0.82, 0.77, 1.03, 1.14, 3.02, 1.92, 0.55, 0.81, 1.28, 1.26, 2.02, 2.26, 0.25, 2.73, 0.06, 0.67, 0.83, 0.67, 5.39, 0.69, 1.01, 0.14, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/r0cRrtcU5X0_filtered.json b/annotations_filtered/r0cRrtcU5X0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a387d8b97195a8a2f735c17333fe12e4574d3b0b --- /dev/null +++ b/annotations_filtered/r0cRrtcU5X0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 4.19], [7.0, 6.89], [8.0, 8.68], [14.0, 13.98], [18.0, 19.04], [24.0, 24.26], [27.0, 31.16], [38.0, 39.11], [42.0, 42.06], [43.0, 46.01], [47.0, 48.19], [50.0, 52.19], [57.0, 58.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 0.0, 0.0, 80.11, 0.0, 87.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.19, -0.11, 0.68, -0.02, 1.04, 0.26, 4.16, 1.11, 0.06, 3.01, 1.19, 2.19, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/r0eg-ieT77g_filtered.json b/annotations_filtered/r0eg-ieT77g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd9cf3e2864417ad1775d4eaf87ce140deee02d2 --- /dev/null +++ b/annotations_filtered/r0eg-ieT77g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.91], [12.0, 15.62], [18.0, 22.0], [25.0, 26.4], [29.0, 35.92], [39.0, 42.72], [43.0, 46.77], [54.0, 55.38], [57.0, 60.2], [61.0, 68.17], [72.0, 71.85], [74.0, 74.66], [75.0, 83.44], [85.0, 86.53], [91.0, 96.43], [100.0, 111.27], [115.0, 135.24], [140.0, 140.86], [143.0, 144.24], [148.0, 155.34], [156.0, 161.67], [166.0, 166.06]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.05, 32.45, 31.45, 0.0, 33.91, 64.86, 36.15, 0.0, 38.75, 31.39, 0.0, 0.0, 31.13, 0.0, 31.09, 31.37, 30.38, 0.0, 0.0, 32.52, 31.25, 0.0], "audiomae_on_audioset": [[["music", 60.12], ["hum", 6.73], ["throbbing", 3.75]], [["music", 50.72], ["electronic music", 6.42], ["noise", 5.48]], [["music", 32.17], ["speech", 28.13], ["throbbing", 4.23]], null, [["music", 63.13], ["throbbing", 8.8], ["didgeridoo", 5.85]], null, [["music", 50.1], ["boing", 32.52], ["didgeridoo", 1.94]], null, [["music", 54.09], ["theremin", 22.01], ["noise", 5.21]], [["music", 85.3], ["throbbing", 3.44], ["boing", 1.71]], null, null, [["music", 58.12], ["speech", 13.35], ["sidetone", 10.57]], null, [["music", 38.52], ["hum", 17.3], ["throbbing", 15.14]], [["music", 89.05], ["electronic music", 1.4], ["throbbing", 0.89]], [["music", 63.91], ["throbbing", 8.86], ["hum", 6.64]], null, null, [["music", 61.28], ["electronic music", 10.1], ["synthesizer", 5.39]], [["sidetone", 45.35], ["music", 21.03], ["hum", 10.12]], null], "duration": [8.91, 3.62, 4.0, 1.4, 6.92, 3.72, 3.77, 1.38, 3.2, 7.17, -0.15, 0.66, 8.44, 1.53, 5.43, 11.27, 20.24, 0.86, 1.24, 7.34, 5.67, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/r0ladY1kwco_filtered.json b/annotations_filtered/r0ladY1kwco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffeb76d7778c0a6fe3dbf4c4b8d9bc65f67f4331 --- /dev/null +++ b/annotations_filtered/r0ladY1kwco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 122.84]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [65.84]} \ No newline at end of file diff --git a/annotations_filtered/r12JlwSBvVQ_filtered.json b/annotations_filtered/r12JlwSBvVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a079be838732742d5119d1132f45b07503653b42 --- /dev/null +++ b/annotations_filtered/r12JlwSBvVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.04], [14.0, 16.68], [34.0, 42.38], [53.0, 53.74], [66.0, 68.45], [75.0, 76.27], [77.0, 80.77], [82.0, 82.93], [84.0, 85.28], [98.0, 98.63], [101.0, 102.41], [112.0, 121.58], [126.0, 126.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.54, 62.37, 0.0, 82.79, 0.0, 50.06, 0.0, 0.0, 0.0, 0.0, 44.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.65], ["applause", 7.29], ["male speech, man speaking", 1.36]], null], "duration": [1.04, 2.68, 8.38, 0.74, 2.45, 1.27, 3.77, 0.93, 1.28, 0.63, 1.41, 9.58, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/r1N-Xby5AnA_filtered.json b/annotations_filtered/r1N-Xby5AnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57057f5bec4528181dfdbeb6ef82de3f716a4d3b --- /dev/null +++ b/annotations_filtered/r1N-Xby5AnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.02], [8.0, 8.48], [11.0, 20.11], [21.0, 21.12], [23.0, 23.31], [25.0, 27.16], [29.0, 48.61], [50.0, 50.79], [52.0, 53.76], [55.0, 69.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.53, 0.0, 0.0, 92.8, 34.61, 0.0, 0.0, 33.16], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 74.79], ["throbbing", 2.97], ["synthesizer", 2.14]], null, null, [["music", 63.41], ["speech", 9.89], ["throbbing", 2.77]]], "duration": [0.02, 0.48, 9.11, 0.12, 0.31, 2.16, 19.61, 0.79, 1.76, 14.15]} \ No newline at end of file diff --git a/annotations_filtered/r1NUy3Rq8n4_filtered.json b/annotations_filtered/r1NUy3Rq8n4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7af9bd37bedf85f4caa919d974fcb1935f4c96c8 --- /dev/null +++ b/annotations_filtered/r1NUy3Rq8n4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.65], [21.0, 22.28], [23.0, 23.36], [41.0, 42.2], [51.0, 52.68], [54.0, 54.87], [55.0, 56.88], [59.0, 60.84], [71.0, 73.55], [74.0, 75.25], [78.0, 83.32], [86.0, 89.04], [93.0, 97.83], [99.0, 100.53]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.46, 0.0, 32.85, 33.08, 35.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 21.34], ["throbbing", 14.72], ["hum", 9.6]], null, [["music", 38.95], ["speech", 20.84], ["electronic music", 4.11]], [["music", 49.14], ["sidetone", 10.45], ["electronic music", 4.07]], [["music", 60.84], ["speech", 7.71], ["sidetone", 3.9]], null], "duration": [0.65, 1.28, 0.36, 1.2, 1.68, 0.87, 1.88, 1.84, 2.55, 1.25, 5.32, 3.04, 4.83, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/r1S-yBBZsDI_filtered.json b/annotations_filtered/r1S-yBBZsDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75ec54183c2f6d7b146f90256e1c0fd5efd8fdaa --- /dev/null +++ b/annotations_filtered/r1S-yBBZsDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.99], [13.0, 12.93], [14.0, 15.18], [18.0, 18.98], [25.0, 27.21], [29.0, 29.08], [30.0, 30.15], [31.0, 31.89], [33.0, 33.61], [34.0, 35.07], [36.0, 37.64], [41.0, 42.09], [44.0, 44.78], [46.0, 46.25], [47.0, 47.04], [53.0, 52.81], [61.0, 62.56], [66.0, 67.76], [68.0, 69.75], [87.0, 87.89]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 27.38], ["hum", 22.12], ["throbbing", 10.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, -0.07, 1.18, 0.98, 2.21, 0.08, 0.15, 0.89, 0.61, 1.07, 1.64, 1.09, 0.78, 0.25, 0.04, -0.19, 1.56, 1.76, 1.75, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/r1fp_NVGr6Q_filtered.json b/annotations_filtered/r1fp_NVGr6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db08ec20d1ee7637006e0f7514cdd6105e4f17a0 --- /dev/null +++ b/annotations_filtered/r1fp_NVGr6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.72], [47.0, 47.55], [52.0, 52.71], [77.0, 90.85], [92.0, 102.0], [107.0, 108.18]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.73, 42.17, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 83.29], ["singing", 4.18], ["music of bollywood", 1.12]], [["music", 74.78], ["singing", 2.86], ["harmonica", 2.77]], null], "duration": [0.72, 0.55, 0.71, 13.85, 10.0, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/r1gBq45CkgI_filtered.json b/annotations_filtered/r1gBq45CkgI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1209d821fc33d753e2072ad89a28f0b2223e2e82 --- /dev/null +++ b/annotations_filtered/r1gBq45CkgI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.73], [6.0, 7.08], [7.0, 9.0], [14.0, 14.07], [15.0, 15.35], [17.0, 17.09], [19.0, 18.96], [20.0, 20.87], [23.0, 22.96], [26.0, 29.24], [31.0, 36.19], [42.0, 41.84], [45.0, 56.79], [62.0, 62.7], [65.0, 71.83], [75.0, 78.43], [80.0, 82.75], [86.0, 103.52], [110.0, 111.97], [113.0, 113.36], [114.0, 115.59], [124.0, 125.63], [126.0, 126.81], [130.0, 131.23], [133.0, 133.44]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, true, false, true, true, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.52, 30.23, 0.0, 29.06, 0.0, 28.64, 28.47, 28.66, 42.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 15.5], ["speech", 13.57], ["livestock, farm animals, working animals", 12.91]], null, null, null, null, null, null, [["boing", 21.94], ["speech", 21.76], ["croak", 9.41]], [["vehicle", 35.5], ["skidding", 29.92], ["car", 10.2]], null, [["music", 24.65], ["buzz", 21.39], ["hum", 21.38]], null, [["speech", 31.07], ["buzz", 12.96], ["hum", 9.93]], [["music", 18.08], ["smash, crash", 13.78], ["explosion", 11.87]], [["explosion", 30.63], ["burst, pop", 11.01], ["eruption", 8.09]], [["hum", 36.99], ["rumble", 9.77], ["mains hum", 6.72]], null, null, null, null, null, null, null], "duration": [0.73, 1.08, 2.0, 0.07, 0.35, 0.09, -0.04, 0.87, -0.04, 3.24, 5.19, -0.16, 11.79, 0.7, 6.83, 3.43, 2.75, 17.52, 1.97, 0.36, 1.59, 1.63, 0.81, 1.23, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/r1jgKSXPL84_filtered.json b/annotations_filtered/r1jgKSXPL84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7d54ac01d20316c146e9f2e3b820f78586457d0 --- /dev/null +++ b/annotations_filtered/r1jgKSXPL84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.95], [31.0, 35.78], [37.0, 37.98], [41.0, 41.94], [45.0, 46.58], [48.0, 48.17], [49.0, 49.27], [52.0, 52.47], [54.0, 62.06], [64.0, 68.55], [70.0, 70.93], [71.0, 89.72], [90.0, 91.74], [94.0, 94.34], [96.0, 96.74], [99.0, 100.58], [105.0, 107.27], [108.0, 108.72], [110.0, 111.32], [114.0, 114.2], [115.0, 123.03]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.96, 38.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 99.91, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0, 0.0, 95.91], "audiomae_on_audioset": [[["music", 54.77], ["throbbing", 7.95], ["musical instrument", 5.03]], [["speech", 24.84], ["music", 24.47], ["wind instrument, woodwind instrument", 7.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.95, 4.78, 0.98, 0.94, 1.58, 0.17, 0.27, 0.47, 8.06, 4.55, 0.93, 18.72, 1.74, 0.34, 0.74, 1.58, 2.27, 0.72, 1.32, 0.2, 8.03]} \ No newline at end of file diff --git a/annotations_filtered/r1mN6K60148_filtered.json b/annotations_filtered/r1mN6K60148_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b552be4370f7f2b45569c34f4669dbf28d00350 --- /dev/null +++ b/annotations_filtered/r1mN6K60148_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 20.7], [23.0, 24.21], [25.0, 25.34], [26.0, 28.26], [29.0, 29.42], [30.0, 38.77], [39.0, 40.47], [52.0, 52.86], [54.0, 55.8], [56.0, 56.39], [56.0, 56.42], [56.0, 58.35], [59.0, 59.93], [61.0, 61.21], [62.0, 77.43], [78.0, 82.83], [83.0, 84.65], [85.0, 90.14], [91.0, 92.85], [104.0, 111.86], [125.0, 125.22], [126.0, 127.4], [132.0, 132.14], [135.0, 140.04], [141.0, 142.62], [145.0, 148.51], [160.0, 160.14], [166.0, 167.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [97.33, 0.0, 0.0, 97.83, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 72.9, 63.1, 0.0, 92.64, 0.0, 36.09, 0.0, 0.0, 0.0, 97.54, 0.0, 87.19, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["telephone dialing, dtmf", 18.26], ["music", 16.8], ["dial tone", 14.91]], null, null, null, null, null, null, null, null], "duration": [14.7, 1.21, 0.34, 2.26, 0.42, 8.77, 1.47, 0.86, 1.8, 0.39, 0.42, 2.35, 0.93, 0.21, 15.43, 4.83, 1.65, 5.14, 1.85, 7.86, 0.22, 1.4, 0.14, 5.04, 1.62, 3.51, 0.14, 1.93]} \ No newline at end of file diff --git a/annotations_filtered/r1scNthC8NI_filtered.json b/annotations_filtered/r1scNthC8NI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8ea0e4bda79a26107a9e5b3518bd47de99de2d8 --- /dev/null +++ b/annotations_filtered/r1scNthC8NI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.8], [9.0, 10.94], [11.0, 22.59], [28.0, 28.51], [30.0, 31.29], [33.0, 33.62], [35.0, 35.04], [35.0, 35.72], [38.0, 46.94], [48.0, 53.42], [54.0, 54.75], [57.0, 59.17], [60.0, 77.23], [78.0, 86.81], [91.0, 92.04], [94.0, 94.19], [100.0, 100.41], [105.0, 106.0], [110.0, 110.35], [114.0, 114.2], [116.0, 116.67], [125.0, 126.13], [133.0, 133.14], [141.0, 141.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.84, 0.0, 0.0, 0.0, 0.0, 0.0, 37.35, 53.28, 0.0, 64.75, 46.19, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 71.52], ["speech", 17.65], ["musical instrument", 2.3]], null, null, null, null, null, [["music", 43.39], ["speech", 25.09], ["didgeridoo", 12.65]], null, null, null, [["music", 76.64], ["speech", 7.46], ["musical instrument", 2.74]], null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 1.94, 11.59, 0.51, 1.29, 0.62, 0.04, 0.72, 8.94, 5.42, 0.75, 2.17, 17.23, 8.81, 1.04, 0.19, 0.41, 1.0, 0.35, 0.2, 0.67, 1.13, 0.14, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/r29P93wUiMg_filtered.json b/annotations_filtered/r29P93wUiMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..800b7b45c3a611e1f6cf9d490f35d0a20522b984 --- /dev/null +++ b/annotations_filtered/r29P93wUiMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[98.0, 112.8], [118.0, 131.21]], "keep_status": [false, false], "silence_prob": [29.65, 29.91], "audiomae_on_audioset": [[["music", 29.07], ["throbbing", 28.26], ["hum", 16.06]], [["music", 30.73], ["throbbing", 29.76], ["hum", 15.25]]], "duration": [14.8, 13.21]} \ No newline at end of file diff --git a/annotations_filtered/r2GpJzIdoYQ_filtered.json b/annotations_filtered/r2GpJzIdoYQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba69a45351ab056373ddd5f56b5a4a64e60bf9c3 --- /dev/null +++ b/annotations_filtered/r2GpJzIdoYQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [9.0, 9.51], [10.0, 12.6], [15.0, 16.46], [17.0, 19.41], [21.0, 28.9], [29.0, 30.47], [31.0, 31.8], [37.0, 38.01], [39.0, 39.85], [43.0, 44.12], [47.0, 50.53], [52.0, 59.73], [61.0, 91.96], [96.0, 96.77], [99.0, 100.13], [102.0, 104.09], [105.0, 105.66], [106.0, 108.24], [109.0, 138.3], [139.0, 148.2], [149.0, 150.36], [151.0, 151.68], [154.0, 154.85], [157.0, 159.06], [160.0, 161.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 56.03, 0.0, 82.43, 95.23, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 96.66, 0.0, 0.0, 0.0, 98.51, 0.0, 88.46, 33.41, 41.98, 0.0, 0.0, 0.0, 59.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.83], ["ambient music", 10.8], ["hum", 4.91]], [["music", 73.08], ["musical instrument", 3.29], ["hum", 2.51]], null, null, null, null, null], "duration": [1.62, 0.51, 2.6, 1.46, 2.41, 7.9, 1.47, 0.8, 1.01, 0.85, 1.12, 3.53, 7.73, 30.96, 0.77, 1.13, 2.09, 0.66, 2.24, 29.3, 9.2, 1.36, 0.68, 0.85, 2.06, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/r2NHTRgH3G0_filtered.json b/annotations_filtered/r2NHTRgH3G0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2ea23a513c7b3907312a8996e7cdeb4e0c01306 --- /dev/null +++ b/annotations_filtered/r2NHTRgH3G0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.77], [12.0, 12.68], [14.0, 15.72], [17.0, 23.33], [29.0, 32.83], [43.0, 44.79], [69.0, 68.81], [71.0, 71.63]], "keep_status": [true, false, false, true, true, false, false, false], "silence_prob": [30.08, 0.0, 0.0, 43.58, 40.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.71], ["synthesizer", 11.03], ["didgeridoo", 8.96]], null, null, [["hum", 29.26], ["electric shaver, electric razor", 16.94], ["mains hum", 10.87]], [["speech", 45.04], ["music", 8.41], ["hum", 6.42]], null, null, null], "duration": [4.77, 0.68, 1.72, 6.33, 3.83, 1.79, -0.19, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/r2RzBizjKT0_filtered.json b/annotations_filtered/r2RzBizjKT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67a5ba5b950a320971d5dfb170756953693fd1b6 --- /dev/null +++ b/annotations_filtered/r2RzBizjKT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [7.0, 8.45], [10.0, 10.96], [12.0, 15.38], [16.0, 28.05], [29.0, 38.75], [48.0, 49.89], [51.0, 52.91], [54.0, 57.1], [59.0, 72.77], [75.0, 82.92], [84.0, 85.11], [86.0, 86.34], [89.0, 90.12], [94.0, 104.97], [105.0, 114.27], [115.0, 122.15], [122.0, 122.32], [122.0, 125.39], [127.0, 127.18], [129.0, 128.87], [131.0, 132.04], [135.0, 137.34], [141.0, 141.81], [149.0, 149.47], [150.0, 151.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 93.6, 59.51, 69.47, 0.0, 0.0, 61.37, 60.89, 67.89, 0.0, 0.0, 0.0, 51.44, 38.42, 76.04, 0.0, 43.74, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 36.25], ["cattle, bovinae", 32.45], ["moo", 13.65]], null, null, [["speech", 54.19], ["fly, housefly", 4.86], ["hum", 3.71]], null, null, null, null, null, null, null], "duration": [1.8, 1.45, 0.96, 3.38, 12.05, 9.75, 1.89, 1.91, 3.1, 13.77, 7.92, 1.11, 0.34, 1.12, 10.97, 9.27, 7.15, 0.32, 3.39, 0.18, -0.13, 1.04, 2.34, 0.81, 0.47, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/r2fHzai5ih4_filtered.json b/annotations_filtered/r2fHzai5ih4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6896e5455c31f5f9f42e9910504e0ec813587dd2 --- /dev/null +++ b/annotations_filtered/r2fHzai5ih4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.94], [16.0, 16.65], [21.0, 21.41], [32.0, 32.04], [45.0, 45.91], [72.0, 72.82], [73.0, 75.52], [76.0, 75.84], [80.0, 81.41], [85.0, 85.36], [99.0, 100.43], [104.0, 104.73], [105.0, 106.57], [111.0, 113.59], [115.0, 117.09], [118.0, 120.02]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.75, 34.67, 60.51], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 32.03], ["music", 15.68], ["pulse", 7.91]], null, null, null, null, null, null, null, [["music", 34.27], ["theremin", 6.29], ["whale vocalization", 5.1]], null], "duration": [0.94, 0.65, 0.41, 0.04, 0.91, 0.82, 2.52, -0.16, 1.41, 0.36, 1.43, 0.73, 1.57, 2.59, 2.09, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/r2ucpHgHo1g_filtered.json b/annotations_filtered/r2ucpHgHo1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7b06e66a7725ebb466308cbd35880c7f2b8399c --- /dev/null +++ b/annotations_filtered/r2ucpHgHo1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 50.23], [53.0, 70.24], [73.0, 73.26], [74.0, 74.28], [75.0, 94.73], [96.0, 101.22], [103.0, 102.93], [104.0, 107.13], [108.0, 113.21]], "keep_status": [false, true, false, false, true, false, false, true, false], "silence_prob": [31.26, 39.24, 0.0, 0.0, 32.97, 39.78, 0.0, 37.81, 43.53], "audiomae_on_audioset": [[["music", 67.11], ["speech", 5.63], ["hum", 3.41]], [["music", 37.22], ["hum", 12.38], ["fly, housefly", 5.86]], null, null, [["music", 35.47], ["sound effect", 4.83], ["didgeridoo", 4.43]], [["didgeridoo", 55.63], ["music", 16.42], ["hum", 7.55]], null, [["music", 26.33], ["fly, housefly", 6.67], ["mains hum", 4.58]], [["hum", 51.52], ["mains hum", 30.46], ["throbbing", 7.97]]], "duration": [8.23, 17.24, 0.26, 0.28, 19.73, 5.22, -0.07, 3.13, 5.21]} \ No newline at end of file diff --git a/annotations_filtered/r2x4QueC2As_filtered.json b/annotations_filtered/r2x4QueC2As_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/r2x4QueC2As_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/r2xpAXMPRHc_filtered.json b/annotations_filtered/r2xpAXMPRHc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..083a758f72b81d479bc6717812c44b959afd4836 --- /dev/null +++ b/annotations_filtered/r2xpAXMPRHc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 61.72], [62.0, 62.92], [64.0, 70.07], [72.0, 77.28], [79.0, 84.5]], "keep_status": [true, false, false, false, false], "silence_prob": [35.75, 0.0, 97.73, 98.99, 99.59], "audiomae_on_audioset": [[["music", 44.21], ["gasp", 16.58], ["throbbing", 2.11]], null, null, null, null], "duration": [20.72, 0.92, 6.07, 5.28, 5.5]} \ No newline at end of file diff --git a/annotations_filtered/r38fEGep2yU_filtered.json b/annotations_filtered/r38fEGep2yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83f4743c93f0ff3e3626c275e05c0c85abd3df47 --- /dev/null +++ b/annotations_filtered/r38fEGep2yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.07], [20.0, 20.66], [25.0, 25.68], [27.0, 26.99], [32.0, 33.27], [54.0, 54.28], [82.0, 84.06], [85.0, 85.73], [87.0, 92.23], [93.0, 95.99], [97.0, 101.04], [106.0, 107.43]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.89, 0.0, 31.84, 71.43, 71.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 18.17], ["singing bowl", 16.42], ["sine wave", 11.8]], null, null, null], "duration": [0.07, 0.66, 0.68, -0.01, 1.27, 0.28, 2.06, 0.73, 5.23, 2.99, 4.04, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/r3BS4jKjRkc_filtered.json b/annotations_filtered/r3BS4jKjRkc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b85c01ce188b3ec749b2c3ead2f12a7db7b7ad1b --- /dev/null +++ b/annotations_filtered/r3BS4jKjRkc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.89], [20.0, 23.9], [24.0, 29.29], [30.0, 34.1], [35.0, 44.76], [47.0, 54.24], [55.0, 55.68], [58.0, 60.67], [64.0, 67.83], [71.0, 89.68], [91.0, 95.1], [96.0, 105.11], [114.0, 115.18], [119.0, 129.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.2, 88.28, 97.83, 95.09, 88.28, 0.0, 53.84, 83.88, 57.25, 92.64, 87.37, 0.0, 85.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.89, 3.9, 5.29, 4.1, 9.76, 7.24, 0.68, 2.67, 3.83, 18.68, 4.1, 9.11, 1.18, 10.05]} \ No newline at end of file diff --git a/annotations_filtered/r3L0e0izKG4_filtered.json b/annotations_filtered/r3L0e0izKG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b70276e20a52f0599147ac5761ef745474e9e29f --- /dev/null +++ b/annotations_filtered/r3L0e0izKG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 55.86], [58.0, 70.53], [73.0, 85.31], [87.0, 87.91], [91.0, 92.57], [97.0, 97.9], [101.0, 117.91], [123.0, 122.94], [125.0, 127.31], [128.0, 132.54], [137.0, 138.35], [139.0, 139.56], [142.0, 142.55], [144.0, 143.95], [146.0, 147.21], [147.0, 148.56], [153.0, 154.31], [155.0, 155.73], [156.0, 166.63], [168.0, 179.61], [182.0, 184.62], [185.0, 185.75], [187.0, 253.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.11, 96.66, 0.0, 0.0, 0.0, 100.0, 0.0, 65.2, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 99.85, 97.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [52.86, 12.53, 12.31, 0.91, 1.57, 0.9, 16.91, -0.06, 2.31, 4.54, 1.35, 0.56, 0.55, -0.05, 1.21, 1.56, 1.31, 0.73, 10.63, 11.61, 2.62, 0.75, 66.84]} \ No newline at end of file diff --git a/annotations_filtered/r3Owzt1HZkY_filtered.json b/annotations_filtered/r3Owzt1HZkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f5b4231d21036bf501a457a91d391fbe50c7304 --- /dev/null +++ b/annotations_filtered/r3Owzt1HZkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.98], [15.0, 28.98], [30.0, 32.73], [33.0, 35.56], [37.0, 62.53], [69.0, 70.12], [73.0, 72.99], [74.0, 81.7], [84.0, 89.58], [95.0, 116.01], [124.0, 126.5], [128.0, 129.39], [130.0, 131.04]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [46.47, 55.53, 57.01, 46.54, 43.35, 0.0, 0.0, 70.58, 97.64, 37.5, 47.08, 0.0, 0.0], "audiomae_on_audioset": [[["music", 67.22], ["foghorn", 3.95], ["musical instrument", 3.39]], null, null, [["music", 40.56], ["singing bowl", 9.6], ["speech", 8.58]], [["music", 69.37], ["squish", 3.95], ["keys jangling", 3.79]], null, null, null, null, [["speech", 63.46], ["vehicle", 13.15], ["helicopter", 3.89]], [["livestock, farm animals, working animals", 23.62], ["music", 18.46], ["didgeridoo", 8.94]], null, null], "duration": [3.98, 13.98, 2.73, 2.56, 25.53, 1.12, -0.01, 7.7, 5.58, 21.01, 2.5, 1.39, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/r3_IvtMPIi4_filtered.json b/annotations_filtered/r3_IvtMPIi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c841cca1789528a7fb0be25fe6f60d418de8346 --- /dev/null +++ b/annotations_filtered/r3_IvtMPIi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.16], [8.0, 10.57], [11.0, 16.95], [17.0, 35.46], [37.0, 43.97], [44.0, 44.78], [48.0, 49.37], [56.0, 58.77], [60.0, 61.32], [66.0, 66.29], [72.0, 72.72], [75.0, 76.72], [77.0, 79.35], [82.0, 83.1], [92.0, 93.38], [95.0, 96.33], [98.0, 99.54], [100.0, 107.91], [110.0, 118.76], [119.0, 121.51], [122.0, 122.62], [123.0, 123.6], [124.0, 129.3], [131.0, 131.52], [133.0, 138.94], [142.0, 152.79], [156.0, 155.68], [158.0, 158.67], [162.0, 164.07], [165.0, 165.43], [166.0, 182.14], [184.0, 185.43], [186.0, 189.73]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 30.92, 30.87, 30.47, 39.99, 0.0, 0.0, 40.02, 0.0, 0.0, 0.0, 0.0, 34.94, 0.0, 0.0, 0.0, 0.0, 38.86, 42.42, 36.94, 0.0, 0.0, 57.17, 0.0, 43.96, 47.74, 0.0, 0.0, 58.47, 0.0, 38.75, 0.0, 32.84], "audiomae_on_audioset": [null, [["music", 53.8], ["speech", 9.08], ["rattle (instrument)", 6.36]], [["music", 45.7], ["speech", 32.87], ["boing", 3.63]], [["music", 49.51], ["speech", 14.01], ["theremin", 10.49]], [["hum", 47.36], ["mains hum", 34.23], ["music", 4.06]], null, null, [["hum", 18.43], ["mains hum", 14.36], ["noise", 11.36]], null, null, null, null, [["speech", 32.15], ["music", 10.05], ["whale vocalization", 8.07]], null, null, null, null, [["speech", 51.62], ["music", 31.72], ["synthesizer", 2.49]], [["hum", 18.44], ["speech", 17.17], ["mains hum", 15.59]], [["speech", 29.25], ["sidetone", 28.94], ["hum", 5.31]], null, null, null, null, [["mains hum", 30.98], ["music", 22.38], ["hum", 15.01]], [["theremin", 58.98], ["music", 17.82], ["hum", 2.39]], null, null, null, null, [["music", 64.1], ["theremin", 8.88], ["hum", 5.44]], null, [["music", 33.22], ["owl", 9.92], ["hum", 8.07]]], "duration": [0.16, 2.57, 5.95, 18.46, 6.97, 0.78, 1.37, 2.77, 1.32, 0.29, 0.72, 1.72, 2.35, 1.1, 1.38, 1.33, 1.54, 7.91, 8.76, 2.51, 0.62, 0.6, 5.3, 0.52, 5.94, 10.79, -0.32, 0.67, 2.07, 0.43, 16.14, 1.43, 3.73]} \ No newline at end of file diff --git a/annotations_filtered/r3eNr-xxA7s_filtered.json b/annotations_filtered/r3eNr-xxA7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b77b4ac8e43a800af707c66014d78e93aab1acfa --- /dev/null +++ b/annotations_filtered/r3eNr-xxA7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 41.55], [44.0, 50.94], [53.0, 55.05], [61.0, 61.86], [62.0, 78.33], [83.0, 108.63], [110.0, 129.07], [130.0, 130.81]], "keep_status": [false, true, false, false, true, false, false, false], "silence_prob": [0.0, 35.18, 46.19, 0.0, 39.15, 38.46, 36.59, 0.0], "audiomae_on_audioset": [null, [["insect", 30.26], ["fly, housefly", 27.69], ["mosquito", 4.61]], [["music", 41.8], ["boing", 33.77], ["sidetone", 6.33]], null, [["music", 50.01], ["musical instrument", 10.69], ["noise", 7.16]], [["music", 83.91], ["neigh, whinny", 2.27], ["musical instrument", 1.89]], [["music", 72.68], ["speech", 4.64], ["musical instrument", 3.43]], null], "duration": [31.55, 6.94, 2.05, 0.86, 16.33, 25.63, 19.07, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/r3fnCEjvPCQ_filtered.json b/annotations_filtered/r3fnCEjvPCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ea6402ae029739151cd472e579f80c3f04cb240 --- /dev/null +++ b/annotations_filtered/r3fnCEjvPCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.74], [8.0, 10.74], [11.0, 13.73], [14.0, 15.7], [16.0, 29.39]], "keep_status": [true, true, true, false, true], "silence_prob": [34.16, 36.55, 34.74, 0.0, 31.18], "audiomae_on_audioset": [[["music", 20.69], ["hum", 19.68], ["mains hum", 12.93]], [["music", 28.29], ["hum", 12.49], ["speech", 6.9]], [["moo", 19.99], ["cattle, bovinae", 17.23], ["livestock, farm animals, working animals", 12.26]], null, [["hum", 20.61], ["throbbing", 12.85], ["buzz", 10.8]]], "duration": [2.74, 2.74, 2.73, 1.7, 13.39]} \ No newline at end of file diff --git a/annotations_filtered/r421zjv-hoE_filtered.json b/annotations_filtered/r421zjv-hoE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2fa3b6b361623f13220f1ecf15995cdc4e48e256 --- /dev/null +++ b/annotations_filtered/r421zjv-hoE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.93], [13.0, 14.74], [18.0, 19.35], [20.0, 20.98], [21.0, 30.82], [31.0, 32.53], [33.0, 50.95], [54.0, 67.49], [70.0, 72.32], [75.0, 79.1], [82.0, 96.4], [99.0, 101.01], [103.0, 108.4], [114.0, 118.5]], "keep_status": [true, false, false, false, true, false, true, false, true, true, true, false, true, false], "silence_prob": [32.06, 0.0, 0.0, 0.0, 31.08, 0.0, 30.06, 30.17, 29.64, 30.16, 30.13, 30.67, 31.24, 31.08], "audiomae_on_audioset": [[["hum", 31.28], ["music", 21.67], ["mains hum", 16.36]], null, null, null, [["music", 52.28], ["throbbing", 7.05], ["hum", 5.81]], null, [["music", 14.6], ["vehicle", 12.59], ["throbbing", 7.94]], [["speech", 44.35], ["music", 33.5], ["musical instrument", 2.21]], [["music", 62.17], ["cacophony", 2.91], ["electronic music", 2.45]], [["throbbing", 14.13], ["hum", 13.35], ["speech", 9.16]], [["speech", 32.78], ["music", 23.27], ["vehicle", 9.12]], [["speech", 51.94], ["music", 11.24], ["hum", 6.89]], [["hum", 14.01], ["music", 11.64], ["animal", 11.6]], [["speech", 53.64], ["music", 23.35], ["vehicle", 3.2]]], "duration": [5.93, 1.74, 1.35, 0.98, 9.82, 1.53, 17.95, 13.49, 2.32, 4.1, 14.4, 2.01, 5.4, 4.5]} \ No newline at end of file diff --git a/annotations_filtered/r4IBPd7-LlQ_filtered.json b/annotations_filtered/r4IBPd7-LlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57aa000f081e7c4a85c468c632c568be697a964e --- /dev/null +++ b/annotations_filtered/r4IBPd7-LlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.42], [7.0, 26.92], [30.0, 40.81], [44.0, 47.16], [48.0, 50.75], [51.0, 59.17]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 29.56, 30.14, 32.46, 34.02, 30.6], "audiomae_on_audioset": [null, [["music", 54.62], ["vehicle", 8.6], ["car", 5.75]], [["music", 52.34], ["speech", 25.14], ["hum", 3.93]], [["music", 68.49], ["throbbing", 9.94], ["synthesizer", 4.08]], [["music", 41.06], ["throbbing", 27.64], ["hum", 7.85]], [["music", 70.28], ["speech", 16.45], ["throbbing", 3.38]]], "duration": [0.42, 19.92, 10.81, 3.16, 2.75, 8.17]} \ No newline at end of file diff --git a/annotations_filtered/r4K7eNzseCI_filtered.json b/annotations_filtered/r4K7eNzseCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..604c7471af4eb5f02570227517df02e41173ae26 --- /dev/null +++ b/annotations_filtered/r4K7eNzseCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.72], [10.0, 9.71], [12.0, 13.39], [22.0, 22.0], [25.0, 27.11], [33.0, 34.05], [35.0, 36.17], [37.0, 37.56], [53.0, 53.64], [54.0, 55.24], [57.0, 56.91], [57.0, 63.48], [66.0, 68.62], [69.0, 71.31], [72.0, 73.94], [75.0, 75.98], [78.0, 78.7], [80.0, 81.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 97.43, 90.6, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, -0.29, 1.39, 0.0, 2.11, 1.05, 1.17, 0.56, 0.64, 1.24, -0.09, 6.48, 2.62, 2.31, 1.94, 0.98, 0.7, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/r4SF22qFxbE_filtered.json b/annotations_filtered/r4SF22qFxbE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8122a63dda61ecb06c999732810e4769574fb3b7 --- /dev/null +++ b/annotations_filtered/r4SF22qFxbE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.12], [12.0, 24.11], [27.0, 26.82], [29.0, 30.13], [32.0, 77.7], [79.0, 94.17], [97.0, 105.56], [106.0, 106.91], [119.0, 119.5]], "keep_status": [false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 33.91, 0.0, 0.0, 0.0, 47.39, 34.3, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 30.39], ["explosion", 25.83], ["burst, pop", 7.11]], null, null, null, [["burst, pop", 17.04], ["explosion", 16.66], ["gunshot, gunfire", 14.42]], [["burst, pop", 25.23], ["explosion", 23.94], ["gunshot, gunfire", 13.54]], null, null], "duration": [0.12, 12.11, -0.18, 1.13, 45.7, 15.17, 8.56, 0.91, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/r4mQmoD72tc_filtered.json b/annotations_filtered/r4mQmoD72tc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35f5bdfc08f16867fc3b70ca0060c455f38453b5 --- /dev/null +++ b/annotations_filtered/r4mQmoD72tc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.79], [25.0, 29.4], [31.0, 36.04], [38.0, 49.5], [54.0, 55.41], [61.0, 86.39], [95.0, 104.45], [107.0, 124.68]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 31.67, 31.88, 31.98, 0.0, 30.95, 31.47, 31.38], "audiomae_on_audioset": [null, [["music", 43.32], ["sidetone", 8.55], ["speech", 7.09]], [["music", 72.79], ["speech", 5.46], ["electronic music", 3.15]], [["music", 81.14], ["didgeridoo", 2.66], ["musical instrument", 1.85]], null, [["music", 81.8], ["throbbing", 3.01], ["didgeridoo", 2.99]], [["music", 76.73], ["electronic music", 7.01], ["techno", 3.28]], [["music", 61.63], ["electronic music", 6.62], ["throbbing", 6.59]]], "duration": [1.79, 4.4, 5.04, 11.5, 1.41, 25.39, 9.45, 17.68]} \ No newline at end of file diff --git a/annotations_filtered/r4vQbzdjQW8_filtered.json b/annotations_filtered/r4vQbzdjQW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a80438398481eb22c179edba7c3437652af0e5f --- /dev/null +++ b/annotations_filtered/r4vQbzdjQW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 17.19], [19.0, 23.8], [25.0, 40.17], [41.0, 41.89], [43.0, 44.79], [46.0, 47.6], [48.0, 91.96], [94.0, 96.89], [98.0, 116.75], [118.0, 118.77], [120.0, 122.64], [123.0, 125.02], [127.0, 127.95], [129.0, 131.31], [135.0, 141.32], [142.0, 146.69]], "keep_status": [true, false, true, false, false, false, false, true, true, false, true, true, false, true, true, false], "silence_prob": [37.02, 36.23, 34.38, 0.0, 0.0, 0.0, 0.0, 39.72, 36.25, 0.0, 38.75, 38.5, 0.0, 41.58, 36.1, 37.65], "audiomae_on_audioset": [[["sidetone", 33.17], ["hum", 15.53], ["speech", 12.41]], [["whale vocalization", 55.09], ["grunt", 12.46], ["music", 6.0]], [["whale vocalization", 21.47], ["roaring cats (lions, tigers)", 14.64], ["roar", 13.44]], null, null, null, null, [["music", 40.5], ["whale vocalization", 10.1], ["foghorn", 4.34]], [["grunt", 25.49], ["speech", 9.17], ["music", 7.73]], null, [["whale vocalization", 18.04], ["music", 15.74], ["hum", 12.86]], [["whale vocalization", 16.99], ["throbbing", 10.96], ["music", 7.27]], null, [["rumble", 29.51], ["car", 5.69], ["crackle", 5.25]], [["rumble", 24.26], ["whale vocalization", 13.68], ["hum", 11.18]], [["rumble", 68.9], ["hum", 7.39], ["throbbing", 4.65]]], "duration": [14.19, 4.8, 15.17, 0.89, 1.79, 1.6, 43.96, 2.89, 18.75, 0.77, 2.64, 2.02, 0.95, 2.31, 6.32, 4.69]} \ No newline at end of file diff --git a/annotations_filtered/r5ilcq9hUZI_filtered.json b/annotations_filtered/r5ilcq9hUZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f57ebea22616bdf1bce5ea32ced9fba3b4bcb26f --- /dev/null +++ b/annotations_filtered/r5ilcq9hUZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [7.0, 8.26], [20.0, 23.75], [25.0, 25.83], [28.0, 30.18], [33.0, 33.51], [37.0, 38.08], [41.0, 52.34], [55.0, 56.46], [60.0, 60.3], [61.0, 61.59], [62.0, 63.04], [65.0, 66.41], [67.0, 67.31], [69.0, 69.9], [75.0, 76.64], [79.0, 80.59], [81.0, 84.54], [92.0, 93.58], [96.0, 97.21], [108.0, 109.27], [113.0, 114.47], [115.0, 117.93], [127.0, 132.73], [133.0, 135.5], [137.0, 143.43], [144.0, 145.71], [149.0, 150.9], [153.0, 153.54], [155.0, 162.11], [163.0, 166.7], [167.0, 170.16], [170.0, 174.24], [175.0, 176.64], [178.0, 182.09], [187.0, 188.72], [189.0, 194.31], [195.0, 196.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.37, 0.0, 99.82, 0.0, 0.0, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 44.07, 28.91, 52.74, 99.98, 0.0, 0.0, 0.0, 72.46, 99.85, 87.74, 43.85, 0.0, 90.25, 0.0, 45.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.31], ["sine wave", 29.07], ["chirp tone", 6.82]], [["crack", 27.78], ["breaking", 11.01], ["animal", 7.31]], null, null, null, null, null, null, null, null, [["speech", 52.24], ["singing bowl", 12.96], ["tuning fork", 10.4]], null, null, null, [["hum", 41.39], ["speech", 31.81], ["throbbing", 8.62]], null], "duration": [1.1, 1.26, 3.75, 0.83, 2.18, 0.51, 1.08, 11.34, 1.46, 0.3, 0.59, 1.04, 1.41, 0.31, 0.9, 1.64, 1.59, 3.54, 1.58, 1.21, 1.27, 1.47, 2.93, 5.73, 2.5, 6.43, 1.71, 1.9, 0.54, 7.11, 3.7, 3.16, 4.24, 1.64, 4.09, 1.72, 5.31, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/r5zhPLNGAOE_filtered.json b/annotations_filtered/r5zhPLNGAOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bbda6f4a6e608eaa1f1e2eba8345ee0ab29a676 --- /dev/null +++ b/annotations_filtered/r5zhPLNGAOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [6.0, 7.5], [10.0, 11.45], [19.0, 19.06], [20.0, 20.75], [22.0, 22.77], [24.0, 38.52], [41.0, 71.58], [74.0, 87.93], [91.0, 92.06], [99.0, 99.49], [100.0, 102.96], [105.0, 108.43], [111.0, 121.32], [124.0, 124.93], [127.0, 127.72], [130.0, 138.08], [141.0, 141.24], [144.0, 144.04], [146.0, 149.86], [153.0, 155.16], [159.0, 160.08], [163.0, 164.83], [166.0, 167.34], [170.0, 172.29], [175.0, 176.4], [177.0, 180.74], [181.0, 182.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.63, 0.0, 32.26, 0.0, 0.0, 44.46, 39.22, 95.09, 0.0, 0.0, 83.52, 0.0, 0.0, 96.04, 97.64, 0.0, 0.0, 0.0, 81.89, 0.0, 67.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 62.09], ["throbbing", 5.02], ["hum", 4.48]], null, [["whale vocalization", 38.56], ["speech", 35.85], ["music", 6.47]], null, null, [["throbbing", 34.94], ["hum", 31.35], ["music", 13.77]], [["hum", 38.67], ["music", 19.03], ["mains hum", 16.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 1.5, 1.45, 0.06, 0.75, 0.77, 14.52, 30.58, 13.93, 1.06, 0.49, 2.96, 3.43, 10.32, 0.93, 0.72, 8.08, 0.24, 0.04, 3.86, 2.16, 1.08, 1.83, 1.34, 2.29, 1.4, 3.74, 1.6]} \ No newline at end of file diff --git a/annotations_filtered/r67faKKQyO4_filtered.json b/annotations_filtered/r67faKKQyO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..542dfbfb59fc45e658263de089c3e0e6cffa2742 --- /dev/null +++ b/annotations_filtered/r67faKKQyO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.56], [5.0, 6.94], [9.0, 11.33], [15.0, 20.53], [28.0, 29.32], [36.0, 45.94], [47.0, 49.55], [52.0, 60.27], [65.0, 64.89], [69.0, 70.09], [74.0, 80.49], [81.0, 96.13], [98.0, 100.84], [106.0, 113.46], [114.0, 114.39], [120.0, 143.33], [148.0, 152.34], [153.0, 158.73], [164.0, 172.44], [173.0, 173.69], [174.0, 174.46], [178.0, 181.38]], "keep_status": [false, false, true, true, false, false, true, true, false, false, true, true, true, false, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 32.48, 33.12, 0.0, 33.67, 41.78, 36.06, 0.0, 0.0, 35.08, 34.34, 33.14, 35.94, 0.0, 32.89, 34.66, 31.93, 30.97, 0.0, 0.0, 30.34], "audiomae_on_audioset": [null, null, [["mosquito", 30.83], ["moo", 14.33], ["boing", 10.3]], [["music", 25.98], ["whack, thwack", 21.18], ["fly, housefly", 8.89]], null, [["livestock, farm animals, working animals", 37.7], ["cattle, bovinae", 26.34], ["ding", 12.99]], [["cattle, bovinae", 18.73], ["livestock, farm animals, working animals", 17.84], ["moo", 14.15]], [["music", 38.8], ["boing", 12.05], ["speech", 5.47]], null, null, [["music", 26.93], ["fly, housefly", 19.04], ["breaking", 8.96]], [["hum", 36.82], ["mains hum", 15.69], ["fly, housefly", 10.01]], [["music", 47.47], ["boing", 7.97], ["speech", 3.98]], [["music", 63.02], ["boing", 9.4], ["whip", 7.51]], null, [["speech", 61.0], ["music", 14.19], ["fart", 7.92]], [["mosquito", 61.99], ["fly, housefly", 17.43], ["insect", 3.26]], [["music", 36.64], ["speech", 11.6], ["throbbing", 8.68]], [["music", 35.32], ["noise", 12.68], ["synthesizer", 10.51]], null, null, [["music", 14.6], ["crowd", 10.52], ["whale vocalization", 8.65]]], "duration": [0.56, 1.94, 2.33, 5.53, 1.32, 9.94, 2.55, 8.27, -0.11, 1.09, 6.49, 15.13, 2.84, 7.46, 0.39, 23.33, 4.34, 5.73, 8.44, 0.69, 0.46, 3.38]} \ No newline at end of file diff --git a/annotations_filtered/r6dLxmPng8o_filtered.json b/annotations_filtered/r6dLxmPng8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..514195d46526ee0ccd1f733ff23f11ea643dd008 --- /dev/null +++ b/annotations_filtered/r6dLxmPng8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.75], [29.0, 34.06], [36.0, 37.52], [38.0, 38.87], [40.0, 41.44], [43.0, 43.73], [45.0, 46.21], [48.0, 48.68], [50.0, 51.43], [54.0, 55.31], [57.0, 57.54], [61.0, 61.59], [62.0, 63.19], [65.0, 65.53], [68.0, 69.23], [71.0, 73.25], [75.0, 75.96], [77.0, 77.36], [79.0, 80.42], [81.0, 82.51], [87.0, 88.05], [89.0, 89.68], [91.0, 91.3], [93.0, 93.09], [96.0, 96.13], [97.0, 97.82], [100.0, 101.09], [102.0, 103.0], [103.0, 104.65], [106.0, 106.51], [108.0, 108.45], [110.0, 110.73], [113.0, 130.86]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [54.5, 37.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.65], "audiomae_on_audioset": [null, [["speech", 46.86], ["eruption", 9.03], ["boat, water vehicle", 7.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 15.03], ["speech", 11.21], ["eruption", 6.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 52.77], ["burst, pop", 9.14], ["eruption", 6.67]]], "duration": [2.75, 5.06, 1.52, 0.87, 1.44, 0.73, 1.21, 0.68, 1.43, 1.31, 0.54, 0.59, 1.19, 0.53, 1.23, 2.25, 0.96, 0.36, 1.42, 1.51, 1.05, 0.68, 0.3, 0.09, 0.13, 0.82, 1.09, 1.0, 1.65, 0.51, 0.45, 0.73, 17.86]} \ No newline at end of file diff --git a/annotations_filtered/r6fpS6P16NI_filtered.json b/annotations_filtered/r6fpS6P16NI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a315cd58fd0fd8b16dcb3c33c90e2d2bfbb4b5a --- /dev/null +++ b/annotations_filtered/r6fpS6P16NI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [7.0, 7.94], [8.0, 8.7], [9.0, 9.49], [14.0, 14.22], [21.0, 29.2], [30.0, 30.43], [31.0, 32.97], [33.0, 34.01], [42.0, 44.66], [47.0, 49.0], [59.0, 58.83], [59.0, 59.27], [81.0, 84.65], [103.0, 107.18], [110.0, 110.59], [115.0, 115.43], [117.0, 119.62], [124.0, 126.25], [126.0, 127.84], [128.0, 129.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.03, 0.0, 0.0, 0.0, 35.29, 52.33, 0.0, 0.0, 35.33, 32.8, 0.0, 0.0, 32.43, 30.78, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["fart", 38.33], ["speech", 32.13], ["radio", 7.57]], null, null, null, [["boing", 47.23], ["grunt", 31.07], ["speech", 10.88]], null, null, null, [["speech", 45.53], ["radio", 8.09], ["sidetone", 6.27]], [["speech", 69.1], ["animal", 4.75], ["sheep", 4.59]], null, null, [["speech", 27.36], ["frog", 25.58], ["screaming", 6.86]], [["speech", 20.44], ["goose", 12.44], ["duck", 11.33]], null, null], "duration": [1.05, 0.94, 0.7, 0.49, 0.22, 8.2, 0.43, 1.97, 1.01, 2.66, 2.0, -0.17, 0.27, 3.65, 4.18, 0.59, 0.43, 2.62, 2.25, 1.84, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/r74QbwaIWFc_filtered.json b/annotations_filtered/r74QbwaIWFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/r74QbwaIWFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/r763LgcxCyM_filtered.json b/annotations_filtered/r763LgcxCyM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97e37a3d4d5ed3b6cc7e3badce58846c48ea73ff --- /dev/null +++ b/annotations_filtered/r763LgcxCyM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [6.0, 7.6], [8.0, 13.32], [14.0, 14.74], [15.0, 15.75], [17.0, 17.17], [19.0, 19.63], [20.0, 20.26], [24.0, 47.04], [48.0, 48.9], [50.0, 53.97], [56.0, 57.72], [58.0, 58.7], [63.0, 64.57], [67.0, 67.63], [70.0, 70.88], [73.0, 73.11], [74.0, 75.22], [77.0, 77.57], [81.0, 81.73], [85.0, 85.14], [86.0, 86.07], [87.0, 87.79], [90.0, 90.85], [97.0, 98.1], [105.0, 105.7], [107.0, 107.55], [109.0, 109.61], [111.0, 111.38], [114.0, 114.12], [115.0, 115.77], [116.0, 118.88], [121.0, 123.77], [127.0, 128.58]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 38.97, 0.0, 0.0, 0.0, 0.0, 0.0, 35.8, 0.0, 32.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6, 69.2, 0.0], "audiomae_on_audioset": [null, null, [["stomach rumble", 9.54], ["creak", 7.45], ["fart", 6.94]], null, null, null, null, null, [["mains hum", 31.65], ["hum", 19.66], ["speech", 16.78]], null, [["speech", 35.54], ["radio", 32.6], ["didgeridoo", 11.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 1.6, 5.32, 0.74, 0.75, 0.17, 0.63, 0.26, 23.04, 0.9, 3.97, 1.72, 0.7, 1.57, 0.63, 0.88, 0.11, 1.22, 0.57, 0.73, 0.14, 0.07, 0.79, 0.85, 1.1, 0.7, 0.55, 0.61, 0.38, 0.12, 0.77, 2.88, 2.77, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/r76peMNNiyw_filtered.json b/annotations_filtered/r76peMNNiyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bef6d53952800c293deb7e75343ca992665c46a --- /dev/null +++ b/annotations_filtered/r76peMNNiyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.56], [19.0, 22.05], [23.0, 24.14], [26.0, 26.11], [28.0, 29.52], [31.0, 32.51]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 55.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.56, 3.05, 1.14, 0.11, 1.52, 1.51]} \ No newline at end of file diff --git a/annotations_filtered/r7J-Qx2InoU_filtered.json b/annotations_filtered/r7J-Qx2InoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e93d2b8302f32b9db029fadd402f295276f8a34 --- /dev/null +++ b/annotations_filtered/r7J-Qx2InoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [4.0, 5.68], [8.0, 20.19], [21.0, 21.24], [22.0, 22.45], [23.0, 24.14], [25.0, 29.89], [31.0, 35.02], [35.0, 39.09], [40.0, 80.08], [81.0, 88.94], [90.0, 101.33], [103.0, 104.68], [107.0, 109.66], [111.0, 112.06], [113.0, 119.84], [121.0, 121.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 90.43, 54.43, 42.33, 0.0, 39.5, 35.64, 0.0, 50.61, 0.0, 36.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 46.96], ["radio", 15.16], ["sidetone", 12.67]], null, [["music", 49.47], ["speech", 27.12], ["whale vocalization", 11.72]], [["music", 74.35], ["effects unit", 2.83], ["theremin", 1.98]], null, null, null, [["music", 44.87], ["speech", 29.22], ["electronic music", 4.92]], null], "duration": [1.38, 1.68, 12.19, 0.24, 0.45, 1.14, 4.89, 4.02, 4.09, 40.08, 7.94, 11.33, 1.68, 2.66, 1.06, 6.84, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/r7aXjBDUk8w_filtered.json b/annotations_filtered/r7aXjBDUk8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..642171687e5673c8708344d7738c2b48407f404e --- /dev/null +++ b/annotations_filtered/r7aXjBDUk8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.74], [15.0, 15.72], [18.0, 20.22], [22.0, 22.52], [28.0, 32.17], [42.0, 41.88], [49.0, 50.99], [51.0, 51.48], [56.0, 66.07], [68.0, 68.47], [71.0, 74.33], [75.0, 75.46], [76.0, 80.49], [82.0, 91.0], [91.0, 106.78]], "keep_status": [false, false, true, false, true, false, false, false, false, false, true, false, true, true, false], "silence_prob": [64.75, 0.0, 42.35, 0.0, 42.58, 0.0, 0.0, 0.0, 37.01, 0.0, 35.24, 0.0, 35.94, 35.11, 32.06], "audiomae_on_audioset": [null, null, [["sidetone", 16.02], ["fly, housefly", 13.64], ["speech", 10.45]], null, [["music", 43.98], ["hum", 11.83], ["throbbing", 8.89]], null, null, null, [["music", 65.5], ["brass instrument", 5.16], ["musical instrument", 4.95]], null, [["music", 54.16], ["hum", 9.91], ["theremin", 4.9]], null, [["music", 41.57], ["speech", 16.93], ["fly, housefly", 8.44]], [["music", 40.03], ["buzz", 15.82], ["trombone", 10.65]], [["music", 61.88], ["music of latin america", 6.45], ["flamenco", 3.85]]], "duration": [2.74, 0.72, 2.22, 0.52, 4.17, -0.12, 1.99, 0.48, 10.07, 0.47, 3.33, 0.46, 4.49, 9.0, 15.78]} \ No newline at end of file diff --git a/annotations_filtered/r7k9mkm0TKU_filtered.json b/annotations_filtered/r7k9mkm0TKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f75e8bf522fa85a99be8d285c35ec7c30d88e73 --- /dev/null +++ b/annotations_filtered/r7k9mkm0TKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.2], [7.0, 7.2], [13.0, 14.17], [15.0, 16.61], [21.0, 21.46], [25.0, 26.49], [31.0, 37.42], [39.0, 40.58], [46.0, 89.43], [91.0, 92.3], [97.0, 106.49], [115.0, 115.01], [119.0, 119.94]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.34, 0.0, 0.0, 0.0, 31.69, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 60.61], ["musical instrument", 4.05], ["synthesizer", 3.29]], null, null, null, [["music", 69.38], ["speech", 6.84], ["electronic music", 2.17]], null, null], "duration": [0.2, 0.2, 1.17, 1.61, 0.46, 1.49, 6.42, 1.58, 43.43, 1.3, 9.49, 0.01, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/r8-BFx3xFJ4_filtered.json b/annotations_filtered/r8-BFx3xFJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cbf1b059b55f889653980218abdfd413a7bf047 --- /dev/null +++ b/annotations_filtered/r8-BFx3xFJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 64.67], [65.0, 65.64], [67.0, 67.24], [68.0, 69.5], [75.0, 75.69], [77.0, 81.45], [83.0, 91.45], [98.0, 98.39], [100.0, 100.35], [101.0, 114.1], [115.0, 116.87], [139.0, 147.46], [148.0, 148.22], [159.0, 159.95], [162.0, 162.43], [164.0, 165.96], [171.0, 172.81], [174.0, 174.68], [176.0, 175.86], [176.0, 181.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [30.42, 0.0, 0.0, 0.0, 0.0, 31.39, 32.13, 0.0, 0.0, 30.55, 0.0, 32.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.72], "audiomae_on_audioset": [[["music", 49.7], ["throbbing", 15.88], ["speech", 8.49]], null, null, null, null, [["music", 57.54], ["speech", 9.65], ["hum", 6.25]], [["music", 32.0], ["throbbing", 31.16], ["hum", 13.2]], null, null, [["music", 56.09], ["speech", 10.35], ["hum", 3.53]], null, [["hum", 26.89], ["music", 25.87], ["throbbing", 16.63]], null, null, null, null, null, null, null, null], "duration": [12.67, 0.64, 0.24, 1.5, 0.69, 4.45, 8.45, 0.39, 0.35, 13.1, 1.87, 8.46, 0.22, 0.95, 0.43, 1.96, 1.81, 0.68, -0.14, 5.94]} \ No newline at end of file diff --git a/annotations_filtered/r86n2JRUyRc_filtered.json b/annotations_filtered/r86n2JRUyRc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..760b0f81a9c7739e78c5fc54741372ae10186bda --- /dev/null +++ b/annotations_filtered/r86n2JRUyRc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.83], [14.0, 13.91], [29.0, 29.98], [32.0, 42.97], [45.0, 88.25], [91.0, 97.02], [99.0, 99.49], [102.0, 112.62], [121.0, 121.58], [128.0, 128.66], [150.0, 149.96], [156.0, 159.11], [159.0, 159.26], [159.0, 159.33], [159.0, 159.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.09, 0.0, 34.41, 0.0, 30.58, 0.0, 0.0, 0.0, 34.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.61], ["throbbing", 15.86], ["hum", 5.28]], null, [["music", 46.31], ["throbbing", 12.48], ["speech", 11.9]], null, [["music", 39.24], ["smash, crash", 20.44], ["speech", 13.55]], null, null, null, [["speech", 56.99], ["whip", 7.59], ["hubbub, speech noise, speech babble", 4.11]], null, null, null], "duration": [0.83, -0.09, 0.98, 10.97, 43.25, 6.02, 0.49, 10.62, 0.58, 0.66, -0.04, 3.11, 0.26, 0.33, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/r8swYmKUGJ0_filtered.json b/annotations_filtered/r8swYmKUGJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5623240b61b849eeb0c5f66814bba5a30395a09f --- /dev/null +++ b/annotations_filtered/r8swYmKUGJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.2], [40.0, 40.68], [49.0, 49.17], [53.0, 53.16], [55.0, 55.71], [58.0, 57.74], [65.0, 65.84]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.2, 0.68, 0.17, 0.16, 0.71, -0.26, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/r8uOQupi1iQ_filtered.json b/annotations_filtered/r8uOQupi1iQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37fc61bcaca6be8a010867cc3db34ed1dd71c1e2 --- /dev/null +++ b/annotations_filtered/r8uOQupi1iQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.42], [18.0, 20.09], [21.0, 22.94], [25.0, 25.52], [26.0, 30.7], [36.0, 36.1], [37.0, 38.4], [47.0, 47.34], [50.0, 50.3], [52.0, 52.44], [55.0, 55.43], [58.0, 61.52], [66.0, 66.95], [68.0, 68.54], [70.0, 72.06], [74.0, 79.76], [83.0, 84.96], [88.0, 88.84], [92.0, 94.47], [96.0, 96.72], [99.0, 101.41], [106.0, 106.44], [106.0, 106.66], [107.0, 106.69], [107.0, 109.31]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, true], "silence_prob": [29.69, 33.57, 0.0, 0.0, 29.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.73, 0.0, 0.0, 41.32, 34.54, 0.0, 0.0, 52.68, 0.0, 77.87, 0.0, 0.0, 0.0, 34.97], "audiomae_on_audioset": [[["speech", 51.49], ["music", 25.98], ["whack, thwack", 1.67]], [["music", 41.87], ["hum", 18.67], ["throbbing", 16.07]], null, null, [["speech", 42.2], ["music", 13.93], ["whack, thwack", 9.32]], null, null, null, null, null, null, [["music", 22.23], ["speech", 20.28], ["crushing", 11.22]], null, null, [["cattle, bovinae", 26.83], ["moo", 14.8], ["livestock, farm animals, working animals", 11.85]], [["music", 14.51], ["insect", 12.0], ["fly, housefly", 10.26]], null, null, null, null, null, null, null, null, [["sound effect", 17.1], ["music", 12.2], ["whack, thwack", 9.88]]], "duration": [6.42, 2.09, 1.94, 0.52, 4.7, 0.1, 1.4, 0.34, 0.3, 0.44, 0.43, 3.52, 0.95, 0.54, 2.06, 5.76, 1.96, 0.84, 2.47, 0.72, 2.41, 0.44, 0.66, -0.31, 2.31]} \ No newline at end of file diff --git a/annotations_filtered/r9aUxfTTLfk_filtered.json b/annotations_filtered/r9aUxfTTLfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f6502f1b61d1c96e42f5ec6f636f5d7e951add8 --- /dev/null +++ b/annotations_filtered/r9aUxfTTLfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.04], [29.0, 30.0], [31.0, 34.11], [34.0, 38.79], [50.0, 50.72], [51.0, 52.46], [55.0, 55.0], [55.0, 56.22], [57.0, 60.99], [62.0, 89.09], [89.0, 91.44], [92.0, 92.21], [97.0, 97.92], [99.0, 101.36], [105.0, 106.24], [108.0, 108.65], [111.0, 115.8], [118.0, 121.19], [123.0, 127.18]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 95.23, 83.7, 0.0, 0.0, 0.0, 0.0, 41.5, 37.65, 74.92, 0.0, 0.0, 50.36, 0.0, 0.0, 70.86, 41.85, 97.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 31.7], ["music", 15.7], ["mains hum", 14.59]], [["music", 38.22], ["speech", 9.22], ["trombone", 7.33]], null, null, null, null, null, null, null, [["music", 44.98], ["hum", 8.66], ["mains hum", 6.77]], null], "duration": [1.04, 1.0, 3.11, 4.79, 0.72, 1.46, 0.0, 1.22, 3.99, 27.09, 2.44, 0.21, 0.92, 2.36, 1.24, 0.65, 4.8, 3.19, 4.18]} \ No newline at end of file diff --git a/annotations_filtered/r9ae_frgcpU_filtered.json b/annotations_filtered/r9ae_frgcpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0240edc9a2a95beef6db4af0e87994eba0938040 --- /dev/null +++ b/annotations_filtered/r9ae_frgcpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.05], [8.0, 19.45], [22.0, 58.11], [59.0, 63.31], [64.0, 66.41], [69.0, 72.71], [73.0, 74.01], [76.0, 77.5], [78.0, 78.49], [81.0, 81.24], [82.0, 82.17], [82.0, 82.8], [85.0, 87.76], [89.0, 89.56], [91.0, 90.88], [92.0, 103.22], [105.0, 108.85], [113.0, 114.61], [116.0, 117.81], [120.0, 120.82], [122.0, 123.15], [127.0, 128.06], [129.0, 130.98], [133.0, 137.29], [138.0, 138.86], [142.0, 148.49], [149.0, 150.25], [152.0, 153.3], [156.0, 157.11], [161.0, 167.56]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [31.76, 29.63, 0.0, 48.82, 77.7, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.05, 0.0, 0.0, 30.39, 36.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.41, 0.0, 38.68, 0.0, 0.0, 0.0, 44.07], "audiomae_on_audioset": [[["vehicle", 19.13], ["car", 4.31], ["outside, urban or manmade", 4.15]], [["buzz", 15.15], ["music", 10.3], ["noise", 8.7]], null, [["music", 36.25], ["hum", 13.53], ["whale vocalization", 7.59]], null, null, null, null, null, null, null, null, [["speech", 51.18], ["hum", 13.09], ["sonar", 4.42]], null, null, [["whack, thwack", 30.39], ["clang", 16.73], ["ding", 12.45]], [["hum", 17.04], ["throbbing", 15.99], ["music", 10.49]], null, null, null, null, null, null, [["music", 53.03], ["speech", 5.05], ["musical instrument", 4.87]], null, [["hum", 28.21], ["mains hum", 13.81], ["bee, wasp, etc.", 11.84]], null, null, null, [["music", 35.69], ["speech", 25.11], ["didgeridoo", 8.3]]], "duration": [2.05, 11.45, 36.11, 4.31, 2.41, 3.71, 1.01, 1.5, 0.49, 0.24, 0.17, 0.8, 2.76, 0.56, -0.12, 11.22, 3.85, 1.61, 1.81, 0.82, 1.15, 1.06, 1.98, 4.29, 0.86, 6.49, 1.25, 1.3, 1.11, 6.56]} \ No newline at end of file diff --git a/annotations_filtered/r9bfL4Jz-M8_filtered.json b/annotations_filtered/r9bfL4Jz-M8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..999ab980456deb18aa67002cffdacef03251ebed --- /dev/null +++ b/annotations_filtered/r9bfL4Jz-M8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.17], [9.0, 9.53], [15.0, 15.45], [28.0, 28.38], [30.0, 30.47], [31.0, 31.28], [33.0, 33.3], [34.0, 34.2], [35.0, 36.37], [37.0, 38.26], [60.0, 60.25], [62.0, 63.12], [64.0, 64.07], [66.0, 72.94], [73.0, 72.99], [74.0, 73.79], [74.0, 82.85], [84.0, 84.79], [86.0, 90.39], [92.0, 92.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 30.47, 0.0, 70.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.98], ["speech", 20.5], ["musical instrument", 3.49]], null, null, [["music", 55.29], ["speech", 21.19], ["throbbing", 5.58]], null, null, null], "duration": [1.17, 0.53, 0.45, 0.38, 0.47, 0.28, 0.3, 0.2, 1.37, 1.26, 0.25, 1.12, 0.07, 6.94, -0.01, -0.21, 8.85, 0.79, 4.39, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/r9mcNXIJFbY_filtered.json b/annotations_filtered/r9mcNXIJFbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c00d460b47b2e010346cba50410a4326c42312e --- /dev/null +++ b/annotations_filtered/r9mcNXIJFbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.9], [13.0, 14.67], [16.0, 16.09], [16.0, 18.76], [20.0, 21.68], [22.0, 24.27], [27.0, 31.19], [32.0, 33.71], [36.0, 37.99], [41.0, 45.66], [48.0, 55.8], [57.0, 58.8], [60.0, 69.08], [71.0, 73.26], [77.0, 79.59], [87.0, 88.52], [93.0, 96.6], [98.0, 100.18], [102.0, 103.67], [106.0, 110.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 89.01, 77.2, 0.0, 100.0, 100.0, 99.92, 0.0, 100.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 1.67, 0.09, 2.76, 1.68, 2.27, 4.19, 1.71, 1.99, 4.66, 7.8, 1.8, 9.08, 2.26, 2.59, 1.52, 3.6, 2.18, 1.67, 4.98]} \ No newline at end of file diff --git a/annotations_filtered/r9nG9RByMRI_filtered.json b/annotations_filtered/r9nG9RByMRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cae012cc9ef90bde73aafed04a6601d540b962fa --- /dev/null +++ b/annotations_filtered/r9nG9RByMRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.91], [7.0, 7.53], [9.0, 9.68], [11.0, 10.77], [12.0, 12.11], [18.0, 19.57], [22.0, 22.71], [26.0, 27.55], [29.0, 29.59], [32.0, 33.13], [34.0, 34.92], [40.0, 41.12], [49.0, 48.98], [49.0, 49.33], [50.0, 49.67], [61.0, 62.04], [66.0, 66.95], [70.0, 72.6], [77.0, 87.27], [89.0, 96.75], [100.0, 101.26], [106.0, 106.24], [107.0, 109.24], [127.0, 130.76], [133.0, 133.27], [153.0, 160.96], [162.0, 162.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.87, 36.72, 39.74, 0.0, 0.0, 33.76, 30.92, 0.0, 30.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 24.86], ["mosquito", 12.78], ["insect", 8.07]], [["hum", 46.44], ["mains hum", 38.59], ["noise", 4.93]], [["hum", 31.52], ["mains hum", 30.59], ["fly, housefly", 8.59]], null, null, [["radio", 44.22], ["speech", 23.26], ["music", 9.07]], [["frog", 30.04], ["speech", 22.7], ["sound effect", 3.33]], null, [["music", 71.54], ["musical instrument", 8.18], ["guitar", 5.74]], null], "duration": [1.91, 0.53, 0.68, -0.23, 0.11, 1.57, 0.71, 1.55, 0.59, 1.13, 0.92, 1.12, -0.02, 0.33, -0.33, 1.04, 0.95, 2.6, 10.27, 7.75, 1.26, 0.24, 2.24, 3.76, 0.27, 7.96, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/r9twTtXkQNA_filtered.json b/annotations_filtered/r9twTtXkQNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..879b0303c53c36b9dbe8807f50edb268c43cb7f2 --- /dev/null +++ b/annotations_filtered/r9twTtXkQNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.22], [19.0, 20.26], [22.0, 23.06], [23.0, 23.09], [25.0, 26.99], [27.0, 27.95], [30.0, 35.23], [43.0, 43.88], [45.0, 47.21], [49.0, 49.89], [58.0, 58.21], [60.0, 61.08], [62.0, 62.94], [72.0, 81.3], [82.0, 82.71], [85.0, 87.98], [88.0, 88.89], [89.0, 89.73], [92.0, 96.42], [98.0, 98.25], [100.0, 100.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.47, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 38.98, 0.0, 37.92, 0.0, 0.0, 56.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 42.79], ["music", 28.56], ["fart", 4.71]], null, null, null, null, null, null, [["speech", 74.62], ["crushing", 2.94], ["wood", 2.54]], null, [["breaking", 41.93], ["thunk", 9.74], ["fly, housefly", 8.3]], null, null, null, null, null], "duration": [1.22, 1.26, 1.06, 0.09, 1.99, 0.95, 5.23, 0.88, 2.21, 0.89, 0.21, 1.08, 0.94, 9.3, 0.71, 2.98, 0.89, 0.73, 4.42, 0.25, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/rA69NDoXRhI_filtered.json b/annotations_filtered/rA69NDoXRhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..344807f9d78727251d18de60dc4bc6ac77b4de5c --- /dev/null +++ b/annotations_filtered/rA69NDoXRhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.39], [19.0, 20.07], [22.0, 45.2], [49.0, 49.99], [52.0, 53.45], [55.0, 55.48], [56.0, 57.15], [59.0, 60.18], [65.0, 66.02], [67.0, 67.63], [77.0, 78.56], [79.0, 79.44], [82.0, 82.68], [93.0, 94.42], [96.0, 96.48], [103.0, 107.86], [109.0, 110.25], [115.0, 115.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.98, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 48.2], ["singing bowl", 20.54], ["music", 10.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.39, 1.07, 23.2, 0.99, 1.45, 0.48, 1.15, 1.18, 1.02, 0.63, 1.56, 0.44, 0.68, 1.42, 0.48, 4.86, 1.25, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/rA6AZeHyw8Q_filtered.json b/annotations_filtered/rA6AZeHyw8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6fd39a06d7e72d1cd2f521c375af5755fc52909 --- /dev/null +++ b/annotations_filtered/rA6AZeHyw8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.39], [17.0, 25.79], [28.0, 39.04], [41.0, 63.91], [65.0, 65.87], [67.0, 67.86], [69.0, 70.06], [70.0, 73.25], [73.0, 73.3], [74.0, 74.33], [77.0, 84.33], [86.0, 85.73], [86.0, 102.41], [104.0, 131.55], [133.0, 132.68], [133.0, 132.8], [133.0, 155.11], [157.0, 167.98], [170.0, 170.95], [172.0, 173.33]], "keep_status": [true, false, true, true, false, false, false, true, false, false, true, false, true, true, false, false, false, false, false, false], "silence_prob": [42.06, 44.32, 40.95, 46.29, 0.0, 0.0, 0.0, 40.19, 0.0, 0.0, 46.75, 0.0, 49.97, 46.26, 0.0, 0.0, 48.19, 65.09, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.95], ["didgeridoo", 4.28], ["electronic music", 3.48]], [["music", 65.27], ["musical instrument", 5.42], ["synthesizer", 2.26]], [["music", 62.24], ["electronic music", 4.2], ["speech", 3.51]], [["music", 31.9], ["sidetone", 8.75], ["cattle, bovinae", 8.37]], null, null, null, [["pigeon, dove", 21.4], ["speech", 21.32], ["bird", 19.06]], null, null, [["speech", 33.81], ["horse", 11.23], ["whale vocalization", 8.36]], null, [["speech", 41.06], ["hum", 6.8], ["fly, housefly", 6.12]], [["speech", 50.24], ["hum", 6.77], ["explosion", 5.07]], null, null, [["hum", 39.57], ["throbbing", 28.94], ["mains hum", 6.27]], null, null, null], "duration": [9.39, 8.79, 11.04, 22.91, 0.87, 0.86, 1.06, 3.25, 0.3, 0.33, 7.33, -0.27, 16.41, 27.55, -0.32, -0.2, 22.11, 10.98, 0.95, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/rAEv7dJC5Iw_filtered.json b/annotations_filtered/rAEv7dJC5Iw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a581eea7c3cdd43c9ac85decff68a434342d23c --- /dev/null +++ b/annotations_filtered/rAEv7dJC5Iw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 27.28], [28.0, 29.78], [30.0, 30.54], [38.0, 38.57], [39.0, 40.26], [41.0, 41.71], [43.0, 43.44], [45.0, 45.79], [46.0, 51.8], [54.0, 64.71], [66.0, 66.14], [76.0, 82.7], [83.0, 84.48], [85.0, 87.94], [99.0, 99.57], [100.0, 100.58], [102.0, 103.45], [108.0, 108.62], [111.0, 112.13], [119.0, 122.52], [124.0, 125.58], [127.0, 130.4]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [31.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.25, 31.3, 0.0, 32.23, 0.0, 35.74, 0.0, 0.0, 0.0, 0.0, 0.0, 31.95, 0.0, 36.94], "audiomae_on_audioset": [[["music", 78.8], ["throbbing", 5.66], ["didgeridoo", 1.66]], null, null, null, null, null, null, null, [["music", 63.32], ["didgeridoo", 7.98], ["sampler", 2.2]], [["music", 58.04], ["throbbing", 6.93], ["speech", 4.05]], null, [["music", 42.65], ["throbbing", 34.43], ["hum", 7.46]], null, [["throbbing", 31.69], ["music", 24.97], ["hum", 21.21]], null, null, null, null, null, [["speech", 61.91], ["whack, thwack", 3.27], ["thunk", 3.16]], null, [["speech", 39.09], ["fart", 13.18], ["hum", 5.91]]], "duration": [13.28, 1.78, 0.54, 0.57, 1.26, 0.71, 0.44, 0.79, 5.8, 10.71, 0.14, 6.7, 1.48, 2.94, 0.57, 0.58, 1.45, 0.62, 1.13, 3.52, 1.58, 3.4]} \ No newline at end of file diff --git a/annotations_filtered/rAKR-BBQY2M_filtered.json b/annotations_filtered/rAKR-BBQY2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9e343e91cd4873d63aaaf774ecc3a758ea4f42f --- /dev/null +++ b/annotations_filtered/rAKR-BBQY2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.1], [17.0, 18.27], [23.0, 23.8], [36.0, 36.46], [40.0, 41.91], [47.0, 47.53], [52.0, 52.54], [53.0, 54.68], [55.0, 55.97], [62.0, 70.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 51.07], ["thunk", 15.16], ["music", 13.79]]], "duration": [0.1, 1.27, 0.8, 0.46, 1.91, 0.53, 0.54, 1.68, 0.97, 8.75]} \ No newline at end of file diff --git a/annotations_filtered/rARKAStGRy8_filtered.json b/annotations_filtered/rARKAStGRy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e51767c80792895d18fc266f192877a597a5fa57 --- /dev/null +++ b/annotations_filtered/rARKAStGRy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [15.0, 15.4], [23.0, 23.26], [46.0, 46.2], [50.0, 54.43], [64.0, 64.32], [72.0, 72.74]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 49.56], ["hum", 9.62], ["music", 7.97]], null, null], "duration": [0.51, 0.4, 0.26, 0.2, 4.43, 0.32, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/rAULcuSAZeo_filtered.json b/annotations_filtered/rAULcuSAZeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9424e49b489d84f22a90f4b4aa85cc74f8bff8ef --- /dev/null +++ b/annotations_filtered/rAULcuSAZeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.58], [2.0, 69.58]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.58, 67.58]} \ No newline at end of file diff --git a/annotations_filtered/rAdvJOAGEmc_filtered.json b/annotations_filtered/rAdvJOAGEmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82104a080f474743bae36282099f0a530f540bc4 --- /dev/null +++ b/annotations_filtered/rAdvJOAGEmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.97], [5.0, 12.88], [14.0, 14.79], [16.0, 17.24], [19.0, 28.27], [32.0, 32.63], [34.0, 36.14], [42.0, 44.76], [49.0, 53.43], [55.0, 55.76], [56.0, 57.69], [58.0, 59.26], [60.0, 61.15], [63.0, 62.94], [71.0, 74.95], [80.0, 83.64], [91.0, 92.94], [101.0, 117.42], [122.0, 122.25], [122.0, 128.12], [133.0, 133.39], [134.0, 134.38], [135.0, 135.28], [141.0, 145.34], [146.0, 149.47]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 37.39, 0.0, 0.0, 38.31, 0.0, 35.65, 35.02, 34.94, 0.0, 0.0, 0.0, 0.0, 0.0, 34.39, 34.55, 0.0, 34.39, 0.0, 48.48, 0.0, 0.0, 0.0, 51.71, 68.67], "audiomae_on_audioset": [null, [["music", 13.73], ["beatboxing", 7.01], ["animal", 6.29]], null, null, [["music", 52.92], ["beatboxing", 7.94], ["didgeridoo", 6.77]], null, [["music", 61.25], ["guitar", 7.76], ["musical instrument", 5.97]], [["music", 70.82], ["musical instrument", 3.12], ["guitar", 2.2]], [["music", 77.87], ["swing music", 2.13], ["musical instrument", 1.75]], null, null, null, null, null, [["music", 69.86], ["swing music", 4.25], ["musical instrument", 2.39]], [["music", 65.48], ["swing music", 4.86], ["musical instrument", 2.86]], null, [["music", 41.59], ["boing", 26.76], ["speech", 9.32]], null, [["animal", 33.42], ["speech", 14.96], ["outside, rural or natural", 4.75]], null, null, null, null, null], "duration": [0.97, 7.88, 0.79, 1.24, 9.27, 0.63, 2.14, 2.76, 4.43, 0.76, 1.69, 1.26, 1.15, -0.06, 3.95, 3.64, 1.94, 16.42, 0.25, 6.12, 0.39, 0.38, 0.28, 4.34, 3.47]} \ No newline at end of file diff --git a/annotations_filtered/rBZQHST6BQQ_filtered.json b/annotations_filtered/rBZQHST6BQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d17de0055141f997c75aa453f000889ec7acb8d8 --- /dev/null +++ b/annotations_filtered/rBZQHST6BQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [5.0, 5.56], [9.0, 10.0], [11.0, 12.46], [14.0, 15.87], [18.0, 18.39], [25.0, 24.65], [27.0, 29.25], [31.0, 31.11], [32.0, 36.32], [38.0, 38.92], [44.0, 45.01], [47.0, 47.71], [51.0, 56.2], [59.0, 63.58], [65.0, 69.84], [74.0, 76.0], [76.0, 76.06], [78.0, 91.69], [95.0, 111.1], [113.0, 113.34], [115.0, 115.92], [117.0, 117.53], [119.0, 119.79], [121.0, 126.59]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.72, 0.0, 40.38, 0.0, 0.0, 0.0, 39.22, 62.27, 53.72, 54.9, 0.0, 41.81, 41.98, 0.0, 0.0, 0.0, 0.0, 47.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 29.35], ["livestock, farm animals, working animals", 17.86], ["cattle, bovinae", 10.66]], null, null, null, [["music", 73.73], ["speech", 2.64], ["didgeridoo", 2.63]], null, null, null, null, [["music", 78.82], ["musical instrument", 2.65], ["synthesizer", 2.12]], [["music", 83.66], ["musical instrument", 1.87], ["singing", 1.69]], null, null, null, null, [["music", 75.27], ["musical instrument", 5.63], ["guitar", 3.07]]], "duration": [0.38, 0.56, 1.0, 1.46, 1.87, 0.39, -0.35, 2.25, 0.11, 4.32, 0.92, 1.01, 0.71, 5.2, 4.58, 4.84, 2.0, 0.06, 13.69, 16.1, 0.34, 0.92, 0.53, 0.79, 5.59]} \ No newline at end of file diff --git a/annotations_filtered/rBtzudk40pE_filtered.json b/annotations_filtered/rBtzudk40pE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77693cd3629f6cedcff77489fa96c63bc9e6afd1 --- /dev/null +++ b/annotations_filtered/rBtzudk40pE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.11], [13.0, 19.43], [21.0, 37.12], [43.0, 43.92], [45.0, 46.72], [47.0, 53.15]], "keep_status": [true, false, false, false, false, false], "silence_prob": [41.4, 42.62, 32.75, 0.0, 0.0, 32.23], "audiomae_on_audioset": [[["music", 45.64], ["foghorn", 13.12], ["theremin", 6.41]], [["music", 60.8], ["synthesizer", 8.06], ["ambient music", 4.73]], [["music", 68.36], ["musical instrument", 5.22], ["theremin", 3.73]], null, null, [["music", 74.88], ["musical instrument", 3.81], ["synthesizer", 3.57]]], "duration": [7.11, 6.43, 16.12, 0.92, 1.72, 6.15]} \ No newline at end of file diff --git a/annotations_filtered/rC9LfNF_CW8_filtered.json b/annotations_filtered/rC9LfNF_CW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afc4a4489583023699e21c029636fbd5bd45f7e4 --- /dev/null +++ b/annotations_filtered/rC9LfNF_CW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.55], [5.0, 6.84], [8.0, 8.31], [10.0, 9.95], [11.0, 11.4], [15.0, 15.55], [20.0, 23.6], [25.0, 25.86], [27.0, 27.9], [30.0, 31.02], [33.0, 33.61], [34.0, 34.8], [47.0, 47.01], [49.0, 54.68], [64.0, 72.45], [74.0, 77.48], [82.0, 90.75], [93.0, 94.63], [96.0, 99.3], [102.0, 102.07], [105.0, 112.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.49, 30.23, 30.02, 30.22, 0.0, 30.12, 0.0, 29.63], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 42.81], ["mains hum", 16.64], ["throbbing", 13.72]], null, null, null, null, null, null, [["hum", 47.88], ["mains hum", 38.75], ["throbbing", 6.93]], [["music", 75.02], ["skateboard", 3.27], ["ice cream truck, ice cream van", 2.8]], [["music", 57.47], ["hum", 10.96], ["throbbing", 7.55]], [["music", 67.22], ["speech", 4.54], ["hum", 4.18]], null, [["music", 45.6], ["tubular bells", 8.6], ["percussion", 8.0]], null, [["music", 49.51], ["speech", 19.1], ["single-lens reflex camera", 3.07]]], "duration": [-0.45, 1.84, 0.31, -0.05, 0.4, 0.55, 3.6, 0.86, 0.9, 1.02, 0.61, 0.8, 0.01, 5.68, 8.45, 3.48, 8.75, 1.63, 3.3, 0.07, 7.73]} \ No newline at end of file diff --git a/annotations_filtered/rC9MhZGgJy4_filtered.json b/annotations_filtered/rC9MhZGgJy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff01691bc67e15cd0823126b2ffb065ed06d4881 --- /dev/null +++ b/annotations_filtered/rC9MhZGgJy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.97], [7.0, 8.58], [10.0, 10.93], [16.0, 16.09], [22.0, 22.74], [23.0, 28.16], [29.0, 30.08], [39.0, 40.44], [42.0, 43.09], [44.0, 45.89], [46.0, 53.96], [59.0, 59.17], [62.0, 62.33], [66.0, 68.49], [70.0, 70.43], [71.0, 72.33], [80.0, 80.89], [82.0, 83.25], [87.0, 88.8], [90.0, 90.64], [91.0, 93.14], [106.0, 107.59], [109.0, 109.41], [111.0, 112.55], [114.0, 113.86], [116.0, 116.78], [118.0, 119.04], [123.0, 123.63], [126.0, 126.42], [128.0, 128.48], [134.0, 135.03], [136.0, 139.24], [142.0, 143.02], [147.0, 147.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 58.72, 0.0, 0.0, 0.0, 0.0, 41.66, 0.0, 0.0, 53.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 36.4], ["music", 13.89], ["thunk", 9.3]], null, null, null, null, null, null, null, null, null, [["fly, housefly", 19.24], ["music", 14.16], ["insect", 7.34]], null, null, null, null, null, null, null, null, null, null, [["singing bowl", 24.82], ["gong", 10.72], ["hum", 8.56]], null, null], "duration": [0.97, 1.58, 0.93, 0.09, 0.74, 5.16, 1.08, 1.44, 1.09, 1.89, 7.96, 0.17, 0.33, 2.49, 0.43, 1.33, 0.89, 1.25, 1.8, 0.64, 2.14, 1.59, 0.41, 1.55, -0.14, 0.78, 1.04, 0.63, 0.42, 0.48, 1.03, 3.24, 1.02, 0.66]} \ No newline at end of file diff --git a/annotations_filtered/rCCCJ2tXF7A_filtered.json b/annotations_filtered/rCCCJ2tXF7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d2900dd6129f9e6027a9c15893d31a60a332c08 --- /dev/null +++ b/annotations_filtered/rCCCJ2tXF7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 36.21], [38.0, 42.58], [48.0, 68.44], [73.0, 78.78], [81.0, 83.57], [84.0, 84.69], [87.0, 103.13], [104.0, 105.0], [106.0, 107.03], [110.0, 125.91], [127.0, 131.14]], "keep_status": [true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [29.9, 30.2, 29.85, 30.48, 50.66, 0.0, 30.06, 0.0, 0.0, 29.45, 29.95], "audiomae_on_audioset": [[["music", 25.1], ["moo", 12.45], ["cattle, bovinae", 11.76]], [["music", 30.76], ["speech", 22.45], ["throbbing", 11.7]], [["music", 34.59], ["hum", 26.08], ["throbbing", 12.46]], [["throbbing", 38.7], ["music", 36.44], ["hum", 8.94]], null, null, [["music", 27.19], ["livestock, farm animals, working animals", 18.52], ["speech", 15.79]], null, null, [["music", 60.03], ["throbbing", 5.96], ["vehicle", 4.76]], [["throbbing", 30.69], ["hum", 29.3], ["music", 17.11]]], "duration": [2.21, 4.58, 20.44, 5.78, 2.57, 0.69, 16.13, 1.0, 1.03, 15.91, 4.14]} \ No newline at end of file diff --git a/annotations_filtered/rCEbhr55ISU_filtered.json b/annotations_filtered/rCEbhr55ISU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7b888c71b68b8bcf5dc553bb082c328a98dfded --- /dev/null +++ b/annotations_filtered/rCEbhr55ISU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [5.0, 4.92], [6.0, 7.47], [8.0, 9.73], [11.0, 13.78], [14.0, 14.59], [17.0, 23.5], [26.0, 26.77], [28.0, 27.9], [29.0, 30.82], [31.0, 31.58], [32.0, 33.1], [36.0, 37.79], [51.0, 51.21], [54.0, 55.58], [63.0, 63.75], [67.0, 67.63], [69.0, 70.51], [73.0, 73.74], [77.0, 77.38], [86.0, 86.56], [94.0, 95.12], [97.0, 98.27], [104.0, 104.65], [105.0, 107.91], [111.0, 117.78], [118.0, 125.63], [126.0, 127.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.39, 0.0, 34.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.53, 44.2, 52.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 56.86], ["sidetone", 8.61], ["music", 8.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.12], ["speech", 7.95], ["hum", 5.27]], null, null], "duration": [0.29, -0.08, 1.47, 1.73, 2.78, 0.59, 6.5, 0.77, -0.1, 1.82, 0.58, 1.1, 1.79, 0.21, 1.58, 0.75, 0.63, 1.51, 0.74, 0.38, 0.56, 1.12, 1.27, 0.65, 2.91, 6.78, 7.63, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/rCHGzxSBn-c_filtered.json b/annotations_filtered/rCHGzxSBn-c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85f8ac8f54a80d7341aa647f8eead25b59ec10bf --- /dev/null +++ b/annotations_filtered/rCHGzxSBn-c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [11.0, 12.78], [21.0, 21.47], [22.0, 23.57], [24.0, 26.7], [27.0, 29.47], [30.0, 31.11], [36.0, 37.35], [39.0, 39.83], [42.0, 42.92], [51.0, 51.17], [54.0, 55.78], [56.0, 56.94], [58.0, 58.99], [61.0, 62.06], [65.0, 66.04], [88.0, 89.43], [91.0, 92.35], [93.0, 94.19], [95.0, 98.2], [99.0, 100.23], [103.0, 103.35], [104.0, 110.74], [112.0, 112.11], [114.0, 116.83], [117.0, 118.35], [119.0, 119.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 95.37, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 98.36, 0.0, 81.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 1.78, 0.47, 1.57, 2.7, 2.47, 1.11, 1.35, 0.83, 0.92, 0.17, 1.78, 0.94, 0.99, 1.06, 1.04, 1.43, 1.35, 1.19, 3.2, 1.23, 0.35, 6.74, 0.11, 2.83, 1.35, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/rCUNazDU2mg_filtered.json b/annotations_filtered/rCUNazDU2mg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9450c54c611b322bb95584f67928152b8c43aa09 --- /dev/null +++ b/annotations_filtered/rCUNazDU2mg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 29.24], [30.0, 79.42], [80.0, 97.98], [98.0, 98.04], [101.0, 104.99], [106.0, 110.59], [111.0, 112.14], [115.0, 180.37], [181.0, 181.94]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [30.17, 0.0, 30.06, 0.0, 32.94, 37.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 73.56], ["smash, crash", 6.17], ["breaking", 4.28]], null, [["music", 71.16], ["hum", 3.73], ["sound effect", 2.87]], null, [["whale vocalization", 44.81], ["sidetone", 21.37], ["music", 5.61]], [["hum", 31.91], ["music", 20.01], ["throbbing", 13.68]], null, null, null], "duration": [26.24, 49.42, 17.98, 0.04, 3.99, 4.59, 1.14, 65.37, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/rChS9MeLW-w_filtered.json b/annotations_filtered/rChS9MeLW-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e98cded9aff4b0cd5d48db2f7a7ea722c5c99a0 --- /dev/null +++ b/annotations_filtered/rChS9MeLW-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 48.57], [55.0, 59.39], [64.0, 69.09], [70.0, 71.49], [75.0, 80.6], [82.0, 83.17], [84.0, 85.85], [87.0, 87.4], [88.0, 90.56], [94.0, 94.14], [98.0, 98.52], [102.0, 102.98], [105.0, 105.02], [106.0, 115.08], [116.0, 119.11]], "keep_status": [false, true, true, false, true, false, false, false, true, false, false, false, false, false, true], "silence_prob": [37.74, 45.21, 48.87, 0.0, 42.88, 0.0, 0.0, 0.0, 37.05, 0.0, 0.0, 0.0, 0.0, 36.72, 41.48], "audiomae_on_audioset": [[["music", 71.24], ["ambient music", 7.74], ["musical instrument", 2.19]], [["gong", 24.03], ["music", 18.99], ["singing bowl", 18.44]], [["hum", 18.52], ["gong", 17.57], ["music", 16.89]], null, [["music", 36.4], ["throbbing", 7.87], ["synthesizer", 5.18]], null, null, null, [["music", 31.27], ["speech", 18.76], ["mains hum", 7.47]], null, null, null, null, [["music", 37.13], ["theremin", 18.84], ["didgeridoo", 14.7]], [["music", 50.72], ["didgeridoo", 14.7], ["singing bowl", 3.44]]], "duration": [23.57, 4.39, 5.09, 1.49, 5.6, 1.17, 1.85, 0.4, 2.56, 0.14, 0.52, 0.98, 0.02, 9.08, 3.11]} \ No newline at end of file diff --git a/annotations_filtered/rClviS6MMvk_filtered.json b/annotations_filtered/rClviS6MMvk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfaab59126905d1c7b26205462c9a0778f842e88 --- /dev/null +++ b/annotations_filtered/rClviS6MMvk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.02], [13.0, 13.44], [16.0, 15.89], [17.0, 18.22], [21.0, 21.42], [22.0, 25.93], [27.0, 27.51], [29.0, 29.94], [30.0, 31.72], [34.0, 34.3], [35.0, 35.48], [38.0, 38.48], [40.0, 40.66], [41.0, 41.54], [49.0, 49.57], [58.0, 59.68], [63.0, 69.5], [71.0, 71.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 0.44, -0.11, 1.22, 0.42, 3.93, 0.51, 0.94, 1.72, 0.3, 0.48, 0.48, 0.66, 0.54, 0.57, 1.68, 6.5, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/rCn7orvs0Ws_filtered.json b/annotations_filtered/rCn7orvs0Ws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6b358aa06090bad40723066f8c0eb23fc009a08 --- /dev/null +++ b/annotations_filtered/rCn7orvs0Ws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 59.76], [61.0, 62.82], [64.0, 65.5], [66.0, 67.14], [68.0, 73.75], [79.0, 79.08], [80.0, 81.24], [82.0, 83.62], [93.0, 92.8], [93.0, 96.13], [97.0, 97.87], [102.0, 105.88], [107.0, 106.81], [113.0, 114.98], [116.0, 117.51], [118.0, 125.37], [130.0, 129.98], [138.0, 137.71], [146.0, 147.38], [150.0, 157.52], [160.0, 160.76], [163.0, 163.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [98.93, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 66.27, 0.0, 0.0, 0.0, 42.04, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 22.11], ["grunt", 14.74], ["speech", 9.91]], null, null, null, null, null, null], "duration": [8.76, 1.82, 1.5, 1.14, 5.75, 0.08, 1.24, 1.62, -0.2, 3.13, 0.87, 3.88, -0.19, 1.98, 1.51, 7.37, -0.02, -0.29, 1.38, 7.52, 0.76, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/rD3kI-nioGA_filtered.json b/annotations_filtered/rD3kI-nioGA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..684c86ee8e03b804ec3e86b58409852087db5eb2 --- /dev/null +++ b/annotations_filtered/rD3kI-nioGA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.9], [4.0, 4.77], [6.0, 10.4], [13.0, 13.05], [16.0, 23.4], [27.0, 28.56], [32.0, 31.95], [39.0, 50.18], [51.0, 60.34], [61.0, 61.57], [63.0, 63.34]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 36.07, 0.0, 35.8, 0.0, 0.0, 35.11, 44.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 48.21], ["speech", 13.31], ["musical instrument", 3.03]], null, [["speech", 40.44], ["music", 31.85], ["musical instrument", 2.03]], null, null, [["music", 38.7], ["speech", 19.15], ["didgeridoo", 16.06]], [["livestock, farm animals, working animals", 29.45], ["cattle, bovinae", 13.31], ["moo", 9.02]], null, null], "duration": [0.9, 0.77, 4.4, 0.05, 7.4, 1.56, -0.05, 11.18, 9.34, 0.57, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/rDGRAHBojWE_filtered.json b/annotations_filtered/rDGRAHBojWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ceab773f0600c7112c87b9f6a0a3dd79c5a80408 --- /dev/null +++ b/annotations_filtered/rDGRAHBojWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [7.0, 7.3], [8.0, 9.24], [11.0, 12.8], [18.0, 23.25], [24.0, 26.99], [30.0, 30.74], [31.0, 35.28], [40.0, 41.0], [42.0, 42.21], [43.0, 43.12], [45.0, 46.01], [47.0, 46.9], [48.0, 62.95], [65.0, 65.7], [67.0, 70.07], [70.0, 75.41], [79.0, 79.84], [81.0, 82.27], [84.0, 83.84], [85.0, 87.02], [89.0, 89.85], [91.0, 112.24], [114.0, 117.24], [120.0, 127.4]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.63, 44.87, 0.0, 38.52, 0.0, 0.0, 0.0, 0.0, 0.0, 33.11, 0.0, 37.59, 35.07, 0.0, 0.0, 0.0, 57.48, 0.0, 32.39, 32.29, 32.1], "audiomae_on_audioset": [null, null, null, null, [["speech", 31.28], ["music", 26.06], ["sidetone", 18.52]], [["music", 28.24], ["speech", 17.49], ["throbbing", 14.33]], null, [["music", 47.79], ["speech", 15.06], ["boing", 5.38]], null, null, null, null, null, [["music", 63.3], ["speech", 9.04], ["musical instrument", 7.5]], null, [["fart", 23.95], ["music", 20.51], ["speech", 9.37]], [["music", 26.72], ["speech", 19.39], ["bow-wow", 10.04]], null, null, null, null, null, [["music", 72.56], ["funk", 5.95], ["swing music", 5.82]], [["music", 77.64], ["electronic music", 2.29], ["synthesizer", 2.02]], [["music", 73.81], ["funk", 7.28], ["didgeridoo", 2.73]]], "duration": [1.62, 0.3, 1.24, 1.8, 5.25, 2.99, 0.74, 4.28, 1.0, 0.21, 0.12, 1.01, -0.1, 14.95, 0.7, 3.07, 5.41, 0.84, 1.27, -0.16, 2.02, 0.85, 21.24, 3.24, 7.4]} \ No newline at end of file diff --git a/annotations_filtered/rDIF3XhXTT8_filtered.json b/annotations_filtered/rDIF3XhXTT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a782054ee73997ccd9aa1a484e5ee3df4d26d140 --- /dev/null +++ b/annotations_filtered/rDIF3XhXTT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 45.94], [49.0, 91.76], [93.0, 109.29], [115.0, 125.02], [128.0, 150.18], [151.0, 151.82], [153.0, 155.92], [156.0, 170.97], [172.0, 175.59], [176.0, 177.8], [180.0, 190.83]], "keep_status": [false, false, false, true, true, false, false, true, true, false, false], "silence_prob": [33.19, 0.0, 33.69, 31.68, 41.95, 0.0, 94.52, 31.8, 49.54, 0.0, 32.81], "audiomae_on_audioset": [[["music", 68.2], ["theremin", 12.87], ["buzz", 1.27]], null, [["music", 67.58], ["didgeridoo", 6.32], ["theremin", 5.44]], [["music", 53.28], ["hum", 4.0], ["musical instrument", 3.54]], [["music", 24.72], ["hum", 8.86], ["synthesizer", 7.7]], null, null, [["music", 53.79], ["sidetone", 10.92], ["synthesizer", 3.56]], [["music", 34.71], ["wind instrument, woodwind instrument", 18.22], ["clarinet", 5.52]], null, [["music", 60.41], ["theremin", 9.88], ["explosion", 7.72]]], "duration": [16.94, 42.76, 16.29, 10.02, 22.18, 0.82, 2.92, 14.97, 3.59, 1.8, 10.83]} \ No newline at end of file diff --git a/annotations_filtered/rDTZ6A5zsYc_filtered.json b/annotations_filtered/rDTZ6A5zsYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a882679f9827f48e794d9442a8ff2b00bc30bdd --- /dev/null +++ b/annotations_filtered/rDTZ6A5zsYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.73], [28.0, 37.08], [38.0, 39.09], [48.0, 59.19], [73.0, 114.22], [116.0, 145.4]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 38.84, 0.0, 55.89, 0.0, 34.4], "audiomae_on_audioset": [null, [["music", 31.66], ["speech", 23.87], ["thunk", 4.36]], null, null, null, [["music", 75.73], ["country", 5.09], ["bluegrass", 1.57]]], "duration": [0.73, 9.08, 1.09, 11.19, 41.22, 29.4]} \ No newline at end of file diff --git a/annotations_filtered/rDXBM22wbrg_filtered.json b/annotations_filtered/rDXBM22wbrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91e6b51cbcc634a87589c2a32ba160714276a9c5 --- /dev/null +++ b/annotations_filtered/rDXBM22wbrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 17.95], [19.0, 19.08], [23.0, 23.82], [28.0, 30.2], [32.0, 46.11], [47.0, 49.65], [51.0, 51.21], [52.0, 52.89], [54.0, 54.41], [55.0, 67.47], [68.0, 74.43], [75.0, 80.23], [83.0, 84.37], [86.0, 87.35], [88.0, 88.87], [90.0, 91.15], [97.0, 103.33], [109.0, 111.23], [115.0, 117.07], [127.0, 127.74]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [31.71, 0.0, 0.0, 31.53, 36.64, 99.73, 0.0, 0.0, 0.0, 59.86, 35.58, 45.78, 0.0, 0.0, 0.0, 0.0, 31.89, 91.13, 37.35, 0.0], "audiomae_on_audioset": [[["whack, thwack", 31.06], ["speech", 12.28], ["thunk", 5.24]], null, null, [["music", 60.73], ["speech", 13.84], ["musical instrument", 3.27]], [["music", 68.46], ["synthesizer", 12.2], ["sampler", 2.47]], null, null, null, null, null, [["sidetone", 46.53], ["music", 29.68], ["speech", 12.15]], [["music", 35.85], ["speech", 28.21], ["brass instrument", 3.44]], null, null, null, null, [["music", 63.44], ["musical instrument", 4.1], ["swing music", 3.84]], null, [["speech", 40.57], ["music", 9.32], ["bee, wasp, etc.", 2.19]], null], "duration": [7.95, 0.08, 0.82, 2.2, 14.11, 2.65, 0.21, 0.89, 0.41, 12.47, 6.43, 5.23, 1.37, 1.35, 0.87, 1.15, 6.33, 2.23, 2.07, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/rDbMqG0EObM_filtered.json b/annotations_filtered/rDbMqG0EObM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abfc2eeb5b67f0f15d9104cc011543efec47519b --- /dev/null +++ b/annotations_filtered/rDbMqG0EObM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 30.23], [31.0, 31.26], [32.0, 32.24], [33.0, 34.18], [35.0, 37.0], [38.0, 40.49], [41.0, 47.01], [47.0, 48.05], [49.0, 49.1], [50.0, 61.2], [63.0, 63.81], [65.0, 65.8], [70.0, 69.99], [71.0, 77.75], [79.0, 79.81], [85.0, 91.56], [92.0, 91.81]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false], "silence_prob": [91.64, 0.0, 0.0, 0.0, 99.84, 99.99, 50.71, 0.0, 0.0, 36.36, 0.0, 0.0, 0.0, 33.61, 0.0, 37.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["fly, housefly", 16.79], ["cattle, bovinae", 13.65], ["speech", 12.87]], null, null, null, [["animal", 12.93], ["wild animals", 12.61], ["livestock, farm animals, working animals", 9.06]], null, [["music", 42.89], ["hum", 16.68], ["whale vocalization", 7.92]], null], "duration": [20.23, 0.26, 0.24, 1.18, 2.0, 2.49, 6.01, 1.05, 0.1, 11.2, 0.81, 0.8, -0.01, 6.75, 0.81, 6.56, -0.19]} \ No newline at end of file diff --git a/annotations_filtered/rDnazOBaF1U_filtered.json b/annotations_filtered/rDnazOBaF1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7182d79c1d2f5b969faaf7ffae9a9c6e1c8002a2 --- /dev/null +++ b/annotations_filtered/rDnazOBaF1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.96], [5.0, 5.21], [5.0, 6.3], [8.0, 7.77], [10.0, 13.17], [14.0, 14.32], [17.0, 18.98], [20.0, 22.08], [24.0, 24.75], [27.0, 27.23], [31.0, 32.41], [38.0, 37.94], [40.0, 40.9], [41.0, 46.18], [47.0, 49.1], [50.0, 53.64], [55.0, 55.86], [57.0, 59.04], [59.0, 67.12], [68.0, 73.23], [75.0, 78.76], [85.0, 88.35], [89.0, 89.82], [91.0, 92.5], [95.0, 96.2], [98.0, 98.05], [102.0, 103.87], [105.0, 106.14], [108.0, 109.48], [113.0, 115.57], [116.0, 117.27], [119.0, 120.61], [121.0, 122.86], [127.0, 128.53], [129.0, 131.43], [134.0, 137.47], [143.0, 147.45], [148.0, 150.52], [151.0, 152.93], [154.0, 154.16]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 45.98, 0.0, 0.0, 0.0, 0.0, 0.0, 41.78, 82.79, 92.64, 0.0, 82.97, 60.89, 51.44, 48.48, 47.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.94, 0.0, 0.0, 0.0, 0.0, 37.35, 38.56, 32.09, 35.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 43.58], ["sidetone", 12.41], ["sine wave", 7.18]], null, null, null, null, null, [["sidetone", 46.76], ["speech", 13.55], ["sine wave", 11.27]], null, null, null, null, null, null, [["music", 24.63], ["mains hum", 13.42], ["hum", 12.68]], [["music", 31.85], ["marimba, xylophone", 13.48], ["glockenspiel", 6.88]], null, null, null, null, null, null, null, [["music", 51.59], ["musical instrument", 9.07], ["mains hum", 4.97]], null, null, null, null, [["music", 45.44], ["guitar", 6.3], ["musical instrument", 6.04]], [["music", 58.41], ["hum", 4.2], ["synthesizer", 3.7]], [["music", 52.53], ["didgeridoo", 12.12], ["mains hum", 6.79]], [["music", 55.48], ["synthesizer", 8.55], ["musical instrument", 4.14]], null, null], "duration": [1.96, 0.21, 1.3, -0.23, 3.17, 0.32, 1.98, 2.08, 0.75, 0.23, 1.41, -0.06, 0.9, 5.18, 2.1, 3.64, 0.86, 2.04, 8.12, 5.23, 3.76, 3.35, 0.82, 1.5, 1.2, 0.05, 1.87, 1.14, 1.48, 2.57, 1.27, 1.61, 1.86, 1.53, 2.43, 3.47, 4.45, 2.52, 1.93, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/rEAbZTpV47E_filtered.json b/annotations_filtered/rEAbZTpV47E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa8b665a8b9f9d82ed115b2f476945f1a51ac23f --- /dev/null +++ b/annotations_filtered/rEAbZTpV47E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.36], [15.0, 17.76], [24.0, 25.27], [26.0, 27.24], [30.0, 30.86], [43.0, 43.8], [45.0, 45.18], [47.0, 47.66], [49.0, 50.5], [51.0, 51.49], [52.0, 53.28], [57.0, 57.55], [59.0, 59.34], [61.0, 63.83], [66.0, 68.57], [72.0, 72.52], [75.0, 75.63], [76.0, 76.62], [77.0, 78.24], [81.0, 81.24], [84.0, 84.79], [91.0, 93.46], [94.0, 95.17], [97.0, 98.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 2.76, 1.27, 1.24, 0.86, 0.8, 0.18, 0.66, 1.5, 0.49, 1.28, 0.55, 0.34, 2.83, 2.57, 0.52, 0.63, 0.62, 1.24, 0.24, 0.79, 2.46, 1.17, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/rETUKp1A-xo_filtered.json b/annotations_filtered/rETUKp1A-xo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd4fa051d4f12c04dcea0817b7a3efd5ffbcbd00 --- /dev/null +++ b/annotations_filtered/rETUKp1A-xo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 34.23], [37.0, 38.11], [39.0, 39.92], [42.0, 47.01], [48.0, 66.45], [69.0, 73.57], [75.0, 75.52], [78.0, 78.75], [87.0, 88.35], [90.0, 89.99], [93.0, 99.05], [100.0, 100.23], [101.0, 101.95], [107.0, 122.57], [124.0, 124.66], [132.0, 133.37], [134.0, 137.32], [143.0, 143.95], [151.0, 158.89]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [38.17, 0.0, 0.0, 34.62, 33.26, 87.74, 0.0, 0.0, 0.0, 0.0, 48.1, 0.0, 0.0, 36.04, 0.0, 0.0, 38.78, 0.0, 30.96], "audiomae_on_audioset": [[["electric shaver, electric razor", 29.91], ["animal", 7.72], ["inside, small room", 7.35]], null, null, [["music", 68.3], ["speech", 11.03], ["boing", 5.76]], [["electric shaver, electric razor", 32.62], ["buzz", 28.47], ["music", 15.47]], null, null, null, null, null, [["speech", 86.87], ["telephone", 3.3], ["noise", 1.56]], null, null, [["speech", 71.78], ["music", 9.09], ["boing", 4.72]], null, null, [["music", 57.37], ["musical instrument", 4.48], ["foghorn", 4.06]], null, [["music", 19.83], ["livestock, farm animals, working animals", 17.33], ["speech", 15.64]]], "duration": [17.23, 1.11, 0.92, 5.01, 18.45, 4.57, 0.52, 0.75, 1.35, -0.01, 6.05, 0.23, 0.95, 15.57, 0.66, 1.37, 3.32, 0.95, 7.89]} \ No newline at end of file diff --git a/annotations_filtered/rEWaqUVac3M_filtered.json b/annotations_filtered/rEWaqUVac3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1814aab027e88d5a0d34c26620245b80033d4cf5 --- /dev/null +++ b/annotations_filtered/rEWaqUVac3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.2], [17.0, 17.73], [19.0, 20.78], [25.0, 26.18], [29.0, 29.79], [31.0, 31.02], [32.0, 33.27], [40.0, 40.71], [50.0, 50.48], [63.0, 62.88], [67.0, 67.76], [74.0, 75.54], [77.0, 77.57], [84.0, 85.55], [87.0, 87.96], [89.0, 89.46], [91.0, 91.2], [95.0, 95.55], [103.0, 103.71], [105.0, 110.98], [112.0, 116.8], [118.0, 118.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 30.49, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.62], ["theremin", 15.77], ["musical instrument", 4.16]], [["music", 39.17], ["theremin", 26.03], ["synthesizer", 6.22]], null], "duration": [0.2, 0.73, 1.78, 1.18, 0.79, 0.02, 1.27, 0.71, 0.48, -0.12, 0.76, 1.54, 0.57, 1.55, 0.96, 0.46, 0.2, 0.55, 0.71, 5.98, 4.8, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/rFHh8MTXs5M_filtered.json b/annotations_filtered/rFHh8MTXs5M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91eeafb63b2283a1c4d9b1b4d47b4465fdba81c4 --- /dev/null +++ b/annotations_filtered/rFHh8MTXs5M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.94], [9.0, 9.39], [14.0, 13.91], [16.0, 16.41], [17.0, 17.66], [28.0, 28.56], [38.0, 38.35], [40.0, 41.45], [42.0, 42.8], [43.0, 43.8], [45.0, 45.1], [50.0, 51.19], [52.0, 52.51], [55.0, 55.0], [58.0, 58.18], [63.0, 62.78], [63.0, 63.91], [65.0, 65.33], [66.0, 69.99], [111.0, 114.54], [116.0, 116.11], [118.0, 117.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 99.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.06, 0.39, -0.09, 0.41, 0.66, 0.56, 0.35, 1.45, 0.8, 0.8, 0.1, 1.19, 0.51, 0.0, 0.18, -0.22, 0.91, 0.33, 3.99, 3.54, 0.11, -0.41]} \ No newline at end of file diff --git a/annotations_filtered/rFbe4I4SXGg_filtered.json b/annotations_filtered/rFbe4I4SXGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca3d9c31783504c9a4c041ffc7c3842721cdf360 --- /dev/null +++ b/annotations_filtered/rFbe4I4SXGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.48], [9.0, 8.8], [13.0, 14.12], [17.0, 18.22], [26.0, 27.18], [30.0, 30.43], [32.0, 33.18], [34.0, 35.23], [36.0, 37.2], [38.0, 38.85], [42.0, 42.69], [48.0, 47.93], [52.0, 54.06], [61.0, 62.31], [69.0, 69.45], [69.0, 69.52], [70.0, 71.46], [72.0, 82.93], [83.0, 86.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 53.72, 64.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, -0.2, 1.12, 1.22, 1.18, 0.43, 1.18, 1.23, 1.2, 0.85, 0.69, -0.07, 2.06, 1.31, 0.45, 0.52, 1.46, 10.93, 3.12]} \ No newline at end of file diff --git a/annotations_filtered/rFuhmG2wUXw_filtered.json b/annotations_filtered/rFuhmG2wUXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95458728179b66957b40a6378274465e5341aac0 --- /dev/null +++ b/annotations_filtered/rFuhmG2wUXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.38], [17.0, 17.59], [18.0, 31.43], [32.0, 42.94], [44.0, 66.23], [70.0, 103.94], [105.0, 107.86]], "keep_status": [false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 36.72, 32.2, 33.16, 0.0, 37.96], "audiomae_on_audioset": [null, null, [["speech", 61.07], ["vehicle", 5.86], ["livestock, farm animals, working animals", 4.98]], [["vehicle", 26.15], ["buzz", 14.45], ["speech", 6.21]], [["vehicle", 21.28], ["insect", 12.65], ["fly, housefly", 8.72]], null, [["music", 20.61], ["theremin", 14.85], ["synthesizer", 8.26]]], "duration": [1.38, 0.59, 13.43, 10.94, 22.23, 33.94, 2.86]} \ No newline at end of file diff --git a/annotations_filtered/rFvaTVV7yO4_filtered.json b/annotations_filtered/rFvaTVV7yO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71b9800d08507655432facacb8184a114445a2e9 --- /dev/null +++ b/annotations_filtered/rFvaTVV7yO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 28.17], [39.0, 39.39], [46.0, 45.89], [50.0, 50.38], [53.0, 53.43], [57.0, 59.31], [64.0, 64.42], [65.0, 69.5], [88.0, 88.38], [95.0, 105.24], [132.0, 133.1], [136.0, 136.07], [144.0, 144.49], [145.0, 145.02], [147.0, 148.56], [149.0, 150.06], [157.0, 165.64], [166.0, 166.14], [166.0, 170.28]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [30.86, 0.0, 0.0, 0.0, 0.0, 29.84, 0.0, 31.71, 0.0, 30.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.16, 0.0, 31.02], "audiomae_on_audioset": [[["music", 69.46], ["theremin", 13.63], ["carnatic music", 3.76]], null, null, null, null, [["music", 44.71], ["crowd", 10.63], ["speech", 4.64]], null, [["music", 44.79], ["speech", 24.56], ["boing", 6.26]], null, [["music", 61.81], ["speech", 5.09], ["boing", 4.11]], null, null, null, null, null, null, [["music", 53.03], ["boing", 13.76], ["speech", 6.04]], null, [["speech", 37.32], ["music", 7.53], ["fart", 4.84]]], "duration": [5.17, 0.39, -0.11, 0.38, 0.43, 2.31, 0.42, 4.5, 0.38, 10.24, 1.1, 0.07, 0.49, 0.02, 1.56, 1.06, 8.64, 0.14, 4.28]} \ No newline at end of file diff --git a/annotations_filtered/rFy2252ierA_filtered.json b/annotations_filtered/rFy2252ierA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5046ec6f9afe30d311dd2b89dc3f2f8531123dc4 --- /dev/null +++ b/annotations_filtered/rFy2252ierA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.05], [6.0, 7.89], [9.0, 10.13], [11.0, 11.67], [14.0, 16.63], [19.0, 21.34], [22.0, 22.79], [26.0, 25.59], [28.0, 28.32], [30.0, 30.54], [31.0, 32.58], [34.0, 34.1], [34.0, 36.41], [41.0, 40.95], [42.0, 42.89], [45.0, 45.72], [46.0, 47.02], [48.0, 48.83], [50.0, 50.36], [52.0, 52.08], [59.0, 59.56], [61.0, 60.89], [63.0, 64.0], [64.0, 64.5], [65.0, 64.56], [65.0, 65.72], [68.0, 69.33], [69.0, 69.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.92, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.05, 1.89, 1.13, 0.67, 2.63, 2.34, 0.79, -0.41, 0.32, 0.54, 1.58, 0.1, 2.41, -0.05, 0.89, 0.72, 1.02, 0.83, 0.36, 0.08, 0.56, -0.11, 1.0, 0.5, -0.44, 0.72, 1.33, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/rGAjkzbV8zw_filtered.json b/annotations_filtered/rGAjkzbV8zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b272a94794693dc09d36d6451ff222f9b9c0f56 --- /dev/null +++ b/annotations_filtered/rGAjkzbV8zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.69], [5.0, 6.54], [7.0, 7.79], [9.0, 9.78], [11.0, 11.8], [14.0, 14.44], [18.0, 18.82], [20.0, 22.49], [23.0, 23.77], [26.0, 28.61], [30.0, 30.16], [30.0, 32.63], [33.0, 33.29], [34.0, 34.03], [35.0, 35.55], [38.0, 39.51], [40.0, 41.3], [43.0, 44.12], [46.0, 46.72], [47.0, 52.76], [54.0, 54.68], [55.0, 55.75], [58.0, 59.14], [64.0, 64.17], [64.0, 65.37], [66.0, 66.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 100.0, 0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.56], ["hum", 12.29], ["mains hum", 5.72]], null, null, null, null, null, null], "duration": [0.69, 1.54, 0.79, 0.78, 0.8, 0.44, 0.82, 2.49, 0.77, 2.61, 0.16, 2.63, 0.29, 0.03, 0.55, 1.51, 1.3, 1.12, 0.72, 5.76, 0.68, 0.75, 1.14, 0.17, 1.37, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/rGR6aO4JsH0_filtered.json b/annotations_filtered/rGR6aO4JsH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af257b42ee334408ede5bb1fa8c0a722c83d4b50 --- /dev/null +++ b/annotations_filtered/rGR6aO4JsH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 49.87], [52.0, 58.83], [60.0, 63.21], [64.0, 65.79], [68.0, 69.01], [69.0, 117.68]], "keep_status": [false, false, false, false, false, false], "silence_prob": [30.77, 35.44, 38.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 46.6], ["throbbing", 28.55], ["hum", 10.14]], [["music", 79.7], ["musical instrument", 5.58], ["didgeridoo", 3.52]], [["music", 56.43], ["speech", 8.46], ["synthesizer", 7.34]], null, null, null], "duration": [6.87, 6.83, 3.21, 1.79, 1.01, 48.68]} \ No newline at end of file diff --git a/annotations_filtered/rGS4bE0G3yY_filtered.json b/annotations_filtered/rGS4bE0G3yY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26567aff07e24842f826aebf843909b72445e2f6 --- /dev/null +++ b/annotations_filtered/rGS4bE0G3yY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.91], [26.0, 26.06], [28.0, 27.78], [29.0, 29.86], [31.0, 30.99], [39.0, 39.99], [40.0, 41.66], [42.0, 44.25], [45.0, 45.71], [48.0, 48.63], [51.0, 51.51], [53.0, 54.01], [56.0, 58.16], [68.0, 71.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 0.0, 33.78, 97.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 41.81], ["speech", 24.39], ["livestock, farm animals, working animals", 4.76]], null], "duration": [-0.09, 0.06, -0.22, 0.86, -0.01, 0.99, 1.66, 2.25, 0.71, 0.63, 0.51, 1.01, 2.16, 3.93]} \ No newline at end of file diff --git a/annotations_filtered/rGnXd_krGA0_filtered.json b/annotations_filtered/rGnXd_krGA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/rGnXd_krGA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/rGtJbW9sRbo_filtered.json b/annotations_filtered/rGtJbW9sRbo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0beb3a1058e25a8f122aa5307ef4672c4af2d57 --- /dev/null +++ b/annotations_filtered/rGtJbW9sRbo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [7.0, 7.5], [13.0, 15.84], [16.0, 21.76], [22.0, 22.4], [23.0, 24.88], [26.0, 26.99], [27.0, 29.71], [30.0, 31.06], [36.0, 37.2], [47.0, 48.66], [50.0, 50.14], [53.0, 53.65], [57.0, 57.16], [58.0, 58.56], [65.0, 65.99], [67.0, 67.64], [69.0, 71.05], [74.0, 74.85], [76.0, 76.01], [80.0, 80.0], [88.0, 90.22], [94.0, 94.31], [100.0, 100.38], [101.0, 101.92], [105.0, 105.16], [109.0, 109.02], [110.0, 123.7], [124.0, 129.88]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 48.39, 51.82, 0.0, 0.0, 0.0, 53.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 36.65, 50.21], "audiomae_on_audioset": [null, null, [["speech", 47.91], ["animal", 7.73], ["wild animals", 7.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.13], ["fly, housefly", 18.84], ["insect", 7.6]], null], "duration": [1.37, 0.5, 2.84, 5.76, 0.4, 1.88, 0.99, 2.71, 1.06, 1.2, 1.66, 0.14, 0.65, 0.16, 0.56, 0.99, 0.64, 2.05, 0.85, 0.01, 0.0, 2.22, 0.31, 0.38, 0.92, 0.16, 0.02, 13.7, 5.88]} \ No newline at end of file diff --git a/annotations_filtered/rGvIBT10JDU_filtered.json b/annotations_filtered/rGvIBT10JDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..315e0c91f01cc0fe1640d82e01472f728adba3f3 --- /dev/null +++ b/annotations_filtered/rGvIBT10JDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [5.0, 6.99], [8.0, 8.45], [10.0, 9.96], [11.0, 11.57], [13.0, 14.27], [15.0, 15.87], [17.0, 18.49], [19.0, 25.19], [26.0, 28.32], [31.0, 31.21], [35.0, 36.04], [39.0, 40.53], [43.0, 46.33], [49.0, 49.27], [50.0, 53.23], [55.0, 56.37], [57.0, 74.34], [75.0, 78.02], [79.0, 81.14], [83.0, 88.99], [93.0, 93.73], [95.0, 95.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 38.37, 0.0, 0.0, 0.0, 38.55, 0.0, 79.24, 0.0, 94.95, 62.37, 99.99, 36.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 54.65], ["thunk", 10.58], ["fly, housefly", 5.77]], null, null, null, [["speech", 12.38], ["hands", 8.18], ["arrow", 8.1]], null, null, null, null, null, null, [["speech", 55.02], ["music", 15.15], ["inside, small room", 3.87]], null, null], "duration": [0.46, 1.99, 0.45, -0.04, 0.57, 1.27, 0.87, 1.49, 6.19, 2.32, 0.21, 1.04, 1.53, 3.33, 0.27, 3.23, 1.37, 17.34, 3.02, 2.14, 5.99, 0.73, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/rHIIMIBMvng_filtered.json b/annotations_filtered/rHIIMIBMvng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fc5568a0ec2b6dd70b2e096ee0961c015521530 --- /dev/null +++ b/annotations_filtered/rHIIMIBMvng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.4], [12.0, 16.19], [17.0, 26.05], [27.0, 30.15], [32.0, 35.21], [37.0, 74.11]], "keep_status": [true, true, true, true, false, false], "silence_prob": [31.93, 31.59, 29.31, 32.13, 30.89, 0.0], "audiomae_on_audioset": [[["hum", 27.63], ["music", 14.01], ["sine wave", 9.67]], [["hum", 26.56], ["mains hum", 12.46], ["throbbing", 12.3]], [["hum", 22.92], ["music", 19.77], ["static", 14.41]], [["music", 46.98], ["hum", 10.69], ["ambient music", 8.58]], [["music", 64.93], ["ambient music", 8.33], ["synthesizer", 6.05]], null], "duration": [3.4, 4.19, 9.05, 3.15, 3.21, 37.11]} \ No newline at end of file diff --git a/annotations_filtered/rHvCQEr_ETk_filtered.json b/annotations_filtered/rHvCQEr_ETk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2404e372ede619415e93f53919feba6e0accc822 --- /dev/null +++ b/annotations_filtered/rHvCQEr_ETk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.45], [15.0, 20.71], [22.0, 23.57], [24.0, 24.71], [27.0, 27.75], [28.0, 29.17], [32.0, 35.28], [36.0, 45.64], [53.0, 83.17], [83.0, 83.44], [83.0, 102.59], [104.0, 118.27], [122.0, 123.26], [125.0, 129.95], [130.0, 132.6], [139.0, 141.29], [143.0, 145.71], [147.0, 147.36], [149.0, 149.94], [152.0, 152.79], [153.0, 154.25], [155.0, 156.0], [157.0, 157.64], [159.0, 165.01]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 65.32, 32.3, 0.0, 0.0, 30.34, 31.98, 0.0, 88.83, 43.77, 85.17, 36.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 35.96], ["groan", 20.1], ["fart", 6.92]], null, null, [["music", 38.34], ["speech", 22.46], ["groan", 7.65]], [["music", 66.95], ["grunt", 8.39], ["musical instrument", 2.59]], null, null, [["speech", 42.75], ["sidetone", 17.39], ["music", 4.73]], null, [["music", 56.56], ["didgeridoo", 10.73], ["foghorn", 3.01]], null, null, null, null, null, null, [["music", 56.02], ["electronic music", 8.64], ["sonar", 4.08]]], "duration": [1.45, 5.71, 1.57, 0.71, 0.75, 1.17, 3.28, 9.64, 30.17, 0.44, 19.59, 14.27, 1.26, 4.95, 2.6, 2.29, 2.71, 0.36, 0.94, 0.79, 1.25, 1.0, 0.64, 6.01]} \ No newline at end of file diff --git a/annotations_filtered/rHwc3Jc9rD8_filtered.json b/annotations_filtered/rHwc3Jc9rD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c89ae43f0b8501420a6d0ba24e7f221908def3c3 --- /dev/null +++ b/annotations_filtered/rHwc3Jc9rD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.28], [11.0, 45.12], [46.0, 46.67], [50.0, 52.52], [57.0, 66.38], [71.0, 71.34], [82.0, 82.16], [86.0, 115.55]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.42, 30.23, 0.0, 0.0, 30.43], "audiomae_on_audioset": [null, null, null, [["music", 43.11], ["throbbing", 5.11], ["musical instrument", 3.86]], [["music", 84.48], ["ice cream truck, ice cream van", 4.4], ["echo", 1.68]], null, null, [["music", 36.23], ["speech", 33.94], ["ice cream truck, ice cream van", 13.13]]], "duration": [0.28, 34.12, 0.67, 2.52, 9.38, 0.34, 0.16, 29.55]} \ No newline at end of file diff --git a/annotations_filtered/rITjAbXej3o_filtered.json b/annotations_filtered/rITjAbXej3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9efc9f268a195813ff089ff273197dd8c894d039 --- /dev/null +++ b/annotations_filtered/rITjAbXej3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.5], [35.0, 59.83], [65.0, 67.09], [69.0, 69.77], [72.0, 73.01], [76.0, 75.96], [78.0, 80.81], [82.0, 82.76], [89.0, 89.14], [90.0, 91.76], [97.0, 101.12], [105.0, 105.29], [110.0, 114.03], [116.0, 116.78], [119.0, 120.63], [122.0, 126.52], [130.0, 130.49], [136.0, 137.34], [140.0, 143.06]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 32.06, 59.15, 0.0, 0.0, 0.0, 52.68, 0.0, 0.0, 0.0, 81.53, 0.0, 34.28, 0.0, 0.0, 34.61, 0.0, 0.0, 93.76], "audiomae_on_audioset": [null, [["hum", 23.28], ["music", 15.41], ["rumble", 7.03]], null, null, null, null, null, null, null, null, null, null, [["explosion", 9.88], ["livestock, farm animals, working animals", 9.17], ["rumble", 8.01]], null, null, [["hum", 34.93], ["speech", 17.62], ["throbbing", 15.89]], null, null, null], "duration": [1.5, 24.83, 2.09, 0.77, 1.01, -0.04, 2.81, 0.76, 0.14, 1.76, 4.12, 0.29, 4.03, 0.78, 1.63, 4.52, 0.49, 1.34, 3.06]} \ No newline at end of file diff --git a/annotations_filtered/rIr6rEndy0A_filtered.json b/annotations_filtered/rIr6rEndy0A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20cb6f179e37184a33c897b3d0bd2c8d72d8817d --- /dev/null +++ b/annotations_filtered/rIr6rEndy0A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [3.0, 3.45], [4.0, 5.07], [8.0, 9.26], [14.0, 14.22], [15.0, 15.84], [17.0, 18.1], [26.0, 26.92], [30.0, 30.21], [32.0, 32.05], [36.0, 38.87], [51.0, 50.7], [52.0, 55.93], [57.0, 59.05], [59.0, 61.32], [62.0, 62.92], [64.0, 64.64], [66.0, 67.61], [69.0, 70.02], [70.0, 72.27], [74.0, 78.71], [79.0, 84.05], [85.0, 86.88], [88.0, 101.36], [104.0, 105.81], [108.0, 110.73], [113.0, 115.35], [118.0, 121.46], [126.0, 129.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.05, 0.0, 30.9, 39.46, 31.58, 0.0, 0.0, 0.0, 0.0, 41.36, 35.51, 34.77, 0.0, 87.55, 0.0, 100.0, 99.96, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 46.57], ["radio", 44.5], ["telephone", 2.24]], null, [["livestock, farm animals, working animals", 22.61], ["moo", 11.98], ["speech", 10.1]], [["hum", 13.65], ["speech", 7.29], ["dishes, pots, and pans", 5.87]], [["speech", 59.79], ["music", 19.25], ["speech synthesizer", 2.94]], null, null, null, null, [["speech", 18.98], ["whale vocalization", 13.18], ["tick", 8.11]], [["speech", 68.8], ["chirp tone", 4.53], ["whale vocalization", 3.59]], [["speech", 88.23], ["noise", 1.93], ["music", 1.11]], null, null, null, null, null, null, null], "duration": [0.81, 0.45, 1.07, 1.26, 0.22, 0.84, 1.1, 0.92, 0.21, 0.05, 2.87, -0.3, 3.93, 2.05, 2.32, 0.92, 0.64, 1.61, 1.02, 2.27, 4.71, 5.05, 1.88, 13.36, 1.81, 2.73, 2.35, 3.46, 3.78]} \ No newline at end of file diff --git a/annotations_filtered/rJCltwaUrXI_filtered.json b/annotations_filtered/rJCltwaUrXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47a54522ea0df94a6db6a8ea9e5a75abb9b6dce8 --- /dev/null +++ b/annotations_filtered/rJCltwaUrXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 15.69], [18.0, 19.23], [26.0, 28.46], [37.0, 37.39], [42.0, 42.87], [43.0, 43.5], [44.0, 44.39], [45.0, 45.74], [64.0, 69.2], [70.0, 72.57], [74.0, 76.0], [80.0, 80.28], [83.0, 84.35], [86.0, 94.22], [96.0, 98.17], [105.0, 105.43], [106.0, 107.45], [110.0, 110.0], [114.0, 117.78], [123.0, 124.46], [137.0, 137.83], [140.0, 141.02]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 32.81, 0.0, 0.0, 0.0, 0.0, 0.0, 33.67, 32.76, 32.84, 0.0, 0.0, 38.7, 34.52, 0.0, 0.0, 0.0, 43.03, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 42.98], ["music", 24.27], ["speech", 10.27]], null, null, null, null, null, [["speech", 60.75], ["rumble", 5.67], ["hum", 3.9]], [["music", 41.71], ["whale vocalization", 10.12], ["noise", 8.53]], [["hum", 15.98], ["music", 15.4], ["speech", 12.22]], null, null, [["hum", 51.65], ["mains hum", 17.93], ["throbbing", 15.23]], [["music", 30.35], ["speech", 17.17], ["mains hum", 10.84]], null, null, null, [["music", 48.76], ["musical instrument", 8.36], ["hum", 5.87]], null, null, null], "duration": [-0.31, 1.23, 2.46, 0.39, 0.87, 0.5, 0.39, 0.74, 5.2, 2.57, 2.0, 0.28, 1.35, 8.22, 2.17, 0.43, 1.45, 0.0, 3.78, 1.46, 0.83, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/rJGOCtlPzUs_filtered.json b/annotations_filtered/rJGOCtlPzUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ce5f705a21f8e8c55aaaae12df02661e3442986 --- /dev/null +++ b/annotations_filtered/rJGOCtlPzUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.09], [11.0, 11.74], [14.0, 20.8], [21.0, 21.74], [25.0, 24.78], [27.0, 27.58], [28.0, 28.71], [30.0, 31.72], [35.0, 35.4], [36.0, 37.07], [42.0, 43.92], [46.0, 47.28], [49.0, 63.12], [66.0, 68.34], [71.0, 72.05], [72.0, 74.36], [75.0, 76.05], [77.0, 76.86], [77.0, 78.9], [80.0, 82.58], [86.0, 86.34], [90.0, 90.96], [95.0, 95.3], [97.0, 97.28], [99.0, 99.33], [106.0, 109.34], [110.0, 113.24], [114.0, 116.5], [118.0, 125.63], [127.0, 128.56], [130.0, 130.84], [132.0, 132.65], [134.0, 135.03], [136.0, 140.49]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 46.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 71.87, 0.0, 54.56, 0.0, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 62.68, 59.59, 54.83, 0.0, 0.0, 0.0, 0.0, 56.33], "audiomae_on_audioset": [null, null, [["mains hum", 34.19], ["hum", 16.25], ["speech", 16.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 0.74, 6.8, 0.74, -0.22, 0.58, 0.71, 1.72, 0.4, 1.07, 1.92, 1.28, 14.12, 2.34, 1.05, 2.36, 1.05, -0.14, 1.9, 2.58, 0.34, 0.96, 0.3, 0.28, 0.33, 3.34, 3.24, 2.5, 7.63, 1.56, 0.84, 0.65, 1.03, 4.49]} \ No newline at end of file diff --git a/annotations_filtered/rJSnxSjZIcA_filtered.json b/annotations_filtered/rJSnxSjZIcA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/rJSnxSjZIcA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/rJWLdQ9vylA_filtered.json b/annotations_filtered/rJWLdQ9vylA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0487d96e4a4a75b2d440125ca3b895331cabe555 --- /dev/null +++ b/annotations_filtered/rJWLdQ9vylA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [4.0, 4.16], [5.0, 5.09], [8.0, 9.68], [13.0, 12.72], [13.0, 14.39], [15.0, 15.97], [17.0, 18.06], [19.0, 19.43], [21.0, 27.21], [28.0, 28.39], [31.0, 31.58], [36.0, 36.48], [37.0, 37.88], [43.0, 43.55], [47.0, 47.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["mains hum", 49.61], ["hum", 35.27], ["throbbing", 7.61]], null, null, null, null, null, null], "duration": [0.66, 0.16, 0.09, 1.68, -0.28, 1.39, 0.97, 1.06, 0.43, 6.21, 0.39, 0.58, 0.48, 0.88, 0.55, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/rKHW39mShF4_filtered.json b/annotations_filtered/rKHW39mShF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b48b011cee7edfcc88b9a9f88e38a3b3f077367c --- /dev/null +++ b/annotations_filtered/rKHW39mShF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.91], [5.0, 6.79], [9.0, 9.53], [10.0, 13.47], [15.0, 16.5], [17.0, 17.91], [18.0, 32.05], [34.0, 34.53], [36.0, 36.95], [38.0, 38.4], [43.0, 60.96], [62.0, 62.41], [63.0, 64.42], [65.0, 66.7], [68.0, 68.5], [71.0, 75.39], [76.0, 77.08], [81.0, 128.38], [129.0, 130.35]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.43, 0.0, 0.0, 30.51, 0.0, 0.0, 0.0, 29.89, 0.0, 0.0, 0.0, 0.0, 29.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 24.2], ["music", 20.16], ["throbbing", 8.41]], null, null, [["speech", 48.49], ["music", 23.1], ["sidetone", 8.17]], null, null, null, [["speech", 68.81], ["music", 12.07], ["buzz", 1.99]], null, null, null, null, [["music", 25.94], ["hum", 16.35], ["throbbing", 11.38]], null, null, null], "duration": [-0.09, 1.79, 0.53, 3.47, 1.5, 0.91, 14.05, 0.53, 0.95, 0.4, 17.96, 0.41, 1.42, 1.7, 0.5, 4.39, 1.08, 47.38, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/rKUEBIPe5F8_filtered.json b/annotations_filtered/rKUEBIPe5F8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f92b21c2e1aa3e9e79932a18b66b12d25abe44ed --- /dev/null +++ b/annotations_filtered/rKUEBIPe5F8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.45], [11.0, 13.17], [16.0, 17.14], [18.0, 23.4], [25.0, 79.34], [86.0, 103.79], [106.0, 145.15], [147.0, 147.11], [149.0, 154.74], [160.0, 161.27], [170.0, 177.45]], "keep_status": [false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [0.0, 73.82, 0.0, 79.59, 0.0, 36.61, 0.0, 0.0, 30.47, 0.0, 29.88], "audiomae_on_audioset": [null, null, null, null, null, [["music", 38.44], ["speech", 16.64], ["electronic music", 9.03]], null, null, [["music", 53.72], ["sound effect", 6.91], ["hum", 4.99]], null, [["music", 37.83], ["hum", 20.64], ["didgeridoo", 9.67]]], "duration": [0.45, 2.17, 1.14, 5.4, 54.34, 17.79, 39.15, 0.11, 5.74, 1.27, 7.45]} \ No newline at end of file diff --git a/annotations_filtered/rKV-U-HcGVk_filtered.json b/annotations_filtered/rKV-U-HcGVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44e9daa75ba0b3e55333ab95a5af1f9ad5feb0a6 --- /dev/null +++ b/annotations_filtered/rKV-U-HcGVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 31.38], [33.0, 42.18], [53.0, 54.08], [56.0, 56.44], [65.0, 65.87], [74.0, 74.02], [79.0, 81.78], [85.0, 86.34], [88.0, 88.03], [96.0, 98.69], [99.0, 100.97], [109.0, 111.45], [113.0, 113.27], [116.0, 119.4], [121.0, 122.62], [123.0, 127.6], [128.0, 129.25], [132.0, 131.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.81, 82.61, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 93.6, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [14.38, 9.18, 1.08, 0.44, 0.87, 0.02, 2.78, 1.34, 0.03, 2.69, 1.97, 2.45, 0.27, 3.4, 1.62, 4.6, 1.25, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/rKfOjJJ1ql4_filtered.json b/annotations_filtered/rKfOjJJ1ql4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9decbcd5c0810d4aa4bfd9a88bb29c5a9a972a4b --- /dev/null +++ b/annotations_filtered/rKfOjJJ1ql4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 41.2], [45.0, 76.42], [77.0, 77.52], [78.0, 78.68], [79.0, 80.82], [81.0, 81.5], [82.0, 82.0], [82.0, 82.58], [83.0, 95.54], [96.0, 104.95], [106.0, 116.31], [117.0, 117.04], [118.0, 123.08], [123.0, 124.24], [124.0, 124.5], [126.0, 126.47], [127.0, 127.55], [128.0, 128.61], [129.0, 130.06]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.55, 32.02, 36.91, 0.0, 44.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 55.16], ["whale vocalization", 11.79], ["gurgling", 3.44]], [["music", 23.68], ["percussion", 8.93], ["drum", 6.7]], [["music", 69.06], ["boing", 5.16], ["musical instrument", 2.43]], null, [["music", 51.22], ["whale vocalization", 7.35], ["synthesizer", 3.29]], null, null, null, null, null, null], "duration": [39.2, 31.42, 0.52, 0.68, 1.82, 0.5, 0.0, 0.58, 12.54, 8.95, 10.31, 0.04, 5.08, 1.24, 0.5, 0.47, 0.55, 0.61, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/rKh4muRk_s0_filtered.json b/annotations_filtered/rKh4muRk_s0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7f26670503b0718be8c0a538169bd6ef217f4cd --- /dev/null +++ b/annotations_filtered/rKh4muRk_s0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.15], [10.0, 11.69], [13.0, 13.98], [16.0, 20.04], [22.0, 23.73], [25.0, 45.96], [48.0, 56.62], [59.0, 59.53], [61.0, 81.72], [91.0, 98.59], [99.0, 100.18], [101.0, 101.51], [103.0, 111.0], [113.0, 116.53], [122.0, 126.3], [128.0, 128.75], [130.0, 130.81], [133.0, 137.83], [139.0, 139.53], [150.0, 155.16], [163.0, 164.57], [169.0, 192.6], [194.0, 204.89], [208.0, 209.07], [209.0, 219.47]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [98.1, 0.0, 0.0, 80.11, 0.0, 28.75, 28.99, 0.0, 28.47, 28.54, 0.0, 0.0, 28.32, 28.27, 28.45, 0.0, 0.0, 28.17, 0.0, 28.45, 0.0, 28.49, 28.38, 0.0, 29.06], "audiomae_on_audioset": [null, null, null, null, null, [["music", 69.92], ["synthesizer", 6.24], ["throbbing", 4.88]], [["speech", 32.95], ["vehicle", 8.5], ["music", 6.42]], null, [["speech", 33.16], ["vehicle", 14.31], ["electric shaver, electric razor", 13.6]], [["music", 68.57], ["throbbing", 10.74], ["electronic music", 10.46]], null, null, [["throbbing", 31.03], ["music", 24.47], ["hum", 17.33]], [["music", 71.46], ["cacophony", 8.5], ["musical instrument", 3.9]], [["speech", 68.38], ["vehicle", 10.39], ["music", 6.27]], null, null, [["speech", 55.03], ["music", 20.79], ["electronic music", 2.54]], null, [["speech", 63.97], ["music", 24.63], ["vehicle", 2.08]], null, [["speech", 19.42], ["burst, pop", 7.83], ["music", 7.05]], [["speech", 31.06], ["music", 24.77], ["outside, rural or natural", 3.37]], null, [["music", 58.3], ["musical instrument", 6.33], ["bowed string instrument", 4.53]]], "duration": [3.15, 1.69, 0.98, 4.04, 1.73, 20.96, 8.62, 0.53, 20.72, 7.59, 1.18, 0.51, 8.0, 3.53, 4.3, 0.75, 0.81, 4.83, 0.53, 5.16, 1.57, 23.6, 10.89, 1.07, 10.47]} \ No newline at end of file diff --git a/annotations_filtered/rKwnRWbuCx4_filtered.json b/annotations_filtered/rKwnRWbuCx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe12023117ca82ccccca17a41e1f69b5f8f07a7b --- /dev/null +++ b/annotations_filtered/rKwnRWbuCx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.43], [9.0, 11.87], [14.0, 17.88], [19.0, 28.04], [34.0, 34.72], [36.0, 48.3], [58.0, 58.9], [61.0, 61.53], [64.0, 65.15], [68.0, 68.74], [75.0, 75.98], [89.0, 96.9], [101.0, 101.49], [102.0, 103.47], [106.0, 107.4], [109.0, 111.48], [113.0, 114.39], [117.0, 125.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.75, 43.3, 38.83, 0.0, 40.43, 0.0, 0.0, 0.0, 0.0, 0.0, 41.95, 0.0, 0.0, 0.0, 99.4, 0.0, 99.16], "audiomae_on_audioset": [null, [["music", 54.8], ["speech", 12.28], ["sitar", 3.11]], [["music", 77.52], ["theremin", 3.26], ["musical instrument", 2.77]], [["music", 69.44], ["speech", 10.56], ["cattle, bovinae", 2.19]], null, [["music", 64.5], ["theremin", 7.26], ["cello", 4.53]], null, null, null, null, null, [["music", 71.58], ["boing", 3.68], ["speech", 2.05]], null, null, null, null, null, null], "duration": [1.43, 2.87, 3.88, 9.04, 0.72, 12.3, 0.9, 0.53, 1.15, 0.74, 0.98, 7.9, 0.49, 1.47, 1.4, 2.48, 1.39, 8.78]} \ No newline at end of file diff --git a/annotations_filtered/rL1VrbSK0IA_filtered.json b/annotations_filtered/rL1VrbSK0IA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5457ccf6b2fe7e502af8189a6cb17171ee0d6417 --- /dev/null +++ b/annotations_filtered/rL1VrbSK0IA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.52], [16.0, 20.31], [22.0, 25.76], [26.0, 31.24], [32.0, 36.32], [37.0, 41.88], [42.0, 45.45], [48.0, 49.05], [53.0, 52.78], [54.0, 55.14], [56.0, 69.89], [74.0, 75.66], [76.0, 78.06], [80.0, 81.5], [82.0, 90.44], [92.0, 104.53], [107.0, 113.53], [115.0, 115.7], [117.0, 119.84]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.03, 41.16, 43.93, 83.16, 54.04, 66.27, 79.41, 0.0, 0.0, 0.0, 61.08, 0.0, 59.15, 0.0, 66.63, 29.96, 52.8, 0.0, 53.65], "audiomae_on_audioset": [null, [["music", 24.99], ["hum", 14.21], ["singing bowl", 12.19]], [["speech", 35.58], ["music", 21.77], ["singing bowl", 11.47]], null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 64.7], ["throbbing", 20.5], ["mains hum", 12.22]], null, null, null], "duration": [4.52, 4.31, 3.76, 5.24, 4.32, 4.88, 3.45, 1.05, -0.22, 1.14, 13.89, 1.66, 2.06, 1.5, 8.44, 12.53, 6.53, 0.7, 2.84]} \ No newline at end of file diff --git a/annotations_filtered/rLVwKpyUwWI_filtered.json b/annotations_filtered/rLVwKpyUwWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85a7bfa102a94f26c976f77eb827e43437cd6289 --- /dev/null +++ b/annotations_filtered/rLVwKpyUwWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [14.0, 14.49], [30.0, 31.14], [35.0, 35.04], [35.0, 35.21], [41.0, 42.2], [45.0, 47.48], [60.0, 62.72], [65.0, 66.5], [70.0, 73.62], [88.0, 91.84], [129.0, 140.16]], "keep_status": [false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.54, 34.93, 0.0, 34.38, 34.04, 32.23], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 52.62], ["boing", 5.38], ["throbbing", 3.3]], [["music", 49.72], ["drum machine", 5.6], ["funk", 4.09]], null, [["music", 73.48], ["musical instrument", 2.3], ["guitar", 1.15]], [["music", 59.47], ["singing", 5.68], ["funk", 2.67]], [["music", 57.75], ["speech", 14.22], ["throbbing", 9.26]]], "duration": [0.43, 0.49, 1.14, 0.04, 0.21, 1.2, 2.48, 2.72, 1.5, 3.62, 3.84, 11.16]} \ No newline at end of file diff --git a/annotations_filtered/rLZ5aVNxV84_filtered.json b/annotations_filtered/rLZ5aVNxV84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a060ee831ddf0662e6442e248c068dd35163c105 --- /dev/null +++ b/annotations_filtered/rLZ5aVNxV84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [9.0, 10.79], [15.0, 15.57], [20.0, 21.46], [30.0, 31.94], [36.0, 35.95], [44.0, 48.39], [52.0, 52.3], [76.0, 77.13], [91.0, 91.1], [96.0, 115.77], [116.0, 116.82], [118.0, 123.47], [126.0, 128.19], [131.0, 131.85], [136.0, 135.68], [145.0, 145.02], [147.0, 147.07], [148.0, 148.09], [150.0, 150.42]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.53, 0.0, 0.0, 0.0, 29.96, 0.0, 32.11, 34.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["groan", 25.06], ["whack, thwack", 23.85], ["screaming", 6.53]], null, null, null, [["livestock, farm animals, working animals", 22.22], ["cattle, bovinae", 12.61], ["groan", 11.4]], null, [["whale vocalization", 76.05], ["animal", 2.35], ["mosquito", 2.35]], [["speech", 30.63], ["fly, housefly", 7.27], ["fart", 5.94]], null, null, null, null, null, null], "duration": [0.31, 1.79, 0.57, 1.46, 1.94, -0.05, 4.39, 0.3, 1.13, 0.1, 19.77, 0.82, 5.47, 2.19, 0.85, -0.32, 0.02, 0.07, 0.09, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/rLcAQVgMTSY_filtered.json b/annotations_filtered/rLcAQVgMTSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ed305a2c045920a7df437414cdd9d1e98a3786b --- /dev/null +++ b/annotations_filtered/rLcAQVgMTSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.7], [16.0, 31.72], [34.0, 36.85], [39.0, 38.89], [40.0, 44.95], [46.0, 46.21], [47.0, 49.35], [53.0, 53.23], [58.0, 58.14], [61.0, 61.25], [62.0, 62.95], [65.0, 65.87], [68.0, 69.03], [81.0, 83.34], [89.0, 90.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 54.36, 88.28, 0.0, 72.31, 0.0, 58.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.7, 15.72, 2.85, -0.11, 4.95, 0.21, 2.35, 0.23, 0.14, 0.25, 0.95, 0.87, 1.03, 2.34, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/rLtmIBRWQVQ_filtered.json b/annotations_filtered/rLtmIBRWQVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d535305ca435d0a11b63bcb7ca8dde39290b38c --- /dev/null +++ b/annotations_filtered/rLtmIBRWQVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 31.01], [32.0, 52.41], [58.0, 58.58], [62.0, 62.11], [66.0, 66.56], [68.0, 68.07], [71.0, 71.66], [84.0, 83.73], [85.0, 85.62], [89.0, 90.71], [97.0, 97.66], [99.0, 99.87], [112.0, 111.62], [116.0, 116.56], [118.0, 119.5], [124.0, 124.92], [126.0, 126.47], [135.0, 135.3], [138.0, 138.03], [141.0, 141.07], [143.0, 143.48], [147.0, 146.84], [148.0, 149.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 58.13], ["brass instrument", 15.16], ["trombone", 6.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 20.41, 0.58, 0.11, 0.56, 0.07, 0.66, -0.27, 0.62, 1.71, 0.66, 0.87, -0.38, 0.56, 1.5, 0.92, 0.47, 0.3, 0.03, 0.07, 0.48, -0.16, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/rM5Bg89j9qo_filtered.json b/annotations_filtered/rM5Bg89j9qo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b604c4697d3c451ade33f0b014a1c32609ef0607 --- /dev/null +++ b/annotations_filtered/rM5Bg89j9qo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 74.44]], "keep_status": [true], "silence_prob": [31.29], "audiomae_on_audioset": [[["speech", 50.56], ["rumble", 8.8], ["mains hum", 5.94]]], "duration": [4.44]} \ No newline at end of file diff --git a/annotations_filtered/rMS4ESFlfDk_filtered.json b/annotations_filtered/rMS4ESFlfDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77858f10084dcf51453f34eefffe29a728c15a32 --- /dev/null +++ b/annotations_filtered/rMS4ESFlfDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.36], [25.0, 24.98], [29.0, 33.18], [35.0, 48.2], [49.0, 49.22], [52.0, 61.28], [66.0, 68.05], [69.0, 69.92], [76.0, 76.55], [80.0, 80.23], [87.0, 87.2], [92.0, 95.52], [98.0, 113.29]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 99.87, 91.3, 0.0, 31.92, 42.48, 0.0, 0.0, 0.0, 0.0, 83.52, 32.01], "audiomae_on_audioset": [null, null, null, null, null, [["explosion", 16.79], ["livestock, farm animals, working animals", 14.59], ["cattle, bovinae", 14.29]], [["beatboxing", 53.53], ["vocal music", 34.42], ["speech", 1.62]], null, null, null, null, null, [["speech", 42.43], ["snicker", 12.62], ["laughter", 8.6]]], "duration": [0.36, -0.02, 4.18, 13.2, 0.22, 9.28, 2.05, 0.92, 0.55, 0.23, 0.2, 3.52, 15.29]} \ No newline at end of file diff --git a/annotations_filtered/rMWZUV287WA_filtered.json b/annotations_filtered/rMWZUV287WA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e954b83f9bca10a1352c67eb832e348f738588d --- /dev/null +++ b/annotations_filtered/rMWZUV287WA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 26.2], [29.0, 28.76], [29.0, 37.27], [38.0, 39.16], [42.0, 43.19], [54.0, 54.5], [60.0, 62.75], [63.0, 63.24], [63.0, 63.42], [63.0, 72.5], [77.0, 83.19], [85.0, 94.17], [95.0, 94.73], [95.0, 98.39], [99.0, 99.94], [101.0, 103.28], [105.0, 105.04], [105.0, 105.12], [105.0, 112.23], [117.0, 117.91]], "keep_status": [true, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [38.64, 0.0, 56.18, 0.0, 0.0, 0.0, 32.09, 0.0, 0.0, 30.72, 32.98, 35.64, 0.0, 80.46, 0.0, 90.6, 0.0, 0.0, 43.79, 0.0], "audiomae_on_audioset": [[["hum", 15.54], ["electric shaver, electric razor", 12.07], ["buzz", 11.81]], null, null, null, null, null, [["music", 39.02], ["speech", 22.48], ["splash, splatter", 4.85]], null, null, [["speech", 44.98], ["music", 34.96], ["guitar", 3.01]], [["music", 48.09], ["guitar", 6.34], ["plucked string instrument", 4.74]], [["music", 61.19], ["rowboat, canoe, kayak", 10.48], ["whale vocalization", 4.98]], null, null, null, null, null, null, [["speech", 52.04], ["splash, splatter", 14.69], ["whale vocalization", 11.77]], null], "duration": [11.2, -0.24, 8.27, 1.16, 1.19, 0.5, 2.75, 0.24, 0.42, 9.5, 6.19, 9.17, -0.27, 3.39, 0.94, 2.28, 0.04, 0.12, 7.23, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/rMczYrlPwaw_filtered.json b/annotations_filtered/rMczYrlPwaw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..100d01ddb953decd64f8ad28f839be30bd197aab --- /dev/null +++ b/annotations_filtered/rMczYrlPwaw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.8], [20.0, 21.51], [24.0, 24.26], [26.0, 26.49], [27.0, 27.82], [30.0, 30.3], [32.0, 32.54], [34.0, 34.33], [35.0, 37.1], [39.0, 40.44], [45.0, 44.93], [52.0, 57.25], [58.0, 59.8], [61.0, 63.21], [65.0, 66.75], [68.0, 68.84], [71.0, 72.52], [74.0, 75.51], [78.0, 82.38], [84.0, 84.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 95.23, 0.0, 82.97, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.51, 0.26, 0.49, 0.82, 0.3, 0.54, 0.33, 2.1, 1.44, -0.07, 5.25, 1.8, 2.21, 1.75, 0.84, 1.52, 1.51, 4.38, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/rMdZw9aBmnY_filtered.json b/annotations_filtered/rMdZw9aBmnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8876e6159657b0b3dd3910350b78a10832cc9c02 --- /dev/null +++ b/annotations_filtered/rMdZw9aBmnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.9], [3.0, 5.14], [11.0, 11.94], [16.0, 18.03], [19.0, 20.36], [23.0, 23.6], [29.0, 30.16], [35.0, 35.19], [37.0, 38.6], [44.0, 44.56], [47.0, 47.44], [50.0, 52.39], [55.0, 55.65], [58.0, 58.97], [60.0, 60.62], [62.0, 62.33], [66.0, 67.8], [69.0, 69.97], [72.0, 72.82], [77.0, 77.01], [79.0, 79.2], [80.0, 80.94], [85.0, 85.67], [95.0, 95.22], [97.0, 98.61], [100.0, 100.36], [102.0, 103.59], [108.0, 109.22], [112.0, 112.97], [115.0, 115.15], [116.0, 115.89], [119.0, 120.04], [124.0, 125.34], [127.0, 128.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.1, 2.14, 0.94, 2.03, 1.36, 0.6, 1.16, 0.19, 1.6, 0.56, 0.44, 2.39, 0.65, 0.97, 0.62, 0.33, 1.8, 0.97, 0.82, 0.01, 0.2, 0.94, 0.67, 0.22, 1.61, 0.36, 1.59, 1.22, 0.97, 0.15, -0.11, 1.04, 1.34, 1.75]} \ No newline at end of file diff --git a/annotations_filtered/rMz7JBRbmNo_filtered.json b/annotations_filtered/rMz7JBRbmNo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efc640696c765b75ab9cf8c7acb30a6eddc5d12e --- /dev/null +++ b/annotations_filtered/rMz7JBRbmNo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [8.0, 16.82], [17.0, 16.85], [17.0, 16.88], [17.0, 16.92], [17.0, 16.95], [20.0, 25.93], [28.0, 30.67], [31.0, 32.09], [34.0, 33.62], [39.0, 39.51], [40.0, 41.77], [43.0, 43.6], [51.0, 51.7], [54.0, 54.33], [62.0, 62.16], [68.0, 69.28], [85.0, 84.7], [86.0, 86.71], [88.0, 88.86], [97.0, 96.99], [98.0, 98.24], [101.0, 100.85], [127.0, 126.79], [136.0, 138.21], [139.0, 139.67], [140.0, 140.44], [146.0, 145.72], [149.0, 149.23], [154.0, 168.59], [169.0, 169.52], [189.0, 204.09], [205.0, 205.17], [208.0, 209.53], [214.0, 216.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 98.19, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 56.03, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 8.82, -0.15, -0.12, -0.08, -0.05, 5.93, 2.67, 1.09, -0.38, 0.51, 1.77, 0.6, 0.7, 0.33, 0.16, 1.28, -0.3, 0.71, 0.86, -0.01, 0.24, -0.15, -0.21, 2.21, 0.67, 0.44, -0.28, 0.23, 14.59, 0.52, 15.09, 0.17, 1.53, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/rNP5uIQxAfY_filtered.json b/annotations_filtered/rNP5uIQxAfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c2ec852c919a09305105f78018390a67f55d633 --- /dev/null +++ b/annotations_filtered/rNP5uIQxAfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.29], [13.0, 14.27], [20.0, 20.21], [23.0, 30.2], [33.0, 32.98], [34.0, 34.82], [36.0, 36.49], [38.0, 38.91], [42.0, 42.33], [45.0, 46.28], [47.0, 48.69], [51.0, 50.6], [52.0, 54.51], [55.0, 61.47], [63.0, 63.14], [65.0, 65.62], [67.0, 76.86], [78.0, 96.94], [99.0, 100.85], [103.0, 109.02], [110.0, 110.56], [117.0, 117.34], [118.0, 121.68], [127.0, 127.67], [129.0, 129.56], [136.0, 136.43], [138.0, 142.23], [144.0, 145.08], [148.0, 148.15], [149.0, 149.84]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 95.37, 0.0, 0.0, 95.64, 83.16, 0.0, 96.89, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 18.39], ["glass", 8.26], ["musical instrument", 4.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 1.27, 0.21, 7.2, -0.02, 0.82, 0.49, 0.91, 0.33, 1.28, 1.69, -0.4, 2.51, 6.47, 0.14, 0.62, 9.86, 18.94, 1.85, 6.02, 0.56, 0.34, 3.68, 0.67, 0.56, 0.43, 4.23, 1.08, 0.15, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/rNPcxSp5a2o_filtered.json b/annotations_filtered/rNPcxSp5a2o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5914fac945a3610406f7e110938475a72e6a52b1 --- /dev/null +++ b/annotations_filtered/rNPcxSp5a2o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 17.61], [19.0, 27.04], [28.0, 33.54], [35.0, 96.65], [99.0, 100.5], [101.0, 103.11], [112.0, 115.42], [117.0, 135.11], [135.0, 135.68], [136.0, 137.74], [139.0, 140.14]], "keep_status": [true, true, false, false, false, false, true, true, false, false, false], "silence_prob": [46.9, 37.99, 89.72, 0.0, 0.0, 63.74, 38.64, 32.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.7], ["hum", 10.4], ["throbbing", 7.08]], [["speech", 47.89], ["music", 7.21], ["vehicle", 4.81]], null, null, null, null, [["speech", 34.5], ["music", 23.22], ["thunk", 5.3]], [["throbbing", 32.83], ["hum", 17.75], ["music", 13.27]], null, null, null], "duration": [15.61, 8.04, 5.54, 61.65, 1.5, 2.11, 3.42, 18.11, 0.68, 1.74, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/rNmmNleiY_4_filtered.json b/annotations_filtered/rNmmNleiY_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ad944fbaf17d2d9c21374cacd93a55a2565743d --- /dev/null +++ b/annotations_filtered/rNmmNleiY_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.72], [4.0, 4.65], [8.0, 8.18], [17.0, 16.87], [18.0, 18.69], [23.0, 22.87], [28.0, 28.09], [32.0, 32.71], [50.0, 49.89], [53.0, 53.33], [57.0, 56.84], [61.0, 61.65], [64.0, 64.64], [66.0, 66.95], [69.0, 69.92], [75.0, 75.86], [76.0, 76.98], [77.0, 82.29], [97.0, 96.99], [105.0, 104.75], [125.0, 126.05], [132.0, 132.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.17, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 58.91], ["drum machine", 10.45], ["synthesizer", 8.24]], null, null, null, null], "duration": [2.72, 0.65, 0.18, -0.13, 0.69, -0.13, 0.09, 0.71, -0.11, 0.33, -0.16, 0.65, 0.64, 0.95, 0.92, 0.86, 0.98, 5.29, -0.01, -0.25, 1.05, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/rNoHdt36C7o_filtered.json b/annotations_filtered/rNoHdt36C7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79998fa375ac53cd8153e670f2eec4f20847789d --- /dev/null +++ b/annotations_filtered/rNoHdt36C7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.3], [12.0, 13.29], [14.0, 14.57], [17.0, 17.41], [20.0, 20.12], [22.0, 25.39], [27.0, 29.44], [31.0, 31.35], [32.0, 33.69], [36.0, 37.91], [41.0, 41.67], [47.0, 53.49], [54.0, 55.38], [56.0, 56.91], [58.0, 58.77], [60.0, 62.29], [65.0, 64.84], [69.0, 71.95], [73.0, 74.56], [76.0, 80.0], [81.0, 82.39], [83.0, 86.05]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.17, 30.83, 0.0, 0.0, 0.0, 0.0, 30.95, 0.0, 0.0, 0.0, 30.93, 0.0, 30.74, 0.0, 30.85, 0.0, 30.95], "audiomae_on_audioset": [null, null, null, null, null, [["music", 43.59], ["hum", 9.5], ["electronic music", 8.6]], [["frog", 11.47], ["throbbing", 11.05], ["didgeridoo", 10.83]], null, null, null, null, [["hum", 43.05], ["throbbing", 29.53], ["mains hum", 7.48]], null, null, null, [["chirp tone", 29.19], ["sine wave", 14.08], ["hum", 10.51]], null, [["hum", 22.44], ["music", 19.68], ["mains hum", 14.21]], null, [["hum", 37.84], ["mains hum", 15.17], ["sine wave", 7.73]], null, [["music", 28.45], ["chirp tone", 21.23], ["hum", 11.99]]], "duration": [0.3, 1.29, 0.57, 0.41, 0.12, 3.39, 2.44, 0.35, 1.69, 1.91, 0.67, 6.49, 1.38, 0.91, 0.77, 2.29, -0.16, 2.95, 1.56, 4.0, 1.39, 3.05]} \ No newline at end of file diff --git a/annotations_filtered/rNxqb6KMtkg_filtered.json b/annotations_filtered/rNxqb6KMtkg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..779527c2bd6fff35a75dd8b344e2d3645a5c8582 --- /dev/null +++ b/annotations_filtered/rNxqb6KMtkg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.68], [16.0, 16.23], [18.0, 19.53], [21.0, 21.54], [29.0, 32.39], [35.0, 37.1], [39.0, 40.14], [44.0, 44.93], [46.0, 47.02], [49.0, 49.49], [50.0, 50.65], [53.0, 54.43], [57.0, 57.08], [59.0, 64.18], [65.0, 73.14], [76.0, 78.63]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.73, 0.0, 0.0, 0.0, 98.1, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.72, 30.77, 95.78], "audiomae_on_audioset": [[["speech", 29.41], ["siren", 14.59], ["emergency vehicle", 5.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.71], ["music", 7.12], ["hum", 4.92]], null], "duration": [2.68, 0.23, 1.53, 0.54, 3.39, 2.1, 1.14, 0.93, 1.02, 0.49, 0.65, 1.43, 0.08, 5.18, 8.14, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/rOaNhtHWULw_filtered.json b/annotations_filtered/rOaNhtHWULw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7940c6c880c02d22540f07524b88131a741c99fb --- /dev/null +++ b/annotations_filtered/rOaNhtHWULw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.87], [20.0, 21.84], [23.0, 29.3], [30.0, 37.88], [41.0, 64.74], [67.0, 67.66], [68.0, 71.52], [78.0, 78.48], [79.0, 94.29], [95.0, 105.53], [107.0, 109.61]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 37.27, 85.72, 49.5, 0.0, 82.97, 0.0, 45.3, 88.64, 94.81], "audiomae_on_audioset": [null, null, [["music", 48.18], ["noise", 26.54], ["didgeridoo", 2.17]], null, [["speech", 22.48], ["music", 16.83], ["burping, eructation", 4.4]], null, null, null, [["mosquito", 17.82], ["fly, housefly", 17.64], ["music", 15.52]], null, null], "duration": [1.87, 1.84, 6.3, 7.88, 23.74, 0.66, 3.52, 0.48, 15.29, 10.53, 2.61]} \ No newline at end of file diff --git a/annotations_filtered/rOoBvxdO0Ac_filtered.json b/annotations_filtered/rOoBvxdO0Ac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0afbd461752f25e895dfab1ef32833e378747aea --- /dev/null +++ b/annotations_filtered/rOoBvxdO0Ac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.9], [9.0, 11.85], [13.0, 16.23], [17.0, 17.76], [19.0, 20.09], [23.0, 25.51], [29.0, 30.69], [35.0, 38.48], [43.0, 43.83], [44.0, 44.59], [47.0, 48.46], [51.0, 63.1], [66.0, 66.04], [69.0, 71.29], [73.0, 73.89], [75.0, 75.83], [76.0, 77.21], [79.0, 78.8], [81.0, 80.79], [83.0, 85.65], [86.0, 86.26], [93.0, 93.31], [95.0, 96.35], [97.0, 97.87], [100.0, 100.33], [101.0, 104.18], [110.0, 110.56], [112.0, 112.36], [114.0, 114.27], [116.0, 117.63], [118.0, 119.52], [124.0, 129.12], [139.0, 141.66], [144.0, 146.08], [150.0, 153.33], [156.0, 155.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 63.53, 57.48, 0.0, 0.0, 92.97, 0.0, 54.17, 0.0, 0.0, 0.0, 34.82, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 0.0, 0.0, 31.35, 30.5, 65.09, 78.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 64.06], ["trombone", 7.64], ["brass instrument", 6.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.58], ["didgeridoo", 13.3], ["groan", 7.76]], [["music", 42.19], ["synthesizer", 10.96], ["speech", 8.55]], null, null, null], "duration": [1.9, 2.85, 3.23, 0.76, 1.09, 2.51, 1.69, 3.48, 0.83, 0.59, 1.46, 12.1, 0.04, 2.29, 0.89, 0.83, 1.21, -0.2, -0.21, 2.65, 0.26, 0.31, 1.35, 0.87, 0.33, 3.18, 0.56, 0.36, 0.27, 1.63, 1.52, 5.12, 2.66, 2.08, 3.33, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/rOzJnj3UmNE_filtered.json b/annotations_filtered/rOzJnj3UmNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ee60b9db5a9fab3fa26b27599c9956ea7c2343e --- /dev/null +++ b/annotations_filtered/rOzJnj3UmNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.11], [15.0, 32.9], [37.0, 37.5], [38.0, 39.68], [40.0, 41.17], [41.0, 42.26], [43.0, 50.85], [54.0, 53.6], [54.0, 54.97], [57.0, 57.97], [58.0, 58.31], [59.0, 60.07], [62.0, 73.16], [74.0, 84.35], [86.0, 116.97], [118.0, 130.27], [131.0, 143.04], [143.0, 143.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.73, 68.67, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 36.38, 39.38, 0.0, 42.39, 31.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.83], ["hum", 22.05], ["mains hum", 21.43]], [["hum", 33.66], ["music", 23.25], ["throbbing", 18.96]], null, [["music", 47.3], ["hum", 14.8], ["rumble", 10.47]], [["music", 45.64], ["hum", 18.37], ["throbbing", 10.78]], null], "duration": [5.11, 17.9, 0.5, 1.68, 1.17, 1.26, 7.85, -0.4, 0.97, 0.97, 0.31, 1.07, 11.16, 10.35, 30.97, 12.27, 12.04, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/rP0QURktz3Y_filtered.json b/annotations_filtered/rP0QURktz3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..346c04b13c21c9c306bbed447953a16fe56e1666 --- /dev/null +++ b/annotations_filtered/rP0QURktz3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.61], [7.0, 12.95], [16.0, 22.06], [24.0, 26.5], [28.0, 32.83], [35.0, 41.79], [42.0, 44.64]], "keep_status": [false, true, true, true, false, true, true], "silence_prob": [41.2, 36.44, 39.83, 32.62, 37.99, 37.82, 33.63], "audiomae_on_audioset": [[["mains hum", 37.52], ["hum", 32.02], ["throbbing", 6.23]], [["speech", 30.53], ["mains hum", 17.58], ["music", 10.9]], [["speech", 31.13], ["mains hum", 14.0], ["hum", 12.23]], [["speech", 41.82], ["hum", 17.96], ["mains hum", 7.46]], [["speech", 56.95], ["hum", 9.84], ["throbbing", 4.71]], [["mains hum", 23.96], ["hum", 23.3], ["didgeridoo", 17.01]], [["music", 15.6], ["speech", 14.55], ["theremin", 11.37]]], "duration": [2.61, 5.95, 6.06, 2.5, 4.83, 6.79, 2.64]} \ No newline at end of file diff --git a/annotations_filtered/rPh94cOW-MI_filtered.json b/annotations_filtered/rPh94cOW-MI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78a1fe56022ba362d0fdbec56e18d5b199e3a4c8 --- /dev/null +++ b/annotations_filtered/rPh94cOW-MI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [12.0, 14.17], [19.0, 25.1], [30.0, 34.96], [38.0, 39.34], [44.0, 45.55], [50.0, 50.8], [52.0, 52.79], [54.0, 55.12], [59.0, 60.59], [63.0, 63.53], [65.0, 67.68], [71.0, 71.49], [77.0, 78.54], [80.0, 81.5], [84.0, 84.08], [85.0, 87.4], [90.0, 90.71], [95.0, 96.4], [97.0, 99.15], [101.0, 102.3], [105.0, 111.57], [114.0, 113.85], [115.0, 115.69], [117.0, 118.71], [120.0, 120.21], [123.0, 122.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.43, 43.2, 38.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 0.0, 0.0, 0.0, 43.33, 0.0, 0.0, 51.28, 0.0, 51.28, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 50.63], ["theremin", 17.78], ["effects unit", 5.56]], [["music", 74.08], ["fart", 3.16], ["grunt", 1.89]], [["music", 55.46], ["synthesizer", 10.61], ["didgeridoo", 8.11]], null, null, null, null, null, null, null, [["music", 51.69], ["theremin", 18.01], ["effects unit", 5.26]], null, null, null, null, [["music", 29.26], ["theremin", 7.64], ["mosquito", 6.24]], null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 2.17, 6.1, 4.96, 1.34, 1.55, 0.8, 0.79, 1.12, 1.59, 0.53, 2.68, 0.49, 1.54, 1.5, 0.08, 2.4, 0.71, 1.4, 2.15, 1.3, 6.57, -0.15, 0.69, 1.71, 0.21, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/rPuW7T25Yuw_filtered.json b/annotations_filtered/rPuW7T25Yuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a097e21a41e1780e734bad97a07dd2b2f95142d --- /dev/null +++ b/annotations_filtered/rPuW7T25Yuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.62], [8.0, 9.73], [11.0, 15.84], [19.0, 19.52], [23.0, 23.41], [24.0, 26.42], [27.0, 28.44], [32.0, 34.08], [34.0, 34.5], [35.0, 34.62], [35.0, 36.73], [39.0, 39.56], [41.0, 42.65], [45.0, 47.56], [49.0, 56.02], [58.0, 58.83], [61.0, 62.38], [65.0, 68.77], [69.0, 69.38], [70.0, 70.44], [70.0, 70.51], [71.0, 76.87], [86.0, 85.67], [89.0, 93.11], [96.0, 95.89], [98.0, 109.26], [112.0, 114.88], [116.0, 123.8]], "keep_status": [true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.39, 0.0, 42.19, 0.0, 0.0, 36.22, 0.0, 36.7, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 42.39, 0.0, 0.0, 37.28, 0.0, 0.0, 0.0, 35.85, 0.0, 36.69, 0.0, 43.71, 51.82, 50.16], "audiomae_on_audioset": [[["music", 47.33], ["didgeridoo", 8.1], ["speech", 4.92]], null, [["music", 31.19], ["speech", 29.57], ["didgeridoo", 5.33]], null, null, [["music", 76.73], ["speech", 5.78], ["throbbing", 2.53]], null, [["music", 28.38], ["hum", 10.97], ["mains hum", 8.41]], null, null, null, null, null, [["music", 78.95], ["musical instrument", 2.85], ["electronic music", 0.88]], [["music", 63.89], ["didgeridoo", 7.34], ["speech", 3.56]], null, null, [["music", 80.56], ["didgeridoo", 2.37], ["musical instrument", 1.71]], null, null, null, [["music", 54.84], ["didgeridoo", 10.03], ["speech", 9.8]], null, [["music", 55.13], ["hum", 11.1], ["mains hum", 8.9]], null, [["music", 63.26], ["theremin", 14.32], ["didgeridoo", 9.4]], null, null], "duration": [2.62, 1.73, 4.84, 0.52, 0.41, 2.42, 1.44, 2.08, 0.5, -0.38, 1.73, 0.56, 1.65, 2.56, 7.02, 0.83, 1.38, 3.77, 0.38, 0.44, 0.51, 5.87, -0.33, 4.11, -0.11, 11.26, 2.88, 7.8]} \ No newline at end of file diff --git a/annotations_filtered/rQ3Qokn9t_w_filtered.json b/annotations_filtered/rQ3Qokn9t_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4600af2e89eb6b9cf159de7168cce4a5ba22bf00 --- /dev/null +++ b/annotations_filtered/rQ3Qokn9t_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [10.0, 23.99], [25.0, 59.9], [60.0, 61.48], [63.0, 102.61], [110.0, 113.14], [115.0, 122.01], [122.0, 122.59], [126.0, 127.99], [129.0, 129.73], [132.0, 131.94]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 41.87, 0.0, 0.0, 0.0, 30.58, 29.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 29.32], ["mains hum", 26.33], ["throbbing", 15.31]], null, null, null, [["speech", 53.03], ["beatboxing", 6.94], ["music", 5.28]], [["speech", 27.85], ["fly, housefly", 11.94], ["insect", 8.58]], null, null, null, null], "duration": [1.6, 13.99, 34.9, 1.48, 39.61, 3.14, 7.01, 0.59, 1.99, 0.73, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/rQ7oKh5K7K4_filtered.json b/annotations_filtered/rQ7oKh5K7K4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18ef5f41bc1ac941af3572944f4676b70e6bffd1 --- /dev/null +++ b/annotations_filtered/rQ7oKh5K7K4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [6.0, 13.07], [13.0, 15.23], [17.0, 23.89], [26.0, 35.33], [42.0, 42.5], [44.0, 48.19], [48.0, 54.03]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [0.0, 34.06, 34.58, 31.82, 30.92, 0.0, 32.44, 31.16], "audiomae_on_audioset": [null, [["music", 45.66], ["didgeridoo", 15.01], ["speech", 11.44]], [["music", 72.1], ["throbbing", 6.27], ["musical instrument", 3.57]], [["music", 39.33], ["throbbing", 37.01], ["hum", 11.72]], [["music", 53.24], ["speech", 11.98], ["telephone", 10.27]], null, [["speech", 19.7], ["music", 14.94], ["throbbing", 14.11]], [["music", 62.53], ["speech", 12.96], ["throbbing", 9.73]]], "duration": [0.49, 7.07, 2.23, 6.89, 9.33, 0.5, 4.19, 6.03]} \ No newline at end of file diff --git a/annotations_filtered/rQABiLDqdVc_filtered.json b/annotations_filtered/rQABiLDqdVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b762d6d160c4d8679bb6874a9828ffaaa0de1de2 --- /dev/null +++ b/annotations_filtered/rQABiLDqdVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.84], [20.0, 21.0], [24.0, 34.47], [41.0, 52.14], [58.0, 67.54], [68.0, 85.14], [86.0, 115.99]], "keep_status": [false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 29.66, 29.7, 29.89, 30.45, 30.5], "audiomae_on_audioset": [null, null, [["speech", 42.08], ["music", 16.79], ["eruption", 7.56]], [["speech", 45.97], ["explosion", 18.81], ["music", 14.06]], [["throbbing", 22.87], ["hum", 19.85], ["music", 13.4]], [["fart", 16.5], ["music", 14.5], ["speech", 14.24]], [["throbbing", 30.07], ["speech", 23.38], ["hum", 20.99]]], "duration": [0.84, 1.0, 10.47, 11.14, 9.54, 17.14, 29.99]} \ No newline at end of file diff --git a/annotations_filtered/rQOBwQbssgo_filtered.json b/annotations_filtered/rQOBwQbssgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e6170ec17d8a3c55fca8983c83be962e0f6351d --- /dev/null +++ b/annotations_filtered/rQOBwQbssgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.94], [7.0, 7.45], [15.0, 14.96], [17.0, 19.94], [24.0, 24.85], [32.0, 32.41], [35.0, 35.13], [35.0, 36.09], [40.0, 40.49], [41.0, 41.45], [48.0, 49.18], [51.0, 53.5], [60.0, 60.79], [62.0, 62.92], [75.0, 83.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 56.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 43.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 34.84], ["cough", 14.91], ["burping, eructation", 10.33]]], "duration": [0.94, 0.45, -0.04, 2.94, 0.85, 0.41, 0.13, 1.09, 0.49, 0.45, 1.18, 2.5, 0.79, 0.92, 8.19]} \ No newline at end of file diff --git a/annotations_filtered/rQP1duR2tf4_filtered.json b/annotations_filtered/rQP1duR2tf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fdae975024d131aa174e76ab2ba8814b1d5abf6 --- /dev/null +++ b/annotations_filtered/rQP1duR2tf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.68], [35.0, 35.95], [42.0, 42.43], [43.0, 44.66], [49.0, 50.31], [51.0, 59.93], [61.0, 61.48], [62.0, 66.56], [68.0, 69.67], [72.0, 74.95], [77.0, 81.58], [83.0, 83.61], [84.0, 84.94], [86.0, 86.04], [88.0, 90.53], [92.0, 92.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.51, 0.0, 94.66, 0.0, 94.66, 99.05, 0.0, 0.0, 0.0, 85.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 88.94], ["electric shaver, electric razor", 1.37], ["male speech, man speaking", 1.28]], null, null, null, null, null, null, null, null, null, null], "duration": [1.68, 0.95, 0.43, 1.66, 1.31, 8.93, 0.48, 4.56, 1.67, 2.95, 4.58, 0.61, 0.94, 0.04, 2.53, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/rQWpTKfljVg_filtered.json b/annotations_filtered/rQWpTKfljVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3b9b2023d6f7802874fe906fbed7bc8ec5a5a4c --- /dev/null +++ b/annotations_filtered/rQWpTKfljVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.73], [7.0, 7.6], [9.0, 8.82], [9.0, 13.93], [15.0, 15.74], [17.0, 18.08], [19.0, 20.04], [21.0, 21.71], [25.0, 32.97], [35.0, 36.48], [40.0, 40.85], [46.0, 49.38], [51.0, 64.35], [68.0, 72.77], [74.0, 75.71], [76.0, 77.14], [80.0, 80.32], [81.0, 81.67], [86.0, 87.0], [90.0, 92.97], [95.0, 98.69], [100.0, 101.44], [102.0, 102.24], [104.0, 105.12], [106.0, 107.3], [108.0, 108.5], [113.0, 113.8], [121.0, 121.73], [123.0, 124.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 97.64, 75.72, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.6, -0.18, 4.93, 0.74, 1.08, 1.04, 0.71, 7.97, 1.48, 0.85, 3.38, 13.35, 4.77, 1.71, 1.14, 0.32, 0.67, 1.0, 2.97, 3.69, 1.44, 0.24, 1.12, 1.3, 0.5, 0.8, 0.73, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/rQbj9uvYL8I_filtered.json b/annotations_filtered/rQbj9uvYL8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a75665ffd90eaee79aa56ad6c616a80f00ee53c --- /dev/null +++ b/annotations_filtered/rQbj9uvYL8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.37], [11.0, 11.06], [12.0, 12.99], [21.0, 21.98], [24.0, 24.02], [46.0, 50.21], [50.0, 50.28], [50.0, 50.31], [53.0, 88.69]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 40.22], ["speech", 21.09], ["didgeridoo", 12.64]], null, null, null], "duration": [0.37, 0.06, 0.99, 0.98, 0.02, 4.21, 0.28, 0.31, 35.69]} \ No newline at end of file diff --git a/annotations_filtered/rRLP7r6OuYE_filtered.json b/annotations_filtered/rRLP7r6OuYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99870b685425d949e0c1694509378e9b17441c08 --- /dev/null +++ b/annotations_filtered/rRLP7r6OuYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.06], [4.0, 6.62], [9.0, 11.47], [14.0, 14.86], [17.0, 18.05], [19.0, 20.06], [21.0, 22.0], [23.0, 23.85], [25.0, 31.62], [33.0, 36.0], [36.0, 38.55], [40.0, 43.51], [44.0, 45.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 94.81, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 69.2, 74.76, 47.5, 81.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 43.83], ["hum", 8.29], ["busy signal", 7.79]], null, null], "duration": [1.06, 2.62, 2.47, 0.86, 1.05, 1.06, 1.0, 0.85, 6.62, 3.0, 2.55, 3.51, 1.4]} \ No newline at end of file diff --git a/annotations_filtered/rRUVmTXpPyg_filtered.json b/annotations_filtered/rRUVmTXpPyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3d432fcb5ce89854be2bcb3135fc00d57fca9ef --- /dev/null +++ b/annotations_filtered/rRUVmTXpPyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.91], [7.0, 8.09], [11.0, 11.42], [14.0, 14.61], [17.0, 20.56], [23.0, 24.21], [25.0, 26.57], [31.0, 31.31], [34.0, 35.5], [37.0, 37.49], [38.0, 40.49], [47.0, 47.16], [52.0, 53.0], [63.0, 67.64], [83.0, 83.54], [85.0, 87.3], [92.0, 98.29], [99.0, 101.95], [102.0, 111.79], [114.0, 114.49], [115.0, 127.57], [130.0, 130.1], [138.0, 151.41], [154.0, 158.19], [161.0, 161.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 33.31, 0.0, 0.0, 30.35, 0.0, 31.22, 30.21, 29.96, 30.55, 0.0, 29.9, 0.0, 29.16, 32.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["mosquito", 35.46], ["fly, housefly", 26.34], ["insect", 10.65]], null, null, [["livestock, farm animals, working animals", 32.76], ["cowbell", 15.75], ["music", 11.84]], null, [["music", 44.74], ["brass instrument", 8.65], ["musical instrument", 8.52]], [["music", 49.94], ["didgeridoo", 11.48], ["musical instrument", 6.43]], [["foghorn", 16.93], ["speech", 8.41], ["mosquito", 8.38]], [["fly, housefly", 48.4], ["insect", 19.9], ["buzz", 11.7]], null, [["fly, housefly", 28.05], ["insect", 10.84], ["music", 10.59]], null, [["music", 40.5], ["speech", 10.84], ["race car, auto racing", 7.8]], [["hum", 41.94], ["music", 17.3], ["mains hum", 14.34]], null], "duration": [1.91, 1.09, 0.42, 0.61, 3.56, 1.21, 1.57, 0.31, 1.5, 0.49, 2.49, 0.16, 1.0, 4.64, 0.54, 2.3, 6.29, 2.95, 9.79, 0.49, 12.57, 0.1, 13.41, 4.19, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/rRUuycF5FTU_filtered.json b/annotations_filtered/rRUuycF5FTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b25166ede339a89f091a0aa50c53d49c5518ad7 --- /dev/null +++ b/annotations_filtered/rRUuycF5FTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.6], [13.0, 21.17], [22.0, 23.58], [25.0, 31.26], [32.0, 45.5], [49.0, 50.58], [53.0, 63.27], [64.0, 67.88], [69.0, 69.55], [74.0, 86.86], [91.0, 91.89], [93.0, 94.34], [96.0, 95.57], [96.0, 102.3], [103.0, 104.43], [106.0, 107.0], [108.0, 115.69], [117.0, 118.83]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.05, 81.53, 0.0, 85.17, 98.8, 0.0, 99.71, 88.28, 0.0, 79.76, 0.0, 0.0, 0.0, 72.46, 0.0, 0.0, 83.52, 0.0], "audiomae_on_audioset": [[["speech", 24.06], ["animal", 10.93], ["crow", 7.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.6, 8.17, 1.58, 6.26, 13.5, 1.58, 10.27, 3.88, 0.55, 12.86, 0.89, 1.34, -0.43, 6.3, 1.43, 1.0, 7.69, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/rRaHWuWTtG8_filtered.json b/annotations_filtered/rRaHWuWTtG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93d5ad0f15b009c30db1a19cbfaca469400138c7 --- /dev/null +++ b/annotations_filtered/rRaHWuWTtG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.15], [26.0, 26.62], [30.0, 34.82], [36.0, 57.1], [59.0, 59.04], [59.0, 59.1], [60.0, 65.89], [67.0, 69.43], [71.0, 72.84], [78.0, 78.6], [79.0, 79.35], [80.0, 80.38], [81.0, 81.11], [82.0, 82.65], [90.0, 90.71], [92.0, 93.24], [94.0, 94.76], [99.0, 100.35], [101.0, 110.78], [112.0, 118.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.48, 0.0, 78.89, 76.04, 0.0, 0.0, 76.86, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 92.48], "audiomae_on_audioset": [[["breaking", 36.48], ["sidetone", 26.56], ["speech", 16.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.15, 0.62, 4.82, 21.1, 0.04, 0.1, 5.89, 2.43, 1.84, 0.6, 0.35, 0.38, 0.11, 0.65, 0.71, 1.24, 0.76, 1.35, 9.78, 6.98]} \ No newline at end of file diff --git a/annotations_filtered/rRlfzy7Rxdo_filtered.json b/annotations_filtered/rRlfzy7Rxdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b8b507bb5c4713b147283630251fbaa3e842086 --- /dev/null +++ b/annotations_filtered/rRlfzy7Rxdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[140.0, 142.62], [143.0, 145.12], [146.0, 147.97], [149.0, 151.09], [152.0, 167.81], [172.0, 172.69]], "keep_status": [true, true, false, false, true, false], "silence_prob": [38.87, 37.77, 0.0, 36.72, 29.14, 0.0], "audiomae_on_audioset": [[["hum", 27.31], ["music", 24.71], ["mains hum", 7.04]], [["hum", 32.2], ["throbbing", 19.1], ["music", 15.72]], null, [["hum", 32.06], ["music", 23.56], ["throbbing", 17.79]], [["hum", 40.4], ["mains hum", 15.39], ["throbbing", 10.77]], null], "duration": [2.62, 2.12, 1.97, 2.09, 15.81, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/rRuulhJ2ARQ_filtered.json b/annotations_filtered/rRuulhJ2ARQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3746baec07aed264cf84a4fedddae0e5c8156e0b --- /dev/null +++ b/annotations_filtered/rRuulhJ2ARQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.43], [17.0, 17.32], [18.0, 68.57], [69.0, 112.99], [114.0, 142.77], [143.0, 143.46], [144.0, 145.35], [146.0, 147.16], [150.0, 171.76]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [57.89, 0.0, 0.0, 0.0, 72.6, 0.0, 0.0, 0.0, 34.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 66.86], ["scary music", 8.57], ["ambient music", 7.34]]], "duration": [3.43, 0.32, 50.57, 43.99, 28.77, 0.46, 1.35, 1.16, 21.76]} \ No newline at end of file diff --git a/annotations_filtered/rS-P78D5US4_filtered.json b/annotations_filtered/rS-P78D5US4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7715d7ba2ab217f0f2570a96784fdfda1fda714 --- /dev/null +++ b/annotations_filtered/rS-P78D5US4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.96], [45.0, 45.76], [48.0, 47.58], [48.0, 47.73], [68.0, 68.05], [78.0, 78.73], [126.0, 126.6], [129.0, 130.23], [137.0, 137.15]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [3.96, 0.76, -0.42, -0.27, 0.05, 0.73, 0.6, 1.23, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/rS3VUoThFBw_filtered.json b/annotations_filtered/rS3VUoThFBw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8b78e90ccec4cbc60b16b363c8baaabe56b1ccb --- /dev/null +++ b/annotations_filtered/rS3VUoThFBw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 28.8], [34.0, 41.05], [41.0, 53.42], [54.0, 55.27], [56.0, 58.55], [61.0, 72.67], [76.0, 122.55], [123.0, 125.83], [127.0, 127.79]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [38.43, 45.05, 45.33, 0.0, 49.18, 44.34, 0.0, 89.9, 0.0], "audiomae_on_audioset": [[["speech", 42.84], ["music", 28.49], ["sidetone", 9.54]], [["music", 67.5], ["musical instrument", 7.45], ["speech", 6.82]], [["music", 45.7], ["whale vocalization", 19.59], ["synthesizer", 4.8]], null, [["music", 37.19], ["speech", 12.66], ["boing", 7.02]], [["music", 43.39], ["speech", 23.3], ["theremin", 6.04]], null, null, null], "duration": [8.8, 7.05, 12.42, 1.27, 2.55, 11.67, 46.55, 2.83, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/rSB9VJcwQsc_filtered.json b/annotations_filtered/rSB9VJcwQsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/rSB9VJcwQsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/rSCm0viS2mM_filtered.json b/annotations_filtered/rSCm0viS2mM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6261543329fceb81e72398d5632d71e0891b0de --- /dev/null +++ b/annotations_filtered/rSCm0viS2mM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.97], [22.0, 23.11], [30.0, 30.16], [45.0, 50.68], [55.0, 58.95], [63.0, 63.85], [69.0, 69.53], [73.0, 73.84], [75.0, 78.27], [79.0, 80.2], [82.0, 85.53], [87.0, 88.99], [96.0, 100.9], [107.0, 110.37], [114.0, 115.65], [118.0, 118.52], [121.0, 121.56], [122.0, 123.09], [136.0, 138.4], [139.0, 142.21], [143.0, 145.1], [151.0, 152.17], [166.0, 166.26], [175.0, 176.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.39, 33.77, 0.0, 0.0, 0.0, 68.28, 0.0, 44.87, 0.0, 48.65, 36.53, 0.0, 0.0, 0.0, 0.0, 46.9, 61.47, 68.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 72.02], ["throbbing", 4.5], ["hum", 2.81]], [["music", 82.16], ["singing", 2.55], ["musical instrument", 0.89]], null, null, null, null, null, [["music", 30.27], ["quack", 20.63], ["duck", 17.29]], null, [["speech", 52.46], ["hum", 14.03], ["music", 5.95]], [["music", 26.85], ["hum", 20.28], ["speech", 9.73]], null, null, null, null, [["music", 45.69], ["throbbing", 20.87], ["hum", 6.86]], null, null, null, null, null], "duration": [0.97, 1.11, 0.16, 5.68, 3.95, 0.85, 0.53, 0.84, 3.27, 1.2, 3.53, 1.99, 4.9, 3.37, 1.65, 0.52, 0.56, 1.09, 2.4, 3.21, 2.1, 1.17, 0.26, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/rSPj_G2yVz4_filtered.json b/annotations_filtered/rSPj_G2yVz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..638800df5785f5f765071afaf5561d76d940bcab --- /dev/null +++ b/annotations_filtered/rSPj_G2yVz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [4.0, 4.5], [9.0, 10.93], [12.0, 13.22], [15.0, 15.3], [16.0, 17.69], [20.0, 20.12], [22.0, 22.08], [24.0, 24.61], [27.0, 27.21], [30.0, 30.99], [34.0, 34.97], [36.0, 36.59], [39.0, 39.77], [41.0, 41.12], [44.0, 44.14], [47.0, 48.3], [49.0, 49.87], [51.0, 51.44], [54.0, 57.28], [59.0, 58.95], [60.0, 60.17], [61.0, 61.64], [64.0, 64.56], [67.0, 68.4], [69.0, 70.14], [73.0, 73.11], [75.0, 75.24], [76.0, 76.89], [78.0, 83.3], [85.0, 86.73], [88.0, 89.02], [90.0, 90.75], [92.0, 93.07], [94.0, 97.04], [98.0, 101.97], [102.0, 103.55], [104.0, 105.02], [107.0, 107.89], [113.0, 113.97], [115.0, 115.69], [117.0, 118.03], [121.0, 122.74], [124.0, 125.39], [127.0, 128.88], [131.0, 131.77], [135.0, 135.87], [138.0, 138.92], [140.0, 143.11], [144.0, 144.54], [147.0, 147.78], [149.0, 148.74], [150.0, 150.28], [154.0, 154.75], [155.0, 156.32], [158.0, 158.04], [159.0, 159.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.04, 0.5, 1.93, 1.22, 0.3, 1.69, 0.12, 0.08, 0.61, 0.21, 0.99, 0.97, 0.59, 0.77, 0.12, 0.14, 1.3, 0.87, 0.44, 3.28, -0.05, 0.17, 0.64, 0.56, 1.4, 1.14, 0.11, 0.24, 0.89, 5.3, 1.73, 1.02, 0.75, 1.07, 3.04, 3.97, 1.55, 1.02, 0.89, 0.97, 0.69, 1.03, 1.74, 1.39, 1.88, 0.77, 0.87, 0.92, 3.11, 0.54, 0.78, -0.26, 0.28, 0.75, 1.32, 0.04, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/rSWBuZws30g_filtered.json b/annotations_filtered/rSWBuZws30g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19dc16792e290661075b72a4a6e0cc528d02a7d9 --- /dev/null +++ b/annotations_filtered/rSWBuZws30g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [6.0, 7.15], [15.0, 14.81], [17.0, 17.05], [18.0, 18.87], [21.0, 22.03], [24.0, 24.11], [26.0, 27.77], [46.0, 46.89], [53.0, 54.92], [56.0, 57.06], [60.0, 61.72], [63.0, 63.66], [65.0, 66.75], [68.0, 69.58], [72.0, 73.13], [74.0, 74.92], [80.0, 82.93], [84.0, 85.56], [91.0, 96.3], [97.0, 98.74], [102.0, 103.77], [106.0, 107.11], [108.0, 108.95], [111.0, 111.67], [116.0, 118.64], [121.0, 121.2], [123.0, 122.94], [124.0, 124.44], [125.0, 127.14], [129.0, 130.17], [133.0, 134.77], [135.0, 143.51], [145.0, 146.13], [148.0, 147.66], [149.0, 149.71], [151.0, 153.13], [154.0, 160.32], [162.0, 162.9], [164.0, 164.4], [166.0, 167.17], [169.0, 172.83], [174.0, 174.68], [176.0, 176.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 38.12, 0.0, 0.0, 0.0, 0.0, 0.0, 40.26, 0.0, 0.0, 0.0, 41.5, 0.0, 0.0, 41.78, 0.0, 0.0, 0.0, 50.56, 39.01, 0.0, 0.0, 0.0, 33.94, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.7], ["speech", 5.51], ["theremin", 3.96]], null, null, null, null, null, [["music", 58.5], ["animal", 6.69], ["theremin", 5.91]], null, null, null, [["music", 33.65], ["speech", 18.38], ["musical instrument", 8.62]], null, null, [["music", 38.72], ["theremin", 11.79], ["speech", 8.5]], null, null, null, null, [["foghorn", 19.74], ["music", 16.18], ["didgeridoo", 13.53]], null, null, null, [["music", 65.29], ["musical instrument", 8.62], ["theremin", 7.76]], null, null], "duration": [0.5, 1.15, -0.19, 0.05, 0.87, 1.03, 0.11, 1.77, 0.89, 1.92, 1.06, 1.72, 0.66, 1.75, 1.58, 1.13, 0.92, 2.93, 1.56, 5.3, 1.74, 1.77, 1.11, 0.95, 0.67, 2.64, 0.2, -0.06, 0.44, 2.14, 1.17, 1.77, 8.51, 1.13, -0.34, 0.71, 2.13, 6.32, 0.9, 0.4, 1.17, 3.83, 0.68, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/rS_HIFTV7wM_filtered.json b/annotations_filtered/rS_HIFTV7wM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cebf2a776bedcfefe6bce3944a64d83de7819952 --- /dev/null +++ b/annotations_filtered/rS_HIFTV7wM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 52.12], [54.0, 67.86]], "keep_status": [true, true], "silence_prob": [29.76, 29.45], "audiomae_on_audioset": [[["fly, housefly", 43.13], ["mains hum", 6.4], ["bee, wasp, etc.", 6.35]], [["hum", 16.19], ["noise", 15.63], ["mains hum", 8.28]]], "duration": [24.12, 13.86]} \ No newline at end of file diff --git a/annotations_filtered/rTBkVOYzVZA_filtered.json b/annotations_filtered/rTBkVOYzVZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a669dff9284ab1d8c0ae0dfee7846312d5de8bf --- /dev/null +++ b/annotations_filtered/rTBkVOYzVZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.89], [23.0, 23.52], [24.0, 29.86], [35.0, 42.4], [48.0, 58.41], [65.0, 76.28], [81.0, 82.31], [83.0, 83.42], [88.0, 94.09], [97.0, 103.1], [107.0, 110.27], [117.0, 118.56], [120.0, 129.76]], "keep_status": [true, false, false, true, true, false, false, false, true, true, true, false, true], "silence_prob": [29.68, 0.0, 29.47, 29.25, 29.81, 28.73, 0.0, 0.0, 28.78, 30.09, 28.9, 0.0, 30.21], "audiomae_on_audioset": [[["music", 40.28], ["speech", 25.65], ["electric shaver, electric razor", 2.06]], null, [["speech", 61.43], ["vehicle", 9.7], ["music", 6.0]], [["music", 56.94], ["speech", 7.64], ["electronic music", 2.54]], [["speech", 40.06], ["livestock, farm animals, working animals", 9.5], ["music", 8.05]], [["music", 48.85], ["speech", 23.12], ["buzz", 10.22]], null, null, [["music", 37.72], ["speech", 16.86], ["foghorn", 4.26]], [["hum", 29.23], ["mains hum", 24.89], ["throbbing", 11.22]], [["speech", 32.17], ["music", 15.71], ["vehicle", 9.98]], null, [["speech", 54.44], ["music", 6.46], ["boat, water vehicle", 4.97]]], "duration": [5.89, 0.52, 5.86, 7.4, 10.41, 11.28, 1.31, 0.42, 6.09, 6.1, 3.27, 1.56, 9.76]} \ No newline at end of file diff --git a/annotations_filtered/rTCpK6ONu9M_filtered.json b/annotations_filtered/rTCpK6ONu9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..968f8b9197467d4dc711554c7f24dbbfd5a23650 --- /dev/null +++ b/annotations_filtered/rTCpK6ONu9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.45], [31.0, 30.99], [32.0, 33.32], [49.0, 48.84], [59.0, 60.15], [65.0, 65.52], [66.0, 67.71], [72.0, 72.72], [74.0, 73.7], [75.0, 79.47], [79.0, 79.51], [80.0, 79.93], [83.0, 90.36], [95.0, 98.42], [104.0, 103.82], [110.0, 110.32], [117.0, 120.5], [122.0, 123.33]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false], "silence_prob": [43.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.8, 0.0, 0.0, 30.9, 54.56, 0.0, 0.0, 45.88, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 27.33], ["speech", 17.12], ["livestock, farm animals, working animals", 14.88]], null, null, null, null, null, null, null, null, [["mosquito", 30.34], ["fly, housefly", 21.88], ["music", 10.23]], null, null, [["speech", 14.05], ["moo", 13.67], ["cattle, bovinae", 13.56]], null, null, null, [["speech", 49.88], ["music", 16.22], ["musical instrument", 2.98]], null], "duration": [3.45, -0.01, 1.32, -0.16, 1.15, 0.52, 1.71, 0.72, -0.3, 4.47, 0.51, -0.07, 7.36, 3.42, -0.18, 0.32, 3.5, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/rTlfnymyrrQ_filtered.json b/annotations_filtered/rTlfnymyrrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..963be3be9925a55590379819d6e3df69fb1f0b92 --- /dev/null +++ b/annotations_filtered/rTlfnymyrrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.64], [10.0, 27.77], [33.0, 33.35], [35.0, 34.97], [35.0, 36.21], [37.0, 37.91], [38.0, 38.7], [41.0, 42.92], [49.0, 49.06], [51.0, 52.86], [61.0, 68.62], [72.0, 77.85], [82.0, 84.47], [88.0, 93.61], [94.0, 95.15], [96.0, 96.42], [97.0, 97.31], [99.0, 99.03], [100.0, 99.96], [101.0, 101.63], [104.0, 104.75], [106.0, 122.17], [139.0, 140.29], [140.0, 140.34], [141.0, 151.55], [155.0, 157.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [30.09, 30.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.52, 29.98, 31.64, 34.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.02, 0.0, 0.0, 41.62, 84.25], "audiomae_on_audioset": [[["mains hum", 28.62], ["hum", 21.47], ["music", 21.45]], [["music", 73.97], ["electronic music", 3.08], ["explosion", 2.38]], null, null, null, null, null, null, null, null, [["hum", 39.06], ["music", 15.03], ["throbbing", 14.79]], [["music", 22.37], ["speech", 10.72], ["cattle, bovinae", 10.43]], [["hum", 24.78], ["mains hum", 19.47], ["music", 16.94]], [["speech", 56.36], ["music", 13.62], ["throbbing", 11.3]], null, null, null, null, null, null, null, [["speech", 66.56], ["eruption", 5.34], ["explosion", 5.19]], null, null, [["speech", 43.12], ["gunshot, gunfire", 10.78], ["hum", 8.4]], null], "duration": [5.64, 17.77, 0.35, -0.03, 1.21, 0.91, 0.7, 1.92, 0.06, 1.86, 7.62, 5.85, 2.47, 5.61, 1.15, 0.42, 0.31, 0.03, -0.04, 0.63, 0.75, 16.17, 1.29, 0.34, 10.55, 2.03]} \ No newline at end of file diff --git a/annotations_filtered/rU3GNIhA7fk_filtered.json b/annotations_filtered/rU3GNIhA7fk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f270ae99eb4d0cd61a90498d88b0dca7f798e7d5 --- /dev/null +++ b/annotations_filtered/rU3GNIhA7fk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.27], [7.0, 8.73], [13.0, 13.41], [16.0, 16.01], [17.0, 17.12], [20.0, 21.32], [28.0, 49.06], [50.0, 55.02], [71.0, 72.12], [73.0, 74.55], [91.0, 90.83], [92.0, 92.87], [94.0, 94.66], [96.0, 96.96], [100.0, 100.75], [110.0, 110.76]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.18, 38.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 24.17], ["hum", 20.0], ["mains hum", 15.24]], [["music", 36.53], ["hum", 20.18], ["throbbing", 13.24]], null, null, null, null, null, null, null, null], "duration": [0.27, 1.73, 0.41, 0.01, 0.12, 1.32, 21.06, 5.02, 1.12, 1.55, -0.17, 0.87, 0.66, 0.96, 0.75, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/rU8cUBCZn9c_filtered.json b/annotations_filtered/rU8cUBCZn9c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6424dcfdc2ed9417db0586fda5d73ae7ea046f1b --- /dev/null +++ b/annotations_filtered/rU8cUBCZn9c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.36], [12.0, 11.91], [14.0, 14.15], [14.0, 14.79], [19.0, 18.66], [19.0, 19.85], [34.0, 35.06], [36.0, 37.18], [38.0, 37.93], [38.0, 47.65], [48.0, 50.13], [50.0, 50.35], [53.0, 53.18], [54.0, 53.77], [54.0, 53.94], [54.0, 53.97], [54.0, 54.01], [58.0, 74.01], [78.0, 79.81], [89.0, 89.24], [91.0, 91.5], [92.0, 92.21], [109.0, 110.05], [113.0, 112.95], [127.0, 129.61]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.52, 35.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 50.81], ["speech", 6.92], ["percussion", 6.05]], [["speech", 34.18], ["boing", 33.51], ["hum", 4.87]], null, null, null, null, null, null, [["speech", 65.7], ["music", 4.32], ["beatboxing", 2.84]], null, null, null, null, null, null, [["speech", 63.25], ["beatboxing", 4.79], ["male speech, man speaking", 2.26]]], "duration": [0.36, -0.09, 0.15, 0.79, -0.34, 0.85, 1.06, 1.18, -0.07, 9.65, 2.13, 0.35, 0.18, -0.23, -0.06, -0.03, 0.01, 16.01, 1.81, 0.24, 0.5, 0.21, 1.05, -0.05, 2.61]} \ No newline at end of file diff --git a/annotations_filtered/rUbY9uikvWc_filtered.json b/annotations_filtered/rUbY9uikvWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87fbd04d847f1fe539f382a506dbc62a33a48f43 --- /dev/null +++ b/annotations_filtered/rUbY9uikvWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [6.0, 6.54], [7.0, 8.56], [10.0, 10.77], [17.0, 17.07], [20.0, 19.97], [23.0, 23.23], [27.0, 27.87], [41.0, 41.82], [45.0, 44.85], [50.0, 50.08], [52.0, 51.93], [57.0, 57.6], [58.0, 59.32], [61.0, 62.65], [65.0, 65.69], [72.0, 75.51], [81.0, 81.36], [84.0, 84.57], [86.0, 90.0], [94.0, 95.18], [109.0, 111.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 71.14, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.54, 1.56, 0.77, 0.07, -0.03, 0.23, 0.87, 0.82, -0.15, 0.08, -0.07, 0.6, 1.32, 1.65, 0.69, 3.51, 0.36, 0.57, 4.0, 1.18, 2.4]} \ No newline at end of file diff --git a/annotations_filtered/rUczpTPATyU_filtered.json b/annotations_filtered/rUczpTPATyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8215d75958c2a498bf982a1f3cce9233d468275d --- /dev/null +++ b/annotations_filtered/rUczpTPATyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.27], [3.0, 3.67], [5.0, 5.05], [6.0, 7.86], [8.0, 43.01], [44.0, 44.1], [46.0, 47.09], [53.0, 55.34], [57.0, 59.43], [60.0, 65.91], [71.0, 71.69], [75.0, 75.02], [76.0, 75.96], [77.0, 83.74], [88.0, 89.46], [92.0, 93.34], [96.0, 96.96], [98.0, 101.8], [103.0, 125.34], [126.0, 126.89], [130.0, 130.15], [131.0, 162.08], [162.0, 162.89], [164.0, 176.03], [177.0, 178.04], [181.0, 181.48]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.08, 48.06, 43.66, 0.0, 0.0, 0.0, 39.09, 0.0, 0.0, 0.0, 44.55, 50.21, 0.0, 0.0, 0.0, 0.0, 36.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 28.0], ["speech", 24.58], ["theremin", 11.04]], [["music", 58.29], ["synthesizer", 7.78], ["theremin", 5.87]], [["music", 56.7], ["throbbing", 7.25], ["hum", 6.07]], null, null, null, [["music", 74.17], ["musical instrument", 3.11], ["theremin", 2.63]], null, null, null, [["music", 68.73], ["synthesizer", 6.66], ["boing", 3.54]], null, null, null, null, null, [["music", 56.23], ["throbbing", 12.68], ["hum", 10.07]], null, null], "duration": [0.27, 0.67, 0.05, 1.86, 35.01, 0.1, 1.09, 2.34, 2.43, 5.91, 0.69, 0.02, -0.04, 6.74, 1.46, 1.34, 0.96, 3.8, 22.34, 0.89, 0.15, 31.08, 0.89, 12.03, 1.04, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/rV4DxcJOCLs_filtered.json b/annotations_filtered/rV4DxcJOCLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3374918c00b5087b86b9fa655ff66b934d52473 --- /dev/null +++ b/annotations_filtered/rV4DxcJOCLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.34], [11.0, 11.25], [21.0, 22.71], [31.0, 32.26], [38.0, 43.07], [60.0, 61.96], [67.0, 68.55], [75.0, 75.61], [77.0, 78.22], [88.0, 91.1], [92.0, 93.34], [94.0, 97.68], [100.0, 100.48], [103.0, 104.43], [106.0, 105.73], [107.0, 109.04], [115.0, 116.67]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.32, 0.0, 0.0, 0.0, 0.0, 31.19, 0.0, 37.12, 0.0, 0.0, 0.0, 47.82, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 14.18], ["humming", 11.9], ["male singing", 11.09]], null, null, null, null, [["humming", 38.39], ["music", 24.39], ["singing", 4.79]], null, [["speech", 68.22], ["whale vocalization", 3.4], ["fart", 2.48]], null, null, null, [["music", 19.46], ["boing", 13.69], ["humming", 7.42]], null], "duration": [0.34, 0.25, 1.71, 1.26, 5.07, 1.96, 1.55, 0.61, 1.22, 3.1, 1.34, 3.68, 0.48, 1.43, -0.27, 2.04, 1.67]} \ No newline at end of file diff --git a/annotations_filtered/rVFi-yeTe5g_filtered.json b/annotations_filtered/rVFi-yeTe5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6811e62f5b2d12bcb15549ef554468fe1fe76e9b --- /dev/null +++ b/annotations_filtered/rVFi-yeTe5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [4.0, 5.27], [6.0, 6.56], [8.0, 8.73], [13.0, 13.8], [16.0, 17.14], [19.0, 19.55], [22.0, 22.84], [26.0, 25.69], [31.0, 31.29], [35.0, 35.19], [41.0, 41.25], [44.0, 44.54], [45.0, 45.81], [51.0, 52.56], [54.0, 55.21], [57.0, 57.54], [68.0, 69.18], [70.0, 71.39], [72.0, 72.96], [74.0, 75.09], [76.0, 78.46], [81.0, 81.84], [85.0, 85.58], [88.0, 89.45], [91.0, 91.66], [92.0, 94.37], [98.0, 98.02], [100.0, 102.07], [104.0, 105.0], [108.0, 108.26], [113.0, 113.88], [116.0, 116.78], [119.0, 120.38], [122.0, 122.77], [125.0, 127.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.85, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.45], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 57.0], ["speech", 17.3], ["dial tone", 2.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.96], ["echo", 7.04], ["ding", 4.14]]], "duration": [0.76, 1.27, 0.56, 0.73, 0.8, 1.14, 0.55, 0.84, -0.31, 0.29, 0.19, 0.25, 0.54, 0.81, 1.56, 1.21, 0.54, 1.18, 1.39, 0.96, 1.09, 2.46, 0.84, 0.58, 1.45, 0.66, 2.37, 0.02, 2.07, 1.0, 0.26, 0.88, 0.78, 1.38, 0.77, 2.97]} \ No newline at end of file diff --git a/annotations_filtered/rW1_EfZ2pWU_filtered.json b/annotations_filtered/rW1_EfZ2pWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51a9d9dbb3944b3a8ac5437ad3c2c02732022142 --- /dev/null +++ b/annotations_filtered/rW1_EfZ2pWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.15], [12.0, 12.56], [13.0, 13.8], [21.0, 21.56], [24.0, 24.27], [26.0, 26.43], [29.0, 29.22], [37.0, 37.62], [40.0, 41.12], [43.0, 44.02], [48.0, 48.17], [50.0, 50.94], [52.0, 52.35], [55.0, 55.16], [58.0, 58.75], [60.0, 60.66], [63.0, 63.56], [70.0, 72.76], [76.0, 76.77], [78.0, 78.07], [79.0, 79.07], [82.0, 82.76], [86.0, 87.81], [89.0, 91.84], [94.0, 94.27], [96.0, 96.94], [101.0, 102.3], [104.0, 104.9], [107.0, 106.86], [109.0, 109.83], [111.0, 110.98], [113.0, 113.09], [115.0, 114.88], [116.0, 116.24], [117.0, 118.49], [120.0, 120.6], [124.0, 124.56], [134.0, 135.06], [136.0, 135.89], [136.0, 137.32], [139.0, 145.05], [146.0, 146.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.35, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 27.21], ["frog", 16.15], ["grunt", 7.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 0.56, 0.8, 0.56, 0.27, 0.43, 0.22, 0.62, 1.12, 1.02, 0.17, 0.94, 0.35, 0.16, 0.75, 0.66, 0.56, 2.76, 0.77, 0.07, 0.07, 0.76, 1.81, 2.84, 0.27, 0.94, 1.3, 0.9, -0.14, 0.83, -0.02, 0.09, -0.12, 0.24, 1.49, 0.6, 0.56, 1.06, -0.11, 1.32, 6.05, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/rW23RsUTb2Y_filtered.json b/annotations_filtered/rW23RsUTb2Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33982bf31ad889861760135188b3d67f3d14124e --- /dev/null +++ b/annotations_filtered/rW23RsUTb2Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [22.0, 25.56], [32.0, 32.17], [35.0, 35.43], [36.0, 46.89], [48.0, 49.84], [54.0, 54.78], [56.0, 62.28], [64.0, 64.72], [66.0, 66.28], [67.0, 67.98], [69.0, 77.62], [80.0, 80.59], [81.0, 81.46], [84.0, 84.25], [85.0, 85.38], [88.0, 89.34], [90.0, 101.22], [106.0, 137.66], [138.0, 156.57], [159.0, 159.76], [162.0, 162.92]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 62.89, 0.0, 0.0, 36.78, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 36.79, 0.0, 0.0, 0.0, 0.0, 0.0, 57.48, 0.0, 32.53, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 56.63], ["speech", 6.99], ["animal", 2.99]], null, null, null, null, null, null, [["speech", 59.9], ["explosion", 7.39], ["vehicle", 3.39]], null, null, null, null, null, null, null, [["speech", 25.5], ["eruption", 8.07], ["vehicle", 6.91]], null, null], "duration": [0.66, 3.56, 0.17, 0.43, 10.89, 1.84, 0.78, 6.28, 0.72, 0.28, 0.98, 8.62, 0.59, 0.46, 0.25, 0.38, 1.34, 11.22, 31.66, 18.57, 0.76, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/rW59kLTHdBE_filtered.json b/annotations_filtered/rW59kLTHdBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ccd073e5b4f7de8b579075303c154e994ce939e --- /dev/null +++ b/annotations_filtered/rW59kLTHdBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 44.29], [48.0, 77.06], [80.0, 84.18], [86.0, 87.61]], "keep_status": [true, false, false, false], "silence_prob": [29.03, 29.25, 36.86, 0.0], "audiomae_on_audioset": [[["music", 36.22], ["speech", 24.54], ["groan", 3.71]], [["music", 92.51], ["timpani", 0.5], ["hum", 0.48]], [["music", 54.81], ["didgeridoo", 15.16], ["speech", 7.15]], null], "duration": [23.29, 29.06, 4.18, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/rWGj8MCBBnc_filtered.json b/annotations_filtered/rWGj8MCBBnc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bfdc949f3c0efbe42e265b61f9af99ec4187c34 --- /dev/null +++ b/annotations_filtered/rWGj8MCBBnc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.69], [14.0, 17.2], [20.0, 20.98], [22.0, 22.89], [24.0, 27.55], [32.0, 38.03], [40.0, 40.44], [43.0, 44.12], [45.0, 47.61], [52.0, 62.48], [66.0, 70.34], [76.0, 76.67], [78.0, 77.8], [79.0, 79.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.09, 0.0, 0.0, 97.92, 84.43, 0.0, 0.0, 97.43, 100.0, 65.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.69, 3.2, 0.98, 0.89, 3.55, 6.03, 0.44, 1.12, 2.61, 10.48, 4.34, 0.67, -0.2, 0.68]} \ No newline at end of file diff --git a/annotations_filtered/rWe5nzPq1JA_filtered.json b/annotations_filtered/rWe5nzPq1JA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c36bdb7dd99cba604f0c87c5c489167f7df81218 --- /dev/null +++ b/annotations_filtered/rWe5nzPq1JA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.15], [12.0, 15.92], [20.0, 20.68], [23.0, 23.82], [26.0, 27.03], [34.0, 36.61], [40.0, 40.12], [47.0, 48.02], [49.0, 54.35], [55.0, 56.27], [58.0, 64.45], [65.0, 65.47], [70.0, 72.66], [77.0, 78.6], [80.0, 80.82], [87.0, 91.29], [93.0, 94.39], [96.0, 97.78]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.92, 0.0, 0.0, 0.0, 70.44, 0.0, 0.0, 71.57, 0.0, 41.68, 0.0, 64.41, 0.0, 0.0, 99.26, 0.0, 0.0], "audiomae_on_audioset": [null, [["electric shaver, electric razor", 21.04], ["hum", 9.4], ["mains hum", 8.67]], null, null, null, null, null, null, null, null, [["speech", 38.29], ["fly, housefly", 12.15], ["bee, wasp, etc.", 10.22]], null, null, null, null, null, null, null], "duration": [1.15, 3.92, 0.68, 0.82, 1.03, 2.61, 0.12, 1.02, 5.35, 1.27, 6.45, 0.47, 2.66, 1.6, 0.82, 4.29, 1.39, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/rWeaYCoh1qk_filtered.json b/annotations_filtered/rWeaYCoh1qk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c825485f90edda68242435c5a34327a8e323f03 --- /dev/null +++ b/annotations_filtered/rWeaYCoh1qk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [13.0, 13.22], [17.0, 16.85], [17.0, 17.59], [30.0, 29.91], [38.0, 37.79], [38.0, 38.8], [42.0, 42.11], [46.0, 48.15], [54.0, 55.65], [58.0, 60.3], [61.0, 63.46], [68.0, 68.64], [69.0, 69.35], [83.0, 86.85], [89.0, 90.46], [91.0, 92.15], [94.0, 95.32], [96.0, 98.02], [100.0, 101.26], [104.0, 103.92], [107.0, 107.76], [113.0, 112.97], [119.0, 121.51], [122.0, 122.59], [125.0, 126.06], [129.0, 128.9], [130.0, 130.71], [131.0, 131.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.22, -0.15, 0.59, -0.09, -0.21, 0.8, 0.11, 2.15, 1.65, 2.3, 2.46, 0.64, 0.35, 3.85, 1.46, 1.15, 1.32, 2.02, 1.26, -0.08, 0.76, -0.03, 2.51, 0.59, 1.06, -0.1, 0.71, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/rWlFWMR9MfY_filtered.json b/annotations_filtered/rWlFWMR9MfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..796b0bca04731b8bf732386665fe5d400198cb7d --- /dev/null +++ b/annotations_filtered/rWlFWMR9MfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.12], [4.0, 3.74], [5.0, 6.99], [14.0, 15.52], [27.0, 27.35], [32.0, 31.97], [33.0, 33.81], [47.0, 49.08], [52.0, 52.27], [65.0, 65.77], [74.0, 73.79], [82.0, 82.65], [91.0, 94.8], [96.0, 102.78], [106.0, 106.79], [120.0, 127.4], [130.0, 132.19], [135.0, 148.12], [150.0, 150.72], [154.0, 155.19], [159.0, 159.83], [161.0, 165.42], [167.0, 180.93]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, true, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.33, 0.0, 0.0, 0.0, 0.0, 29.23, 28.97, 0.0, 29.0, 31.46, 29.02, 0.0, 0.0, 0.0, 29.55, 28.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["roar", 22.34], ["speech", 18.76], ["music", 12.83]], null, null, null, null, [["music", 46.66], ["sound effect", 10.63], ["reverberation", 8.15]], [["music", 38.63], ["hum", 24.59], ["throbbing", 15.29]], null, [["music", 43.96], ["didgeridoo", 5.49], ["hum", 4.45]], [["music", 18.22], ["musical instrument", 5.16], ["trombone", 4.99]], [["music", 10.08], ["whack, thwack", 7.65], ["speech", 6.6]], null, null, null, [["speech", 41.49], ["rumble", 11.6], ["whoosh, swoosh, swish", 6.1]], [["music", 21.65], ["speech", 19.45], ["buzz", 7.18]]], "duration": [0.12, -0.26, 1.99, 1.52, 0.35, -0.03, 0.81, 2.08, 0.27, 0.77, -0.21, 0.65, 3.8, 6.78, 0.79, 7.4, 2.19, 13.12, 0.72, 1.19, 0.83, 4.42, 13.93]} \ No newline at end of file diff --git a/annotations_filtered/rWqVoaYxgRs_filtered.json b/annotations_filtered/rWqVoaYxgRs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..461534ee5000ec5cdef418561f6e459d178fc393 --- /dev/null +++ b/annotations_filtered/rWqVoaYxgRs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.26], [23.0, 23.45], [26.0, 26.62], [27.0, 35.4], [37.0, 37.81], [38.0, 39.09], [40.0, 63.54], [64.0, 76.08], [77.0, 77.94], [83.0, 89.02], [92.0, 122.4], [125.0, 127.55], [130.0, 144.95], [147.0, 148.0]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, true, true, false], "silence_prob": [67.13, 0.0, 0.0, 70.44, 0.0, 0.0, 32.68, 30.37, 0.0, 37.12, 0.0, 40.45, 38.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 57.33], ["music", 7.1], ["theremin", 3.59]], [["music", 33.46], ["didgeridoo", 29.39], ["mains hum", 9.54]], null, [["music", 47.62], ["speech", 7.75], ["synthesizer", 5.89]], null, [["insect", 17.37], ["sidetone", 15.49], ["hum", 12.85]], [["music", 12.91], ["mosquito", 6.09], ["musical instrument", 5.63]], null], "duration": [15.26, 0.45, 0.62, 8.4, 0.81, 1.09, 23.54, 12.08, 0.94, 6.02, 30.4, 2.55, 14.95, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/rWvIBJO8T_Y_filtered.json b/annotations_filtered/rWvIBJO8T_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc0e928bdcdfff5e2cbbcb6bcf0431f7b0691b31 --- /dev/null +++ b/annotations_filtered/rWvIBJO8T_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.54], [6.0, 7.18], [8.0, 39.97], [41.0, 43.09], [44.0, 47.92], [48.0, 55.53], [57.0, 88.62]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 99.87, 98.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.54, 1.18, 31.97, 2.09, 3.92, 7.53, 31.62]} \ No newline at end of file diff --git a/annotations_filtered/rWvqkw0_xFA_filtered.json b/annotations_filtered/rWvqkw0_xFA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b83c6c208ec6ebd3398667e3d05545b79049f1b1 --- /dev/null +++ b/annotations_filtered/rWvqkw0_xFA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.67], [8.0, 10.23], [12.0, 15.38], [18.0, 21.73], [23.0, 24.9], [26.0, 26.42], [27.0, 30.3], [32.0, 53.92], [54.0, 54.14], [54.0, 62.36], [64.0, 64.88], [66.0, 67.44], [68.0, 73.06], [74.0, 87.02], [89.0, 170.61], [171.0, 177.18], [178.0, 193.53]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, false, true], "silence_prob": [82.43, 83.16, 99.92, 85.17, 0.0, 0.0, 98.27, 30.52, 0.0, 31.39, 0.0, 0.0, 31.35, 54.97, 0.0, 75.55, 33.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 31.14], ["mains hum", 17.47], ["speech", 14.6]], null, [["speech", 30.03], ["mains hum", 19.71], ["music", 14.0]], null, null, [["music", 33.76], ["synthesizer", 7.59], ["speech", 6.15]], null, null, null, [["thunk", 33.18], ["music", 27.05], ["door", 7.25]]], "duration": [4.67, 2.23, 3.38, 3.73, 1.9, 0.42, 3.3, 21.92, 0.14, 8.36, 0.88, 1.44, 5.06, 13.02, 81.61, 6.18, 15.53]} \ No newline at end of file diff --git a/annotations_filtered/rX6oUNKUbI8_filtered.json b/annotations_filtered/rX6oUNKUbI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d624a28f81c821f7670c690f140fd4cdb1fe401 --- /dev/null +++ b/annotations_filtered/rX6oUNKUbI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.72], [32.0, 32.17], [60.0, 61.01], [69.0, 69.57], [71.0, 71.27], [76.0, 75.68], [91.0, 91.71], [96.0, 95.77], [128.0, 128.07], [130.0, 129.81], [133.0, 135.36], [140.0, 140.22], [160.0, 160.54], [164.0, 164.96], [166.0, 174.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 45.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.47], ["thunk", 16.49], ["whack, thwack", 13.63]]], "duration": [2.72, 0.17, 1.01, 0.57, 0.27, -0.32, 0.71, -0.23, 0.07, -0.19, 2.36, 0.22, 0.54, 0.96, 8.09]} \ No newline at end of file diff --git a/annotations_filtered/rXpCjDg0RT0_filtered.json b/annotations_filtered/rXpCjDg0RT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a5853c45c200d4a5378d636c3f3ff9ec838c313 --- /dev/null +++ b/annotations_filtered/rXpCjDg0RT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.76], [4.0, 6.84], [8.0, 10.84], [12.0, 12.5], [13.0, 15.28], [17.0, 18.52], [20.0, 29.93], [31.0, 50.25], [51.0, 77.87], [81.0, 88.35], [96.0, 101.71], [105.0, 106.24], [107.0, 112.77], [114.0, 114.49], [115.0, 116.01], [119.0, 119.43]], "keep_status": [false, true, false, false, false, false, true, true, true, true, true, false, false, false, false, false], "silence_prob": [0.0, 44.6, 44.96, 0.0, 44.55, 0.0, 31.07, 30.56, 28.52, 47.2, 35.06, 0.0, 97.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["rumble", 29.56], ["sine wave", 11.45], ["speech", 7.62]], [["speech", 40.18], ["sine wave", 27.56], ["rumble", 8.47]], null, [["speech", 63.68], ["rumble", 5.18], ["vehicle", 5.05]], null, [["music", 28.91], ["speech", 19.9], ["hum", 11.0]], [["speech", 20.93], ["noise", 11.07], ["rumble", 9.87]], [["speech", 15.29], ["music", 13.38], ["siren", 11.8]], [["hum", 36.29], ["music", 20.03], ["mains hum", 10.72]], [["speech", 30.14], ["animal", 9.58], ["domestic animals, pets", 8.06]], null, null, null, null, null], "duration": [1.76, 2.84, 2.84, 0.5, 2.28, 1.52, 9.93, 19.25, 26.87, 7.35, 5.71, 1.24, 5.77, 0.49, 1.01, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/rXqRZvG5LAQ_filtered.json b/annotations_filtered/rXqRZvG5LAQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a1d6caf2c66b8fd149ed4e424be460b9363d7f4 --- /dev/null +++ b/annotations_filtered/rXqRZvG5LAQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.06], [6.0, 9.88], [13.0, 13.14], [13.0, 13.47], [14.0, 15.21], [16.0, 16.75], [22.0, 50.85], [55.0, 56.27], [57.0, 61.7], [64.0, 64.5], [66.0, 80.2], [84.0, 84.4], [88.0, 88.82], [92.0, 112.53], [114.0, 113.86], [115.0, 118.25], [119.0, 119.77], [121.0, 122.15], [129.0, 128.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.03, 0.0, 0.0, 0.0, 0.0, 35.3, 0.0, 53.78, 0.0, 45.52, 0.0, 0.0, 34.98, 0.0, 70.86, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 38.52], ["gunshot, gunfire", 23.03], ["machine gun", 21.66]], null, null, null, null, [["music", 54.69], ["throbbing", 25.31], ["hum", 6.08]], null, null, null, [["throbbing", 65.65], ["music", 15.02], ["hum", 5.39]], null, null, [["throbbing", 36.55], ["music", 35.19], ["hum", 10.7]], null, null, null, null, null], "duration": [0.06, 3.88, 0.14, 0.47, 1.21, 0.75, 28.85, 1.27, 4.7, 0.5, 14.2, 0.4, 0.82, 20.53, -0.14, 3.25, 0.77, 1.15, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/rXs41JvueZY_filtered.json b/annotations_filtered/rXs41JvueZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0370c3acb9967c88c44508be01a304db6704188e --- /dev/null +++ b/annotations_filtered/rXs41JvueZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.38], [13.0, 15.75], [17.0, 18.44], [20.0, 21.36], [22.0, 23.25], [27.0, 27.57], [28.0, 28.98], [32.0, 33.62], [35.0, 35.99], [38.0, 39.83], [41.0, 40.95], [42.0, 41.74], [43.0, 43.8], [46.0, 46.94], [53.0, 55.43], [58.0, 59.1], [60.0, 60.24], [63.0, 63.83], [72.0, 72.5], [76.0, 76.49], [79.0, 78.7], [80.0, 82.19], [86.0, 88.11], [92.0, 92.69], [95.0, 95.61], [100.0, 101.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 34.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 26.87], ["music", 23.39], ["wind instrument, woodwind instrument", 16.45]], null, null, null], "duration": [0.38, 2.75, 1.44, 1.36, 1.25, 0.57, 0.98, 1.62, 0.99, 1.83, -0.05, -0.26, 0.8, 0.94, 2.43, 1.1, 0.24, 0.83, 0.5, 0.49, -0.3, 2.19, 2.11, 0.69, 0.61, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/rXwdnHnLvms_filtered.json b/annotations_filtered/rXwdnHnLvms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03d94718eb5927194c101ba0644b4236535f57a5 --- /dev/null +++ b/annotations_filtered/rXwdnHnLvms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.16], [20.0, 21.1], [22.0, 22.42], [39.0, 38.91], [45.0, 44.95], [76.0, 76.77], [83.0, 83.47], [95.0, 96.47], [105.0, 106.17], [110.0, 111.18], [113.0, 112.94], [116.0, 116.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 1.1, 0.42, -0.09, -0.05, 0.77, 0.47, 1.47, 1.17, 1.18, -0.06, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/rXxBQRh89AA_filtered.json b/annotations_filtered/rXxBQRh89AA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2033a4fd3e114e9e0ed5d9b25422792b53d7e6e --- /dev/null +++ b/annotations_filtered/rXxBQRh89AA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.43], [11.0, 12.24], [13.0, 15.03], [18.0, 19.58], [20.0, 20.85], [27.0, 28.14], [30.0, 30.89], [33.0, 34.21], [35.0, 35.67], [37.0, 38.57], [41.0, 42.7], [44.0, 45.13], [46.0, 47.63], [49.0, 49.18], [49.0, 51.0], [57.0, 57.21], [57.0, 58.09], [61.0, 64.56], [68.0, 68.57], [69.0, 70.87], [71.0, 73.25], [75.0, 75.76], [76.0, 76.6], [78.0, 79.25], [81.0, 82.49], [84.0, 86.27], [89.0, 90.51], [92.0, 97.36], [98.0, 99.52], [100.0, 102.09], [103.0, 104.79], [106.0, 106.91], [108.0, 109.98], [110.0, 121.14], [122.0, 122.18], [123.0, 127.08], [130.0, 132.39], [133.0, 134.77], [142.0, 142.28], [148.0, 152.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 0.0, 0.0, 53.53, 0.0, 0.0, 36.98, 0.0, 0.0, 0.0, 0.0, 78.21, 0.0, 62.37, 0.0, 38.55, 0.0, 0.0, 0.0, 45.62, 0.0, 48.02, 53.28, 0.0, 0.0, 72.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.27], ["music", 21.16], ["hum", 3.91]], null, null, null, null, null, null, null, null, [["speech", 21.7], ["hum", 20.31], ["mains hum", 13.22]], null, null, null, [["fly, housefly", 23.76], ["insect", 14.04], ["speech", 11.62]], null, [["fart", 13.97], ["rumble", 12.78], ["buzz", 9.42]], null, null, null, null], "duration": [1.43, 1.24, 2.03, 1.58, 0.85, 1.14, 0.89, 1.21, 0.67, 1.57, 1.7, 1.13, 1.63, 0.18, 2.0, 0.21, 1.09, 3.56, 0.57, 1.87, 2.25, 0.76, 0.6, 1.25, 1.49, 2.27, 1.51, 5.36, 1.52, 2.09, 1.79, 0.91, 1.98, 11.14, 0.18, 4.08, 2.39, 1.77, 0.28, 4.69]} \ No newline at end of file diff --git a/annotations_filtered/rXyyr3kSB3s_filtered.json b/annotations_filtered/rXyyr3kSB3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..491923f4c2a7e36884fc1248dc69c448fb7e3b8e --- /dev/null +++ b/annotations_filtered/rXyyr3kSB3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.91], [19.0, 30.62], [32.0, 34.55], [37.0, 40.2], [41.0, 47.36], [52.0, 57.18], [58.0, 58.29], [59.0, 64.83], [66.0, 66.7], [68.0, 69.87], [74.0, 76.08], [78.0, 81.16], [83.0, 105.44], [107.0, 108.55], [111.0, 113.19], [114.0, 122.12], [123.0, 124.63], [125.0, 129.79]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.72, 77.53, 97.92, 45.18, 88.64, 57.01, 0.0, 90.78, 0.0, 0.0, 54.5, 31.3, 46.94, 0.0, 89.19, 59.42, 0.0, 55.53], "audiomae_on_audioset": [null, null, null, [["heart sounds, heartbeat", 33.38], ["sheep", 9.68], ["throbbing", 5.53]], null, null, null, null, null, null, null, [["speech", 63.12], ["hum", 5.0], ["clang", 2.43]], [["whale vocalization", 92.37], ["animal", 1.59], ["roar", 0.78]], null, null, null, null, null], "duration": [3.91, 11.62, 2.55, 3.2, 6.36, 5.18, 0.29, 5.83, 0.7, 1.87, 2.08, 3.16, 22.44, 1.55, 2.19, 8.12, 1.63, 4.79]} \ No newline at end of file diff --git a/annotations_filtered/rYGWG2_PB_Q_filtered.json b/annotations_filtered/rYGWG2_PB_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2d30516b35dd699ff403021e775164d38a01f3a --- /dev/null +++ b/annotations_filtered/rYGWG2_PB_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 94.51]], "keep_status": [true], "silence_prob": [31.13], "audiomae_on_audioset": [[["hum", 35.37], ["mains hum", 20.71], ["music", 8.82]]], "duration": [19.51]} \ No newline at end of file diff --git a/annotations_filtered/rYHCZi-tmTE_filtered.json b/annotations_filtered/rYHCZi-tmTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9af77bc8770939f1ce4c4ecab377a619c075cb1c --- /dev/null +++ b/annotations_filtered/rYHCZi-tmTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.97], [5.0, 5.71], [7.0, 8.6], [11.0, 14.98], [16.0, 16.36], [18.0, 19.11], [20.0, 20.65], [21.0, 22.01], [37.0, 37.49], [44.0, 44.07], [49.0, 49.3], [65.0, 65.2], [74.0, 76.42], [80.0, 81.18], [82.0, 83.91], [90.0, 90.58], [94.0, 93.97], [95.0, 95.08], [96.0, 97.19], [101.0, 109.48], [138.0, 139.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.97, 0.71, 1.6, 3.98, 0.36, 1.11, 0.65, 1.01, 0.49, 0.07, 0.3, 0.2, 2.42, 1.18, 1.91, 0.58, -0.03, 0.08, 1.19, 8.48, 1.06]} \ No newline at end of file diff --git a/annotations_filtered/rYS9mUCFOAk_filtered.json b/annotations_filtered/rYS9mUCFOAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..831cebef585827996df2f215afff83b90bbe2cb2 --- /dev/null +++ b/annotations_filtered/rYS9mUCFOAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [34.0, 34.13], [36.0, 35.75], [40.0, 41.07], [45.0, 45.94], [56.0, 56.49], [64.0, 65.16], [74.0, 74.34], [77.0, 77.35], [86.0, 86.04], [93.0, 94.05], [95.0, 94.91], [96.0, 96.74], [98.0, 99.22], [101.0, 102.39], [104.0, 104.36], [113.0, 113.41], [119.0, 119.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.13, -0.25, 1.07, 0.94, 0.49, 1.16, 0.34, 0.35, 0.04, 1.05, -0.09, 0.74, 1.22, 1.39, 0.36, 0.41, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/rYVsdfE_Wh8_filtered.json b/annotations_filtered/rYVsdfE_Wh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..071e846da1922729ac0b8744f47e763dba00a52c --- /dev/null +++ b/annotations_filtered/rYVsdfE_Wh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [7.0, 7.3], [25.0, 25.34], [39.0, 40.05], [43.0, 43.53], [46.0, 45.79], [72.0, 72.4], [75.0, 76.11], [76.0, 76.86], [83.0, 85.72], [87.0, 90.91], [91.0, 92.58], [94.0, 95.84], [97.0, 98.63], [99.0, 101.11], [102.0, 103.32], [104.0, 107.59], [108.0, 109.54], [111.0, 112.6], [114.0, 115.62], [127.0, 127.74], [131.0, 130.96], [143.0, 144.14], [146.0, 150.09], [152.0, 154.04], [154.0, 154.23], [154.0, 154.95], [156.0, 160.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 99.98, 0.0, 0.0, 0.0, 99.82, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 99.21, 0.0, 0.0, 96.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.3, 0.34, 1.05, 0.53, -0.21, 0.4, 1.11, 0.86, 2.72, 3.91, 1.58, 1.84, 1.63, 2.11, 1.32, 3.59, 1.54, 1.6, 1.62, 0.74, -0.04, 1.14, 4.09, 2.04, 0.23, 0.95, 4.73]} \ No newline at end of file diff --git a/annotations_filtered/rYXDky5UYks_filtered.json b/annotations_filtered/rYXDky5UYks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35a3dceea9f10d43d04eaf54696fa125432d1f5a --- /dev/null +++ b/annotations_filtered/rYXDky5UYks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 36.17], [40.0, 55.32], [57.0, 63.07], [64.0, 64.45], [66.0, 69.2], [74.0, 74.58], [76.0, 89.63], [90.0, 89.87], [90.0, 89.95], [90.0, 101.88], [102.0, 103.72], [104.0, 105.92], [108.0, 110.07], [112.0, 112.45], [116.0, 116.33], [118.0, 118.07], [119.0, 119.11], [120.0, 120.61]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.64, 59.96, 0.0, 72.31, 0.0, 34.01, 0.0, 0.0, 47.78, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 28.44], ["music", 22.92], ["mains hum", 13.03]], null, null, [["music", 66.47], ["squish", 3.03], ["glass", 2.87]], null, null, null, null, null, null, null, null], "duration": [32.17, 15.32, 6.07, 0.45, 3.2, 0.58, 13.63, -0.13, -0.05, 11.88, 1.72, 1.92, 2.07, 0.45, 0.33, 0.07, 0.11, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/rYjtudWe7O0_filtered.json b/annotations_filtered/rYjtudWe7O0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..208e837c1f2579f301a662658295177cc9e56f83 --- /dev/null +++ b/annotations_filtered/rYjtudWe7O0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.94], [13.0, 14.5], [20.0, 22.06], [24.0, 25.61], [29.0, 30.13], [33.0, 41.59], [42.0, 43.5], [44.0, 45.57], [48.0, 56.93], [58.0, 58.45], [58.0, 58.95], [60.0, 62.18], [64.0, 78.26], [79.0, 81.75], [82.0, 83.94], [86.0, 90.07], [94.0, 94.12], [99.0, 99.49], [110.0, 111.99], [115.0, 117.78], [119.0, 120.01], [123.0, 124.07], [125.0, 127.84], [129.0, 129.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.08, 0.0, 0.0, 99.68, 0.0, 0.0, 98.86, 0.0, 0.0, 30.94, 99.82, 99.52, 0.0, 99.88, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 98.01, 0.0], "audiomae_on_audioset": [null, null, [["speech", 53.8], ["gunshot, gunfire", 12.06], ["artillery fire", 6.32]], null, null, null, null, null, null, null, null, [["ding", 17.29], ["sound effect", 13.49], ["breaking", 12.79]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 1.5, 2.06, 1.61, 1.13, 8.59, 1.5, 1.57, 8.93, 0.45, 0.95, 2.18, 14.26, 2.75, 1.94, 4.07, 0.12, 0.49, 1.99, 2.78, 1.01, 1.07, 2.84, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/rZ-_UsEBT5E_filtered.json b/annotations_filtered/rZ-_UsEBT5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..401fca97602ae5fac093e637d1cb6f4f21d7e3f2 --- /dev/null +++ b/annotations_filtered/rZ-_UsEBT5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.56], [6.0, 10.18], [13.0, 12.9], [17.0, 18.71], [23.0, 25.95], [27.0, 28.56], [30.0, 34.03]], "keep_status": [false, false, false, false, true, false, true], "silence_prob": [77.2, 81.0, 0.0, 0.0, 34.63, 0.0, 39.43], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 21.87], ["hum", 15.97], ["speech", 10.4]], null, [["sine wave", 28.2], ["chirp tone", 9.59], ["tuning fork", 6.76]]], "duration": [2.56, 4.18, -0.1, 1.71, 2.95, 1.56, 4.03]} \ No newline at end of file diff --git a/annotations_filtered/rZlzxsrv4ow_filtered.json b/annotations_filtered/rZlzxsrv4ow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0697ed8bdcf57b0596b470b958eed776bbdf483 --- /dev/null +++ b/annotations_filtered/rZlzxsrv4ow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.53], [20.0, 40.09], [42.0, 72.33], [72.0, 103.44], [105.0, 107.06], [109.0, 112.99], [115.0, 116.48], [117.0, 118.27], [120.0, 121.56]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.99, 0.0, 0.0, 35.1, 37.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 37.64], ["throbbing", 18.75], ["hum", 12.89]], null, null, [["music", 43.82], ["hum", 17.23], ["throbbing", 13.26]], [["music", 41.64], ["speech", 26.95], ["whack, thwack", 3.39]], null, null, null], "duration": [0.53, 20.09, 30.33, 31.44, 2.06, 3.99, 1.48, 1.27, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/rZpeepxXh7I_filtered.json b/annotations_filtered/rZpeepxXh7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e1add10aedc242a867bd6301909a3491482c0d6 --- /dev/null +++ b/annotations_filtered/rZpeepxXh7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [4.0, 7.2], [7.0, 14.27], [17.0, 17.07], [20.0, 23.06], [25.0, 25.42], [28.0, 28.12], [30.0, 30.69], [32.0, 32.9], [35.0, 35.01], [39.0, 41.34], [43.0, 43.56], [45.0, 45.15], [47.0, 51.0], [52.0, 53.74], [56.0, 64.99], [66.0, 66.78], [68.0, 68.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 68.41, 59.51, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 67.13, 0.0, 0.0, 74.29, 0.0, 33.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 16.75], ["explosion", 13.36], ["burst, pop", 9.06]], null, null], "duration": [0.42, 3.2, 7.27, 0.07, 3.06, 0.42, 0.12, 0.69, 0.9, 0.01, 2.34, 0.56, 0.15, 4.0, 1.74, 8.99, 0.78, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/rZs0ZkhzpsI_filtered.json b/annotations_filtered/rZs0ZkhzpsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edc6c419c04d21da56967843f42bc915c09bc86a --- /dev/null +++ b/annotations_filtered/rZs0ZkhzpsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.03], [22.0, 25.47], [27.0, 34.2], [36.0, 37.3], [38.0, 38.6], [45.0, 47.75], [53.0, 57.59], [58.0, 60.15], [62.0, 64.69], [66.0, 66.21], [67.0, 68.88], [71.0, 76.01], [76.0, 77.36], [79.0, 84.97], [87.0, 89.04], [94.0, 100.4], [101.0, 103.05], [107.0, 108.57], [109.0, 110.73], [112.0, 113.9], [117.0, 119.79], [121.0, 124.23]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.35, 63.64, 0.0, 0.0, 39.37, 98.86, 84.43, 96.77, 0.0, 0.0, 89.9, 0.0, 95.23, 98.27, 98.93, 99.87, 0.0, 0.0, 0.0, 69.88, 68.28], "audiomae_on_audioset": [null, [["music", 10.12], ["speech", 8.05], ["wood", 6.54]], null, null, null, [["speech", 50.52], ["music", 14.22], ["synthesizer", 5.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 3.47, 7.2, 1.3, 0.6, 2.75, 4.59, 2.15, 2.69, 0.21, 1.88, 5.01, 1.36, 5.97, 2.04, 6.4, 2.05, 1.57, 1.73, 1.9, 2.79, 3.23]} \ No newline at end of file diff --git a/annotations_filtered/rZsQJGk__DQ_filtered.json b/annotations_filtered/rZsQJGk__DQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ad8a0ffc38d99d4f3fb8690523a45f17aee7584 --- /dev/null +++ b/annotations_filtered/rZsQJGk__DQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [3.0, 3.75], [5.0, 6.03], [9.0, 39.6], [41.0, 60.29], [61.0, 61.8]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.49, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 28.31], ["hum", 12.48], ["mains hum", 10.27]], null], "duration": [0.47, 0.75, 1.03, 30.6, 19.29, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/rZuHQ94ES6U_filtered.json b/annotations_filtered/rZuHQ94ES6U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f30372f9e893c0fb8a5fe9c7287d83832e29d05c --- /dev/null +++ b/annotations_filtered/rZuHQ94ES6U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.94], [9.0, 54.31], [57.0, 57.99], [60.0, 59.9], [64.0, 65.03], [67.0, 72.74], [73.0, 74.63], [78.0, 93.87], [101.0, 101.51], [102.0, 102.51]], "keep_status": [false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 42.08, 0.0, 37.17, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 33.88], ["music", 24.13], ["sidetone", 7.57]], null, [["music", 24.32], ["livestock, farm animals, working animals", 23.96], ["cattle, bovinae", 19.63]], null, null], "duration": [0.94, 45.31, 0.99, -0.1, 1.03, 5.74, 1.63, 15.87, 0.51, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/rZyjko9lXo0_filtered.json b/annotations_filtered/rZyjko9lXo0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d19bf08fdfdb0c43955c0f544ec0ee2ae827816 --- /dev/null +++ b/annotations_filtered/rZyjko9lXo0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.59], [24.0, 25.15], [31.0, 33.54], [43.0, 44.27], [47.0, 47.78], [53.0, 55.26], [68.0, 68.98], [75.0, 76.18], [77.0, 78.09], [79.0, 80.59], [84.0, 85.8], [90.0, 91.88], [92.0, 93.26], [98.0, 100.33], [102.0, 102.91], [104.0, 108.9], [112.0, 111.87], [114.0, 114.61], [118.0, 122.59], [129.0, 129.03], [131.0, 132.54], [135.0, 135.48], [137.0, 140.78], [143.0, 146.04], [149.0, 149.4], [150.0, 151.92], [153.0, 156.05], [159.0, 160.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 99.16, 0.0, 0.0, 79.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 63.96, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 74.6, 49.45, 0.0, 0.0, 89.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.02], ["throbbing", 12.68], ["music", 10.65]], null, null, null, null], "duration": [0.59, 1.15, 2.54, 1.27, 0.78, 2.26, 0.98, 1.18, 1.09, 1.59, 1.8, 1.88, 1.26, 2.33, 0.91, 4.9, -0.13, 0.61, 4.59, 0.03, 1.54, 0.48, 3.78, 3.04, 0.4, 1.92, 3.05, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/r_3ofu2x8qM_filtered.json b/annotations_filtered/r_3ofu2x8qM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dfc9c62e11ce199bda64243b76b6a14b5d5a166 --- /dev/null +++ b/annotations_filtered/r_3ofu2x8qM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.58], [26.0, 26.55], [30.0, 30.47], [31.0, 31.4], [34.0, 104.4], [105.0, 106.47], [109.0, 109.8], [110.0, 111.54], [112.0, 112.41], [120.0, 129.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 0.55, 0.47, 0.4, 70.4, 1.47, 0.8, 1.54, 0.41, 9.63]} \ No newline at end of file diff --git a/annotations_filtered/r_3r5f1W1Oo_filtered.json b/annotations_filtered/r_3r5f1W1Oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e4af82c8efbf3ac00f1e0bb6a45b75faf5769b0 --- /dev/null +++ b/annotations_filtered/r_3r5f1W1Oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.16], [8.0, 9.19], [11.0, 14.27], [22.0, 23.31], [31.0, 40.39], [45.0, 52.66], [64.0, 65.03], [68.0, 75.42], [79.0, 98.52], [99.0, 99.12], [103.0, 102.71], [104.0, 111.86], [114.0, 117.48], [122.0, 122.3], [125.0, 127.26]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.83, 0.0, 42.44, 43.77, 0.0, 89.72, 47.9, 0.0, 0.0, 48.87, 37.41, 0.0, 63.1], "audiomae_on_audioset": [null, null, [["music", 60.0], ["speech", 9.65], ["throbbing", 8.07]], null, [["music", 69.91], ["synthesizer", 3.43], ["didgeridoo", 2.72]], [["music", 65.19], ["vibraphone", 5.58], ["glockenspiel", 1.9]], null, null, [["music", 48.14], ["speech", 11.55], ["guitar", 6.72]], null, null, [["music", 65.09], ["didgeridoo", 7.46], ["double bass", 1.94]], [["music", 78.12], ["electronic music", 1.94], ["musical instrument", 1.86]], null, null], "duration": [1.16, 1.19, 3.27, 1.31, 9.39, 7.66, 1.03, 7.42, 19.52, 0.12, -0.29, 7.86, 3.48, 0.3, 2.26]} \ No newline at end of file diff --git a/annotations_filtered/r_9PgiNuwDc_filtered.json b/annotations_filtered/r_9PgiNuwDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5bcdd138794cb0c46b5e0bd3fd41da0ffdcecf6 --- /dev/null +++ b/annotations_filtered/r_9PgiNuwDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [5.0, 4.72], [11.0, 21.39], [22.0, 22.52], [24.0, 24.43], [25.0, 25.64], [26.0, 26.81], [28.0, 27.94], [29.0, 29.67], [37.0, 39.95], [41.0, 41.49], [43.0, 44.71], [48.0, 49.87], [52.0, 53.15], [56.0, 56.54], [58.0, 59.02], [60.0, 61.2], [63.0, 63.09], [66.0, 67.58], [69.0, 70.28], [72.0, 73.35], [75.0, 77.06], [78.0, 80.45], [82.0, 85.73]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 72.46, 71.0], "audiomae_on_audioset": [null, null, [["noise", 17.73], ["music", 9.71], ["buzz", 8.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, -0.28, 10.39, 0.52, 0.43, 0.64, 0.81, -0.06, 0.67, 2.95, 0.49, 1.71, 1.87, 1.15, 0.54, 1.02, 1.2, 0.09, 1.58, 1.28, 1.35, 2.06, 2.45, 3.73]} \ No newline at end of file diff --git a/annotations_filtered/r_Bdli4c8TA_filtered.json b/annotations_filtered/r_Bdli4c8TA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80f55373020912da820fd7ef0d2dee14672a1a56 --- /dev/null +++ b/annotations_filtered/r_Bdli4c8TA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 46.45], [52.0, 53.22], [57.0, 65.94], [67.0, 75.29], [77.0, 83.71], [86.0, 87.66], [95.0, 109.16]], "keep_status": [false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 34.45, 34.75, 83.16, 0.0, 36.4], "audiomae_on_audioset": [null, null, [["speech", 55.08], ["music", 8.69], ["vehicle", 6.18]], [["speech", 45.46], ["gunshot, gunfire", 10.82], ["music", 10.43]], null, null, [["music", 57.3], ["gong", 4.42], ["hum", 4.03]]], "duration": [32.45, 1.22, 8.94, 8.29, 6.71, 1.66, 14.16]} \ No newline at end of file diff --git a/annotations_filtered/r_O3k-RpV2c_filtered.json b/annotations_filtered/r_O3k-RpV2c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca594c07ee9b974be5606e741a320bfe5c4d1e68 --- /dev/null +++ b/annotations_filtered/r_O3k-RpV2c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.03], [10.0, 11.82], [14.0, 14.62], [19.0, 20.95], [23.0, 24.04], [25.0, 27.51], [35.0, 39.33], [41.0, 42.3], [44.0, 43.82], [46.0, 50.04]], "keep_status": [false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 47.66, 37.69, 0.0, 0.0, 31.41], "audiomae_on_audioset": [null, null, null, null, null, [["music", 23.35], ["speech", 21.17], ["electric shaver, electric razor", 8.14]], [["mains hum", 42.01], ["hum", 39.57], ["music", 7.01]], null, null, [["sidetone", 26.52], ["music", 19.71], ["speech", 13.54]]], "duration": [1.03, 1.82, 0.62, 1.95, 1.04, 2.51, 4.33, 1.3, -0.18, 4.04]} \ No newline at end of file diff --git a/annotations_filtered/r_U2p-bdeww_filtered.json b/annotations_filtered/r_U2p-bdeww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e60ea79c157d5236aca6dc4d916e629716326634 --- /dev/null +++ b/annotations_filtered/r_U2p-bdeww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [11.0, 11.18], [13.0, 14.5], [18.0, 18.76], [19.0, 20.73], [24.0, 26.96], [33.0, 36.02], [39.0, 43.7], [45.0, 48.59], [54.0, 62.26], [68.0, 81.4], [89.0, 91.44], [100.0, 102.46], [103.0, 104.79], [107.0, 111.05], [116.0, 116.43], [118.0, 118.69], [124.0, 124.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 45.69, 73.51, 33.71, 30.32, 30.42, 29.5, 37.77, 37.45, 0.0, 37.25, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 75.4], ["rumble", 6.63], ["hum", 3.04]], null, [["music", 73.0], ["synthesizer", 6.53], ["drum machine", 4.05]], [["music", 76.53], ["musical instrument", 4.82], ["livestock, farm animals, working animals", 2.76]], [["music", 63.39], ["drum machine", 10.61], ["musical instrument", 5.78]], [["music", 75.15], ["hum", 2.94], ["synthesizer", 2.66]], [["music", 56.0], ["speech", 13.36], ["musical instrument", 2.56]], [["mains hum", 34.04], ["hum", 29.76], ["speech", 10.41]], null, [["hum", 39.84], ["mains hum", 17.94], ["noise", 13.75]], null, null, null], "duration": [0.0, 0.18, 1.5, 0.76, 1.73, 2.96, 3.02, 4.7, 3.59, 8.26, 13.4, 2.44, 2.46, 1.79, 4.05, 0.43, 0.69, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/r_a34DBcwCE_filtered.json b/annotations_filtered/r_a34DBcwCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..239e3cbcca3722be7bf6736a7e0dfb79dc9c225a --- /dev/null +++ b/annotations_filtered/r_a34DBcwCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.8], [2.0, 6.64], [8.0, 31.33], [34.0, 35.45], [39.0, 40.19], [41.0, 41.1], [42.0, 42.26], [47.0, 47.38], [49.0, 49.54], [50.0, 51.27], [52.0, 53.86], [55.0, 56.35], [57.0, 58.04], [61.0, 60.81], [62.0, 62.73], [64.0, 64.84], [85.0, 85.48], [86.0, 86.71], [89.0, 89.92], [94.0, 94.78], [96.0, 102.17], [104.0, 104.7], [105.0, 105.7], [107.0, 107.2], [108.0, 108.38], [113.0, 113.1], [119.0, 121.49], [123.0, 123.84]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.31, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.94, 0.0, 0.0, 0.0, 0.0, 0.0, 48.23, 0.0], "audiomae_on_audioset": [null, null, [["speech", 26.0], ["sidetone", 16.3], ["radio", 11.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["gong", 74.36], ["music", 3.66], ["eruption", 2.25]], null, null, null, null, null, [["music", 48.86], ["theremin", 24.55], ["musical instrument", 2.72]], null], "duration": [0.8, 4.64, 23.33, 1.45, 1.19, 0.1, 0.26, 0.38, 0.54, 1.27, 1.86, 1.35, 1.04, -0.19, 0.73, 0.84, 0.48, 0.71, 0.92, 0.78, 6.17, 0.7, 0.7, 0.2, 0.38, 0.1, 2.49, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/r_ckU9PkTbM_filtered.json b/annotations_filtered/r_ckU9PkTbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..416bef00fc88e38ea267fafc8d5ea082da17402a --- /dev/null +++ b/annotations_filtered/r_ckU9PkTbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.14], [13.0, 14.67], [21.0, 21.37], [22.0, 21.96], [23.0, 24.7], [26.0, 26.18], [28.0, 28.8], [31.0, 31.67], [34.0, 34.3], [36.0, 37.22], [37.0, 37.99], [47.0, 49.11], [55.0, 55.83], [57.0, 56.86], [59.0, 59.81], [61.0, 64.89], [65.0, 66.93], [72.0, 71.9], [73.0, 74.04], [78.0, 78.71], [79.0, 80.15], [81.0, 81.14], [82.0, 82.51], [83.0, 83.84], [87.0, 88.25], [89.0, 96.96], [97.0, 115.13], [116.0, 118.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.72, 53.78, 68.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.1], ["music", 10.44], ["buzz", 7.6]], null, null], "duration": [0.14, 1.67, 0.37, -0.04, 1.7, 0.18, 0.8, 0.67, 0.3, 1.22, 0.99, 2.11, 0.83, -0.14, 0.81, 3.89, 1.93, -0.1, 1.04, 0.71, 1.15, 0.14, 0.51, 0.84, 1.25, 7.96, 18.13, 2.61]} \ No newline at end of file diff --git a/annotations_filtered/r_tl6PA-Rd4_filtered.json b/annotations_filtered/r_tl6PA-Rd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c326956edef9238d66673bf87bb0ae9bb9e8a76 --- /dev/null +++ b/annotations_filtered/r_tl6PA-Rd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.85], [3.0, 2.73], [4.0, 7.2], [8.0, 8.51], [14.0, 15.82], [20.0, 20.24], [21.0, 23.04], [24.0, 24.68], [26.0, 26.81], [29.0, 30.2], [31.0, 33.61], [37.0, 39.85], [43.0, 43.7], [44.0, 47.75], [50.0, 51.09], [54.0, 54.73], [57.0, 57.65], [59.0, 61.06], [63.0, 63.42], [64.0, 69.26], [70.0, 69.77], [70.0, 86.44], [88.0, 88.38], [95.0, 100.45], [105.0, 105.66], [108.0, 108.62], [109.0, 109.34], [110.0, 111.11], [113.0, 114.62], [115.0, 119.64], [122.0, 122.71]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 46.5, 0.0, 0.0, 0.0, 53.59, 0.0, 0.0, 0.0, 48.52, 45.24, 0.0, 32.22, 0.0, 0.0, 0.0, 30.05, 0.0, 31.55, 0.0, 31.18, 0.0, 50.76, 0.0, 0.0, 0.0, 0.0, 0.0, 49.73, 0.0], "audiomae_on_audioset": [null, null, [["music", 33.21], ["didgeridoo", 21.21], ["theremin", 8.0]], null, null, null, null, null, null, null, [["music", 49.93], ["didgeridoo", 29.12], ["musical instrument", 2.96]], [["music", 9.91], ["animal", 5.62], ["dog", 5.04]], null, [["music", 65.63], ["speech", 15.57], ["musical instrument", 2.9]], null, null, null, [["music", 69.56], ["musical instrument", 4.34], ["carnatic music", 3.73]], null, [["music", 55.38], ["brass instrument", 11.42], ["musical instrument", 7.11]], null, [["music", 64.21], ["effects unit", 2.26], ["didgeridoo", 2.17]], null, null, null, null, null, null, null, [["bee, wasp, etc.", 24.5], ["speech", 23.42], ["fly, housefly", 20.7]], null], "duration": [-0.15, -0.27, 3.2, 0.51, 1.82, 0.24, 2.04, 0.68, 0.81, 1.2, 2.61, 2.85, 0.7, 3.75, 1.09, 0.73, 0.65, 2.06, 0.42, 5.26, -0.23, 16.44, 0.38, 5.45, 0.66, 0.62, 0.34, 1.11, 1.62, 4.64, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/ra42YS4NRlY_filtered.json b/annotations_filtered/ra42YS4NRlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59bc49d0d5a82843a8d5bdea2b81c1c5e9b3e3b7 --- /dev/null +++ b/annotations_filtered/ra42YS4NRlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.78], [6.0, 6.49], [8.0, 7.7], [8.0, 15.09], [23.0, 27.46], [40.0, 40.96], [47.0, 46.89], [49.0, 50.5], [52.0, 52.69], [59.0, 58.89], [60.0, 61.28], [65.0, 65.47], [73.0, 76.65], [77.0, 77.23], [79.0, 81.95], [84.0, 84.5], [87.0, 90.61], [96.0, 96.87], [97.0, 98.68], [99.0, 99.69], [100.0, 100.75], [101.0, 101.61], [106.0, 118.37], [119.0, 123.96], [127.0, 127.14], [129.0, 131.77], [135.0, 135.75]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [54.5, 0.0, 0.0, 40.17, 34.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.37, 0.0, 41.3, 0.0, 32.88, 0.0, 0.0, 0.0, 0.0, 0.0, 40.75, 32.45, 0.0, 37.3, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 40.47], ["bass guitar", 8.63], ["hum", 6.35]], [["music", 21.7], ["hum", 19.6], ["mains hum", 16.35]], null, null, null, null, null, null, null, [["music", 64.35], ["musical instrument", 4.87], ["didgeridoo", 4.75]], null, [["music", 49.5], ["speech", 32.98], ["explosion", 1.6]], null, [["music", 62.07], ["hum", 5.83], ["throbbing", 5.15]], null, null, null, null, null, [["music", 32.71], ["speech", 12.53], ["hum", 10.19]], [["speech", 44.92], ["music", 28.39], ["boing", 8.01]], null, [["hum", 30.02], ["speech", 17.29], ["music", 14.79]], null], "duration": [2.78, 0.49, -0.3, 7.09, 4.46, 0.96, -0.11, 1.5, 0.69, -0.11, 1.28, 0.47, 3.65, 0.23, 2.95, 0.5, 3.61, 0.87, 1.68, 0.69, 0.75, 0.61, 12.37, 4.96, 0.14, 2.77, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/ra9UQb-OVqQ_filtered.json b/annotations_filtered/ra9UQb-OVqQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb1b419207e0aa81850985644bb51acbe87772a4 --- /dev/null +++ b/annotations_filtered/ra9UQb-OVqQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.87], [10.0, 16.88], [22.0, 21.84], [23.0, 23.5], [24.0, 29.86], [31.0, 30.75], [38.0, 41.81], [48.0, 51.61], [53.0, 55.59], [58.0, 61.08], [62.0, 62.95], [66.0, 68.45], [77.0, 77.95]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [34.28, 36.15, 0.0, 0.0, 31.04, 0.0, 33.79, 34.65, 94.22, 46.12, 0.0, 48.65, 0.0], "audiomae_on_audioset": [[["music", 40.28], ["speech", 29.37], ["busy signal", 2.56]], [["music", 53.15], ["speech", 17.1], ["throbbing", 2.56]], null, null, [["music", 52.91], ["speech", 24.68], ["boing", 3.22]], null, [["music", 24.99], ["hum", 16.15], ["mains hum", 10.17]], [["music", 53.55], ["throbbing", 13.4], ["hum", 12.5]], null, [["thunk", 38.05], ["arrow", 29.26], ["animal", 2.88]], null, [["music", 40.8], ["animal", 8.2], ["livestock, farm animals, working animals", 7.64]], null], "duration": [4.87, 6.88, -0.16, 0.5, 5.86, -0.25, 3.81, 3.61, 2.59, 3.08, 0.95, 2.45, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/raDWhK7iSqU_filtered.json b/annotations_filtered/raDWhK7iSqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..463a145617ebbbe425141dae61b6c14a69ae7144 --- /dev/null +++ b/annotations_filtered/raDWhK7iSqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.67], [14.0, 22.77], [33.0, 32.9], [33.0, 34.28], [35.0, 35.77], [37.0, 47.71], [50.0, 52.17], [59.0, 59.31], [60.0, 62.23], [68.0, 79.32], [79.0, 81.63], [83.0, 84.08], [92.0, 96.04], [97.0, 97.02], [98.0, 99.55], [102.0, 102.61], [103.0, 124.82], [132.0, 151.97], [153.0, 153.54], [154.0, 154.7]], "keep_status": [true, false, false, false, false, false, true, false, true, true, true, false, true, false, false, false, false, false, false, false], "silence_prob": [35.28, 35.65, 0.0, 0.0, 0.0, 35.47, 33.07, 0.0, 35.67, 35.18, 33.81, 0.0, 42.79, 0.0, 0.0, 0.0, 34.05, 35.56, 0.0, 0.0], "audiomae_on_audioset": [[["music", 15.24], ["mosquito", 13.2], ["fly, housefly", 10.75]], [["music", 67.48], ["animal", 4.96], ["quack", 2.07]], null, null, null, [["speech", 30.97], ["music", 23.19], ["groan", 16.47]], [["hum", 41.25], ["throbbing", 20.79], ["noise", 5.78]], null, [["music", 28.68], ["groan", 14.52], ["didgeridoo", 9.54]], [["music", 33.21], ["fly, housefly", 8.99], ["moo", 6.36]], [["fly, housefly", 31.21], ["insect", 11.02], ["music", 9.59]], null, [["theremin", 39.08], ["music", 13.45], ["speech", 7.53]], null, null, null, [["music", 58.33], ["didgeridoo", 9.29], ["insect", 4.63]], [["music", 66.08], ["sonar", 16.94], ["didgeridoo", 2.24]], null, null], "duration": [4.67, 8.77, -0.1, 1.28, 0.77, 10.71, 2.17, 0.31, 2.23, 11.32, 2.63, 1.08, 4.04, 0.02, 1.55, 0.61, 21.82, 19.97, 0.54, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/raIdZiSZ970_filtered.json b/annotations_filtered/raIdZiSZ970_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fadac450732616f1393fd9077060b005d73245ff --- /dev/null +++ b/annotations_filtered/raIdZiSZ970_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.49], [29.0, 30.06], [32.0, 32.71], [34.0, 35.06], [37.0, 39.92], [44.0, 44.25], [46.0, 46.25], [48.0, 48.56], [50.0, 50.55], [51.0, 52.14], [53.0, 54.53], [55.0, 55.92], [59.0, 65.31], [66.0, 74.19], [76.0, 76.47], [79.0, 87.37], [90.0, 90.14], [91.0, 91.37], [92.0, 92.35], [95.0, 97.78], [98.0, 98.61], [99.0, 99.79], [101.0, 101.14], [105.0, 104.87], [105.0, 107.97], [109.0, 109.68], [110.0, 110.74], [112.0, 112.04], [115.0, 115.69]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.31, 33.37, 0.0, 39.8, 0.0, 0.0, 0.0, 34.58, 0.0, 0.0, 0.0, 0.0, 35.32, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 47.44], ["baby laughter", 10.61], ["laughter", 8.73]], null, null, null, null, null, null, null, [["music", 40.73], ["didgeridoo", 13.87], ["synthesizer", 6.74]], [["speech", 16.15], ["music", 14.21], ["whack, thwack", 5.48]], null, [["speech", 30.59], ["cattle, bovinae", 10.86], ["livestock, farm animals, working animals", 8.77]], null, null, null, [["cattle, bovinae", 40.22], ["moo", 26.05], ["speech", 9.61]], null, null, null, null, [["livestock, farm animals, working animals", 48.44], ["cattle, bovinae", 20.65], ["moo", 11.92]], null, null, null, null], "duration": [0.49, 1.06, 0.71, 1.06, 2.92, 0.25, 0.25, 0.56, 0.55, 1.14, 1.53, 0.92, 6.31, 8.19, 0.47, 8.37, 0.14, 0.37, 0.35, 2.78, 0.61, 0.79, 0.14, -0.13, 2.97, 0.68, 0.74, 0.04, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/raM63LAHuwo_filtered.json b/annotations_filtered/raM63LAHuwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cf627c1076824bf396a08966a7982e513d3c08c --- /dev/null +++ b/annotations_filtered/raM63LAHuwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [5.0, 7.3], [10.0, 11.1], [14.0, 19.09], [20.0, 22.2], [23.0, 23.46], [25.0, 31.33], [31.0, 32.8], [35.0, 35.87], [37.0, 38.11], [40.0, 40.78], [44.0, 45.0], [48.0, 49.01], [51.0, 51.44], [52.0, 52.74], [54.0, 56.4], [58.0, 68.59], [70.0, 74.82], [76.0, 79.05], [79.0, 85.06], [85.0, 89.5], [91.0, 91.69], [93.0, 93.29], [94.0, 95.98], [97.0, 97.46], [98.0, 98.52], [100.0, 100.75], [107.0, 107.22], [110.0, 111.03], [112.0, 112.89], [113.0, 113.95], [115.0, 115.65], [118.0, 118.81], [120.0, 145.15], [147.0, 148.93], [151.0, 162.53], [165.0, 164.86], [166.0, 175.29], [176.0, 176.54], [177.0, 177.77], [178.0, 178.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.52, 0.0, 97.92, 99.96, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 94.95, 83.34, 98.36, 86.82, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 51.28, 0.0, 50.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 2.3, 1.1, 5.09, 2.2, 0.46, 6.33, 1.8, 0.87, 1.11, 0.78, 1.0, 1.01, 0.44, 0.74, 2.4, 10.59, 4.82, 3.05, 6.06, 4.5, 0.69, 0.29, 1.98, 0.46, 0.52, 0.75, 0.22, 1.03, 0.89, 0.95, 0.65, 0.81, 25.15, 1.93, 11.53, -0.14, 9.29, 0.54, 0.77, 0.12]} \ No newline at end of file diff --git a/annotations_filtered/raSWINBYtuc_filtered.json b/annotations_filtered/raSWINBYtuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..088a863688a7557b0320d4fc2458b68d8310ac53 --- /dev/null +++ b/annotations_filtered/raSWINBYtuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 31.87], [33.0, 33.81], [44.0, 45.25], [52.0, 52.37], [54.0, 54.14], [56.0, 56.27], [60.0, 76.77], [79.0, 82.46], [83.0, 84.81], [86.0, 118.5], [119.0, 119.87], [121.0, 124.34], [130.0, 131.38], [134.0, 148.12], [149.0, 149.17], [151.0, 150.99], [158.0, 158.31], [163.0, 164.17], [165.0, 166.5], [172.0, 173.37]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [30.52, 0.0, 0.0, 0.0, 0.0, 0.0, 29.65, 28.98, 0.0, 0.0, 0.0, 31.05, 0.0, 32.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 39.19], ["hum", 25.86], ["music", 21.01]], null, null, null, null, null, [["music", 36.46], ["throbbing", 23.47], ["hum", 15.81]], [["music", 24.94], ["speech", 23.86], ["explosion", 17.8]], null, null, null, [["music", 44.47], ["mains hum", 10.47], ["didgeridoo", 7.43]], null, [["hum", 48.7], ["mains hum", 42.09], ["buzz", 3.17]], null, null, null, null, null, null], "duration": [15.87, 0.81, 1.25, 0.37, 0.14, 0.27, 16.77, 3.46, 1.81, 32.5, 0.87, 3.34, 1.38, 14.12, 0.17, -0.01, 0.31, 1.17, 1.5, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/raVKed5rdgM_filtered.json b/annotations_filtered/raVKed5rdgM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3c4ba90180f3cffefde98d359fb6563a6dc3cdd --- /dev/null +++ b/annotations_filtered/raVKed5rdgM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.17], [34.0, 35.33], [38.0, 39.09], [40.0, 40.36], [52.0, 54.33], [63.0, 65.91], [72.0, 72.22], [84.0, 86.02], [88.0, 88.91], [89.0, 90.26], [91.0, 93.21], [95.0, 96.38], [97.0, 99.64], [100.0, 115.26]], "keep_status": [false, false, false, false, true, false, false, true, false, false, true, false, false, true], "silence_prob": [56.4, 0.0, 0.0, 0.0, 40.5, 36.31, 0.0, 31.04, 0.0, 0.0, 48.74, 0.0, 68.41, 43.13], "audiomae_on_audioset": [null, null, null, null, [["speech", 26.23], ["sidetone", 20.57], ["throbbing", 5.4]], [["hum", 38.48], ["mains hum", 26.97], ["music", 9.11]], null, [["speech", 19.73], ["clip-clop", 11.46], ["horse", 11.09]], null, null, [["noise", 24.55], ["crushing", 16.55], ["thunk", 9.32]], null, null, [["speech", 37.74], ["music", 18.05], ["electric shaver, electric razor", 4.83]]], "duration": [2.17, 1.33, 1.09, 0.36, 2.33, 2.91, 0.22, 2.02, 0.91, 1.26, 2.21, 1.38, 2.64, 15.26]} \ No newline at end of file diff --git a/annotations_filtered/rbFIs5-Rn_Y_filtered.json b/annotations_filtered/rbFIs5-Rn_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4704bd22330676ce323d11f979684e77384ce1de --- /dev/null +++ b/annotations_filtered/rbFIs5-Rn_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.02], [4.0, 5.29], [8.0, 9.98], [11.0, 14.0], [16.0, 17.95], [18.0, 19.7], [21.0, 22.33], [23.0, 24.68], [25.0, 32.21], [34.0, 37.62], [40.0, 43.85], [46.0, 47.34], [50.0, 50.82], [54.0, 55.26], [62.0, 63.69], [66.0, 67.63], [70.0, 70.92], [72.0, 73.28], [74.0, 75.24], [76.0, 76.54], [77.0, 78.56], [79.0, 79.52], [83.0, 84.6], [87.0, 88.01], [91.0, 92.84], [93.0, 92.92], [93.0, 93.06], [94.0, 94.88], [100.0, 100.74], [103.0, 104.19], [105.0, 106.39], [108.0, 108.46], [111.0, 110.91], [115.0, 122.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.29, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 86.82, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.02, 1.29, 1.98, 3.0, 1.95, 1.7, 1.33, 1.68, 7.21, 3.62, 3.85, 1.34, 0.82, 1.26, 1.69, 1.63, 0.92, 1.28, 1.24, 0.54, 1.56, 0.52, 1.6, 1.01, 1.84, -0.08, 0.06, 0.88, 0.74, 1.19, 1.39, 0.46, -0.09, 7.84]} \ No newline at end of file diff --git a/annotations_filtered/rbYJb_i2czc_filtered.json b/annotations_filtered/rbYJb_i2czc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f493d2425f651fd91e9771ce892001cbaf89f649 --- /dev/null +++ b/annotations_filtered/rbYJb_i2czc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.85], [24.0, 25.51], [26.0, 28.43], [34.0, 46.47], [47.0, 47.65], [56.0, 55.92], [57.0, 69.72], [71.0, 71.56], [76.0, 77.89], [79.0, 80.5], [81.0, 87.72], [89.0, 90.69]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 29.42, 30.06, 0.0, 0.0, 30.72, 0.0, 0.0, 0.0, 39.72, 0.0], "audiomae_on_audioset": [null, null, [["music", 33.66], ["hum", 26.0], ["mains hum", 19.21]], [["music", 54.68], ["throbbing", 24.99], ["hum", 8.42]], null, null, [["speech", 20.51], ["thump, thud", 15.29], ["music", 13.4]], null, null, null, [["hum", 31.37], ["speech", 18.7], ["music", 15.32]], null], "duration": [1.85, 1.51, 2.43, 12.47, 0.65, -0.08, 12.72, 0.56, 1.89, 1.5, 6.72, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/rba9NiqG9PI_filtered.json b/annotations_filtered/rba9NiqG9PI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/rba9NiqG9PI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/rbhNKSWKWwU_filtered.json b/annotations_filtered/rbhNKSWKWwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fddce614a447c49650d76419aedce21bfb71397a --- /dev/null +++ b/annotations_filtered/rbhNKSWKWwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.37], [8.0, 10.76], [19.0, 19.4], [32.0, 32.17], [56.0, 56.19], [57.0, 61.7], [63.0, 71.07], [73.0, 73.52], [77.0, 78.58], [87.0, 93.6], [108.0, 110.15], [117.0, 118.54], [120.0, 121.44], [124.0, 128.58], [130.0, 129.73], [142.0, 149.35], [152.0, 153.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [45.92, 82.25, 0.0, 0.0, 0.0, 31.54, 38.7, 0.0, 0.0, 46.12, 31.99, 0.0, 0.0, 31.16, 0.0, 28.73, 0.0], "audiomae_on_audioset": [[["chirp tone", 44.59], ["sine wave", 29.59], ["hum", 7.29]], null, null, null, null, [["music", 71.01], ["speech", 12.62], ["musical instrument", 3.36]], [["chirp tone", 33.98], ["busy signal", 31.48], ["sine wave", 21.35]], null, null, [["chirp tone", 48.19], ["sine wave", 18.68], ["speech", 6.24]], [["speech", 46.24], ["whale vocalization", 10.09], ["hum", 5.71]], null, null, [["speech", 37.67], ["music", 27.12], ["didgeridoo", 6.86]], null, [["speech", 27.59], ["music", 13.04], ["sound effect", 8.09]], null], "duration": [4.37, 2.76, 0.4, 0.17, 0.19, 4.7, 8.07, 0.52, 1.58, 6.6, 2.15, 1.54, 1.44, 4.58, -0.27, 7.35, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/rbrIQjVNl0E_filtered.json b/annotations_filtered/rbrIQjVNl0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dacc2e2e1da8a2792ee72d2b302c00e03379732 --- /dev/null +++ b/annotations_filtered/rbrIQjVNl0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.87], [7.0, 7.57], [10.0, 18.01], [23.0, 23.82], [26.0, 34.45], [36.0, 36.59], [37.0, 38.1], [41.0, 41.47], [42.0, 89.43], [91.0, 93.28], [99.0, 99.64], [102.0, 111.0], [119.0, 132.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.88, 0.0, 29.75, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 31.62, 30.88], "audiomae_on_audioset": [null, null, [["music", 61.15], ["throbbing", 6.42], ["sidetone", 5.97]], null, [["speech", 40.4], ["music", 33.59], ["throbbing", 6.51]], null, null, null, null, [["music", 35.57], ["didgeridoo", 25.45], ["speech", 10.62]], null, [["music", 38.5], ["hum", 23.34], ["throbbing", 10.46]], [["music", 45.3], ["hum", 20.59], ["mains hum", 8.48]]], "duration": [-0.13, 0.57, 8.01, 0.82, 8.45, 0.59, 1.1, 0.47, 47.43, 2.28, 0.64, 9.0, 13.88]} \ No newline at end of file diff --git a/annotations_filtered/rbsrjcXynlg_filtered.json b/annotations_filtered/rbsrjcXynlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e71fe658c4476dc1ba283dfebbf2f61088bde695 --- /dev/null +++ b/annotations_filtered/rbsrjcXynlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [11.0, 12.26], [13.0, 13.24], [18.0, 22.77], [25.0, 32.76]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.23, 31.09], "audiomae_on_audioset": [null, null, null, [["speech", 28.12], ["music", 18.83], ["whale vocalization", 7.32]], [["livestock, farm animals, working animals", 43.34], ["cattle, bovinae", 25.49], ["moo", 8.6]]], "duration": [0.62, 1.26, 0.24, 4.77, 7.76]} \ No newline at end of file diff --git a/annotations_filtered/rcA0MBnPPM8_filtered.json b/annotations_filtered/rcA0MBnPPM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5d10a77b6e74be3b0428c36cfd566498f9e61e9 --- /dev/null +++ b/annotations_filtered/rcA0MBnPPM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.55], [18.0, 22.92], [27.0, 27.75], [35.0, 36.21], [49.0, 55.83]], "keep_status": [false, false, false, false, false], "silence_prob": [33.67, 36.22, 0.0, 0.0, 35.54], "audiomae_on_audioset": [[["music", 60.35], ["didgeridoo", 10.83], ["speech", 4.94]], [["music", 50.67], ["speech", 10.67], ["didgeridoo", 8.77]], null, null, [["music", 56.07], ["didgeridoo", 10.2], ["speech", 9.34]]], "duration": [3.55, 4.92, 0.75, 1.21, 6.83]} \ No newline at end of file diff --git a/annotations_filtered/rcIfzdLjjxU_filtered.json b/annotations_filtered/rcIfzdLjjxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..615ecfd5b337268ca9cdb0c623d47d48bf201bef --- /dev/null +++ b/annotations_filtered/rcIfzdLjjxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.56], [10.0, 10.89], [11.0, 15.92], [18.0, 18.44], [19.0, 25.51], [27.0, 28.43], [29.0, 32.56], [36.0, 39.26], [40.0, 46.3], [49.0, 49.62], [52.0, 53.35], [55.0, 56.05], [58.0, 59.51], [61.0, 62.06], [63.0, 64.79], [66.0, 67.27], [69.0, 70.16], [72.0, 72.2], [76.0, 76.0], [79.0, 79.27], [79.0, 79.51], [81.0, 81.67], [83.0, 83.29], [86.0, 87.56], [89.0, 92.2], [92.0, 95.81], [97.0, 97.73], [99.0, 99.37], [102.0, 102.25], [103.0, 103.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.08, 0.0, 47.31, 0.0, 95.23, 44.6, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.01, 49.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 47.8], ["music", 21.99], ["speech", 10.24]], null, [["hum", 28.03], ["throbbing", 26.38], ["music", 16.64]], null, null, [["speech", 66.34], ["hum", 2.99], ["outside, rural or natural", 2.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 61.11], ["mains hum", 10.51], ["throbbing", 10.04]], null, null, null, null], "duration": [0.56, 0.89, 4.92, 0.44, 6.51, 1.43, 3.56, 3.26, 6.3, 0.62, 1.35, 1.05, 1.51, 1.06, 1.79, 1.27, 1.16, 0.2, 0.0, 0.27, 0.51, 0.67, 0.29, 1.56, 3.2, 3.81, 0.73, 0.37, 0.25, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/rcJ5q5BdJi4_filtered.json b/annotations_filtered/rcJ5q5BdJi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f65a1e360545a004c515140de5b45044174977ed --- /dev/null +++ b/annotations_filtered/rcJ5q5BdJi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.43], [8.0, 9.24], [13.0, 14.71], [15.0, 17.27], [21.0, 22.74], [23.0, 25.69], [31.0, 32.05], [34.0, 35.28], [39.0, 40.17], [45.0, 45.69], [46.0, 48.02], [50.0, 52.37], [54.0, 54.36], [65.0, 67.41], [69.0, 71.14], [72.0, 74.58], [89.0, 91.2], [93.0, 94.04], [95.0, 95.77], [97.0, 99.06], [100.0, 100.79], [105.0, 106.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 44.26, 0.0, 65.44, 0.0, 0.0, 0.0, 0.0, 41.22, 43.38, 0.0, 42.53, 37.66, 37.17, 49.22, 0.0, 0.0, 40.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 83.3], ["mechanical fan", 1.63], ["hum", 1.58]], null, null, null, null, null, null, [["hum", 28.56], ["speech", 18.91], ["mains hum", 14.8]], [["noise", 19.42], ["hum", 13.32], ["cacophony", 4.85]], null, [["hum", 24.63], ["throbbing", 10.06], ["mains hum", 9.19]], [["hum", 22.24], ["throbbing", 6.81], ["music", 6.68]], [["music", 18.2], ["synthesizer", 12.07], ["hum", 11.7]], [["speech", 59.65], ["hum", 7.24], ["music", 6.08]], null, null, [["hum", 28.07], ["speech", 18.67], ["throbbing", 14.18]], null, null], "duration": [1.43, 1.24, 1.71, 2.27, 1.74, 2.69, 1.05, 1.28, 1.17, 0.69, 2.02, 2.37, 0.36, 2.41, 2.14, 2.58, 2.2, 1.04, 0.77, 2.06, 0.79, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/rcgygxfcywM_filtered.json b/annotations_filtered/rcgygxfcywM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7374a34dab525fefb4eab19582b9764ce8f02fd6 --- /dev/null +++ b/annotations_filtered/rcgygxfcywM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [7.0, 15.33], [16.0, 31.23], [31.0, 33.34], [35.0, 35.09], [37.0, 62.72], [67.0, 87.54], [93.0, 96.28]], "keep_status": [false, true, true, true, false, true, true, false], "silence_prob": [0.0, 30.83, 31.96, 37.05, 0.0, 32.33, 44.26, 39.78], "audiomae_on_audioset": [null, [["fly, housefly", 22.38], ["music", 15.86], ["buzz", 15.53]], [["music", 29.76], ["livestock, farm animals, working animals", 14.21], ["cattle, bovinae", 9.47]], [["music", 45.59], ["speech", 9.92], ["theremin", 2.48]], null, [["music", 60.61], ["smash, crash", 3.69], ["speech", 3.4]], [["hum", 14.12], ["mains hum", 13.87], ["music", 10.8]], [["music", 75.29], ["musical instrument", 3.65], ["guitar", 2.81]]], "duration": [0.5, 8.33, 15.23, 2.34, 0.09, 25.72, 20.54, 3.28]} \ No newline at end of file diff --git a/annotations_filtered/rcjujixxfdY_filtered.json b/annotations_filtered/rcjujixxfdY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7432065cc1b98965ba58d3713e2910af670b43d6 --- /dev/null +++ b/annotations_filtered/rcjujixxfdY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.63], [10.0, 11.58], [13.0, 13.96], [27.0, 31.41], [34.0, 35.92], [36.0, 37.3], [42.0, 42.6], [45.0, 46.62], [49.0, 49.4], [52.0, 52.44], [53.0, 53.67], [57.0, 58.06], [63.0, 63.34], [65.0, 67.02], [69.0, 69.94], [71.0, 72.2]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.57, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 28.4], ["music", 18.25], ["knock", 12.46]], null, null, null, null, null, null, null, null, null, [["music", 55.04], ["synthesizer", 2.36], ["speech", 2.11]], null, null], "duration": [0.63, 1.58, 0.96, 4.41, 1.92, 1.3, 0.6, 1.62, 0.4, 0.44, 0.67, 1.06, 0.34, 2.02, 0.94, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/rczP7CJB4Hs_filtered.json b/annotations_filtered/rczP7CJB4Hs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af285f03f218a71630dcecd57760e81635c7d3b5 --- /dev/null +++ b/annotations_filtered/rczP7CJB4Hs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.89], [20.0, 21.0], [69.0, 69.13], [79.0, 79.78], [86.0, 86.66], [105.0, 105.61]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [-0.11, 1.0, 0.13, 0.78, 0.66, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/rd8JDPjEoE0_filtered.json b/annotations_filtered/rd8JDPjEoE0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..087ed14d1e2cc1f398e2c414800348665722212e --- /dev/null +++ b/annotations_filtered/rd8JDPjEoE0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [4.0, 8.63], [11.0, 18.76], [20.0, 61.16], [64.0, 88.7], [93.0, 105.36], [107.0, 109.93], [115.0, 150.06], [151.0, 152.66], [153.0, 161.57], [164.0, 175.53]], "keep_status": [false, true, true, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 28.68, 29.98, 0.0, 28.48, 32.86, 30.37, 0.0, 0.0, 65.79, 56.78], "audiomae_on_audioset": [null, [["speech", 57.99], ["vehicle", 8.59], ["car", 3.24]], [["speech", 33.63], ["hum", 23.96], ["music", 11.62]], null, [["speech", 19.17], ["music", 15.77], ["vehicle", 5.7]], [["music", 37.86], ["hum", 29.85], ["mains hum", 16.28]], [["music", 35.66], ["hum", 11.95], ["scary music", 10.51]], null, null, null, null], "duration": [0.57, 4.63, 7.76, 41.16, 24.7, 12.36, 2.93, 35.06, 1.66, 8.57, 11.53]} \ No newline at end of file diff --git a/annotations_filtered/rdEbjNy5BNs_filtered.json b/annotations_filtered/rdEbjNy5BNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7667d9870a1bd73bc5e4c0b8c4df7461ae3df4b --- /dev/null +++ b/annotations_filtered/rdEbjNy5BNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [3.0, 2.98], [5.0, 5.63], [7.0, 7.21], [9.0, 14.71], [16.0, 15.96], [17.0, 18.08], [18.0, 21.64], [24.0, 24.36], [27.0, 27.23], [28.0, 27.95], [31.0, 32.16], [36.0, 37.12], [38.0, 49.81], [51.0, 127.62], [129.0, 131.43], [133.0, 139.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 32.21, 31.57], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.91], ["music", 13.92], ["boing", 2.28]], [["music", 31.95], ["didgeridoo", 11.19], ["cattle, bovinae", 3.33]]], "duration": [0.38, -0.02, 0.63, 0.21, 5.71, -0.04, 1.08, 3.64, 0.36, 0.23, -0.05, 1.16, 1.12, 11.81, 76.62, 2.43, 6.73]} \ No newline at end of file diff --git a/annotations_filtered/rdWIo5R10CM_filtered.json b/annotations_filtered/rdWIo5R10CM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4567c4d28cd345645ec095c09cf50fb1593191a0 --- /dev/null +++ b/annotations_filtered/rdWIo5R10CM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.06], [9.0, 10.29], [12.0, 42.69], [43.0, 55.92], [60.0, 60.52], [65.0, 65.3], [72.0, 129.02], [131.0, 139.82]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.46, 0.0, 0.0, 0.0, 30.75], "audiomae_on_audioset": [null, null, null, [["music", 51.62], ["didgeridoo", 10.88], ["throbbing", 9.93]], null, null, null, [["speech", 34.55], ["radio", 5.33], ["livestock, farm animals, working animals", 4.51]]], "duration": [1.06, 1.29, 30.69, 12.92, 0.52, 0.3, 57.02, 8.82]} \ No newline at end of file diff --git a/annotations_filtered/rdzVVp7e_0Y_filtered.json b/annotations_filtered/rdzVVp7e_0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac45c7c89459b8fa9d7e38d8437f91b45a6e60e4 --- /dev/null +++ b/annotations_filtered/rdzVVp7e_0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 20.92], [23.0, 66.07], [66.0, 70.21], [74.0, 83.79], [90.0, 95.25], [101.0, 104.06]], "keep_status": [false, false, true, true, true, true], "silence_prob": [30.26, 0.0, 33.94, 30.26, 28.68, 33.82], "audiomae_on_audioset": [[["music", 44.24], ["speech", 27.79], ["didgeridoo", 7.46]], null, [["music", 22.73], ["didgeridoo", 22.18], ["speech", 14.99]], [["speech", 40.13], ["music", 10.28], ["hum", 6.47]], [["explosion", 19.64], ["speech", 12.51], ["mains hum", 11.1]], [["sine wave", 14.58], ["hum", 10.97], ["music", 10.84]]], "duration": [4.92, 43.07, 4.21, 9.79, 5.25, 3.06]} \ No newline at end of file diff --git a/annotations_filtered/re0xt6hDdqE_filtered.json b/annotations_filtered/re0xt6hDdqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dbc0421a726b7b9d94351620a6c1968b38378e9 --- /dev/null +++ b/annotations_filtered/re0xt6hDdqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.45], [5.0, 6.44], [9.0, 9.73], [10.0, 10.42], [12.0, 14.13], [15.0, 15.36], [16.0, 17.25], [20.0, 21.95], [23.0, 25.42], [27.0, 28.49], [29.0, 29.59], [32.0, 32.54], [33.0, 33.81], [34.0, 36.09], [43.0, 44.0], [45.0, 46.33], [48.0, 48.79], [54.0, 54.7], [69.0, 69.43], [77.0, 77.09], [78.0, 78.93], [80.0, 80.57], [83.0, 83.59], [87.0, 87.51], [90.0, 92.21], [98.0, 98.88], [101.0, 102.25], [104.0, 104.19], [105.0, 112.89], [114.0, 116.43], [118.0, 126.66], [128.0, 128.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 0.0, 0.0, 38.54, 0.0, 0.0, 0.0, 0.0, 61.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 88.28, 78.04, 76.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 65.3], ["sidetone", 18.87], ["radio", 2.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.45, 1.44, 0.73, 0.42, 2.13, 0.36, 1.25, 1.95, 2.42, 1.49, 0.59, 0.54, 0.81, 2.09, 1.0, 1.33, 0.79, 0.7, 0.43, 0.09, 0.93, 0.57, 0.59, 0.51, 2.21, 0.88, 1.25, 0.19, 7.89, 2.43, 8.66, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/re5veV2F7eY_filtered.json b/annotations_filtered/re5veV2F7eY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1275b3c3a54eb4b274042fdd01a5df0d9207037 --- /dev/null +++ b/annotations_filtered/re5veV2F7eY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.95], [9.0, 8.87], [15.0, 16.34], [17.0, 18.74], [23.0, 23.5], [25.0, 25.3], [28.0, 27.78], [55.0, 63.07], [71.0, 71.44]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 48.98], ["speech", 7.01], ["guitar", 6.61]], null], "duration": [0.95, -0.13, 1.34, 1.74, 0.5, 0.3, -0.22, 8.07, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/re8jdVlrltA_filtered.json b/annotations_filtered/re8jdVlrltA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52f8ab4a805c824d0b0decb29bfe2cc508885ee0 --- /dev/null +++ b/annotations_filtered/re8jdVlrltA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.82], [11.0, 20.33], [21.0, 31.11], [32.0, 32.93], [37.0, 37.39], [42.0, 42.55], [45.0, 45.62], [47.0, 47.82], [49.0, 49.79], [53.0, 53.4], [56.0, 57.0], [59.0, 59.75], [62.0, 63.41], [65.0, 66.61], [68.0, 69.58], [71.0, 72.54], [74.0, 75.39], [77.0, 79.79], [81.0, 83.93], [85.0, 87.0], [88.0, 90.12], [92.0, 92.77], [93.0, 94.39], [96.0, 97.23], [99.0, 99.91], [101.0, 103.6], [104.0, 108.57], [110.0, 111.05], [112.0, 112.4], [127.0, 128.31], [129.0, 129.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.42, 98.1, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 89.36, 97.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.82, 9.33, 10.11, 0.93, 0.39, 0.55, 0.62, 0.82, 0.79, 0.4, 1.0, 0.75, 1.41, 1.61, 1.58, 1.54, 1.39, 2.79, 2.93, 2.0, 2.12, 0.77, 1.39, 1.23, 0.91, 2.6, 4.57, 1.05, 0.4, 1.31, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/reIyMTBfEwQ_filtered.json b/annotations_filtered/reIyMTBfEwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b48c618f2285ac760f5428f29f8398e58387f128 --- /dev/null +++ b/annotations_filtered/reIyMTBfEwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [4.0, 4.7], [5.0, 6.2], [9.0, 8.87], [10.0, 10.54], [16.0, 16.75], [23.0, 23.62], [24.0, 25.69], [26.0, 28.27], [30.0, 32.0], [34.0, 35.04], [36.0, 37.02], [38.0, 39.14], [44.0, 44.25], [47.0, 47.22], [51.0, 51.24], [56.0, 56.13], [57.0, 57.75], [59.0, 59.93], [61.0, 61.15], [64.0, 63.93], [66.0, 66.48], [68.0, 68.27], [70.0, 70.87], [73.0, 73.47], [80.0, 82.17], [89.0, 90.39], [96.0, 102.63], [107.0, 120.33], [128.0, 128.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 96.04, 91.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.7, 1.2, -0.13, 0.54, 0.75, 0.62, 1.69, 2.27, 2.0, 1.04, 1.02, 1.14, 0.25, 0.22, 0.24, 0.13, 0.75, 0.93, 0.15, -0.07, 0.48, 0.27, 0.87, 0.47, 2.17, 1.39, 6.63, 13.33, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/reJAzTE980s_filtered.json b/annotations_filtered/reJAzTE980s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed03bd7116f221b5fd6bd3ed49b4886ae0796711 --- /dev/null +++ b/annotations_filtered/reJAzTE980s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [4.0, 4.18], [7.0, 7.05], [10.0, 10.62], [12.0, 12.68], [14.0, 14.71], [19.0, 19.25], [20.0, 20.82], [22.0, 22.89], [27.0, 27.41], [29.0, 29.22], [30.0, 29.78], [31.0, 31.68], [35.0, 35.7], [36.0, 36.46], [37.0, 37.52], [38.0, 38.3], [39.0, 39.33], [41.0, 41.07], [41.0, 41.74], [42.0, 42.6], [46.0, 47.46], [50.0, 50.6], [53.0, 54.72], [55.0, 55.09], [55.0, 56.61], [65.0, 65.2], [66.0, 66.9], [70.0, 69.97], [71.0, 71.85], [76.0, 76.45], [77.0, 79.14], [81.0, 81.82], [82.0, 82.92], [84.0, 85.36], [90.0, 90.0], [91.0, 91.05], [91.0, 92.26], [94.0, 95.79], [99.0, 98.74], [102.0, 102.15], [106.0, 106.89], [108.0, 108.4], [108.0, 110.46], [114.0, 114.61], [117.0, 125.31], [128.0, 129.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 0.0, 29.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 87.84], ["whack, thwack", 4.2], ["explosion", 1.43]], null], "duration": [0.52, 0.18, 0.05, 0.62, 0.68, 0.71, 0.25, 0.82, 0.89, 0.41, 0.22, -0.22, 0.68, 0.7, 0.46, 0.52, 0.3, 0.33, 0.07, 0.74, 0.6, 1.46, 0.6, 1.72, 0.09, 1.61, 0.2, 0.9, -0.03, 0.85, 0.45, 2.14, 0.82, 0.92, 1.36, 0.0, 0.05, 1.26, 1.79, -0.26, 0.15, 0.89, 0.4, 2.46, 0.61, 8.31, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/reKMIuxFqzY_filtered.json b/annotations_filtered/reKMIuxFqzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f53165a93c61fbe47060dab7eca6e3bc570db4e --- /dev/null +++ b/annotations_filtered/reKMIuxFqzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[107.0, 117.07], [117.0, 117.26], [117.0, 120.24], [121.0, 122.44], [128.0, 136.02], [141.0, 142.99]], "keep_status": [false, false, false, false, false, false], "silence_prob": [39.44, 0.0, 97.92, 0.0, 74.6, 0.0], "audiomae_on_audioset": [[["music", 77.26], ["didgeridoo", 3.67], ["gong", 3.31]], null, null, null, null, null], "duration": [10.07, 0.26, 3.24, 1.44, 8.02, 1.99]} \ No newline at end of file diff --git a/annotations_filtered/reQPn8oDC2c_filtered.json b/annotations_filtered/reQPn8oDC2c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f05db32460f8c279a48c40358a4d4ee95b80ad9 --- /dev/null +++ b/annotations_filtered/reQPn8oDC2c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 65.1], [67.0, 70.58], [71.0, 72.23], [73.0, 80.28], [82.0, 89.04], [90.0, 92.13]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 33.46, 0.0, 32.59, 31.8, 34.26], "audiomae_on_audioset": [null, [["speech", 43.18], ["music", 26.4], ["radio", 4.47]], null, [["music", 52.41], ["synthesizer", 8.09], ["electronic music", 7.46]], [["music", 78.16], ["didgeridoo", 7.71], ["electronic music", 3.19]], [["music", 59.43], ["ambient music", 7.05], ["hum", 3.77]]], "duration": [61.1, 3.58, 1.23, 7.28, 7.04, 2.13]} \ No newline at end of file diff --git a/annotations_filtered/reYcW3bp8gg_filtered.json b/annotations_filtered/reYcW3bp8gg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57b29577c75f7e96144a371acac49843ef58bd5d --- /dev/null +++ b/annotations_filtered/reYcW3bp8gg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.83], [9.0, 9.48], [16.0, 16.5], [22.0, 23.97], [26.0, 26.33], [29.0, 29.89], [33.0, 33.35], [36.0, 36.68], [40.0, 41.98], [43.0, 44.27], [47.0, 47.7], [49.0, 49.79], [56.0, 56.22], [66.0, 69.48], [70.0, 74.12], [83.0, 86.73], [92.0, 92.01], [93.0, 93.24], [107.0, 108.62], [109.0, 110.62], [113.0, 114.91], [116.0, 117.95], [119.0, 120.85], [122.0, 122.86], [124.0, 129.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.5, 49.78, 44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 19.55], ["white noise", 16.38], ["hum", 9.69]], [["livestock, farm animals, working animals", 41.71], ["moo", 24.76], ["cattle, bovinae", 21.62]], [["hum", 42.9], ["mains hum", 15.8], ["throbbing", 8.41]], null, null, null, null, null, null, null, null, [["hum", 42.52], ["mains hum", 22.06], ["throbbing", 8.83]]], "duration": [-0.17, 0.48, 0.5, 1.97, 0.33, 0.89, 0.35, 0.68, 1.98, 1.27, 0.7, 0.79, 0.22, 3.48, 4.12, 3.73, 0.01, 0.24, 1.62, 1.62, 1.91, 1.95, 1.85, 0.86, 5.76]} \ No newline at end of file diff --git a/annotations_filtered/re_liKgRGew_filtered.json b/annotations_filtered/re_liKgRGew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef44432b0ca1585bf1f2904bc34647961c2d2349 --- /dev/null +++ b/annotations_filtered/re_liKgRGew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.1], [9.0, 51.19], [52.0, 53.4], [54.0, 54.67], [59.0, 58.97], [61.0, 61.8], [63.0, 64.13], [65.0, 66.66], [69.0, 69.45], [70.0, 71.12], [72.0, 72.69], [75.0, 75.52], [84.0, 84.74], [86.0, 87.27], [89.0, 89.14], [90.0, 90.71], [93.0, 93.11], [94.0, 95.0], [99.0, 99.18], [101.0, 102.63], [105.0, 105.53], [107.0, 108.26], [109.0, 113.75], [115.0, 115.5], [118.0, 119.91], [121.0, 123.84], [133.0, 142.74], [143.0, 144.54], [148.0, 149.15], [150.0, 151.43], [152.0, 153.17], [155.0, 155.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.84, 0.0, 0.0, 39.74, 32.44, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 29.81], ["speech", 11.39], ["burst, pop", 8.15]], null, null, [["music", 45.46], ["synthesizer", 22.38], ["drum machine", 5.87]], [["music", 47.11], ["boing", 6.92], ["electric shaver, electric razor", 3.81]], null, null, null, null, null], "duration": [0.1, 42.19, 1.4, 0.67, -0.03, 0.8, 1.13, 1.66, 0.45, 1.12, 0.69, 0.52, 0.74, 1.27, 0.14, 0.71, 0.11, 1.0, 0.18, 1.63, 0.53, 1.26, 4.75, 0.5, 1.91, 2.84, 9.74, 1.54, 1.15, 1.43, 1.17, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/refu69Hu5R0_filtered.json b/annotations_filtered/refu69Hu5R0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baee76e0625b0d0643cd6650478850ea4d2d17b4 --- /dev/null +++ b/annotations_filtered/refu69Hu5R0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.02], [4.0, 12.19], [14.0, 14.03], [15.0, 15.99], [24.0, 24.6], [26.0, 28.76], [30.0, 32.46], [35.0, 35.82], [38.0, 38.23], [40.0, 43.66], [45.0, 45.72], [51.0, 56.61], [57.0, 65.1], [66.0, 67.31], [69.0, 69.13], [70.0, 70.09], [73.0, 73.82], [75.0, 74.95], [78.0, 78.02], [81.0, 82.26], [83.0, 83.79], [84.0, 84.89], [86.0, 86.41], [90.0, 93.33], [94.0, 94.85], [96.0, 97.12], [99.0, 98.96], [100.0, 102.17], [104.0, 105.36], [106.0, 106.74], [108.0, 108.21], [110.0, 112.83], [113.0, 116.07], [118.0, 118.81], [119.0, 119.33], [125.0, 125.25], [126.0, 126.64], [128.0, 129.47], [130.0, 130.72], [132.0, 133.02], [137.0, 142.5], [144.0, 144.83], [146.0, 147.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 35.67, 0.0, 0.0, 0.0, 61.57, 99.21, 0.0, 0.0, 47.05, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 79.07, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.8, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 64.17], ["explosion", 4.69], ["music", 4.58]], null, null, null, null, null, null, null, [["speech", 57.71], ["whale vocalization", 11.84], ["fart", 2.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 27.31], ["burst, pop", 15.22], ["glass", 8.03]], null, null], "duration": [0.02, 8.19, 0.03, 0.99, 0.6, 2.76, 2.46, 0.82, 0.23, 3.66, 0.72, 5.61, 8.1, 1.31, 0.13, 0.09, 0.82, -0.05, 0.02, 1.26, 0.79, 0.89, 0.41, 3.33, 0.85, 1.12, -0.04, 2.17, 1.36, 0.74, 0.21, 2.83, 3.07, 0.81, 0.33, 0.25, 0.64, 1.47, 0.72, 1.02, 5.5, 0.83, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/relfjwjhscE_filtered.json b/annotations_filtered/relfjwjhscE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07e7f449b8715c746248cf7bc28dd49289128018 --- /dev/null +++ b/annotations_filtered/relfjwjhscE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 83.39], [84.0, 95.44], [97.0, 101.11]], "keep_status": [false, true, true], "silence_prob": [0.0, 30.02, 37.61], "audiomae_on_audioset": [null, [["hum", 29.82], ["mains hum", 20.67], ["music", 14.54]], [["hum", 26.22], ["music", 17.18], ["throbbing", 14.89]]], "duration": [66.39, 11.44, 4.11]} \ No newline at end of file diff --git a/annotations_filtered/reyTknNqDjA_filtered.json b/annotations_filtered/reyTknNqDjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8df0ab15fdd44980c4f7cedcf1a967bbf2c1aa07 --- /dev/null +++ b/annotations_filtered/reyTknNqDjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 50.46], [52.0, 93.63]], "keep_status": [false, false], "silence_prob": [34.1, 0.0], "audiomae_on_audioset": [[["music", 75.59], ["throbbing", 7.8], ["hum", 2.37]], null], "duration": [14.46, 41.63]} \ No newline at end of file diff --git a/annotations_filtered/rey_J7jIvno_filtered.json b/annotations_filtered/rey_J7jIvno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a561a1cd14041b85e852f833ccc8ea006f1e491 --- /dev/null +++ b/annotations_filtered/rey_J7jIvno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.74], [16.0, 61.32], [62.0, 133.05]], "keep_status": [false, false, false], "silence_prob": [33.04, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 38.02], ["hum", 33.94], ["music", 15.5]], null, null], "duration": [6.74, 45.32, 71.05]} \ No newline at end of file diff --git a/annotations_filtered/rezZBgaJGoM_filtered.json b/annotations_filtered/rezZBgaJGoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4db5b6159f7adb7eabcdeb2704575bf16b4f2c9 --- /dev/null +++ b/annotations_filtered/rezZBgaJGoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [34.0, 34.7], [36.0, 36.83], [37.0, 38.58], [42.0, 44.04], [48.0, 49.08], [52.0, 52.32], [73.0, 73.52], [80.0, 87.62], [99.0, 99.39], [104.0, 106.84], [115.0, 115.57]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 30.29, 0.0, 48.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whip", 32.72], ["speech", 19.42], ["whack, thwack", 12.91]], null, [["speech", 29.02], ["sidetone", 17.51], ["sine wave", 14.28]], null], "duration": [0.48, 0.7, 0.83, 1.58, 2.04, 1.08, 0.32, 0.52, 7.62, 0.39, 2.84, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/rfdF7LBQ8Ic_filtered.json b/annotations_filtered/rfdF7LBQ8Ic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0d9baaecf1aa8a44fee773477b59f8dc8aba594 --- /dev/null +++ b/annotations_filtered/rfdF7LBQ8Ic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.06], [13.0, 13.64], [21.0, 22.69], [34.0, 34.1], [35.0, 35.6], [62.0, 62.65], [63.0, 64.02]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.06, 0.64, 1.69, 0.1, 0.6, 0.65, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/rfeKwl7Dyg0_filtered.json b/annotations_filtered/rfeKwl7Dyg0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/rfeKwl7Dyg0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/rfix60WuBxs_filtered.json b/annotations_filtered/rfix60WuBxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7703a69a44c91ee1e1498c4cdf724d8377b4b6a6 --- /dev/null +++ b/annotations_filtered/rfix60WuBxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.69], [13.0, 13.73], [14.0, 16.53], [20.0, 22.18]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 56.7, 34.7], "audiomae_on_audioset": [null, null, null, [["speech", 76.95], ["radio", 5.13], ["telephone", 1.89]]], "duration": [1.69, 0.73, 2.53, 2.18]} \ No newline at end of file diff --git a/annotations_filtered/rgQjzIVzoh4_filtered.json b/annotations_filtered/rgQjzIVzoh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a17bbdb1a8cdb7bb75077debc878a92c0c37ee20 --- /dev/null +++ b/annotations_filtered/rgQjzIVzoh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.54], [27.0, 27.24], [29.0, 29.22], [38.0, 38.58], [46.0, 46.68], [47.0, 48.3], [50.0, 50.82], [56.0, 56.61], [63.0, 63.37], [64.0, 64.83], [68.0, 68.67], [78.0, 78.27], [80.0, 81.3], [83.0, 84.52], [86.0, 88.16], [89.0, 95.67], [97.0, 102.03], [104.0, 103.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 55.18, 37.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.94], ["livestock, farm animals, working animals", 4.13], ["radio", 4.12]], null], "duration": [0.54, 0.24, 0.22, 0.58, 0.68, 1.3, 0.82, 0.61, 0.37, 0.83, 0.67, 0.27, 1.3, 1.52, 2.16, 6.67, 5.03, -0.36]} \ No newline at end of file diff --git a/annotations_filtered/rgd8TC1Q09g_filtered.json b/annotations_filtered/rgd8TC1Q09g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64b6cbe789e6e4957242950898fb62ab85bda8da --- /dev/null +++ b/annotations_filtered/rgd8TC1Q09g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.06], [15.0, 19.79], [22.0, 28.32], [38.0, 40.68], [58.0, 58.56], [65.0, 66.24], [70.0, 71.07]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [89.19, 99.82, 99.62, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [4.06, 4.79, 6.32, 2.68, 0.56, 1.24, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/rglfoXHFty8_filtered.json b/annotations_filtered/rglfoXHFty8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35f9aa9a8a0d74237b702524851fd5075ff05d97 --- /dev/null +++ b/annotations_filtered/rglfoXHFty8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.09], [6.0, 7.57], [19.0, 20.98], [26.0, 27.24], [29.0, 34.48], [38.0, 38.7], [39.0, 39.6], [51.0, 98.1], [98.0, 100.13], [100.0, 100.5], [101.0, 101.49], [111.0, 111.67], [113.0, 146.01], [148.0, 149.27], [151.0, 153.1], [156.0, 156.07], [161.0, 161.35], [163.0, 163.24], [166.0, 167.39], [169.0, 168.76]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.82, 0.0, 0.0, 0.0, 30.47, 0.0, 0.0, 0.0, 0.0, 0.0, 45.21, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.59], ["music", 14.36], ["electric shaver, electric razor", 14.35]], null, null, null, [["music", 65.38], ["speech", 4.57], ["hum", 3.2]], null, null, null, null, null, [["music", 51.81], ["throbbing", 16.52], ["electronic music", 4.42]], null, null, null, null, null], "duration": [1.09, 1.57, 1.98, 1.24, 5.48, 0.7, 0.6, 47.1, 2.13, 0.5, 0.49, 0.67, 33.01, 1.27, 2.1, 0.07, 0.35, 0.24, 1.39, -0.24]} \ No newline at end of file diff --git a/annotations_filtered/rgmKJYrtmkw_filtered.json b/annotations_filtered/rgmKJYrtmkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3996f4cb359e7ec100fa6e786434a781511ad7b7 --- /dev/null +++ b/annotations_filtered/rgmKJYrtmkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.82], [5.0, 5.49], [6.0, 6.47], [8.0, 8.33], [10.0, 10.1], [10.0, 10.64], [12.0, 14.82], [17.0, 19.16], [21.0, 25.61], [27.0, 27.08], [32.0, 39.93], [49.0, 52.51], [55.0, 56.12], [60.0, 61.08], [73.0, 77.62], [78.0, 77.65], [86.0, 87.03], [89.0, 94.93], [118.0, 118.3], [141.0, 142.16]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 100.0, 48.91, 0.0, 39.22, 46.83, 0.0, 0.0, 64.86, 0.0, 0.0, 39.77, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 33.74], ["music", 12.75], ["frog", 12.09]], null, [["speech", 54.19], ["thunk", 26.48], ["music", 5.23]], [["music", 42.52], ["didgeridoo", 7.01], ["animal", 5.66]], null, null, null, null, null, [["music", 39.01], ["speech", 12.27], ["throbbing", 10.22]], null, null], "duration": [1.82, 0.49, 0.47, 0.33, 0.1, 0.64, 2.82, 2.16, 4.61, 0.08, 7.93, 3.51, 1.12, 1.08, 4.62, -0.35, 1.03, 5.93, 0.3, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/rh8OdlSXiDo_filtered.json b/annotations_filtered/rh8OdlSXiDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d2839ad1d52acb3298380bb59ab8e392e6cf9f2 --- /dev/null +++ b/annotations_filtered/rh8OdlSXiDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [7.0, 8.01], [9.0, 10.08], [26.0, 26.65], [53.0, 55.43], [65.0, 65.79], [76.0, 76.89], [80.0, 109.92], [110.0, 111.11]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 0.0, 37.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 92.02], ["musical instrument", 1.68], ["bass guitar", 0.43]], null], "duration": [0.57, 1.01, 1.08, 0.65, 2.43, 0.79, 0.89, 29.92, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/rhFw9HYTReY_filtered.json b/annotations_filtered/rhFw9HYTReY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edb1ed206b83e6f3217134a63cfe4b84c19a0f49 --- /dev/null +++ b/annotations_filtered/rhFw9HYTReY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 49.82], [54.0, 104.82]], "keep_status": [false, false], "silence_prob": [30.97, 0.0], "audiomae_on_audioset": [[["music", 42.86], ["didgeridoo", 37.02], ["trombone", 2.53]], null], "duration": [14.82, 50.82]} \ No newline at end of file diff --git a/annotations_filtered/rhNty595BeI_filtered.json b/annotations_filtered/rhNty595BeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff5642c08c89db8a6b7fbe5347d9485d7ab9864e --- /dev/null +++ b/annotations_filtered/rhNty595BeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.22], [11.0, 14.17], [16.0, 26.54], [28.0, 30.55], [34.0, 38.16], [38.0, 53.25], [54.0, 55.05], [56.0, 59.36], [62.0, 62.26], [63.0, 63.86], [67.0, 68.81], [70.0, 71.39], [73.0, 75.74], [77.0, 78.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.41, 99.85, 100.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.22, 3.17, 10.54, 2.55, 4.16, 15.25, 1.05, 3.36, 0.26, 0.86, 1.81, 1.39, 2.74, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/rhQ5dWLFLPM_filtered.json b/annotations_filtered/rhQ5dWLFLPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8f1d67fb13536648d76a948019db727e600841d --- /dev/null +++ b/annotations_filtered/rhQ5dWLFLPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.91], [12.0, 14.5], [15.0, 16.46], [17.0, 17.68], [19.0, 22.82], [23.0, 23.82], [26.0, 26.33], [28.0, 28.8], [34.0, 34.75], [47.0, 48.14], [50.0, 50.3], [51.0, 52.84], [54.0, 54.53], [55.0, 56.46], [57.0, 57.82], [58.0, 59.24], [60.0, 61.67], [62.0, 64.79], [66.0, 67.17], [68.0, 69.16], [71.0, 73.48], [75.0, 76.47], [83.0, 84.03], [94.0, 95.3], [96.0, 96.25], [98.0, 107.03], [108.0, 108.62], [110.0, 111.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.97, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.91, 2.5, 1.46, 0.68, 3.82, 0.82, 0.33, 0.8, 0.75, 1.14, 0.3, 1.84, 0.53, 1.46, 0.82, 1.24, 1.67, 2.79, 1.17, 1.16, 2.48, 1.47, 1.03, 1.3, 0.25, 9.03, 0.62, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/rhTGE6TQdSc_filtered.json b/annotations_filtered/rhTGE6TQdSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed273304989fac24067d4b74a3d3cab7d916ae61 --- /dev/null +++ b/annotations_filtered/rhTGE6TQdSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.06], [9.0, 27.62], [28.0, 28.85], [29.0, 29.93], [31.0, 35.53], [36.0, 40.93], [42.0, 47.83]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [61.27, 83.88, 0.0, 0.0, 39.04, 54.5, 52.8], "audiomae_on_audioset": [null, null, null, null, [["music", 47.69], ["grunt", 6.29], ["didgeridoo", 3.89]], null, null], "duration": [4.06, 18.62, 0.85, 0.93, 4.53, 4.93, 5.83]} \ No newline at end of file diff --git a/annotations_filtered/rhc_Ds85lG0_filtered.json b/annotations_filtered/rhc_Ds85lG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04681d64bd3cf193080294ecd542adaa93e4a6f2 --- /dev/null +++ b/annotations_filtered/rhc_Ds85lG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.18], [25.0, 25.39], [29.0, 29.61], [32.0, 34.7], [41.0, 41.89], [47.0, 47.43], [50.0, 50.01], [54.0, 53.77], [55.0, 55.68], [59.0, 61.38], [64.0, 67.98], [80.0, 102.09]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.18, 0.0, 0.0, 0.0, 0.0, 0.0, 33.98, 37.07, 34.36], "audiomae_on_audioset": [null, null, null, [["music", 30.33], ["didgeridoo", 25.1], ["musical instrument", 4.86]], null, null, null, null, null, [["speech", 30.61], ["cattle, bovinae", 24.37], ["moo", 18.69]], [["speech", 26.69], ["music", 21.67], ["animal", 7.0]], [["speech", 48.77], ["fart", 20.3], ["music", 3.3]]], "duration": [0.18, 0.39, 0.61, 2.7, 0.89, 0.43, 0.01, -0.23, 0.68, 2.38, 3.98, 22.09]} \ No newline at end of file diff --git a/annotations_filtered/rhfBzC5A79o_filtered.json b/annotations_filtered/rhfBzC5A79o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f7385a0480d688d86b5fa64148aad09260f37ac --- /dev/null +++ b/annotations_filtered/rhfBzC5A79o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 31.83], [34.0, 35.14], [42.0, 41.67], [44.0, 43.8], [48.0, 51.61], [52.0, 54.01], [54.0, 54.09], [54.0, 56.05], [57.0, 62.06], [65.0, 65.6], [70.0, 83.66], [87.0, 89.75], [91.0, 98.25], [102.0, 105.09], [107.0, 106.83], [108.0, 108.97], [110.0, 110.74], [112.0, 113.32], [115.0, 118.3], [119.0, 122.62]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.37, 0.0, 0.0, 0.0, 99.84, 37.32, 0.0, 37.02, 33.41, 0.0, 98.99, 99.85, 95.09, 44.55, 0.0, 0.0, 0.0, 0.0, 99.84, 42.42], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 48.63], ["busy signal", 22.3], ["sine wave", 12.56]], null, [["speech", 29.49], ["noise", 12.99], ["sidetone", 6.85]], [["speech", 55.03], ["whimper", 4.21], ["laughter", 3.79]], null, null, null, null, [["speech", 53.28], ["busy signal", 20.92], ["dial tone", 8.39]], null, null, null, null, null, [["speech", 35.37], ["dial tone", 29.72], ["sine wave", 25.65]]], "duration": [2.83, 1.14, -0.33, -0.2, 3.61, 2.01, 0.09, 2.05, 5.06, 0.6, 13.66, 2.75, 7.25, 3.09, -0.17, 0.97, 0.74, 1.32, 3.3, 3.62]} \ No newline at end of file diff --git a/annotations_filtered/rhkkbjKcaJ0_filtered.json b/annotations_filtered/rhkkbjKcaJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e9d98b29c726c68302e6b77bf5d396821cac6bd --- /dev/null +++ b/annotations_filtered/rhkkbjKcaJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.29], [10.0, 11.77], [12.0, 13.78], [15.0, 17.56], [19.0, 23.38], [25.0, 112.89], [116.0, 138.23], [140.0, 172.22]], "keep_status": [true, false, false, false, true, false, false, false], "silence_prob": [49.22, 0.0, 0.0, 56.63, 43.45, 0.0, 30.86, 0.0], "audiomae_on_audioset": [[["speech", 27.43], ["hum", 12.71], ["mains hum", 6.69]], null, null, null, [["music", 48.21], ["throbbing", 4.78], ["hum", 4.73]], null, [["hum", 50.08], ["mains hum", 28.26], ["music", 5.87]], null], "duration": [2.29, 1.77, 1.78, 2.56, 4.38, 87.89, 22.23, 32.22]} \ No newline at end of file diff --git a/annotations_filtered/rhnCmErsnYA_filtered.json b/annotations_filtered/rhnCmErsnYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..809e3c0deb2f22e0d7fc4e2431b5606a539fe773 --- /dev/null +++ b/annotations_filtered/rhnCmErsnYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.96], [14.0, 14.79], [17.0, 19.55], [21.0, 23.46], [24.0, 35.68], [42.0, 44.44], [44.0, 44.51], [45.0, 44.61], [45.0, 55.53], [60.0, 75.36], [77.0, 77.7], [79.0, 82.32], [84.0, 84.08], [86.0, 88.65], [92.0, 128.33], [132.0, 134.45], [136.0, 141.4], [141.0, 141.44], [144.0, 148.14]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 53.72, 31.42, 30.97, 30.53, 0.0, 0.0, 30.62, 30.15, 0.0, 34.18, 0.0, 32.56, 0.0, 30.15, 29.86, 0.0, 31.71], "audiomae_on_audioset": [null, null, null, [["music", 59.41], ["throbbing", 10.16], ["hum", 7.45]], [["music", 79.49], ["electronic music", 3.03], ["speech", 2.28]], [["music", 42.9], ["didgeridoo", 21.09], ["musical instrument", 5.15]], null, null, [["speech", 39.75], ["music", 29.66], ["whack, thwack", 5.17]], [["music", 36.97], ["speech", 33.85], ["whack, thwack", 3.44]], null, [["music", 47.87], ["boing", 19.22], ["synthesizer", 7.29]], null, [["moo", 42.46], ["cattle, bovinae", 38.77], ["livestock, farm animals, working animals", 16.39]], null, [["moo", 36.99], ["livestock, farm animals, working animals", 32.1], ["cattle, bovinae", 29.87]], [["boing", 39.13], ["music", 34.17], ["speech", 11.7]], null, [["speech", 30.72], ["music", 29.89], ["throbbing", 6.45]]], "duration": [1.96, 0.79, 2.55, 2.46, 11.68, 2.44, 0.51, -0.39, 10.53, 15.36, 0.7, 3.32, 0.08, 2.65, 36.33, 2.45, 5.4, 0.44, 4.14]} \ No newline at end of file diff --git a/annotations_filtered/rhtLoA3X21s_filtered.json b/annotations_filtered/rhtLoA3X21s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48d8ac31c8024ff94c744da2eb737b93436873c5 --- /dev/null +++ b/annotations_filtered/rhtLoA3X21s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.54], [10.0, 11.58], [12.0, 13.09], [16.0, 17.36], [20.0, 21.19], [42.0, 42.77], [45.0, 45.4], [51.0, 52.68]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.54, 1.58, 1.09, 1.36, 1.19, 0.77, 0.4, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/ri44Zx810p0_filtered.json b/annotations_filtered/ri44Zx810p0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ea3784e67e3bea9f0b97e12957ebcbfa338f74c --- /dev/null +++ b/annotations_filtered/ri44Zx810p0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.23], [7.0, 22.71], [25.0, 26.81], [30.0, 32.16], [32.0, 32.21], [32.0, 32.24], [34.0, 34.62], [35.0, 35.53], [37.0, 39.9], [41.0, 43.71], [45.0, 95.72], [98.0, 98.61], [100.0, 100.4], [101.0, 106.29], [107.0, 109.66], [111.0, 115.13], [116.0, 122.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.74, 56.4, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 99.56, 98.8, 0.0, 0.0, 0.0, 99.59, 99.48, 99.1, 99.16], "audiomae_on_audioset": [[["mains hum", 37.65], ["hum", 22.23], ["music", 12.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.23, 15.71, 1.81, 2.16, 0.21, 0.24, 0.62, 0.53, 2.9, 2.71, 50.72, 0.61, 0.4, 5.29, 2.66, 4.13, 6.37]} \ No newline at end of file diff --git a/annotations_filtered/ri8WqeTAUDE_filtered.json b/annotations_filtered/ri8WqeTAUDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abfa6453dcc3160309d8511c88b9d783390978d9 --- /dev/null +++ b/annotations_filtered/ri8WqeTAUDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.86], [6.0, 6.51], [11.0, 15.94], [16.0, 21.2], [24.0, 25.2], [27.0, 27.68], [30.0, 30.64], [39.0, 38.85], [50.0, 50.55], [54.0, 54.45], [71.0, 72.27], [75.0, 75.22], [75.0, 76.13], [77.0, 77.8], [79.0, 79.56], [81.0, 88.55], [89.0, 93.56], [100.0, 99.93], [103.0, 103.45], [104.0, 104.11], [106.0, 106.07], [108.0, 111.99], [120.0, 120.56], [128.0, 128.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.32, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 99.05, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.86, 0.51, 4.94, 5.2, 1.2, 0.68, 0.64, -0.15, 0.55, 0.45, 1.27, 0.22, 1.13, 0.8, 0.56, 7.55, 4.56, -0.07, 0.45, 0.11, 0.07, 3.99, 0.56, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/riDe28hGBuo_filtered.json b/annotations_filtered/riDe28hGBuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0b1f772ab99ec350772abe037dd44f361f5f0bd --- /dev/null +++ b/annotations_filtered/riDe28hGBuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.66], [15.0, 15.6], [17.0, 17.79], [23.0, 83.29], [89.0, 120.11], [123.0, 126.12], [128.0, 151.77], [152.0, 179.88]], "keep_status": [false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.98, 29.83, 30.39], "audiomae_on_audioset": [null, null, null, null, null, [["music", 47.99], ["whale vocalization", 8.7], ["ambient music", 4.62]], [["music", 34.71], ["hum", 22.54], ["mains hum", 11.62]], [["music", 52.77], ["fly, housefly", 4.69], ["fart", 4.58]]], "duration": [0.66, 0.6, 0.79, 60.29, 31.11, 3.12, 23.77, 27.88]} \ No newline at end of file diff --git a/annotations_filtered/riJRHpcshE0_filtered.json b/annotations_filtered/riJRHpcshE0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c043a44710d88b8b7acb1f3eb4d3de9a6dc47c1e --- /dev/null +++ b/annotations_filtered/riJRHpcshE0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.55], [18.0, 22.69], [23.0, 27.43], [30.0, 38.52], [41.0, 41.79], [42.0, 43.29], [44.0, 45.0], [46.0, 47.78], [52.0, 54.73], [56.0, 58.51], [62.0, 66.72], [67.0, 76.32], [77.0, 77.94], [78.0, 78.61], [79.0, 80.54], [82.0, 88.25], [89.0, 88.53], [89.0, 103.01], [105.0, 124.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 99.95, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 99.1, 0.0, 0.0, 0.0, 99.26, 0.0, 99.96, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.55, 4.69, 4.43, 8.52, 0.79, 1.29, 1.0, 1.78, 2.73, 2.51, 4.72, 9.32, 0.94, 0.61, 1.54, 6.25, -0.47, 14.01, 19.7]} \ No newline at end of file diff --git a/annotations_filtered/riSEerXD6nE_filtered.json b/annotations_filtered/riSEerXD6nE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba1b2831d6959126a0d1df55d07f20dbf6d8e9f0 --- /dev/null +++ b/annotations_filtered/riSEerXD6nE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.39], [11.0, 11.55], [14.0, 15.13], [20.0, 28.66], [30.0, 31.16], [32.0, 32.12], [33.0, 34.21], [37.0, 38.57], [44.0, 45.71], [52.0, 53.47], [56.0, 56.13], [59.0, 60.76], [61.0, 62.18], [64.0, 63.93], [67.0, 68.67], [69.0, 70.02], [76.0, 77.28], [78.0, 77.7], [78.0, 78.06], [80.0, 80.99], [82.0, 83.81], [85.0, 86.14], [88.0, 87.98], [91.0, 91.86], [92.0, 97.04], [98.0, 98.46], [104.0, 112.35], [113.0, 113.68], [115.0, 119.4], [121.0, 123.89], [124.0, 124.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.18, 0.0, 86.64, 0.0, 99.94, 30.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.66], ["musical instrument", 8.93], ["cough", 8.43]], null], "duration": [1.39, 0.55, 1.13, 8.66, 1.16, 0.12, 1.21, 1.57, 1.71, 1.47, 0.13, 1.76, 1.18, -0.07, 1.67, 1.02, 1.28, -0.3, 0.06, 0.99, 1.81, 1.14, -0.02, 0.86, 5.04, 0.46, 8.35, 0.68, 4.4, 2.89, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/riXp9rJ90Xw_filtered.json b/annotations_filtered/riXp9rJ90Xw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eedb43d8645a85f71b5cc204998a3efc791e39c --- /dev/null +++ b/annotations_filtered/riXp9rJ90Xw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.18], [20.0, 20.44], [24.0, 24.27], [28.0, 28.68], [32.0, 32.0], [33.0, 38.28], [39.0, 39.83], [46.0, 77.89], [78.0, 78.44], [78.0, 78.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.37, 0.0, 0.0, 0.0, 0.0, 57.72, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [2.18, 0.44, 0.27, 0.68, 0.0, 5.28, 0.83, 31.89, 0.44, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/riYhck-Z9tw_filtered.json b/annotations_filtered/riYhck-Z9tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48978624715b52d6fc4e702f48c27cb019ed8d7d --- /dev/null +++ b/annotations_filtered/riYhck-Z9tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.14], [64.0, 64.71], [95.0, 97.39], [103.0, 104.84]], "keep_status": [true, false, false, false], "silence_prob": [29.54, 0.0, 32.65, 0.0], "audiomae_on_audioset": [[["music", 33.22], ["noise", 6.51], ["synthesizer", 6.46]], null, [["fly, housefly", 48.92], ["insect", 32.42], ["speech", 4.82]], null], "duration": [7.14, 0.71, 2.39, 1.84]} \ No newline at end of file diff --git a/annotations_filtered/riicefV6xiI_filtered.json b/annotations_filtered/riicefV6xiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec23550ced92b737d74dfce12b173a40668618a8 --- /dev/null +++ b/annotations_filtered/riicefV6xiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.74], [11.0, 11.35], [16.0, 16.77], [19.0, 22.06], [25.0, 25.52], [32.0, 32.39], [37.0, 37.96], [41.0, 41.91], [43.0, 43.77], [47.0, 50.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.94, 0.0, 0.0, 0.0, 0.0, 0.0, 38.91], "audiomae_on_audioset": [null, null, null, [["music", 70.2], ["synthesizer", 6.33], ["electric piano", 2.08]], null, null, null, null, null, [["music", 58.34], ["didgeridoo", 8.13], ["synthesizer", 6.93]]], "duration": [0.74, 0.35, 0.77, 3.06, 0.52, 0.39, 0.96, 0.91, 0.77, 3.77]} \ No newline at end of file diff --git a/annotations_filtered/rilZTyv9RLo_filtered.json b/annotations_filtered/rilZTyv9RLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f65d2808bd2641dac797b359252613ef389916af --- /dev/null +++ b/annotations_filtered/rilZTyv9RLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.59], [15.0, 19.11], [20.0, 20.51], [25.0, 25.3], [29.0, 29.52], [41.0, 44.74], [49.0, 49.86], [52.0, 54.35], [56.0, 58.78], [60.0, 62.45], [77.0, 78.0], [86.0, 87.18], [91.0, 92.35], [100.0, 102.22], [118.0, 118.54], [120.0, 120.26], [131.0, 131.19]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [42.51, 41.58, 0.0, 0.0, 0.0, 33.17, 0.0, 53.78, 40.12, 31.23, 0.0, 0.0, 0.0, 29.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["boing", 59.51], ["music", 17.71], ["speech", 10.73]], [["music", 49.82], ["speech", 34.95], ["scratching (performance technique)", 3.36]], null, null, null, [["music", 56.15], ["theremin", 14.87], ["didgeridoo", 3.38]], null, null, [["music", 26.68], ["synthesizer", 19.76], ["noise", 7.52]], [["speech", 27.35], ["music", 16.91], ["fart", 15.94]], null, null, null, [["music", 35.16], ["speech", 19.89], ["didgeridoo", 6.08]], null, null, null], "duration": [2.59, 4.11, 0.51, 0.3, 0.52, 3.74, 0.86, 2.35, 2.78, 2.45, 1.0, 1.18, 1.35, 2.22, 0.54, 0.26, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/rj7e6WvyClY_filtered.json b/annotations_filtered/rj7e6WvyClY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a7d427dfd981d96f77a7157afb7b9f66e29dd33 --- /dev/null +++ b/annotations_filtered/rj7e6WvyClY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.63], [10.0, 10.25], [10.0, 10.44], [25.0, 24.87], [28.0, 29.13], [30.0, 31.29], [32.0, 33.67], [34.0, 57.69], [59.0, 59.51], [61.0, 61.86], [63.0, 63.31], [65.0, 65.58], [67.0, 66.93], [69.0, 71.05], [74.0, 74.38], [77.0, 76.79], [79.0, 82.65], [83.0, 84.42], [86.0, 87.12], [90.0, 90.59], [92.0, 93.23], [94.0, 95.59], [96.0, 97.55], [99.0, 99.67], [101.0, 102.81], [104.0, 105.14], [106.0, 112.92], [113.0, 120.99], [121.0, 123.11], [124.0, 124.19], [139.0, 139.23], [142.0, 143.14], [148.0, 148.26], [149.0, 149.13], [152.0, 152.44], [155.0, 159.87], [161.0, 162.57], [165.0, 176.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 99.62, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 99.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 0.25, 0.44, -0.13, 1.13, 1.29, 1.67, 23.69, 0.51, 0.86, 0.31, 0.58, -0.07, 2.05, 0.38, -0.21, 3.65, 1.42, 1.12, 0.59, 1.23, 1.59, 1.55, 0.67, 1.81, 1.14, 6.92, 7.99, 2.11, 0.19, 0.23, 1.14, 0.26, 0.13, 0.44, 4.87, 1.57, 11.27]} \ No newline at end of file diff --git a/annotations_filtered/rjnLGy6uWKc_filtered.json b/annotations_filtered/rjnLGy6uWKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1763f0436597ca70ac4704b1c9f292069696084 --- /dev/null +++ b/annotations_filtered/rjnLGy6uWKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.48], [16.0, 16.9], [19.0, 19.79], [28.0, 30.7], [32.0, 33.25], [36.0, 36.69], [42.0, 42.84], [44.0, 45.93], [48.0, 48.52], [55.0, 55.11], [59.0, 60.07], [100.0, 99.96], [101.0, 103.74], [106.0, 109.04], [132.0, 133.64], [135.0, 135.21]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.39, 0.0, 0.0, 37.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 32.76], ["speech", 14.21], ["mosquito", 9.8]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.48, 0.9, 0.79, 2.7, 1.25, 0.69, 0.84, 1.93, 0.52, 0.11, 1.07, -0.04, 2.74, 3.04, 1.64, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/rkPT_6JWenQ_filtered.json b/annotations_filtered/rkPT_6JWenQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f50c13a48c4d6cc0cc7f304b73456dee7897f95b --- /dev/null +++ b/annotations_filtered/rkPT_6JWenQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.18], [11.0, 14.34], [19.0, 20.07], [23.0, 23.23], [25.0, 25.74], [35.0, 37.23], [41.0, 47.14], [47.0, 47.34], [47.0, 53.4], [55.0, 55.29], [64.0, 74.7], [76.0, 104.94], [106.0, 113.59], [114.0, 114.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [62.47, 56.86, 0.0, 0.0, 0.0, 97.73, 77.7, 0.0, 63.74, 0.0, 32.45, 37.9, 50.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 14.69], ["breaking", 9.92], ["whack, thwack", 8.26]], [["speech", 16.51], ["music", 10.53], ["hum", 10.3]], null, null], "duration": [3.18, 3.34, 1.07, 0.23, 0.74, 2.23, 6.14, 0.34, 6.4, 0.29, 10.7, 28.94, 7.59, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/rkaXuC5hrCE_filtered.json b/annotations_filtered/rkaXuC5hrCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..846fe257d1e18bd5da81f3bce1d3bda958eca36f --- /dev/null +++ b/annotations_filtered/rkaXuC5hrCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.59], [4.0, 4.95], [10.0, 13.41], [21.0, 22.99], [25.0, 43.93], [52.0, 54.06]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 51.5, 0.0, 32.12, 45.98], "audiomae_on_audioset": [null, null, null, null, [["hum", 26.41], ["music", 24.84], ["mains hum", 20.51]], [["music", 27.15], ["sine wave", 12.01], ["rumble", 10.15]]], "duration": [0.59, 0.95, 3.41, 1.99, 18.93, 2.06]} \ No newline at end of file diff --git a/annotations_filtered/rku6u5PmiZ4_filtered.json b/annotations_filtered/rku6u5PmiZ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3e03a35ad94481814bb3e48487713d1f63b9047 --- /dev/null +++ b/annotations_filtered/rku6u5PmiZ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.75], [16.0, 18.01], [20.0, 19.99], [20.0, 24.48], [26.0, 32.44], [34.0, 35.55], [36.0, 43.41], [44.0, 52.46], [53.0, 53.65], [55.0, 70.33], [71.0, 71.54], [73.0, 73.5], [76.0, 94.86], [95.0, 95.03], [95.0, 95.08], [95.0, 95.13], [95.0, 95.44], [96.0, 95.64], [99.0, 100.01], [102.0, 104.62], [105.0, 106.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 99.99, 100.0, 0.0, 99.94, 100.0, 0.0, 97.33, 0.0, 0.0, 36.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["firecracker", 41.89], ["explosion", 11.84], ["burst, pop", 7.5]], null, null, null, null, null, null, null, null], "duration": [1.75, 2.01, -0.01, 4.48, 6.44, 1.55, 7.41, 8.46, 0.65, 15.33, 0.54, 0.5, 18.86, 0.03, 0.08, 0.13, 0.44, -0.36, 1.01, 2.62, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/rlMANFZdCkk_filtered.json b/annotations_filtered/rlMANFZdCkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf3e07829e561f27d3080de0d8994aa58d2e67c --- /dev/null +++ b/annotations_filtered/rlMANFZdCkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.99], [31.0, 30.77], [31.0, 31.77], [33.0, 33.67], [45.0, 63.14], [76.0, 76.54], [77.0, 78.17], [80.0, 81.55], [82.0, 83.05], [85.0, 85.21], [85.0, 85.6], [98.0, 99.94], [104.0, 104.73], [116.0, 117.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 87.74], ["funk", 0.9], ["musical instrument", 0.79]], null, null, null, null, null, null, null, null, null], "duration": [0.99, -0.23, 0.77, 0.67, 18.14, 0.54, 1.17, 1.55, 1.05, 0.21, 0.6, 1.94, 0.73, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/rlX19RmlimM_filtered.json b/annotations_filtered/rlX19RmlimM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e4e4d0cfef2bc64bac5ba9c30e161b91cf25235 --- /dev/null +++ b/annotations_filtered/rlX19RmlimM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.98], [7.0, 12.43], [13.0, 26.74], [30.0, 31.01], [50.0, 59.1], [61.0, 61.11], [63.0, 66.33]], "keep_status": [false, true, true, false, false, false, false], "silence_prob": [0.0, 38.06, 31.15, 0.0, 41.54, 0.0, 66.76], "audiomae_on_audioset": [null, [["applause", 24.23], ["crowd", 7.43], ["whale vocalization", 6.35]], [["music", 20.72], ["fly, housefly", 15.97], ["insect", 9.47]], null, [["music", 55.79], ["speech", 19.2], ["bleat", 2.57]], null, null], "duration": [-0.02, 5.43, 13.74, 1.01, 9.1, 0.11, 3.33]} \ No newline at end of file diff --git a/annotations_filtered/rlXKgVlILbM_filtered.json b/annotations_filtered/rlXKgVlILbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b610c144b5c14d27e61761c1676e887a8b877561 --- /dev/null +++ b/annotations_filtered/rlXKgVlILbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.61], [2.0, 2.79], [3.0, 3.7], [7.0, 8.31], [16.0, 16.14], [18.0, 18.66], [20.0, 20.82], [25.0, 25.07], [32.0, 33.81], [35.0, 35.09], [37.0, 42.04], [42.0, 42.94], [47.0, 47.55], [62.0, 62.45], [64.0, 65.92], [68.0, 68.55], [73.0, 73.8], [90.0, 89.65], [92.0, 92.57], [108.0, 108.51], [113.0, 112.99], [116.0, 116.19], [117.0, 117.51], [119.0, 118.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.79, 0.7, 1.31, 0.14, 0.66, 0.82, 0.07, 1.81, 0.09, 5.04, 0.94, 0.55, 0.45, 1.92, 0.55, 0.8, -0.35, 0.57, 0.51, -0.01, 0.19, 0.51, -0.09]} \ No newline at end of file diff --git a/annotations_filtered/rlaRlCFXUqk_filtered.json b/annotations_filtered/rlaRlCFXUqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..709eaa661c602afe8cdb0333e22b13bc69b1ff77 --- /dev/null +++ b/annotations_filtered/rlaRlCFXUqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [6.0, 6.07], [7.0, 8.07], [9.0, 14.08], [15.0, 15.03], [17.0, 18.42], [19.0, 20.02], [21.0, 28.71], [31.0, 31.11], [37.0, 36.69], [43.0, 44.49], [54.0, 55.14], [56.0, 57.1], [67.0, 67.2], [76.0, 77.11], [81.0, 80.92], [81.0, 88.8], [91.0, 91.1], [92.0, 94.61], [99.0, 103.76], [107.0, 108.11], [113.0, 116.16], [121.0, 121.91], [133.0, 133.71], [140.0, 142.97], [145.0, 145.37], [147.0, 147.7], [151.0, 151.82], [155.0, 156.83], [158.0, 159.27], [163.0, 163.0], [166.0, 167.16], [171.0, 172.59]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.54, 0.0, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.26, 0.0, 65.2, 45.92, 0.0, 49.18, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 19.79], ["hum", 7.49], ["mains hum", 5.55]], null, null, null, [["hum", 26.06], ["music", 19.06], ["rumble", 18.96]], null, null, null, null, null, null, null, null, [["mains hum", 38.56], ["hum", 31.08], ["speech", 10.8]], null, null, [["music", 44.58], ["electronic music", 10.38], ["gong", 9.96]], null, [["music", 31.05], ["sonar", 9.21], ["ambient music", 7.24]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.07, 1.07, 5.08, 0.03, 1.42, 1.02, 7.71, 0.11, -0.31, 1.49, 1.14, 1.1, 0.2, 1.11, -0.08, 7.8, 0.1, 2.61, 4.76, 1.11, 3.16, 0.91, 0.71, 2.97, 0.37, 0.7, 0.82, 1.83, 1.27, 0.0, 1.16, 1.59]} \ No newline at end of file diff --git a/annotations_filtered/rllKhsQXZXI_filtered.json b/annotations_filtered/rllKhsQXZXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a79dffbea418c7c9e1e8c1e18bd9fe2bc68064f --- /dev/null +++ b/annotations_filtered/rllKhsQXZXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.01], [24.0, 27.84], [29.0, 29.44], [30.0, 32.31], [34.0, 52.93], [55.0, 55.95], [56.0, 56.1], [56.0, 84.86], [85.0, 102.81]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 99.88, 0.0, 100.0, 95.78, 0.0, 0.0, 99.8, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [2.01, 3.84, 0.44, 2.31, 18.93, 0.95, 0.1, 28.86, 17.81]} \ No newline at end of file diff --git a/annotations_filtered/rm49NpSVgo4_filtered.json b/annotations_filtered/rm49NpSVgo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23e0ef087477bd26ab234def09b6762a12ce14b9 --- /dev/null +++ b/annotations_filtered/rm49NpSVgo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.54], [3.0, 3.67], [13.0, 13.34], [15.0, 15.23], [18.0, 18.62], [21.0, 21.24], [26.0, 26.22], [38.0, 39.26], [48.0, 48.74]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.54, 0.67, 0.34, 0.23, 0.62, 0.24, 0.22, 1.26, 0.74]} \ No newline at end of file diff --git a/annotations_filtered/rmE6nTzmDqI_filtered.json b/annotations_filtered/rmE6nTzmDqI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28c48cc68b5e71b544465b388dca07d3c1d832a4 --- /dev/null +++ b/annotations_filtered/rmE6nTzmDqI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.48], [11.0, 12.21], [16.0, 16.34], [21.0, 22.22], [25.0, 25.29], [27.0, 28.56], [32.0, 32.63], [37.0, 37.83], [39.0, 69.35], [70.0, 73.08], [74.0, 80.45], [81.0, 87.94], [89.0, 101.65], [104.0, 103.91], [105.0, 105.6], [107.0, 108.8], [110.0, 112.92], [118.0, 119.53], [123.0, 124.7], [126.0, 128.56], [130.0, 139.38], [141.0, 143.83], [145.0, 145.77], [146.0, 149.89], [150.0, 156.17], [160.0, 163.27], [166.0, 166.14], [168.0, 169.45], [171.0, 178.82]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.51, 39.54, 36.62, 47.27, 0.0, 0.0, 0.0, 64.07, 0.0, 0.0, 93.76, 47.54, 75.72, 0.0, 51.66, 54.63, 87.55, 0.0, 0.0, 85.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 29.08], ["synthesizer", 11.46], ["speech", 6.4]], [["music", 23.19], ["synthesizer", 16.03], ["hum", 9.72]], [["music", 30.74], ["hum", 16.56], ["synthesizer", 10.25]], [["speech", 24.52], ["music", 18.94], ["mains hum", 17.2]], null, null, null, null, null, null, null, [["speech", 27.66], ["mains hum", 25.63], ["hum", 14.03]], null, null, null, null, null, null, null, null], "duration": [3.48, 1.21, 0.34, 1.22, 0.29, 1.56, 0.63, 0.83, 30.35, 3.08, 6.45, 6.94, 12.65, -0.09, 0.6, 1.8, 2.92, 1.53, 1.7, 2.56, 9.38, 2.83, 0.77, 3.89, 6.17, 3.27, 0.14, 1.45, 7.82]} \ No newline at end of file diff --git a/annotations_filtered/rmpFmJfEZXs_filtered.json b/annotations_filtered/rmpFmJfEZXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e613c599b6357b000c1996d76facac3076fb1de --- /dev/null +++ b/annotations_filtered/rmpFmJfEZXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 46.43], [46.0, 47.95], [65.0, 69.11], [69.0, 70.04], [71.0, 71.44], [74.0, 74.56], [75.0, 77.57], [81.0, 81.24], [85.0, 85.24], [86.0, 86.59], [89.0, 89.13], [90.0, 89.87], [107.0, 107.87], [111.0, 121.2], [139.0, 139.38], [140.0, 144.91], [181.0, 187.69], [190.0, 194.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [66.76, 0.0, 88.1, 0.0, 0.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.83, 0.0, 43.9, 38.11, 33.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.08], ["whack, thwack", 10.52], ["hammer", 8.84]], null, [["music", 66.68], ["didgeridoo", 8.57], ["musical instrument", 6.08]], [["speech", 31.91], ["music", 30.03], ["crushing", 13.91]], [["fly, housefly", 39.02], ["music", 21.21], ["mosquito", 14.93]]], "duration": [2.43, 1.95, 4.11, 1.04, 0.44, 0.56, 2.57, 0.24, 0.24, 0.59, 0.13, -0.13, 0.87, 10.2, 0.38, 4.91, 6.69, 4.66]} \ No newline at end of file diff --git a/annotations_filtered/rnTrWINYDsM_filtered.json b/annotations_filtered/rnTrWINYDsM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5b72683d849200b19871acceef0ab655461a5c1 --- /dev/null +++ b/annotations_filtered/rnTrWINYDsM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.23], [12.0, 13.07], [18.0, 18.3], [30.0, 36.98], [38.0, 52.25], [70.0, 71.46], [73.0, 73.41], [77.0, 78.43], [79.0, 80.35], [86.0, 87.94], [90.0, 90.05], [92.0, 94.95], [98.0, 98.17], [104.0, 105.22], [108.0, 108.84], [112.0, 112.87], [122.0, 125.59], [137.0, 137.64], [140.0, 141.54], [149.0, 151.39], [156.0, 157.77], [163.0, 168.93], [170.0, 170.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 70.86, 50.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.87, 0.0, 0.0, 0.0, 0.0, 31.15, 0.0, 0.0, 45.02, 0.0, 34.8, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.05], ["music", 33.49], ["sidetone", 2.26]], null, null, null, null, [["music", 33.73], ["synthesizer", 7.35], ["hum", 6.64]], null, null, [["music", 86.5], ["sampler", 1.21], ["synthesizer", 0.88]], null, [["music", 62.83], ["throbbing", 7.23], ["electronic music", 6.53]], null], "duration": [0.23, 1.07, 0.3, 6.98, 14.25, 1.46, 0.41, 1.43, 1.35, 1.94, 0.05, 2.95, 0.17, 1.22, 0.84, 0.87, 3.59, 0.64, 1.54, 2.39, 1.77, 5.93, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/rnaCi4rBfqw_filtered.json b/annotations_filtered/rnaCi4rBfqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d28e6859714c6c7f66f9ba8bf0f97c0f6e3d4e07 --- /dev/null +++ b/annotations_filtered/rnaCi4rBfqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.7], [18.0, 18.67], [21.0, 22.0], [22.0, 23.41], [24.0, 24.73], [27.0, 27.6], [35.0, 36.21], [37.0, 37.71], [43.0, 43.19], [43.0, 45.62], [48.0, 48.91], [50.0, 62.58], [65.0, 103.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.15, 0.0, 33.5, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 55.78], ["trombone", 14.21], ["brass instrument", 9.45]], null, [["music", 68.89], ["musical instrument", 7.66], ["effects unit", 2.4]], null], "duration": [0.7, 0.67, 1.0, 1.41, 0.73, 0.6, 1.21, 0.71, 0.19, 2.62, 0.91, 12.58, 38.5]} \ No newline at end of file diff --git a/annotations_filtered/rnbDA4wKrg0_filtered.json b/annotations_filtered/rnbDA4wKrg0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddd48e4b6fda94a75f7d539b507b7cfc35e86686 --- /dev/null +++ b/annotations_filtered/rnbDA4wKrg0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.4], [10.0, 9.81], [13.0, 14.45], [15.0, 17.36], [19.0, 22.79], [23.0, 25.83], [26.0, 28.43], [30.0, 32.61], [34.0, 36.02], [37.0, 38.69], [44.0, 46.79], [48.0, 52.02], [53.0, 63.04], [70.0, 70.09], [72.0, 72.12], [76.0, 76.11], [77.0, 77.08], [79.0, 78.75], [79.0, 80.52], [82.0, 82.54], [85.0, 85.46], [87.0, 90.83], [94.0, 95.4], [98.0, 99.06], [101.0, 101.82], [104.0, 103.77], [105.0, 105.11], [106.0, 106.76], [111.0, 110.62], [112.0, 112.4], [113.0, 113.54], [117.0, 118.56], [119.0, 119.42], [123.0, 123.9], [125.0, 125.22], [126.0, 126.64], [132.0, 132.49], [133.0, 134.3], [135.0, 136.09], [137.0, 137.4], [138.0, 138.86], [140.0, 140.56], [142.0, 142.77], [143.0, 146.01], [146.0, 147.87], [148.0, 150.82], [154.0, 155.21], [156.0, 158.04], [161.0, 161.01], [164.0, 166.18], [168.0, 168.18]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [86.27, 0.0, 0.0, 99.87, 99.78, 52.1, 32.13, 47.05, 100.0, 0.0, 29.87, 100.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 38.03, 0.0, 100.0, 0.0, 47.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 48.35], ["busy signal", 34.24], ["dial tone", 7.88]], [["speech", 45.05], ["dial tone", 5.83], ["telephone", 3.82]], null, null, [["boing", 25.87], ["animal", 13.76], ["echo", 5.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.29], ["sine wave", 13.22], ["sidetone", 10.77]], null, null, null, [["speech", 35.65], ["frog", 11.71], ["croak", 5.33]], null], "duration": [2.4, -0.19, 1.45, 2.36, 3.79, 2.83, 2.43, 2.61, 2.02, 1.69, 2.79, 4.02, 10.04, 0.09, 0.12, 0.11, 0.08, -0.25, 1.52, 0.54, 0.46, 3.83, 1.4, 1.06, 0.82, -0.23, 0.11, 0.76, -0.38, 0.4, 0.54, 1.56, 0.42, 0.9, 0.22, 0.64, 0.49, 1.3, 1.09, 0.4, 0.86, 0.56, 0.77, 3.01, 1.87, 2.82, 1.21, 2.04, 0.01, 2.18, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/rngwd6ExGmc_filtered.json b/annotations_filtered/rngwd6ExGmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..233c297f9e21f72de4881b30402d202ca3f1d882 --- /dev/null +++ b/annotations_filtered/rngwd6ExGmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.72], [5.0, 5.68], [8.0, 8.67], [11.0, 11.94], [12.0, 13.22], [17.0, 17.2], [18.0, 19.45], [21.0, 21.25], [27.0, 29.0]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 28.39], ["speech", 8.97], ["musical instrument", 7.62]]], "duration": [0.72, 0.68, 0.67, 0.94, 1.22, 0.2, 1.45, 0.25, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/rnnt0KYtwFc_filtered.json b/annotations_filtered/rnnt0KYtwFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0a9f4a245cf2a7c8a77d367f1a9eaf6458aac3d --- /dev/null +++ b/annotations_filtered/rnnt0KYtwFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.36], [16.0, 17.85], [19.0, 22.79], [27.0, 31.53], [35.0, 36.75], [40.0, 44.64], [47.0, 52.62], [54.0, 61.82], [64.0, 68.82], [71.0, 71.88], [75.0, 75.57], [78.0, 78.33], [81.0, 88.45], [92.0, 93.34], [98.0, 99.55], [103.0, 105.48]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 79.07, 94.66, 0.0, 91.47, 32.79, 40.88, 70.44, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 30.18], ["ding", 18.09], ["clang", 17.05]], [["music", 30.0], ["speech", 23.76], ["fly, housefly", 6.55]], null, null, null, null, null, null, null, null], "duration": [0.36, 1.85, 3.79, 4.53, 1.75, 4.64, 5.62, 7.82, 4.82, 0.88, 0.57, 0.33, 7.45, 1.34, 1.55, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/rny3UdYPDn0_filtered.json b/annotations_filtered/rny3UdYPDn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d4ba822bf3ebb78fcb22ae69c0ed2cc8fbc2ae8 --- /dev/null +++ b/annotations_filtered/rny3UdYPDn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.17], [12.0, 29.74], [34.0, 35.56], [38.0, 40.41], [44.0, 44.61], [49.0, 49.72], [50.0, 50.13], [63.0, 63.51], [74.0, 74.93], [95.0, 96.96], [102.0, 101.97], [113.0, 115.11], [116.0, 116.65], [121.0, 121.51], [123.0, 123.74], [124.0, 134.87], [136.0, 137.2], [138.0, 138.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [46.19, 43.3, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 35.14, 0.0, 0.0], "audiomae_on_audioset": [[["music", 67.15], ["throbbing", 4.18], ["hum", 3.92]], [["throbbing", 56.52], ["hum", 23.27], ["music", 9.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 35.08], ["insect", 15.36], ["music", 12.6]], null, null], "duration": [4.17, 17.74, 1.56, 2.41, 0.61, 0.72, 0.13, 0.51, 0.93, 1.96, -0.03, 2.11, 0.65, 0.51, 0.74, 10.87, 1.2, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/ro74_tScvSA_filtered.json b/annotations_filtered/ro74_tScvSA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfbf54087f3ac6326796a1afd3a2a9570a8767d0 --- /dev/null +++ b/annotations_filtered/ro74_tScvSA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.5], [6.0, 5.7], [7.0, 6.93], [10.0, 11.48], [14.0, 14.84], [15.0, 19.21], [40.0, 39.93], [43.0, 44.12], [53.0, 54.48], [56.0, 62.99], [67.0, 71.14], [73.0, 74.21], [75.0, 77.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 69.74, 77.03, 0.0, 33.74], "audiomae_on_audioset": [null, null, null, null, null, [["fly, housefly", 28.9], ["insect", 21.16], ["music", 20.01]], null, null, null, null, null, null, [["music", 52.6], ["speech", 15.05], ["whack, thwack", 4.07]]], "duration": [1.5, -0.3, -0.07, 1.48, 0.84, 4.21, -0.07, 1.12, 1.48, 6.99, 4.14, 1.21, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/roA5fvzJsho_filtered.json b/annotations_filtered/roA5fvzJsho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd52a2a947c8b3d6fcf45507a2e8ef473dfb520a --- /dev/null +++ b/annotations_filtered/roA5fvzJsho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.2], [7.0, 18.67], [20.0, 26.89], [27.0, 28.21], [33.0, 34.65], [37.0, 38.96], [45.0, 47.22], [48.0, 50.57]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [90.25, 35.11, 58.81, 0.0, 0.0, 0.0, 88.28, 78.55], "audiomae_on_audioset": [null, [["speech", 26.9], ["hum", 19.78], ["rumble", 10.6]], null, null, null, null, null, null], "duration": [3.2, 11.67, 6.89, 1.21, 1.65, 1.96, 2.22, 2.57]} \ No newline at end of file diff --git a/annotations_filtered/roLboEc4M-w_filtered.json b/annotations_filtered/roLboEc4M-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62b5c3c33709c26f73dc94f3525c65a3dd13c076 --- /dev/null +++ b/annotations_filtered/roLboEc4M-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.84], [9.0, 9.54], [12.0, 13.46], [14.0, 14.25], [14.0, 14.52], [15.0, 14.61], [18.0, 19.38], [28.0, 33.2], [34.0, 36.37], [37.0, 38.31], [40.0, 41.82], [43.0, 44.22], [45.0, 47.06], [52.0, 53.42], [55.0, 56.0], [64.0, 64.35], [67.0, 68.34], [73.0, 73.63], [76.0, 76.38], [77.0, 79.88], [83.0, 83.22], [84.0, 84.82], [86.0, 88.87], [92.0, 92.52], [95.0, 102.32], [105.0, 106.1], [108.0, 109.76], [111.0, 111.4], [113.0, 113.24], [115.0, 115.25], [116.0, 116.8], [119.0, 124.28], [125.0, 126.01], [128.0, 128.61], [129.0, 129.76], [132.0, 133.68], [136.0, 137.46], [138.0, 144.24], [150.0, 151.66], [153.0, 153.91], [160.0, 161.49], [162.0, 163.31], [164.0, 165.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 76.53, 0.0, 0.0, 0.0, 48.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.39, 0.0, 0.0, 47.12, 0.0, 49.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.84], ["hum", 11.08], ["whale vocalization", 8.36]], null, null, null, null, null, null, null, null, null, [["speech", 29.4], ["music", 25.6], ["hum", 4.96]], null, [["music", 54.85], ["hum", 7.71], ["mains hum", 7.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 0.54, 1.46, 0.25, 0.52, -0.39, 1.38, 5.2, 2.37, 1.31, 1.82, 1.22, 2.06, 1.42, 1.0, 0.35, 1.34, 0.63, 0.38, 2.88, 0.22, 0.82, 2.87, 0.52, 7.32, 1.1, 1.76, 0.4, 0.24, 0.25, 0.8, 5.28, 1.01, 0.61, 0.76, 1.68, 1.46, 6.24, 1.66, 0.91, 1.49, 1.31, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/roST4TM0ccM_filtered.json b/annotations_filtered/roST4TM0ccM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5398246235d982e2ab0f68faf99b4a57377e035c --- /dev/null +++ b/annotations_filtered/roST4TM0ccM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [0.0, 1.09], [2.0, 8.43], [9.0, 13.76], [14.0, 14.5], [15.0, 16.07], [17.0, 35.38], [38.0, 37.81], [40.0, 45.17], [54.0, 56.24], [57.0, 57.1], [58.0, 57.96], [65.0, 65.64], [67.0, 73.92], [77.0, 93.21], [99.0, 108.82], [112.0, 112.14], [114.0, 114.0], [115.0, 132.29], [135.0, 136.11], [136.0, 136.95], [139.0, 153.81], [157.0, 157.27], [158.0, 162.3], [163.0, 171.31], [183.0, 193.94]], "keep_status": [false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 35.58, 38.35, 0.0, 0.0, 35.68, 0.0, 30.23, 68.8, 0.0, 0.0, 0.0, 40.77, 31.1, 31.45, 0.0, 0.0, 29.19, 0.0, 0.0, 30.43, 0.0, 35.39, 44.55, 51.66], "audiomae_on_audioset": [null, null, [["speech", 17.14], ["livestock, farm animals, working animals", 14.84], ["moo", 12.4]], [["fire", 19.25], ["speech", 12.85], ["rain", 10.11]], null, null, [["music", 30.12], ["speech", 25.34], ["theremin", 15.81]], null, [["speech", 25.41], ["music", 17.4], ["livestock, farm animals, working animals", 5.37]], null, null, null, null, [["throbbing", 34.13], ["hum", 27.63], ["mains hum", 11.46]], [["music", 55.81], ["fart", 7.92], ["groan", 7.91]], [["music", 55.93], ["speech", 18.68], ["throbbing", 4.42]], null, null, [["music", 37.9], ["speech", 27.92], ["whack, thwack", 8.34]], null, null, [["music", 57.27], ["sidetone", 2.88], ["speech", 2.87]], null, [["speech", 37.13], ["music", 22.16], ["noise", 6.26]], [["hum", 35.54], ["mains hum", 17.89], ["music", 15.31]], null], "duration": [0.48, 1.09, 6.43, 4.76, 0.5, 1.07, 18.38, -0.19, 5.17, 2.24, 0.1, -0.04, 0.64, 6.92, 16.21, 9.82, 0.14, 0.0, 17.29, 1.11, 0.95, 14.81, 0.27, 4.3, 8.31, 10.94]} \ No newline at end of file diff --git a/annotations_filtered/roaWSb9xc8I_filtered.json b/annotations_filtered/roaWSb9xc8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96d5c23e76df7f6713c785a5c35956338a172c3c --- /dev/null +++ b/annotations_filtered/roaWSb9xc8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 45.45], [49.0, 53.01], [54.0, 56.08], [57.0, 76.64], [79.0, 81.06], [83.0, 89.46], [91.0, 107.7], [111.0, 157.47]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 69.61, 66.39, 50.66, 65.09, 29.42, 33.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 43.59], ["hum", 9.92], ["machine gun", 9.58]], [["music", 73.43], ["hum", 8.42], ["electronic music", 4.58]], null], "duration": [1.45, 4.01, 2.08, 19.64, 2.06, 6.46, 16.7, 46.47]} \ No newline at end of file diff --git a/annotations_filtered/roeLoZuFI1I_filtered.json b/annotations_filtered/roeLoZuFI1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f39298ac0c482c1d8f08a29787480ad618f61ad --- /dev/null +++ b/annotations_filtered/roeLoZuFI1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 28.14]], "keep_status": [true], "silence_prob": [29.79], "audiomae_on_audioset": [[["music", 23.78], ["speech", 18.75], ["hum", 15.78]]], "duration": [22.14]} \ No newline at end of file diff --git a/annotations_filtered/roxNsu1YELE_filtered.json b/annotations_filtered/roxNsu1YELE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8545fd83051f04d965999d3d4763e966878221e --- /dev/null +++ b/annotations_filtered/roxNsu1YELE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 40.86], [42.0, 65.06]], "keep_status": [true, false], "silence_prob": [30.77, 31.29], "audiomae_on_audioset": [[["music", 44.27], ["throbbing", 14.56], ["hum", 6.48]], [["throbbing", 45.41], ["music", 19.61], ["hum", 11.87]]], "duration": [12.86, 23.06]} \ No newline at end of file diff --git a/annotations_filtered/rp4nf7xR9Uk_filtered.json b/annotations_filtered/rp4nf7xR9Uk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b00dc08d29260241691f94a8dec0293c39226a18 --- /dev/null +++ b/annotations_filtered/rp4nf7xR9Uk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.18], [7.0, 7.67], [9.0, 11.52], [13.0, 14.25], [17.0, 20.38], [21.0, 23.18], [24.0, 25.08], [26.0, 26.92], [29.0, 29.89], [31.0, 32.24], [35.0, 36.42], [37.0, 38.26], [39.0, 42.77], [44.0, 53.91], [55.0, 58.04], [59.0, 60.12], [61.0, 63.26], [66.0, 67.81], [83.0, 83.17], [83.0, 83.34], [86.0, 86.0], [94.0, 95.39], [97.0, 97.78], [102.0, 103.62], [105.0, 106.39], [108.0, 109.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 67.38, 0.0, 72.01, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.13, 44.78, 54.23, 0.0, 54.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["singing bowl", 16.79], ["sine wave", 11.13], ["music", 10.12]], [["music", 32.19], ["hum", 23.89], ["mains hum", 14.38]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 0.67, 2.52, 1.25, 3.38, 2.18, 1.08, 0.92, 0.89, 1.24, 1.42, 1.26, 3.77, 9.91, 3.04, 1.12, 2.26, 1.81, 0.17, 0.34, 0.0, 1.39, 0.78, 1.62, 1.39, 1.68]} \ No newline at end of file diff --git a/annotations_filtered/rpPm4pAJQbc_filtered.json b/annotations_filtered/rpPm4pAJQbc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83e2b4ca1e669867ccfa799871290e3c825c9b47 --- /dev/null +++ b/annotations_filtered/rpPm4pAJQbc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 24.66], [46.0, 45.66], [46.0, 46.84], [66.0, 66.26], [79.0, 79.2], [79.0, 79.27], [79.0, 79.39], [87.0, 86.71], [89.0, 89.45], [99.0, 99.25]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [28.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.05], ["trombone", 13.73], ["musical instrument", 2.66]], null, null, null, null, null, null, null, null, null], "duration": [13.66, -0.34, 0.84, 0.26, 0.2, 0.27, 0.39, -0.29, 0.45, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/rpUPWSqadTo_filtered.json b/annotations_filtered/rpUPWSqadTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b0ab89d814a2b6354254b92163ce78234e2cad0 --- /dev/null +++ b/annotations_filtered/rpUPWSqadTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.9], [6.0, 7.4], [13.0, 15.01], [31.0, 31.18], [32.0, 33.08], [38.0, 48.83], [51.0, 54.16], [57.0, 61.99], [84.0, 85.77], [86.0, 87.13], [90.0, 96.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.93, 0.0, 0.0, 98.66, 98.36, 99.48, 0.0, 0.0, 96.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 1.4, 2.01, 0.18, 1.08, 10.83, 3.16, 4.99, 1.77, 1.13, 6.52]} \ No newline at end of file diff --git a/annotations_filtered/rpdnpip1X4A_filtered.json b/annotations_filtered/rpdnpip1X4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfd9710e55e491f0f2d010bcf60a2c14b22e9119 --- /dev/null +++ b/annotations_filtered/rpdnpip1X4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.28], [6.0, 7.38], [10.0, 10.23], [11.0, 12.43], [15.0, 16.06], [17.0, 17.46], [19.0, 19.26], [21.0, 24.83], [27.0, 28.44], [30.0, 30.86], [32.0, 37.89], [41.0, 41.59], [43.0, 44.36], [46.0, 46.31], [48.0, 48.49], [50.0, 56.07], [57.0, 57.03], [58.0, 59.04], [59.0, 61.6], [66.0, 66.34], [67.0, 67.61], [75.0, 75.79], [76.0, 76.77], [78.0, 78.11], [80.0, 81.09], [83.0, 84.06], [85.0, 85.82], [88.0, 88.7], [90.0, 92.4], [93.0, 93.75], [95.0, 95.96], [97.0, 98.1], [100.0, 99.99], [105.0, 105.38], [106.0, 106.71], [108.0, 107.74], [109.0, 109.39], [111.0, 113.02], [114.0, 114.66], [115.0, 115.4], [116.0, 116.82], [120.0, 121.0], [125.0, 125.59], [128.0, 129.14], [133.0, 133.32], [134.0, 134.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 45.36, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 67.38], ["didgeridoo", 12.73], ["musical instrument", 5.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.28, 1.38, 0.23, 1.43, 1.06, 0.46, 0.26, 3.83, 1.44, 0.86, 5.89, 0.59, 1.36, 0.31, 0.49, 6.07, 0.03, 1.04, 2.6, 0.34, 0.61, 0.79, 0.77, 0.11, 1.09, 1.06, 0.82, 0.7, 2.4, 0.75, 0.96, 1.1, -0.01, 0.38, 0.71, -0.26, 0.39, 2.02, 0.66, 0.4, 0.82, 1.0, 0.59, 1.14, 0.32, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/rpp930f_fhU_filtered.json b/annotations_filtered/rpp930f_fhU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..861d9ccde7bafdf928f0ffdcd31fed8eb1c9b5d1 --- /dev/null +++ b/annotations_filtered/rpp930f_fhU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.88], [5.0, 9.61], [11.0, 12.43], [14.0, 19.2], [20.0, 20.97], [21.0, 22.13], [23.0, 27.23], [28.0, 28.51], [29.0, 32.44], [33.0, 34.08], [35.0, 35.58], [36.0, 35.61], [36.0, 35.7], [36.0, 40.19], [41.0, 41.15], [42.0, 42.57], [44.0, 44.69], [45.0, 46.08], [46.0, 47.19], [48.0, 47.88], [49.0, 49.0], [50.0, 50.19], [51.0, 52.15], [53.0, 58.73], [60.0, 60.83], [62.0, 73.87], [74.0, 75.03], [76.0, 76.76], [78.0, 79.1], [81.0, 81.41], [83.0, 82.76], [84.0, 84.6], [86.0, 86.78], [88.0, 88.42], [92.0, 93.88], [95.0, 95.34], [96.0, 97.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.37, 0.0, 51.94, 0.0, 0.0, 65.91, 0.0, 85.17, 0.0, 0.0, 0.0, 0.0, 46.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.14, 0.0, 33.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 24.33], ["hum", 13.7], ["mains hum", 9.08]], null, null, null, null, null, null, null, null, null, [["noise", 15.99], ["fart", 10.08], ["cough", 9.44]], null, [["music", 83.76], ["guitar", 4.14], ["plucked string instrument", 1.94]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.88, 4.61, 1.43, 5.2, 0.97, 1.13, 4.23, 0.51, 3.44, 1.08, 0.58, -0.39, -0.3, 4.19, 0.15, 0.57, 0.69, 1.08, 1.19, -0.12, 0.0, 0.19, 1.15, 5.73, 0.83, 11.87, 1.03, 0.76, 1.1, 0.41, -0.24, 0.6, 0.78, 0.42, 1.88, 0.34, 1.21]} \ No newline at end of file diff --git a/annotations_filtered/rpqgDDBcmcI_filtered.json b/annotations_filtered/rpqgDDBcmcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12a3c2106328d982d207deec6dd1704a4df221df --- /dev/null +++ b/annotations_filtered/rpqgDDBcmcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.33], [6.0, 6.3], [16.0, 22.62], [24.0, 24.66], [26.0, 26.18], [27.0, 36.98], [40.0, 41.49], [42.0, 79.12], [79.0, 79.64], [91.0, 94.83], [95.0, 99.4], [101.0, 111.2], [112.0, 112.89], [116.0, 118.08], [119.0, 128.9], [129.0, 131.95], [133.0, 133.14], [141.0, 160.41], [161.0, 161.3]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, false, false, false, false], "silence_prob": [36.33, 0.0, 29.0, 0.0, 0.0, 29.11, 0.0, 0.0, 0.0, 31.33, 31.41, 29.99, 0.0, 28.99, 29.27, 28.73, 0.0, 29.78, 0.0], "audiomae_on_audioset": [[["music", 50.97], ["throbbing", 18.91], ["hum", 11.56]], null, [["music", 52.95], ["speech", 9.14], ["throbbing", 8.65]], null, null, [["music", 57.68], ["throbbing", 7.67], ["electronic music", 5.97]], null, null, null, [["music", 48.32], ["hum", 8.0], ["throbbing", 5.96]], [["music", 36.18], ["throbbing", 12.82], ["hum", 10.2]], [["speech", 38.29], ["hum", 12.26], ["mains hum", 9.1]], null, [["music", 75.47], ["throbbing", 2.15], ["cacophony", 1.97]], [["vehicle", 34.67], ["car", 16.92], ["music", 16.54]], [["music", 63.03], ["electronic music", 4.24], ["hum", 3.29]], null, [["hum", 42.17], ["throbbing", 16.1], ["mains hum", 12.93]], null], "duration": [3.33, 0.3, 6.62, 0.66, 0.18, 9.98, 1.49, 37.12, 0.64, 3.83, 4.4, 10.2, 0.89, 2.08, 9.9, 2.95, 0.14, 19.41, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/rpvLdqBrY8s_filtered.json b/annotations_filtered/rpvLdqBrY8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f17935fd9bde03c1157c55a44b6d996db965e00 --- /dev/null +++ b/annotations_filtered/rpvLdqBrY8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.65], [17.0, 16.88], [17.0, 18.55], [23.0, 22.72], [25.0, 25.22], [31.0, 31.82], [34.0, 34.37]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.65, -0.12, 1.55, -0.28, 0.22, 0.82, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/rpy7vhvX8jw_filtered.json b/annotations_filtered/rpy7vhvX8jw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7405725b12817c190c4de45871afc71307d7b6cc --- /dev/null +++ b/annotations_filtered/rpy7vhvX8jw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.61], [7.0, 7.62], [11.0, 11.8], [14.0, 16.33], [18.0, 20.02], [23.0, 24.76], [26.0, 28.56], [31.0, 31.7], [33.0, 35.11], [36.0, 38.06], [41.0, 42.21], [48.0, 51.7], [53.0, 53.94], [58.0, 61.8], [63.0, 63.91], [67.0, 67.93], [69.0, 68.96], [72.0, 76.45], [79.0, 79.0], [82.0, 84.1], [88.0, 88.21], [91.0, 93.18], [94.0, 94.73], [99.0, 100.45], [104.0, 104.18], [104.0, 104.62], [109.0, 110.91], [113.0, 122.18], [123.0, 124.53], [125.0, 128.55], [129.0, 133.64], [136.0, 138.4], [140.0, 140.61], [142.0, 141.84], [144.0, 147.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.16, 89.36, 0.0, 95.23, 0.0, 86.09, 79.94, 0.0, 98.99, 0.0, 68.41, 0.0, 0.0, 0.0, 99.97, 0.0, 97.64, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 88.64, 99.91, 0.0, 0.0, 96.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 0.62, 0.8, 2.33, 2.02, 1.76, 2.56, 0.7, 2.11, 2.06, 1.21, 3.7, 0.94, 3.8, 0.91, 0.93, -0.04, 4.45, 0.0, 2.1, 0.21, 2.18, 0.73, 1.45, 0.18, 0.62, 1.91, 9.18, 1.53, 3.55, 4.64, 2.4, 0.61, -0.16, 3.24]} \ No newline at end of file diff --git a/annotations_filtered/rqKaJ4Yp_oU_filtered.json b/annotations_filtered/rqKaJ4Yp_oU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa37dd148f00cf33f39bced5aaaf6c8c7c8cb345 --- /dev/null +++ b/annotations_filtered/rqKaJ4Yp_oU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.41], [14.0, 14.35], [17.0, 16.85], [18.0, 19.99], [21.0, 22.54], [23.0, 24.63], [25.0, 32.78], [34.0, 53.84], [57.0, 88.67], [89.0, 89.5], [90.0, 91.57], [92.0, 93.04], [96.0, 96.87], [104.0, 111.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 78.72, 36.25, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 83.94], ["musical instrument", 1.63], ["fart", 1.36]], null, null, null, null, null, null], "duration": [3.41, 0.35, -0.15, 1.99, 1.54, 1.63, 7.78, 19.84, 31.67, 0.5, 1.57, 1.04, 0.87, 7.92]} \ No newline at end of file diff --git a/annotations_filtered/rqS6CaouXwE_filtered.json b/annotations_filtered/rqS6CaouXwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e0dda79ee062a6c5c3028d8a06cd78c0d7d4767 --- /dev/null +++ b/annotations_filtered/rqS6CaouXwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.41], [16.0, 17.17], [18.0, 18.47], [21.0, 22.74], [23.0, 23.84], [25.0, 80.91], [82.0, 116.26]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [9.41, 1.17, 0.47, 1.74, 0.84, 55.91, 34.26]} \ No newline at end of file diff --git a/annotations_filtered/rqT82hS-rMw_filtered.json b/annotations_filtered/rqT82hS-rMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33f032f675a8fe20c59a99a73e5ca129c964d5d6 --- /dev/null +++ b/annotations_filtered/rqT82hS-rMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.93], [4.0, 6.03], [20.0, 20.7], [25.0, 25.42], [28.0, 28.48], [30.0, 30.05], [32.0, 32.88], [37.0, 37.99], [43.0, 43.44], [55.0, 55.54], [62.0, 62.85], [65.0, 65.55], [71.0, 72.44], [80.0, 79.89], [81.0, 81.51], [88.0, 88.53], [89.0, 90.39], [94.0, 94.41], [96.0, 97.63], [99.0, 99.03], [109.0, 109.86], [111.0, 110.78], [112.0, 112.73], [114.0, 115.33], [116.0, 116.87], [120.0, 120.19], [121.0, 122.08]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 14.49], ["music", 10.71], ["hum", 10.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 2.03, 0.7, 0.42, 0.48, 0.05, 0.88, 0.99, 0.44, 0.54, 0.85, 0.55, 1.44, -0.11, 0.51, 0.53, 1.39, 0.41, 1.63, 0.03, 0.86, -0.22, 0.73, 1.33, 0.87, 0.19, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/rqVI2DmLI2Q_filtered.json b/annotations_filtered/rqVI2DmLI2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92f0904c858ee4ea0b947a4df19b9054c9c457f2 --- /dev/null +++ b/annotations_filtered/rqVI2DmLI2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 39.26], [55.0, 54.8], [60.0, 61.57], [66.0, 66.75], [77.0, 77.5], [78.0, 79.08], [80.0, 81.03], [83.0, 83.84], [86.0, 86.53], [87.0, 89.94], [92.0, 92.18], [93.0, 94.56], [96.0, 97.01], [100.0, 99.76], [107.0, 107.86]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [38.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.13, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.33], ["fart", 26.75], ["beatboxing", 2.57]], null, null, null, null, null, null, null, null, [["music", 35.77], ["groan", 18.01], ["grunt", 6.71]], null, null, null, null, null], "duration": [22.26, -0.2, 1.57, 0.75, 0.5, 1.08, 1.03, 0.84, 0.53, 2.94, 0.18, 1.56, 1.01, -0.24, 0.86]} \ No newline at end of file diff --git a/annotations_filtered/rqWz0oKJQ5E_filtered.json b/annotations_filtered/rqWz0oKJQ5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1a7f8db3be7db9ed173240816a0008c28a8be9d --- /dev/null +++ b/annotations_filtered/rqWz0oKJQ5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.32], [15.0, 21.02], [22.0, 22.22], [23.0, 30.94], [34.0, 43.14], [46.0, 49.4], [54.0, 54.48], [56.0, 61.53], [62.0, 62.31]], "keep_status": [false, true, false, false, false, false, false, true, false], "silence_prob": [37.88, 30.03, 0.0, 30.26, 31.23, 69.61, 0.0, 43.96, 0.0], "audiomae_on_audioset": [[["music", 62.33], ["ambient music", 12.97], ["synthesizer", 2.59]], [["music", 38.35], ["brass instrument", 9.69], ["clarinet", 5.94]], null, [["music", 66.92], ["speech", 4.82], ["brass instrument", 3.33]], [["trombone", 37.58], ["music", 22.12], ["brass instrument", 21.77]], null, null, [["speech", 39.34], ["hum", 14.02], ["throbbing", 10.03]], null], "duration": [3.32, 6.02, 0.22, 7.94, 9.14, 3.4, 0.48, 5.53, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/rqdEaDM2PWM_filtered.json b/annotations_filtered/rqdEaDM2PWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c12fd68262e7c609ea14d7e405d4930704af7ba --- /dev/null +++ b/annotations_filtered/rqdEaDM2PWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.63], [18.0, 41.96], [43.0, 44.34], [44.0, 45.71], [48.0, 52.54], [54.0, 62.46], [63.0, 64.44], [66.0, 77.55], [82.0, 83.17], [90.0, 93.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.31, 0.0, 0.0, 97.54, 54.63, 0.0, 64.75, 0.0, 99.82], "audiomae_on_audioset": [null, [["music", 60.75], ["sidetone", 21.58], ["thunk", 3.84]], null, null, null, null, null, null, null, null], "duration": [0.63, 23.96, 1.34, 1.71, 4.54, 8.46, 1.44, 11.55, 1.17, 3.77]} \ No newline at end of file diff --git a/annotations_filtered/rr6eufh4DA4_filtered.json b/annotations_filtered/rr6eufh4DA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92013b80c2fce5d581e483bc076db399a65e94f1 --- /dev/null +++ b/annotations_filtered/rr6eufh4DA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.32], [7.0, 9.69], [11.0, 11.28], [13.0, 16.02], [17.0, 20.98], [22.0, 25.56], [26.0, 27.87], [29.0, 30.74], [32.0, 34.84], [36.0, 36.75], [38.0, 38.45], [40.0, 45.5], [46.0, 62.11], [72.0, 74.33], [99.0, 99.33], [102.0, 102.86], [103.0, 103.11], [104.0, 104.65], [109.0, 109.11], [110.0, 110.52], [113.0, 113.09], [121.0, 121.8], [124.0, 123.94], [130.0, 131.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.6, 97.11, 0.0, 100.0, 100.0, 99.36, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 45.27, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 53.88], ["telephone", 12.38], ["inside, small room", 10.96]], null, null, null, null, null, null, null, null, null, null, null], "duration": [4.32, 2.69, 0.28, 3.02, 3.98, 3.56, 1.87, 1.74, 2.84, 0.75, 0.45, 5.5, 16.11, 2.33, 0.33, 0.86, 0.11, 0.65, 0.11, 0.52, 0.09, 0.8, -0.06, 1.48]} \ No newline at end of file diff --git a/annotations_filtered/rrMvGHoW7aw_filtered.json b/annotations_filtered/rrMvGHoW7aw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9a77a0f61cfeac108d82299279d7b83be9878ec --- /dev/null +++ b/annotations_filtered/rrMvGHoW7aw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.88], [12.0, 12.66], [46.0, 46.36], [47.0, 47.16], [67.0, 67.47], [71.0, 71.32], [106.0, 106.68], [109.0, 109.34], [133.0, 133.51], [136.0, 136.56], [146.0, 149.12], [150.0, 151.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, 0.66, 0.36, 0.16, 0.47, 0.32, 0.68, 0.34, 0.51, 0.56, 3.12, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/rrWLFKZafAc_filtered.json b/annotations_filtered/rrWLFKZafAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f257af3f3a26be2309b0a677096a95de4d11adc8 --- /dev/null +++ b/annotations_filtered/rrWLFKZafAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 67.15], [68.0, 89.85], [91.0, 91.56], [93.0, 93.72], [97.0, 98.0], [99.0, 100.87], [103.0, 102.95], [116.0, 116.24]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 43.93], ["speech", 20.15], ["throbbing", 8.12]], null, null, null, null, null, null], "duration": [62.15, 21.85, 0.56, 0.72, 1.0, 1.87, -0.05, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/rrbEQDRYpy8_filtered.json b/annotations_filtered/rrbEQDRYpy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6565ce911e0969272c343a3fa167f2e31d5efc51 --- /dev/null +++ b/annotations_filtered/rrbEQDRYpy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.25], [8.0, 8.97], [11.0, 11.55], [14.0, 14.5], [33.0, 32.68], [40.0, 41.1], [42.0, 42.7], [46.0, 46.68], [48.0, 48.59], [53.0, 53.81], [55.0, 55.86], [57.0, 57.4], [59.0, 59.12], [60.0, 60.45], [62.0, 63.34], [75.0, 75.71], [76.0, 77.08], [78.0, 79.05], [80.0, 81.26], [95.0, 94.93], [96.0, 97.12], [100.0, 101.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.25, 0.97, 0.55, 0.5, -0.32, 1.1, 0.7, 0.68, 0.59, 0.81, 0.86, 0.4, 0.12, 0.45, 1.34, 0.71, 1.08, 1.05, 1.26, -0.07, 1.12, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/rrejfviNpqE_filtered.json b/annotations_filtered/rrejfviNpqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d0f0890b845848a26cdc48789ceaf0ddab91f27 --- /dev/null +++ b/annotations_filtered/rrejfviNpqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.05], [33.0, 33.99], [35.0, 37.3], [40.0, 43.02], [44.0, 44.39], [51.0, 51.31], [52.0, 56.24], [59.0, 61.01], [65.0, 65.35], [68.0, 87.18], [90.0, 91.18], [93.0, 107.13], [111.0, 119.38], [121.0, 122.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.27, 79.24, 0.0, 0.0, 73.36, 51.71, 0.0, 51.82, 0.0, 34.1, 30.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 63.41], ["musical instrument", 6.23], ["didgeridoo", 4.41]], [["music", 67.26], ["speech", 10.64], ["boing", 3.97]], null], "duration": [0.05, 0.99, 2.3, 3.02, 0.39, 0.31, 4.24, 2.01, 0.35, 19.18, 1.18, 14.13, 8.38, 1.22]} \ No newline at end of file diff --git a/annotations_filtered/rroHhssQbok_filtered.json b/annotations_filtered/rroHhssQbok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81b14f10dae14cc82ff476739da72065380fb384 --- /dev/null +++ b/annotations_filtered/rroHhssQbok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.25], [18.0, 20.51], [22.0, 22.62], [26.0, 27.04], [29.0, 28.75], [30.0, 30.48], [38.0, 38.92], [44.0, 44.88], [46.0, 47.78], [65.0, 65.96], [68.0, 68.49], [70.0, 71.02], [72.0, 72.69], [82.0, 82.58], [84.0, 84.57], [85.0, 87.15], [98.0, 99.77], [104.0, 104.75], [107.0, 108.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 2.51, 0.62, 1.04, -0.25, 0.48, 0.92, 0.88, 1.78, 0.96, 0.49, 1.02, 0.69, 0.58, 0.57, 2.15, 1.77, 0.75, 1.55]} \ No newline at end of file diff --git a/annotations_filtered/rroMPRc4flw_filtered.json b/annotations_filtered/rroMPRc4flw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/rroMPRc4flw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/rsT1bLR2sfM_filtered.json b/annotations_filtered/rsT1bLR2sfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c8f975a40c29f2419092f37aca0cd587d1c9ea0 --- /dev/null +++ b/annotations_filtered/rsT1bLR2sfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.36], [8.0, 8.67], [11.0, 14.62], [16.0, 17.51], [18.0, 18.37], [22.0, 23.68], [26.0, 26.69], [28.0, 28.27], [37.0, 37.34], [39.0, 39.26], [44.0, 44.81], [49.0, 49.35], [50.0, 50.84], [52.0, 53.43], [53.0, 53.47], [57.0, 58.09], [61.0, 61.23], [62.0, 62.97], [66.0, 66.29], [67.0, 67.98], [69.0, 70.07], [71.0, 71.59], [73.0, 72.94], [74.0, 75.44], [78.0, 78.8], [79.0, 85.11], [88.0, 88.45], [91.0, 92.79], [95.0, 94.96], [97.0, 102.44], [108.0, 108.36], [109.0, 110.1], [115.0, 116.04], [117.0, 118.13], [120.0, 122.23], [126.0, 126.59], [131.0, 134.37], [136.0, 137.74], [140.0, 141.59], [145.0, 145.5], [147.0, 147.56], [149.0, 151.68], [154.0, 155.17], [156.0, 156.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.36, 0.67, 3.62, 1.51, 0.37, 1.68, 0.69, 0.27, 0.34, 0.26, 0.81, 0.35, 0.84, 1.43, 0.47, 1.09, 0.23, 0.97, 0.29, 0.98, 1.07, 0.59, -0.06, 1.44, 0.8, 6.11, 0.45, 1.79, -0.04, 5.44, 0.36, 1.1, 1.04, 1.13, 2.23, 0.59, 3.37, 1.74, 1.59, 0.5, 0.56, 2.68, 1.17, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/rsi2WcPIcQ0_filtered.json b/annotations_filtered/rsi2WcPIcQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19159bb357689b8d114da24c54523b8382864e2e --- /dev/null +++ b/annotations_filtered/rsi2WcPIcQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.83], [8.0, 10.22], [11.0, 13.81], [18.0, 21.27], [23.0, 25.95], [26.0, 26.87], [27.0, 28.88], [30.0, 31.26], [32.0, 32.54], [33.0, 34.05], [34.0, 42.11], [43.0, 45.47], [49.0, 50.25], [53.0, 54.87], [61.0, 61.35], [62.0, 62.24], [63.0, 63.96], [69.0, 70.82], [71.0, 71.54], [73.0, 73.84], [93.0, 93.72], [96.0, 95.86], [112.0, 129.36], [130.0, 131.38], [133.0, 134.1], [136.0, 138.75], [140.0, 141.56], [143.0, 151.95], [153.0, 155.76], [157.0, 158.13], [160.0, 164.91], [166.0, 169.48], [174.0, 175.14]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 99.95, 35.26, 100.0, 56.1, 0.0, 0.0, 0.0, 0.0, 0.0, 53.91, 56.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.26, 0.0, 0.0, 44.34, 0.0, 33.29, 35.63, 0.0, 31.09, 100.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 58.72], ["hum", 5.28], ["music", 3.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.01], ["drum", 11.69], ["percussion", 6.44]], null, null, [["music", 65.25], ["electronic music", 6.16], ["synthesizer", 5.66]], null, [["music", 75.13], ["speech", 5.63], ["throbbing", 3.36]], [["music", 63.03], ["throbbing", 13.22], ["electronic music", 3.86]], null, [["music", 46.86], ["whack, thwack", 15.3], ["thunk", 5.47]], null, null], "duration": [-0.17, 2.22, 2.81, 3.27, 2.95, 0.87, 1.88, 1.26, 0.54, 1.05, 8.11, 2.47, 1.25, 1.87, 0.35, 0.24, 0.96, 1.82, 0.54, 0.84, 0.72, -0.14, 17.36, 1.38, 1.1, 2.75, 1.56, 8.95, 2.76, 1.13, 4.91, 3.48, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/rsktGDtzKhg_filtered.json b/annotations_filtered/rsktGDtzKhg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b93de1f58be9c2f815256867cab91b837c1a17c1 --- /dev/null +++ b/annotations_filtered/rsktGDtzKhg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.16], [31.0, 35.29], [35.0, 38.23], [38.0, 40.15], [56.0, 57.54], [70.0, 73.89], [98.0, 101.9], [123.0, 124.04], [130.0, 131.3], [136.0, 136.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.16, 35.13, 32.57, 32.5, 0.0, 31.15, 32.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 69.28], ["musical instrument", 1.66], ["guitar", 1.55]], [["music", 68.56], ["funny music", 8.03], ["singing", 4.47]], [["music", 80.2], ["reggae", 1.44], ["funny music", 1.16]], null, [["music", 78.04], ["swing music", 12.92], ["funny music", 2.05]], [["music", 61.92], ["musical instrument", 5.49], ["drum machine", 4.82]], null, null, null], "duration": [5.16, 4.29, 3.23, 2.15, 1.54, 3.89, 3.9, 1.04, 1.3, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/rsmsMeT8EYs_filtered.json b/annotations_filtered/rsmsMeT8EYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b850180cbcb0d8a6ffb03ca05e5ca937e6853f26 --- /dev/null +++ b/annotations_filtered/rsmsMeT8EYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.21], [6.0, 8.07], [9.0, 9.88], [14.0, 16.43], [22.0, 22.45], [24.0, 24.58], [26.0, 25.73], [30.0, 30.47], [31.0, 32.24], [40.0, 41.67], [43.0, 44.95], [47.0, 48.03], [50.0, 50.97], [52.0, 55.14], [56.0, 56.42], [60.0, 62.5], [64.0, 65.03], [69.0, 68.88], [71.0, 79.84], [82.0, 82.11], [87.0, 87.22], [97.0, 97.16], [98.0, 98.25], [102.0, 102.47], [103.0, 104.41], [107.0, 108.63], [113.0, 113.76], [115.0, 115.3], [118.0, 120.06], [121.0, 122.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 88.1, 0.0, 52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 0.0, 87.37, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 2.07, 0.88, 2.43, 0.45, 0.58, -0.27, 0.47, 1.24, 1.67, 1.95, 1.03, 0.97, 3.14, 0.42, 2.5, 1.03, -0.12, 8.84, 0.11, 0.22, 0.16, 0.25, 0.47, 1.41, 1.63, 0.76, 0.3, 2.06, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/rsnLwzzkF_Q_filtered.json b/annotations_filtered/rsnLwzzkF_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a2ec11656e510edd952eb50db78676295c23674 --- /dev/null +++ b/annotations_filtered/rsnLwzzkF_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.66], [3.0, 3.15], [5.0, 11.74], [18.0, 19.06], [23.0, 51.95], [55.0, 55.59], [66.0, 69.3], [70.0, 70.09], [71.0, 70.61], [71.0, 82.05], [83.0, 144.19]], "keep_status": [false, false, true, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 40.14, 0.0, 28.98, 0.0, 29.15, 0.0, 0.0, 28.53, 0.0], "audiomae_on_audioset": [null, null, [["music", 41.39], ["hum", 18.45], ["synthesizer", 7.18]], null, [["music", 32.33], ["frog", 21.89], ["croak", 5.06]], null, [["music", 33.02], ["roar", 19.01], ["livestock, farm animals, working animals", 3.86]], null, null, [["music", 45.15], ["smash, crash", 12.15], ["whack, thwack", 7.84]], null], "duration": [1.66, 0.15, 6.74, 1.06, 28.95, 0.59, 3.3, 0.09, -0.39, 11.05, 61.19]} \ No newline at end of file diff --git a/annotations_filtered/rsuNowyCF0c_filtered.json b/annotations_filtered/rsuNowyCF0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee2f3717b29f9ac8e561b5c181d1e3233fb5a866 --- /dev/null +++ b/annotations_filtered/rsuNowyCF0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [6.0, 8.33], [11.0, 11.08], [12.0, 14.1], [15.0, 16.41], [16.0, 20.12], [26.0, 31.63], [35.0, 35.43], [37.0, 37.74], [38.0, 39.01], [40.0, 42.63], [44.0, 76.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 80.64, 0.0, 71.0, 0.0, 34.79, 39.25, 0.0, 0.0, 0.0, 42.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 36.14], ["music", 27.38], ["hum", 13.24]], [["music", 49.28], ["speech", 22.12], ["electronic music", 6.97]], null, null, null, [["music", 59.26], ["throbbing", 7.61], ["electronic music", 5.64]], null], "duration": [0.13, 2.33, 0.08, 2.1, 1.41, 4.12, 5.63, 0.43, 0.74, 1.01, 2.63, 32.84]} \ No newline at end of file diff --git a/annotations_filtered/rt3FEbzjM3o_filtered.json b/annotations_filtered/rt3FEbzjM3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf9797a2ad4f2fd3d4ab9888fe6d772c7b52cce4 --- /dev/null +++ b/annotations_filtered/rt3FEbzjM3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.1], [8.0, 9.31], [10.0, 12.97], [14.0, 16.53], [19.0, 32.61], [34.0, 33.83], [35.0, 38.31], [39.0, 40.19], [40.0, 57.23], [59.0, 60.56], [62.0, 63.21], [65.0, 65.48], [75.0, 76.82], [78.0, 79.68], [82.0, 87.47], [90.0, 96.94], [98.0, 104.63], [106.0, 108.62], [109.0, 113.66], [119.0, 129.03]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, true, true, true], "silence_prob": [56.03, 0.0, 72.16, 91.47, 36.09, 0.0, 64.75, 0.0, 51.39, 0.0, 0.0, 0.0, 0.0, 0.0, 42.58, 96.17, 72.9, 46.64, 39.4, 36.48], "audiomae_on_audioset": [null, null, null, null, [["hum", 30.87], ["music", 14.74], ["throbbing", 14.37]], null, null, null, null, null, null, null, null, null, [["music", 41.54], ["synthesizer", 9.29], ["ambient music", 7.65]], null, null, [["music", 32.9], ["hum", 9.16], ["didgeridoo", 7.42]], [["music", 41.51], ["hum", 6.29], ["throbbing", 6.06]], [["sine wave", 33.39], ["music", 16.27], ["sidetone", 7.09]]], "duration": [4.1, 1.31, 2.97, 2.53, 13.61, -0.17, 3.31, 1.19, 17.23, 1.56, 1.21, 0.48, 1.82, 1.68, 5.47, 6.94, 6.63, 2.62, 4.66, 10.03]} \ No newline at end of file diff --git a/annotations_filtered/rtYKhaQStZE_filtered.json b/annotations_filtered/rtYKhaQStZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84bbc44d5ca2b31da0c740b6628a239a2f586090 --- /dev/null +++ b/annotations_filtered/rtYKhaQStZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 20.87], [22.0, 22.52], [23.0, 24.21], [27.0, 27.55], [34.0, 34.57], [35.0, 35.87], [37.0, 38.04], [39.0, 40.2], [44.0, 44.05], [46.0, 46.25], [49.0, 49.01], [53.0, 57.91], [60.0, 63.19], [65.0, 65.06], [68.0, 69.25], [71.0, 72.1], [77.0, 78.06], [79.0, 79.54], [88.0, 88.43], [94.0, 100.87], [102.0, 102.74], [104.0, 105.29], [116.0, 115.97], [117.0, 117.73], [119.0, 119.97], [122.0, 123.65], [125.0, 128.9], [133.0, 133.78], [134.0, 134.99], [136.0, 137.19], [138.0, 139.58], [143.0, 143.75], [145.0, 147.56], [148.0, 148.91], [150.0, 150.63], [154.0, 156.69], [160.0, 162.48], [167.0, 168.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.36, 38.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 0.0, 0.0, 42.67, 38.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 45.55], ["music", 25.03], ["hum", 20.16]], [["throbbing", 21.68], ["hum", 21.49], ["mains hum", 13.47]], null, null, null, null, null, null, [["hum", 43.98], ["mains hum", 16.19], ["buzz", 13.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.44], ["hum", 13.78], ["throbbing", 5.44]], [["hum", 38.31], ["throbbing", 14.03], ["music", 10.43]], null], "duration": [-0.13, 0.52, 1.21, 0.55, 0.57, 0.87, 1.04, 1.2, 0.05, 0.25, 0.01, 4.91, 3.19, 0.06, 1.25, 1.1, 1.06, 0.54, 0.43, 6.87, 0.74, 1.29, -0.03, 0.73, 0.97, 1.65, 3.9, 0.78, 0.99, 1.19, 1.58, 0.75, 2.56, 0.91, 0.63, 2.69, 2.48, 1.91]} \ No newline at end of file diff --git a/annotations_filtered/rthHSISkM7A_filtered.json b/annotations_filtered/rthHSISkM7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44696e1c8e870a8eb103d16e172e9823b23630d4 --- /dev/null +++ b/annotations_filtered/rthHSISkM7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.15], [16.0, 27.35], [28.0, 80.77], [96.0, 97.46], [98.0, 122.55], [123.0, 123.7], [125.0, 127.67]], "keep_status": [false, true, false, false, true, false, true], "silence_prob": [0.0, 31.15, 0.0, 0.0, 30.69, 0.0, 31.58], "audiomae_on_audioset": [null, [["burst, pop", 19.44], ["explosion", 17.38], ["speech", 15.1]], null, null, [["music", 33.6], ["speech", 10.52], ["throbbing", 7.98]], null, [["speech", 31.83], ["hum", 21.59], ["horse", 11.2]]], "duration": [1.15, 11.35, 52.77, 1.46, 24.55, 0.7, 2.67]} \ No newline at end of file diff --git a/annotations_filtered/rtkI87FeqOY_filtered.json b/annotations_filtered/rtkI87FeqOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9ed4aab56208afd2efab7ca0ac9eaa6127da224 --- /dev/null +++ b/annotations_filtered/rtkI87FeqOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.88], [6.0, 9.09], [11.0, 11.72], [14.0, 15.45], [17.0, 17.54], [18.0, 19.4], [21.0, 24.36], [27.0, 27.46], [34.0, 35.5], [37.0, 38.06], [39.0, 44.83], [51.0, 52.17], [56.0, 56.79], [60.0, 65.45], [67.0, 69.13], [77.0, 77.75], [88.0, 89.61], [98.0, 98.27]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 33.1, 0.0, 0.0, 0.0, 0.0, 39.82, 0.0, 0.0, 0.0, 57.4, 0.0, 0.0, 32.23, 73.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 81.58], ["radio", 5.42], ["sidetone", 1.84]], null, null, null, null, [["speech", 50.53], ["fart", 9.93], ["hum", 6.99]], null, null, null, null, null, null, [["speech", 26.53], ["moo", 20.69], ["cattle, bovinae", 18.76]], null, null, null, null], "duration": [0.88, 3.09, 0.72, 1.45, 0.54, 1.4, 3.36, 0.46, 1.5, 1.06, 5.83, 1.17, 0.79, 5.45, 2.13, 0.75, 1.61, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/rtn4-lDSB80_filtered.json b/annotations_filtered/rtn4-lDSB80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d39dad5d6f717d795e60054a228241f82e32135f --- /dev/null +++ b/annotations_filtered/rtn4-lDSB80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 21.56], [24.0, 59.68], [60.0, 106.34]], "keep_status": [false, false, false], "silence_prob": [61.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [7.56, 35.68, 46.34]} \ No newline at end of file diff --git a/annotations_filtered/rtqgJvhrswY_filtered.json b/annotations_filtered/rtqgJvhrswY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..590f00fad1aac85a4e571d549b0111d3c1805566 --- /dev/null +++ b/annotations_filtered/rtqgJvhrswY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 58.72], [61.0, 61.48], [62.0, 64.3], [65.0, 67.31], [68.0, 68.59], [69.0, 70.09], [71.0, 71.81]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [98.44, 0.0, 99.82, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [3.72, 0.48, 2.3, 2.31, 0.59, 1.09, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/rtsis0lgx7k_filtered.json b/annotations_filtered/rtsis0lgx7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1901db1aeea06ac3e223b35fe7b970b139251c5 --- /dev/null +++ b/annotations_filtered/rtsis0lgx7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.33], [5.0, 7.53], [9.0, 17.24], [20.0, 21.27], [25.0, 25.47], [28.0, 32.58], [34.0, 35.83], [37.0, 37.35], [38.0, 39.6], [41.0, 43.41], [45.0, 45.55], [50.0, 52.59], [53.0, 54.57], [55.0, 56.69], [57.0, 60.84], [62.0, 64.29], [66.0, 66.97], [68.0, 72.69], [74.0, 79.1], [79.0, 80.69], [81.0, 83.54], [86.0, 90.14], [92.0, 95.89], [97.0, 99.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 74.44, 52.16, 0.0, 0.0, 49.36, 0.0, 0.0, 0.0, 69.61, 0.0, 84.43, 0.0, 0.0, 61.37, 67.63, 0.0, 61.37, 58.47, 0.0, 46.86, 57.97, 54.9, 40.36], "audiomae_on_audioset": [null, null, null, null, null, [["shofar", 61.31], ["wind instrument, woodwind instrument", 33.02], ["music", 1.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 47.28], ["sidetone", 21.63], ["speech", 12.45]], null, null, [["sidetone", 56.14], ["radio", 8.97], ["rumble", 6.43]]], "duration": [1.33, 2.53, 8.24, 1.27, 0.47, 4.58, 1.83, 0.35, 1.6, 2.41, 0.55, 2.59, 1.57, 1.69, 3.84, 2.29, 0.97, 4.69, 5.1, 1.69, 2.54, 4.14, 3.89, 2.1]} \ No newline at end of file diff --git a/annotations_filtered/ruCFlIoCpJ8_filtered.json b/annotations_filtered/ruCFlIoCpJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd9aeec8887d80f9b832c986188d53b830715115 --- /dev/null +++ b/annotations_filtered/ruCFlIoCpJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [5.0, 9.14], [11.0, 12.11], [14.0, 19.23], [20.0, 21.1], [24.0, 24.68], [25.0, 25.86], [36.0, 37.44], [40.0, 41.0], [43.0, 45.27], [47.0, 49.55], [56.0, 55.86], [58.0, 58.41], [60.0, 60.96], [66.0, 66.43], [67.0, 67.81], [71.0, 76.42], [78.0, 80.16], [87.0, 87.66], [90.0, 91.39], [98.0, 103.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 74.76, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 51.34, 44.9, 0.0, 0.0, 0.0, 0.0, 0.0, 45.08, 62.17, 0.0, 0.0, 30.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 24.83], ["snicker", 6.79], ["fart", 6.38]], null, null, null, null, null, [["burping, eructation", 47.67], ["speech", 12.11], ["sidetone", 6.1]], null, null, null, [["speech", 80.78], ["whack, thwack", 5.39], ["burst, pop", 1.99]]], "duration": [0.45, 4.14, 1.11, 5.23, 1.1, 0.68, 0.86, 1.44, 1.0, 2.27, 2.55, -0.14, 0.41, 0.96, 0.43, 0.81, 5.42, 2.16, 0.66, 1.39, 5.69]} \ No newline at end of file diff --git a/annotations_filtered/ruOXWHbyfjo_filtered.json b/annotations_filtered/ruOXWHbyfjo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..087e69cbc6fce00e60356afa0eef0d72335cced2 --- /dev/null +++ b/annotations_filtered/ruOXWHbyfjo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [8.0, 9.22], [10.0, 20.87], [22.0, 25.86], [27.0, 39.28], [44.0, 46.2], [47.0, 47.88], [50.0, 52.08], [54.0, 54.06], [57.0, 58.85], [66.0, 66.34], [67.0, 68.47], [76.0, 77.41], [80.0, 84.25], [85.0, 86.37], [88.0, 90.37], [103.0, 105.07], [106.0, 107.6], [108.0, 110.59], [113.0, 113.91], [115.0, 116.87], [117.0, 119.79], [122.0, 122.35], [123.0, 123.69], [127.0, 128.01], [131.0, 130.82], [132.0, 132.88], [143.0, 144.04], [147.0, 149.42], [152.0, 153.69], [154.0, 156.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 58.64, 87.74, 90.95, 93.13, 0.0, 89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 88.64, 91.81, 0.0, 92.8, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 51.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.22, 10.87, 3.86, 12.28, 2.2, 0.88, 2.08, 0.06, 1.85, 0.34, 1.47, 1.41, 4.25, 1.37, 2.37, 2.07, 1.6, 2.59, 0.91, 1.87, 2.79, 0.35, 0.69, 1.01, -0.18, 0.88, 1.04, 2.42, 1.69, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/ru_PLKD7w4c_filtered.json b/annotations_filtered/ru_PLKD7w4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9848b60563cde7549589fbd821fc167af361629b --- /dev/null +++ b/annotations_filtered/ru_PLKD7w4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 59.76], [60.0, 107.69], [108.0, 110.59]], "keep_status": [false, false, true], "silence_prob": [33.01, 0.0, 30.95], "audiomae_on_audioset": [[["speech", 59.68], ["music", 14.62], ["groan", 4.83]], null, [["music", 16.52], ["drum", 14.62], ["musical instrument", 5.94]]], "duration": [14.76, 47.69, 2.59]} \ No newline at end of file diff --git a/annotations_filtered/rukUxz5J7qg_filtered.json b/annotations_filtered/rukUxz5J7qg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4175a09a90f951c658664271eee81a457c6a02c --- /dev/null +++ b/annotations_filtered/rukUxz5J7qg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.75], [4.0, 4.82], [8.0, 7.6], [10.0, 10.37], [12.0, 12.51], [13.0, 14.67], [17.0, 25.79], [30.0, 34.08], [39.0, 44.66], [47.0, 47.97], [48.0, 48.02], [49.0, 66.58], [67.0, 70.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.19, 30.21, 31.79, 0.0, 0.0, 30.92, 55.81], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 76.41], ["speech", 8.9], ["sidetone", 4.05]], [["music", 45.05], ["speech", 23.77], ["electronic music", 4.16]], [["music", 60.67], ["throbbing", 14.94], ["hum", 11.52]], null, null, [["music", 46.38], ["throbbing", 26.86], ["hum", 12.27]], null], "duration": [-0.25, 0.82, -0.4, 0.37, 0.51, 1.67, 8.79, 4.08, 5.66, 0.97, 0.02, 17.58, 3.85]} \ No newline at end of file diff --git a/annotations_filtered/ruwbVFvdfco_filtered.json b/annotations_filtered/ruwbVFvdfco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc1559363584897d6bb790adc08d4f34df288250 --- /dev/null +++ b/annotations_filtered/ruwbVFvdfco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.22], [23.0, 26.65], [36.0, 37.57], [40.0, 42.55], [55.0, 58.55], [62.0, 64.52], [73.0, 73.08], [74.0, 74.29], [76.0, 81.35], [82.0, 99.45], [102.0, 102.27], [104.0, 104.77], [106.0, 106.3], [108.0, 108.82], [110.0, 110.24], [111.0, 112.92], [116.0, 119.15], [123.0, 124.12], [125.0, 125.71], [128.0, 133.93], [137.0, 137.42], [139.0, 142.84]], "keep_status": [false, true, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.23, 29.08, 0.0, 42.91, 30.14, 29.53, 0.0, 0.0, 30.91, 28.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 0.0, 0.0, 67.51, 0.0, 87.74], "audiomae_on_audioset": [[["mains hum", 39.9], ["hum", 34.89], ["music", 6.93]], [["speech", 48.73], ["sidetone", 8.95], ["music", 5.48]], null, [["music", 58.17], ["throbbing", 10.48], ["hum", 9.36]], [["hum", 26.05], ["mains hum", 25.28], ["music", 6.92]], [["mains hum", 28.64], ["hum", 24.69], ["music", 16.66]], null, null, [["music", 56.39], ["train horn", 4.32], ["hum", 3.89]], [["hum", 32.82], ["music", 19.8], ["mains hum", 19.39]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.22, 3.65, 1.57, 2.55, 3.55, 2.52, 0.08, 0.29, 5.35, 17.45, 0.27, 0.77, 0.3, 0.82, 0.24, 1.92, 3.15, 1.12, 0.71, 5.93, 0.42, 3.84]} \ No newline at end of file diff --git a/annotations_filtered/rvOq4hFIRJg_filtered.json b/annotations_filtered/rvOq4hFIRJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b53822cd2cb6a2530bf602a3f4aa10e10efb698 --- /dev/null +++ b/annotations_filtered/rvOq4hFIRJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.01], [9.0, 10.05], [12.0, 12.51], [20.0, 20.53], [21.0, 46.77], [48.0, 49.99], [51.0, 53.0], [53.0, 61.48], [63.0, 70.58], [86.0, 86.14], [96.0, 100.58], [106.0, 107.43], [113.0, 113.24], [123.0, 123.84], [126.0, 127.52], [130.0, 130.33], [131.0, 132.19], [133.0, 133.69], [137.0, 137.89], [138.0, 140.09], [156.0, 156.81], [158.0, 159.66], [161.0, 165.15], [183.0, 183.64], [184.0, 184.71]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.34, 0.0, 98.93, 88.64, 29.77, 0.0, 29.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.83, 0.0, 0.0, 45.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 12.61], ["burst, pop", 9.45], ["explosion", 7.9]], null, null, null, [["sonar", 30.97], ["music", 14.57], ["rumble", 8.12]], null, [["hum", 40.98], ["mains hum", 25.96], ["throbbing", 21.18]], null, null, null, null, null, null, null, null, [["speech", 36.58], ["music", 28.61], ["insect", 4.61]], null, null, [["mains hum", 18.12], ["hum", 14.72], ["gasp", 9.31]], null, null], "duration": [1.01, 1.05, 0.51, 0.53, 25.77, 1.99, 2.0, 8.48, 7.58, 0.14, 4.58, 1.43, 0.24, 0.84, 1.52, 0.33, 1.19, 0.69, 0.89, 2.09, 0.81, 1.66, 4.15, 0.64, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/rvQZ6MdHSEk_filtered.json b/annotations_filtered/rvQZ6MdHSEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce319c45c956ba7033c7f8440b0717198bc9e774 --- /dev/null +++ b/annotations_filtered/rvQZ6MdHSEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.61], [16.0, 17.15], [19.0, 53.42], [54.0, 61.33], [63.0, 63.69], [65.0, 64.79], [65.0, 67.36], [73.0, 82.83], [86.0, 87.69], [91.0, 91.27], [93.0, 93.34]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.57, 0.0, 0.0, 34.22, 30.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 29.21], ["throbbing", 21.75], ["speech", 18.02]], null, null, [["music", 47.61], ["dubstep", 5.14], ["electronic music", 4.21]], [["speech", 43.71], ["music", 23.85], ["sidetone", 7.35]], null, null, null], "duration": [1.61, 1.15, 34.42, 7.33, 0.69, -0.21, 2.36, 9.83, 1.69, 0.27, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/rvjVIwMPxqA_filtered.json b/annotations_filtered/rvjVIwMPxqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..521bc05d38d809e3bb316ea9d783b2af0c99947e --- /dev/null +++ b/annotations_filtered/rvjVIwMPxqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 27.75], [29.0, 32.14], [36.0, 37.34], [38.0, 38.82], [39.0, 43.51], [47.0, 48.96], [55.0, 64.47], [65.0, 64.86], [76.0, 78.95], [81.0, 85.06], [86.0, 89.06], [89.0, 101.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 0.0, 93.29, 0.0, 100.0, 0.0, 98.8, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.75, 3.14, 1.34, 0.82, 4.51, 1.96, 9.47, -0.14, 2.95, 4.06, 3.06, 12.46]} \ No newline at end of file diff --git a/annotations_filtered/rvqm61CcOLo_filtered.json b/annotations_filtered/rvqm61CcOLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dfebefd02234e13ced301cdfaff6e27262522e5 --- /dev/null +++ b/annotations_filtered/rvqm61CcOLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.14], [16.0, 17.51], [18.0, 21.73], [23.0, 24.22], [27.0, 40.29], [42.0, 115.06], [119.0, 158.92]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [51.28, 0.0, 51.39, 0.0, 39.24, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 76.01], ["scary music", 6.2], ["hum", 3.57]], null, null], "duration": [4.14, 1.51, 3.73, 1.22, 13.29, 73.06, 39.92]} \ No newline at end of file diff --git a/annotations_filtered/rwDDgGuCVS0_filtered.json b/annotations_filtered/rwDDgGuCVS0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/rwDDgGuCVS0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/rwd5hlQnu0I_filtered.json b/annotations_filtered/rwd5hlQnu0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35d8a0d2974aaade7db4e8e52fa5c70b70ff4aa9 --- /dev/null +++ b/annotations_filtered/rwd5hlQnu0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.37], [24.0, 24.41], [28.0, 28.75], [30.0, 34.35], [35.0, 49.72], [53.0, 53.18], [66.0, 66.45], [73.0, 73.36], [76.0, 80.7], [82.0, 87.47], [88.0, 117.91], [122.0, 128.22], [130.0, 134.59], [135.0, 138.03], [140.0, 142.96], [144.0, 146.74], [155.0, 155.09], [157.0, 167.17], [167.0, 167.78], [169.0, 169.35], [170.0, 170.63], [171.0, 172.49]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, true, true, false, true, false, false, true, false, false, false, false], "silence_prob": [31.9, 0.0, 0.0, 34.04, 31.58, 0.0, 0.0, 0.0, 39.54, 35.57, 39.86, 38.6, 37.11, 41.81, 40.48, 55.74, 0.0, 39.64, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 23.47], ["music", 23.02], ["throbbing", 13.52]], null, null, [["music", 46.48], ["throbbing", 13.47], ["hum", 5.12]], [["music", 48.27], ["speech", 17.35], ["throbbing", 14.14]], null, null, null, [["throbbing", 35.52], ["music", 23.55], ["hum", 20.14]], [["throbbing", 39.71], ["music", 26.02], ["hum", 19.8]], [["music", 60.87], ["hum", 10.83], ["throbbing", 9.17]], [["noise", 16.12], ["speech", 9.97], ["effects unit", 9.72]], [["animal", 15.78], ["roar", 14.56], ["hum", 9.04]], [["mains hum", 44.37], ["hum", 33.63], ["buzz", 4.03]], [["hum", 30.03], ["throbbing", 10.58], ["rumble", 10.55]], null, null, [["hum", 39.61], ["burping, eructation", 14.99], ["mains hum", 11.47]], null, null, null, null], "duration": [2.37, 0.41, 0.75, 4.35, 14.72, 0.18, 0.45, 0.36, 4.7, 5.47, 29.91, 6.22, 4.59, 3.03, 2.96, 2.74, 0.09, 10.17, 0.78, 0.35, 0.63, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/rwk6Obqrj9M_filtered.json b/annotations_filtered/rwk6Obqrj9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9c3a02fca2b4da07307f94bbaf2751e3173a448 --- /dev/null +++ b/annotations_filtered/rwk6Obqrj9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [4.0, 5.59], [8.0, 11.04], [11.0, 15.74], [19.0, 23.28], [28.0, 31.67], [34.0, 36.29], [41.0, 47.12], [49.0, 54.14], [63.0, 64.4], [69.0, 70.06], [74.0, 75.83], [79.0, 79.73], [83.0, 84.37]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.37, 35.2, 68.54, 68.41, 58.05, 36.5, 33.39, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 51.3], ["speech", 15.46], ["synthesizer", 12.73]], null, null, null, [["throbbing", 36.66], ["music", 17.66], ["hum", 13.82]], [["music", 43.65], ["throbbing", 20.93], ["hum", 13.6]], null, null, null, null, null], "duration": [0.5, 1.59, 3.04, 4.74, 4.28, 3.67, 2.29, 6.12, 5.14, 1.4, 1.06, 1.83, 0.73, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/rwr1IzFzjqA_filtered.json b/annotations_filtered/rwr1IzFzjqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eb358cb9ed9467b7b2914d2dd9f3de4349cfad7 --- /dev/null +++ b/annotations_filtered/rwr1IzFzjqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [7.0, 8.46], [13.0, 13.49], [14.0, 14.94], [16.0, 16.31], [27.0, 27.82], [30.0, 31.41], [34.0, 34.2], [37.0, 36.95], [43.0, 45.96], [49.0, 49.67], [55.0, 55.58], [57.0, 57.59], [68.0, 67.86], [78.0, 80.89], [82.0, 82.75], [85.0, 85.7], [92.0, 92.3], [93.0, 93.85], [98.0, 97.93], [102.0, 103.42], [104.0, 103.94], [105.0, 105.43], [106.0, 106.07], [112.0, 111.82], [113.0, 113.86], [114.0, 114.62], [115.0, 115.53], [117.0, 117.31], [118.0, 118.03], [130.0, 130.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 1.46, 0.49, 0.94, 0.31, 0.82, 1.41, 0.2, -0.05, 2.96, 0.67, 0.58, 0.59, -0.14, 2.89, 0.75, 0.7, 0.3, 0.85, -0.07, 1.42, -0.06, 0.43, 0.07, -0.18, 0.86, 0.62, 0.53, 0.31, 0.03, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/rwwMn3Y6rUA_filtered.json b/annotations_filtered/rwwMn3Y6rUA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..686a49f2fac0a9efbd599b44d97aa9faf229e8e2 --- /dev/null +++ b/annotations_filtered/rwwMn3Y6rUA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [12.0, 12.01], [20.0, 21.24], [29.0, 30.1], [34.0, 35.31], [42.0, 43.44], [50.0, 51.81], [54.0, 54.97], [63.0, 72.98], [74.0, 75.27], [86.0, 86.58], [88.0, 90.81], [94.0, 101.8], [103.0, 104.97], [107.0, 116.26], [118.0, 118.76], [119.0, 121.36], [122.0, 125.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.75, 0.0, 0.0, 44.66, 39.99, 0.0, 33.04, 0.0, 36.56, 40.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 76.57], ["hum", 3.56], ["throbbing", 3.25]], null, null, [["music", 44.37], ["hum", 12.52], ["throbbing", 11.45]], [["music", 73.72], ["didgeridoo", 11.46], ["throbbing", 3.46]], null, [["music", 82.81], ["musical instrument", 2.22], ["sampler", 1.86]], null, [["music", 42.07], ["speech", 26.99], ["musical instrument", 4.1]], [["music", 60.92], ["throbbing", 6.11], ["hum", 4.88]]], "duration": [1.01, 0.01, 1.24, 1.1, 1.31, 1.44, 1.81, 0.97, 9.98, 1.27, 0.58, 2.81, 7.8, 1.97, 9.26, 0.76, 2.36, 3.31]} \ No newline at end of file diff --git a/annotations_filtered/rwzNpFWiOTg_filtered.json b/annotations_filtered/rwzNpFWiOTg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42e0d40f3826ae20087b00ed3953e0cf86026494 --- /dev/null +++ b/annotations_filtered/rwzNpFWiOTg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.83], [5.0, 5.97], [6.0, 9.04], [20.0, 21.2], [24.0, 28.49], [31.0, 35.09], [38.0, 49.1], [52.0, 52.83], [56.0, 58.06], [62.0, 80.18], [81.0, 80.96], [81.0, 81.3], [84.0, 87.24]], "keep_status": [false, false, true, false, false, true, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 38.12, 0.0, 32.18, 32.76, 32.1, 0.0, 34.45, 31.69, 0.0, 0.0, 36.24], "audiomae_on_audioset": [null, null, [["music", 36.37], ["speech", 11.38], ["theremin", 4.99]], null, [["insect", 43.93], ["fly, housefly", 39.26], ["frog", 5.9]], [["speech", 29.12], ["music", 18.84], ["whale vocalization", 9.92]], [["speech", 26.29], ["music", 21.05], ["animal", 7.39]], null, [["music", 62.29], ["whack, thwack", 3.2], ["crushing", 2.33]], [["speech", 43.09], ["music", 21.8], ["mosquito", 7.24]], null, null, [["music", 23.29], ["speech", 14.35], ["fart", 6.16]]], "duration": [-0.17, 0.97, 3.04, 1.2, 4.49, 4.09, 11.1, 0.83, 2.06, 18.18, -0.04, 0.3, 3.24]} \ No newline at end of file diff --git a/annotations_filtered/rx4sKoITt-Q_filtered.json b/annotations_filtered/rx4sKoITt-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc4c2cf0dc7ac804d4fb8eac9c48bebd44a553e6 --- /dev/null +++ b/annotations_filtered/rx4sKoITt-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [6.0, 7.23], [19.0, 20.85], [25.0, 25.69], [33.0, 33.12], [34.0, 34.23], [35.0, 36.61], [38.0, 37.61], [42.0, 42.58], [44.0, 44.02], [50.0, 49.71], [51.0, 52.03], [54.0, 55.7], [65.0, 70.33], [73.0, 80.91], [81.0, 81.01], [81.0, 84.69], [86.0, 86.83], [89.0, 90.81], [93.0, 97.93], [104.0, 105.51], [109.0, 109.81], [112.0, 114.2], [119.0, 120.8], [127.0, 129.22], [133.0, 135.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 87.19, 0.0, 55.89, 0.0, 0.0, 100.0, 0.0, 0.0, 99.76, 0.0, 90.95, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 1.23, 1.85, 0.69, 0.12, 0.23, 1.61, -0.39, 0.58, 0.02, -0.29, 1.03, 1.7, 5.33, 7.91, 0.01, 3.69, 0.83, 1.81, 4.93, 1.51, 0.81, 2.2, 1.8, 2.22, 2.78]} \ No newline at end of file diff --git a/annotations_filtered/rxC2ZWU4IPo_filtered.json b/annotations_filtered/rxC2ZWU4IPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3580a8ff363a5a51c708034a0b8aac3323931daf --- /dev/null +++ b/annotations_filtered/rxC2ZWU4IPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [14.0, 14.12], [15.0, 16.48], [22.0, 23.89], [25.0, 29.94], [52.0, 53.87], [60.0, 60.64], [65.0, 65.62], [67.0, 68.94], [73.0, 72.94], [74.0, 74.19], [76.0, 80.96], [86.0, 85.78], [89.0, 89.46], [90.0, 90.78], [92.0, 95.32], [98.0, 100.3], [109.0, 109.53], [110.0, 111.23], [112.0, 113.44], [129.0, 134.16], [135.0, 135.65], [140.0, 141.45], [145.0, 146.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 77.87, 98.1, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["boing", 96.4], ["speech", 1.71], ["music", 0.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 0.12, 1.48, 1.89, 4.94, 1.87, 0.64, 0.62, 1.94, -0.06, 0.19, 4.96, -0.22, 0.46, 0.78, 3.32, 2.3, 0.53, 1.23, 1.44, 5.16, 0.65, 1.45, 1.31]} \ No newline at end of file diff --git a/annotations_filtered/rxCuYueuyxM_filtered.json b/annotations_filtered/rxCuYueuyxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27389c2354d1e56a5d82e8df70387dd15818bb0b --- /dev/null +++ b/annotations_filtered/rxCuYueuyxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.84], [19.0, 20.07], [24.0, 57.94], [58.0, 59.48], [61.0, 66.9], [72.0, 72.67], [73.0, 73.92], [75.0, 77.65], [87.0, 92.33], [93.0, 101.26], [104.0, 112.9], [114.0, 114.18], [117.0, 116.88], [126.0, 126.86], [127.0, 127.03], [127.0, 127.94], [129.0, 128.97], [129.0, 132.36], [137.0, 138.11], [151.0, 154.92], [155.0, 155.11]], "keep_status": [true, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.53, 0.0, 0.0, 0.0, 33.34, 0.0, 0.0, 44.49, 31.37, 38.38, 34.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.75, 0.0, 34.22, 0.0], "audiomae_on_audioset": [[["music", 28.37], ["vehicle", 11.29], ["didgeridoo", 8.67]], null, null, null, [["speech", 53.38], ["music", 12.35], ["radio", 7.36]], null, null, [["moo", 27.59], ["cattle, bovinae", 27.17], ["livestock, farm animals, working animals", 11.84]], [["music", 26.14], ["sound effect", 15.26], ["effects unit", 7.18]], [["speech", 29.92], ["sidetone", 14.36], ["whale vocalization", 9.59]], [["livestock, farm animals, working animals", 30.86], ["cattle, bovinae", 12.42], ["animal", 11.62]], null, null, null, null, null, null, [["speech", 73.05], ["fart", 5.78], ["music", 3.73]], null, [["speech", 51.64], ["fart", 11.92], ["music", 6.92]], null], "duration": [9.84, 1.07, 33.94, 1.48, 5.9, 0.67, 0.92, 2.65, 5.33, 8.26, 8.9, 0.18, -0.12, 0.86, 0.03, 0.94, -0.03, 3.36, 1.11, 3.92, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/rxGjeoSRNQU_filtered.json b/annotations_filtered/rxGjeoSRNQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e75be966c5a73aef90f3084d2806bfe372b0f541 --- /dev/null +++ b/annotations_filtered/rxGjeoSRNQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.5], [17.0, 19.06], [20.0, 25.84], [33.0, 33.91], [37.0, 37.2], [43.0, 43.85], [54.0, 55.46], [59.0, 59.7], [63.0, 63.54], [71.0, 72.59], [73.0, 72.67], [73.0, 72.71], [77.0, 81.08], [82.0, 86.0], [88.0, 94.44], [109.0, 109.14], [111.0, 112.14], [126.0, 127.52], [136.0, 136.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false], "silence_prob": [63.31, 97.92, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.1, 34.86, 33.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 7.33], ["fly, housefly", 7.05], ["mosquito", 6.75]], [["speech", 58.52], ["music", 2.85], ["fart", 2.8]], [["speech", 56.15], ["music", 7.11], ["hum", 5.15]], null, null, null, null], "duration": [3.5, 2.06, 5.84, 0.91, 0.2, 0.85, 1.46, 0.7, 0.54, 1.59, -0.33, -0.29, 4.08, 4.0, 6.44, 0.14, 1.14, 1.52, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/rxJiE5EKnD0_filtered.json b/annotations_filtered/rxJiE5EKnD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/rxJiE5EKnD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/rxM8oCm4TnM_filtered.json b/annotations_filtered/rxM8oCm4TnM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4092cbd2b31aab7f6c1907a78aac54c501be2535 --- /dev/null +++ b/annotations_filtered/rxM8oCm4TnM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.11], [11.0, 10.83], [12.0, 13.46], [16.0, 17.05], [18.0, 18.66], [19.0, 20.44], [23.0, 23.09], [26.0, 26.96], [29.0, 29.46], [30.0, 30.99], [32.0, 33.3], [36.0, 36.53], [40.0, 40.61], [41.0, 42.23], [45.0, 45.05], [46.0, 47.36], [50.0, 54.09], [59.0, 59.34], [61.0, 61.52], [62.0, 62.34], [64.0, 64.61], [66.0, 68.17], [77.0, 76.89], [79.0, 88.45], [90.0, 96.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0, 34.69, 0.0, 31.36, 29.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 16.42], ["dog", 8.38], ["speech", 8.09]], null, [["music", 22.72], ["animal", 17.03], ["howl", 15.43]], [["livestock, farm animals, working animals", 43.72], ["cattle, bovinae", 33.08], ["moo", 13.41]]], "duration": [1.11, -0.17, 1.46, 1.05, 0.66, 1.44, 0.09, 0.96, 0.46, 0.99, 1.3, 0.53, 0.61, 1.23, 0.05, 1.36, 4.09, 0.34, 0.52, 0.34, 0.61, 2.17, -0.11, 9.45, 6.09]} \ No newline at end of file diff --git a/annotations_filtered/rxWQfQcLAUA_filtered.json b/annotations_filtered/rxWQfQcLAUA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d52e6b4724a3d193f278deb2f715641b94d9b940 --- /dev/null +++ b/annotations_filtered/rxWQfQcLAUA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.87], [21.0, 20.85], [21.0, 22.03], [22.0, 23.72], [26.0, 26.49], [29.0, 29.56], [33.0, 34.89], [43.0, 44.44], [51.0, 55.24], [60.0, 64.79], [66.0, 69.62], [89.0, 91.77], [95.0, 95.94], [102.0, 109.07], [118.0, 126.13], [130.0, 131.14], [133.0, 133.69]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.38, 29.56, 30.26, 28.88, 0.0, 29.5, 30.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 51.03], ["a capella", 10.86], ["vocal music", 9.96]], [["music", 56.08], ["singing", 5.69], ["musical instrument", 5.33]], [["music", 66.7], ["musical instrument", 3.53], ["middle eastern music", 2.65]], [["music", 59.82], ["musical instrument", 6.08], ["synthesizer", 5.6]], null, [["music", 51.19], ["theremin", 7.57], ["didgeridoo", 6.88]], [["music", 53.34], ["tabla", 8.92], ["carnatic music", 5.7]], null, null], "duration": [1.87, -0.15, 1.03, 1.72, 0.49, 0.56, 1.89, 1.44, 4.24, 4.79, 3.62, 2.77, 0.94, 7.07, 8.13, 1.14, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/rxX-JLi1FB0_filtered.json b/annotations_filtered/rxX-JLi1FB0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cd698e5584fc16b6d86bcd052824e8ee52b9b3d --- /dev/null +++ b/annotations_filtered/rxX-JLi1FB0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [7.0, 7.47], [8.0, 8.46], [13.0, 13.88], [15.0, 16.14], [18.0, 18.77], [20.0, 20.31], [21.0, 23.58], [25.0, 26.52], [28.0, 35.45], [36.0, 36.26], [37.0, 38.6], [40.0, 40.07], [40.0, 57.87], [61.0, 72.3], [72.0, 76.89], [78.0, 78.49], [80.0, 82.16], [84.0, 84.59], [90.0, 90.71], [92.0, 95.82], [96.0, 105.73], [107.0, 116.46], [118.0, 119.92], [121.0, 127.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.07, 0.0, 62.99, 0.0, 0.0, 0.0, 49.27, 36.84, 36.32, 0.0, 32.11, 0.0, 0.0, 33.63, 44.15, 46.79, 0.0, 40.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 25.74], ["throbbing", 15.24], ["sine wave", 13.86]], [["speech", 72.34], ["telephone", 5.94], ["electric shaver, electric razor", 3.6]], [["speech", 35.05], ["radio", 28.18], ["sidetone", 27.16]], null, [["speech", 46.79], ["sidetone", 15.08], ["radio", 4.82]], null, null, [["speech", 73.9], ["dial tone", 8.35], ["sidetone", 5.34]], [["speech", 76.69], ["sidetone", 6.72], ["stomach rumble", 2.51]], [["sidetone", 45.63], ["speech", 34.34], ["telephone", 4.06]], null, [["sidetone", 82.21], ["speech", 8.77], ["radio", 4.19]]], "duration": [0.45, 0.47, 0.46, 0.88, 1.14, 0.77, 0.31, 2.58, 1.52, 7.45, 0.26, 1.6, 0.07, 17.87, 11.3, 4.89, 0.49, 2.16, 0.59, 0.71, 3.82, 9.73, 9.46, 1.92, 6.94]} \ No newline at end of file diff --git a/annotations_filtered/rxZc0tyTqEg_filtered.json b/annotations_filtered/rxZc0tyTqEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96e8e1b3fbb34038251a26b1ffedb1b4d8199158 --- /dev/null +++ b/annotations_filtered/rxZc0tyTqEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.11], [5.0, 5.66], [7.0, 7.97], [10.0, 10.4], [14.0, 29.02], [30.0, 31.55], [41.0, 55.34], [59.0, 81.23], [82.0, 83.08]], "keep_status": [false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.07, 0.0, 30.33, 37.11, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 37.1], ["music", 27.82], ["crack", 9.87]], null, [["music", 42.27], ["speech", 8.9], ["throbbing", 6.66]], [["music", 15.41], ["rumble", 9.28], ["sound effect", 8.93]], null], "duration": [0.11, 0.66, 0.97, 0.4, 15.02, 1.55, 14.34, 22.23, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/rxkB20Tpvx0_filtered.json b/annotations_filtered/rxkB20Tpvx0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..579ad4072185addf3a726a25e2068bd6926eed91 --- /dev/null +++ b/annotations_filtered/rxkB20Tpvx0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [5.0, 8.43], [18.0, 20.83], [23.0, 23.94], [25.0, 26.94], [39.0, 39.48], [44.0, 46.45], [48.0, 50.38], [56.0, 69.9], [71.0, 72.52], [82.0, 85.31], [90.0, 91.84], [95.0, 95.17], [98.0, 98.39], [104.0, 104.7], [108.0, 107.91], [110.0, 111.18], [117.0, 145.84], [150.0, 155.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 98.19, 34.92, 0.0, 0.0, 0.0, 30.88, 31.48, 31.6, 0.0, 30.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39, 36.25], "audiomae_on_audioset": [null, null, [["music", 49.34], ["speech", 25.26], ["effects unit", 3.22]], null, null, null, [["music", 40.83], ["didgeridoo", 37.86], ["speech", 4.23]], [["music", 49.52], ["theremin", 18.23], ["musical instrument", 7.71]], [["music", 38.51], ["didgeridoo", 8.2], ["cattle, bovinae", 7.67]], null, [["mains hum", 25.67], ["hum", 19.09], ["fly, housefly", 12.75]], null, null, null, null, null, null, [["theremin", 61.67], ["music", 31.33], ["musical instrument", 0.88]], [["music", 33.19], ["foghorn", 20.06], ["brass instrument", 7.48]]], "duration": [1.42, 3.43, 2.83, 0.94, 1.94, 0.48, 2.45, 2.38, 13.9, 1.52, 3.31, 1.84, 0.17, 0.39, 0.7, -0.09, 1.18, 28.84, 5.44]} \ No newline at end of file diff --git a/annotations_filtered/rxme5eLoK5E_filtered.json b/annotations_filtered/rxme5eLoK5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e679594f4424524cba051a985e3cd205764446bf --- /dev/null +++ b/annotations_filtered/rxme5eLoK5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [3.0, 6.27], [7.0, 11.74], [13.0, 15.13], [17.0, 19.5], [20.0, 21.44], [22.0, 28.41], [30.0, 30.69], [31.0, 39.21], [41.0, 43.85], [46.0, 46.74], [48.0, 67.0], [69.0, 71.31], [73.0, 86.0], [87.0, 88.64], [89.0, 137.1], [138.0, 140.14], [141.0, 150.6], [155.0, 158.35], [159.0, 162.72]], "keep_status": [false, false, true, true, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.41, 48.44, 43.35, 45.92, 0.0, 41.38, 0.0, 42.08, 45.52, 0.0, 52.62, 96.42, 89.19, 0.0, 0.0, 74.13, 84.07, 97.54, 94.95], "audiomae_on_audioset": [null, [["hum", 33.06], ["whale vocalization", 29.16], ["music", 8.95]], [["hum", 38.73], ["mains hum", 15.95], ["music", 14.72]], [["music", 44.1], ["hum", 18.97], ["mains hum", 6.62]], [["music", 36.97], ["throbbing", 7.91], ["hum", 5.95]], null, [["music", 51.04], ["hum", 12.87], ["singing bowl", 4.65]], null, [["hum", 34.12], ["mains hum", 28.31], ["music", 17.86]], [["music", 37.08], ["livestock, farm animals, working animals", 8.64], ["hum", 6.55]], null, null, null, null, null, null, null, null, null, null], "duration": [1.44, 3.27, 4.74, 2.13, 2.5, 1.44, 6.41, 0.69, 8.21, 2.85, 0.74, 19.0, 2.31, 13.0, 1.64, 48.1, 2.14, 9.6, 3.35, 3.72]} \ No newline at end of file diff --git a/annotations_filtered/rxno2wz0eKc_filtered.json b/annotations_filtered/rxno2wz0eKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e72f82131a098dab5748cae2df48610cc2d304e8 --- /dev/null +++ b/annotations_filtered/rxno2wz0eKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [3.0, 6.03], [10.0, 10.49], [12.0, 13.24], [18.0, 19.63], [27.0, 29.02], [31.0, 30.86], [32.0, 32.27], [33.0, 33.61], [34.0, 34.69], [37.0, 37.83], [40.0, 40.26], [41.0, 42.63], [48.0, 48.73], [50.0, 50.41], [60.0, 60.78], [63.0, 63.83], [65.0, 66.16], [67.0, 68.64], [69.0, 72.84], [77.0, 76.76], [78.0, 77.99], [82.0, 90.8], [93.0, 98.59], [101.0, 102.93], [104.0, 104.45], [105.0, 107.72], [110.0, 118.34], [119.0, 121.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 87.55, 0.0, 0.0, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.95, 0.0, 0.0, 44.18, 49.0, 0.0, 0.0, 45.98, 33.12, 39.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 83.08], ["musical instrument", 2.92], ["synthesizer", 2.73]], null, null, [["music", 53.64], ["brass instrument", 12.02], ["trombone", 6.78]], [["music", 78.93], ["thunk", 2.92], ["brass instrument", 2.67]], null, null, [["music", 71.73], ["didgeridoo", 7.42], ["musical instrument", 3.77]], [["music", 34.42], ["speech", 26.62], ["screaming", 8.59]], [["didgeridoo", 47.01], ["music", 36.78], ["musical instrument", 4.71]]], "duration": [0.46, 3.03, 0.49, 1.24, 1.63, 2.02, -0.14, 0.27, 0.61, 0.69, 0.83, 0.26, 1.63, 0.73, 0.41, 0.78, 0.83, 1.16, 1.64, 3.84, -0.24, -0.01, 8.8, 5.59, 1.93, 0.45, 2.72, 8.34, 2.46]} \ No newline at end of file diff --git a/annotations_filtered/rxwADdYa0YM_filtered.json b/annotations_filtered/rxwADdYa0YM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9775c69e1520a8ddfd810683442d316645538663 --- /dev/null +++ b/annotations_filtered/rxwADdYa0YM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.79], [11.0, 11.38], [14.0, 15.03], [20.0, 22.47], [27.0, 28.17], [36.0, 36.63], [45.0, 45.54], [47.0, 47.39], [48.0, 51.38], [53.0, 53.13], [60.0, 65.11], [77.0, 78.8], [100.0, 103.03], [104.0, 104.89], [106.0, 106.34], [108.0, 114.0], [115.0, 116.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 80.64, 0.0, 0.0, 0.0, 0.0, 35.07, 0.0, 35.69, 0.0, 37.97, 0.0, 0.0, 35.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 47.44], ["foghorn", 19.09], ["theremin", 12.77]], null, [["music", 78.18], ["lullaby", 1.66], ["humming", 1.55]], null, [["music", 41.67], ["theremin", 22.28], ["speech", 5.17]], null, null, [["music", 58.91], ["theremin", 29.65], ["singing", 1.66]], null], "duration": [0.79, 0.38, 1.03, 2.47, 1.17, 0.63, 0.54, 0.39, 3.38, 0.13, 5.11, 1.8, 3.03, 0.89, 0.34, 6.0, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/ry55--J4_VQ_filtered.json b/annotations_filtered/ry55--J4_VQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb2127313177d7dc4fb1ba12a7513e594d905af0 --- /dev/null +++ b/annotations_filtered/ry55--J4_VQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.68], [33.0, 33.03], [36.0, 45.13], [48.0, 49.03], [51.0, 51.04], [52.0, 52.98], [55.0, 56.03], [57.0, 59.48]], "keep_status": [true, false, false, false, false, false, false, true], "silence_prob": [48.44, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 48.39], "audiomae_on_audioset": [[["hum", 28.76], ["mains hum", 12.25], ["throbbing", 11.98]], null, [["speech", 67.93], ["sidetone", 7.0], ["music", 4.74]], null, null, null, null, [["hum", 17.05], ["music", 15.52], ["mains hum", 7.55]]], "duration": [2.68, 0.03, 9.13, 1.03, 0.04, 0.98, 1.03, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/ry88dGpJKZk_filtered.json b/annotations_filtered/ry88dGpJKZk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84776da1ba44cb54f5166ff5e90d411a62b04570 --- /dev/null +++ b/annotations_filtered/ry88dGpJKZk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.96], [10.0, 14.84], [17.0, 22.76], [25.0, 39.31], [40.0, 48.52], [50.0, 51.85], [54.0, 58.13], [60.0, 67.31], [76.0, 77.06], [84.0, 84.59], [85.0, 85.53], [87.0, 93.82], [95.0, 97.68], [99.0, 102.37], [103.0, 108.43], [109.0, 110.54], [112.0, 120.58], [122.0, 124.04], [125.0, 129.78], [132.0, 139.87]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.73, 80.29, 88.28, 99.62, 0.0, 42.51, 100.0, 0.0, 0.0, 0.0, 94.81, 99.59, 100.0, 100.0, 0.0, 99.96, 99.98, 100.0, 100.0], "audiomae_on_audioset": [null, [["civil defense siren", 18.41], ["livestock, farm animals, working animals", 15.57], ["moo", 6.73]], null, null, null, null, [["livestock, farm animals, working animals", 35.36], ["moo", 32.69], ["cattle, bovinae", 31.89]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.96, 4.84, 5.76, 14.31, 8.52, 1.85, 4.13, 7.31, 1.06, 0.59, 0.53, 6.82, 2.68, 3.37, 5.43, 1.54, 8.58, 2.04, 4.78, 7.87]} \ No newline at end of file diff --git a/annotations_filtered/ry9yNbMVeMQ_filtered.json b/annotations_filtered/ry9yNbMVeMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd3b368c488068e49e42464d333d80bf142223cf --- /dev/null +++ b/annotations_filtered/ry9yNbMVeMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 31.75], [33.0, 36.44], [38.0, 78.14], [81.0, 113.26]], "keep_status": [false, true, false, false], "silence_prob": [31.91, 30.3, 0.0, 0.0], "audiomae_on_audioset": [[["music", 30.43], ["hum", 28.91], ["mains hum", 27.85]], [["mains hum", 26.37], ["hum", 20.15], ["music", 15.23]], null, null], "duration": [27.75, 3.44, 40.14, 32.26]} \ No newline at end of file diff --git a/annotations_filtered/ryRzxiWudaA_filtered.json b/annotations_filtered/ryRzxiWudaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb49a703bd11965c047a9c595adbbf7bc40f3d83 --- /dev/null +++ b/annotations_filtered/ryRzxiWudaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [3.0, 15.69], [19.0, 30.62], [33.0, 72.57], [75.0, 81.67], [87.0, 106.83], [111.0, 134.35], [138.0, 171.41], [175.0, 175.95]], "keep_status": [false, false, true, false, true, false, true, false, false], "silence_prob": [0.0, 38.16, 30.91, 0.0, 30.82, 31.31, 32.46, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 48.57], ["throbbing", 20.51], ["mains hum", 12.78]], [["mains hum", 18.87], ["hum", 17.4], ["music", 15.44]], null, [["speech", 30.22], ["music", 26.14], ["didgeridoo", 11.26]], [["mains hum", 53.39], ["hum", 41.06], ["throbbing", 2.54]], [["hum", 24.7], ["mains hum", 19.12], ["speech", 18.07]], null, null], "duration": [0.67, 12.69, 11.62, 39.57, 6.67, 19.83, 23.35, 33.41, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/ryqyAX_lA7w_filtered.json b/annotations_filtered/ryqyAX_lA7w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b20b5c86e9965444088ea98aa801946a2a60101 --- /dev/null +++ b/annotations_filtered/ryqyAX_lA7w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 106.37], [108.0, 116.83]], "keep_status": [false, true], "silence_prob": [46.5, 44.26], "audiomae_on_audioset": [[["music", 60.49], ["hum", 8.45], ["ambient music", 3.64]], [["music", 57.87], ["singing bowl", 5.41], ["theremin", 5.32]]], "duration": [25.37, 8.83]} \ No newline at end of file diff --git a/annotations_filtered/ryvvNrcMh-c_filtered.json b/annotations_filtered/ryvvNrcMh-c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f27280d34b8da68546562a80bbae85ef95a33d63 --- /dev/null +++ b/annotations_filtered/ryvvNrcMh-c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.23], [5.0, 5.86], [7.0, 7.16], [10.0, 14.54], [16.0, 17.39], [19.0, 21.88], [24.0, 26.28], [29.0, 31.87], [35.0, 37.05], [40.0, 41.66], [42.0, 43.71], [46.0, 47.22], [48.0, 49.52], [50.0, 51.11], [52.0, 53.7], [55.0, 64.61], [66.0, 68.25], [70.0, 70.85], [73.0, 74.49], [75.0, 76.38], [81.0, 82.21], [85.0, 90.14], [91.0, 103.77], [105.0, 105.41], [107.0, 109.05], [111.0, 119.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.48, 0.0, 99.1, 99.82, 99.9, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 79.41, 0.0, 0.0, 0.0, 0.0, 48.14, 38.2, 0.0, 60.42, 51.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 27.28], ["mains hum", 17.95], ["hum", 15.89]], [["speech", 34.79], ["hum", 19.96], ["mains hum", 19.95]], null, null, null], "duration": [1.23, 0.86, 0.16, 4.54, 1.39, 2.88, 2.28, 2.87, 2.05, 1.66, 1.71, 1.22, 1.52, 1.11, 1.7, 9.61, 2.25, 0.85, 1.49, 1.38, 1.21, 5.14, 12.77, 0.41, 2.05, 8.62]} \ No newline at end of file diff --git a/annotations_filtered/ryyEEyKD9EU_filtered.json b/annotations_filtered/ryyEEyKD9EU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bec1e41e9edf6b86c8ada2f3598afb6d0daecdd --- /dev/null +++ b/annotations_filtered/ryyEEyKD9EU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.98], [10.0, 9.86], [12.0, 12.11], [14.0, 13.91], [18.0, 20.26], [27.0, 28.02], [31.0, 31.56], [34.0, 34.18], [35.0, 35.02], [37.0, 38.3], [39.0, 40.56], [42.0, 43.16], [45.0, 46.45], [47.0, 47.8], [52.0, 52.39], [54.0, 54.18], [61.0, 61.72], [64.0, 65.31], [72.0, 73.47], [83.0, 83.1], [85.0, 86.73], [89.0, 90.53], [93.0, 93.24], [94.0, 95.23], [97.0, 111.32], [112.0, 115.23], [117.0, 118.49], [123.0, 124.01], [128.0, 129.52], [131.0, 132.93], [134.0, 135.6], [138.0, 138.52], [139.0, 142.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.47, 60.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.98, -0.14, 0.11, -0.09, 2.26, 1.02, 0.56, 0.18, 0.02, 1.3, 1.56, 1.16, 1.45, 0.8, 0.39, 0.18, 0.72, 1.31, 1.47, 0.1, 1.73, 1.53, 0.24, 1.23, 14.32, 3.23, 1.49, 1.01, 1.52, 1.93, 1.6, 0.52, 3.16]} \ No newline at end of file diff --git a/annotations_filtered/rz2FxTVVJi4_filtered.json b/annotations_filtered/rz2FxTVVJi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34ae7171da1b392b0f712ef009cc32a211d28373 --- /dev/null +++ b/annotations_filtered/rz2FxTVVJi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.8], [11.0, 11.06], [11.0, 11.37], [15.0, 14.84], [28.0, 29.12], [35.0, 36.26], [37.0, 38.35], [44.0, 43.95], [56.0, 56.54], [89.0, 89.82], [90.0, 90.93], [97.0, 98.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 0.06, 0.37, -0.16, 1.12, 1.26, 1.35, -0.05, 0.54, 0.82, 0.93, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/rz41nM47q7Y_filtered.json b/annotations_filtered/rz41nM47q7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9398cef0c08730708148cba0a9901bddd749ae8 --- /dev/null +++ b/annotations_filtered/rz41nM47q7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 46.94], [48.0, 48.02], [50.0, 56.08], [56.0, 56.13], [57.0, 62.38], [63.0, 71.63]], "keep_status": [true, false, true, false, true, true], "silence_prob": [29.56, 0.0, 30.4, 0.0, 31.24, 29.16], "audiomae_on_audioset": [[["music", 53.74], ["throbbing", 7.39], ["hum", 3.57]], null, [["explosion", 47.34], ["burst, pop", 11.77], ["speech", 7.28]], null, [["explosion", 25.4], ["music", 23.0], ["burst, pop", 9.88]], [["fly, housefly", 21.34], ["mosquito", 14.84], ["whip", 14.76]]], "duration": [23.94, 0.02, 6.08, 0.13, 5.38, 8.63]} \ No newline at end of file diff --git a/annotations_filtered/rzCeSHk3aVY_filtered.json b/annotations_filtered/rzCeSHk3aVY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c6ca616965008ce3356b9592fcd2d112a99fb46 --- /dev/null +++ b/annotations_filtered/rzCeSHk3aVY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.13], [3.0, 4.06], [7.0, 7.65], [10.0, 12.21], [18.0, 27.11], [31.0, 31.83], [39.0, 39.38], [42.0, 42.35], [46.0, 45.72], [63.0, 64.91], [66.0, 68.17], [71.0, 71.04], [73.0, 74.31], [75.0, 87.29], [89.0, 97.39], [99.0, 100.47], [109.0, 111.97], [114.0, 115.43], [118.0, 122.42], [124.0, 128.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 98.99, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 40.38, 61.67, 0.0, 58.38, 0.0, 31.31, 29.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.32], ["electronic music", 14.11], ["hum", 12.83]], null, null, null, null, [["music", 48.32], ["buzz", 4.87], ["mosquito", 3.17]], [["music", 38.04], ["throbbing", 6.68], ["hum", 5.45]]], "duration": [0.13, 1.06, 0.65, 2.21, 9.11, 0.83, 0.38, 0.35, -0.28, 1.91, 2.17, 0.04, 1.31, 12.29, 8.39, 1.47, 2.97, 1.43, 4.42, 4.65]} \ No newline at end of file diff --git a/annotations_filtered/rzG2L4Nbm3E_filtered.json b/annotations_filtered/rzG2L4Nbm3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ced8c56de01436227c15d283285a41116b6531bd --- /dev/null +++ b/annotations_filtered/rzG2L4Nbm3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.33], [32.0, 32.21], [35.0, 53.11], [56.0, 56.08], [57.0, 59.19], [62.0, 61.79], [65.0, 65.45], [65.0, 65.91]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 35.69, 0.0, 49.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 83.21], ["synthesizer", 4.13], ["musical instrument", 1.26]], null, [["hum", 28.54], ["speech", 16.6], ["mains hum", 12.37]], null, null, null], "duration": [0.33, 0.21, 18.11, 0.08, 2.19, -0.21, 0.45, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/rzIs51GUVgg_filtered.json b/annotations_filtered/rzIs51GUVgg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43f8e8b03562d664a7133de3ddf31cfe75e11880 --- /dev/null +++ b/annotations_filtered/rzIs51GUVgg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.22], [14.0, 14.61], [31.0, 33.96], [39.0, 40.83], [58.0, 59.0], [62.0, 62.87], [65.0, 65.96], [67.0, 68.05], [70.0, 70.17], [79.0, 80.25], [82.0, 83.64], [86.0, 86.73], [89.0, 89.38], [93.0, 94.04], [97.0, 98.42], [102.0, 102.46], [131.0, 131.92]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.55, 0.0, 33.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["echo", 19.98], ["moo", 10.31], ["cattle, bovinae", 5.65]], null, [["music", 44.4], ["didgeridoo", 10.43], ["singing", 3.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.22, 0.61, 2.96, 1.83, 1.0, 0.87, 0.96, 1.05, 0.17, 1.25, 1.64, 0.73, 0.38, 1.04, 1.42, 0.46, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/rzXNFMVS7PM_filtered.json b/annotations_filtered/rzXNFMVS7PM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cdda06c4870320e6e416a8a10703596b449bc2c --- /dev/null +++ b/annotations_filtered/rzXNFMVS7PM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.34], [2.0, 3.0], [4.0, 4.53], [6.0, 6.25], [12.0, 12.38], [19.0, 19.58], [20.0, 20.75], [27.0, 26.96], [28.0, 30.06], [47.0, 48.54], [49.0, 50.36], [51.0, 52.0], [53.0, 53.64], [56.0, 56.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 1.0, 0.53, 0.25, 0.38, 0.58, 0.75, -0.04, 2.06, 1.54, 1.36, 1.0, 0.64, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/rzs0681gdf0_filtered.json b/annotations_filtered/rzs0681gdf0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..863d77eba0e9b71eeb93db3f022ebd2eb2ca3e04 --- /dev/null +++ b/annotations_filtered/rzs0681gdf0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 40.74], [42.0, 43.51], [44.0, 61.91], [64.0, 73.55], [75.0, 75.64], [78.0, 80.18], [81.0, 81.7], [83.0, 82.88], [84.0, 86.29], [87.0, 87.29], [88.0, 90.14], [91.0, 91.32], [93.0, 93.12], [94.0, 95.22], [106.0, 108.19], [110.0, 112.11], [113.0, 113.91], [116.0, 116.19], [117.0, 118.18], [123.0, 123.28], [125.0, 125.42], [127.0, 127.23], [128.0, 129.27], [130.0, 130.64]], "keep_status": [true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.04, 0.0, 37.53, 34.57, 0.0, 90.25, 0.0, 0.0, 98.01, 0.0, 99.1, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 11.1], ["throbbing", 9.62], ["music", 8.6]], null, [["hum", 26.76], ["speech", 9.18], ["mains hum", 8.35]], [["livestock, farm animals, working animals", 20.18], ["frog", 9.12], ["moo", 8.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.74, 1.51, 17.91, 9.55, 0.64, 2.18, 0.7, -0.12, 2.29, 0.29, 2.14, 0.32, 0.12, 1.22, 2.19, 2.11, 0.91, 0.19, 1.18, 0.28, 0.42, 0.23, 1.27, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/rzuN9uvnsZI_filtered.json b/annotations_filtered/rzuN9uvnsZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb56548e0251d3a6e5b3f8f5f5083e4ba04302c2 --- /dev/null +++ b/annotations_filtered/rzuN9uvnsZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [6.0, 6.34], [11.0, 11.43], [17.0, 16.66], [22.0, 22.22], [28.0, 29.88], [30.0, 32.32], [33.0, 38.21], [39.0, 83.35], [84.0, 96.45], [98.0, 114.07], [115.0, 125.14], [126.0, 165.21], [167.0, 167.83], [170.0, 171.44], [173.0, 173.87], [177.0, 178.38], [180.0, 189.19], [191.0, 191.67], [192.0, 203.52], [207.0, 209.01], [210.0, 212.18], [213.0, 219.3], [221.0, 236.58], [243.0, 244.34], [247.0, 249.1], [255.0, 255.9], [264.0, 264.56]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.31, 39.15, 0.0, 28.4, 28.26, 28.43, 0.0, 0.0, 0.0, 0.0, 0.0, 28.84, 0.0, 29.75, 33.97, 37.65, 34.09, 51.71, 0.0, 90.08, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["sidetone", 90.73], ["speech", 3.77], ["radio", 3.05]], null, [["speech", 13.29], ["music", 11.18], ["hum", 7.81]], [["buzz", 24.98], ["electric shaver, electric razor", 9.09], ["noise", 4.57]], [["speech", 44.44], ["vehicle", 11.9], ["aircraft", 6.57]], null, null, null, null, null, [["mains hum", 30.33], ["hum", 17.7], ["music", 12.11]], null, [["music", 41.59], ["synthesizer", 13.89], ["noise", 10.13]], [["music", 43.59], ["hum", 6.6], ["electronic music", 4.97]], [["music", 42.3], ["didgeridoo", 34.0], ["musical instrument", 4.07]], [["speech", 33.81], ["music", 30.23], ["didgeridoo", 13.97]], null, null, null, null, null], "duration": [0.73, 0.34, 0.43, -0.34, 0.22, 1.88, 2.32, 5.21, 44.35, 12.45, 16.07, 10.14, 39.21, 0.83, 1.44, 0.87, 1.38, 9.19, 0.67, 11.52, 2.01, 2.18, 6.3, 15.58, 1.34, 2.1, 0.9, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/s-EheX9m-dE_filtered.json b/annotations_filtered/s-EheX9m-dE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ccf313d831f9c04e3f0c803304da372b7e50c73 --- /dev/null +++ b/annotations_filtered/s-EheX9m-dE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [3.0, 3.42], [5.0, 5.53], [7.0, 7.82], [8.0, 10.08], [13.0, 14.22], [16.0, 17.39], [25.0, 25.71], [27.0, 68.05], [70.0, 72.13], [75.0, 76.79], [78.0, 79.88], [84.0, 89.28], [90.0, 94.02], [96.0, 97.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.3, 0.0, 0.0, 0.0, 0.0, 63.31, 0.0, 0.0, 38.2, 50.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.57], ["fly, housefly", 16.56], ["insect", 7.9]], null, null], "duration": [1.1, 0.42, 0.53, 0.82, 2.08, 1.22, 1.39, 0.71, 41.05, 2.13, 1.79, 1.88, 5.28, 4.02, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/s-Sx_dMw8oA_filtered.json b/annotations_filtered/s-Sx_dMw8oA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b91609f694cb6547ce2be90a1fd8c76c58e3a4d4 --- /dev/null +++ b/annotations_filtered/s-Sx_dMw8oA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.12], [15.0, 16.68], [19.0, 26.64], [31.0, 31.6], [33.0, 33.96], [36.0, 36.64], [37.0, 54.48], [56.0, 56.88], [59.0, 59.7], [61.0, 63.24], [65.0, 68.0], [72.0, 73.35], [78.0, 82.53], [83.0, 90.19], [93.0, 93.29], [93.0, 93.33], [96.0, 104.43]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.01, 0.0, 34.26, 0.0, 0.0, 0.0, 34.82, 0.0, 0.0, 49.87, 38.23, 0.0, 39.5, 34.17, 0.0, 0.0, 33.81], "audiomae_on_audioset": [[["music", 60.08], ["synthesizer", 12.0], ["musical instrument", 3.51]], null, [["music", 55.22], ["theremin", 11.49], ["didgeridoo", 6.15]], null, null, null, [["music", 49.38], ["synthesizer", 18.25], ["theremin", 7.13]], null, null, [["music", 41.89], ["didgeridoo", 9.14], ["musical instrument", 5.61]], [["music", 79.19], ["musical instrument", 2.58], ["synthesizer", 2.13]], null, [["music", 62.51], ["synthesizer", 8.5], ["musical instrument", 4.5]], [["music", 73.52], ["musical instrument", 7.38], ["drum", 2.68]], null, null, [["music", 46.51], ["speech", 19.31], ["musical instrument", 6.65]]], "duration": [2.12, 1.68, 7.64, 0.6, 0.96, 0.64, 17.48, 0.88, 0.7, 2.24, 3.0, 1.35, 4.53, 7.19, 0.29, 0.33, 8.43]} \ No newline at end of file diff --git a/annotations_filtered/s-kucHjKbG4_filtered.json b/annotations_filtered/s-kucHjKbG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1a7173a531a43783e23075e09ff74b5457155d0 --- /dev/null +++ b/annotations_filtered/s-kucHjKbG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.72], [5.0, 6.17], [6.0, 8.68], [9.0, 10.32], [11.0, 11.82], [13.0, 12.92], [13.0, 15.55], [18.0, 18.4], [22.0, 22.5], [23.0, 23.25], [28.0, 28.51], [31.0, 31.8], [33.0, 33.96], [36.0, 36.0], [40.0, 40.44], [44.0, 45.79], [47.0, 49.59], [55.0, 61.48], [62.0, 62.38], [65.0, 65.3], [66.0, 67.96], [89.0, 89.88], [95.0, 96.5], [97.0, 99.57], [103.0, 104.65], [107.0, 107.0], [110.0, 109.78], [112.0, 112.83], [113.0, 115.1], [115.0, 116.94], [119.0, 121.14], [124.0, 124.83], [127.0, 127.36]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 51.82, 0.0, 0.0, 0.0, 39.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.96, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 36.06, 0.0, 0.0, 0.0, 0.0, 33.35, 0.0, 40.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 41.85], ["whale vocalization", 3.25], ["burping, eructation", 2.83]], null, null, null, null, null, null, null, null, null, [["speech", 47.9], ["dial tone", 11.07], ["busy signal", 8.03]], null, null, null, null, null, null, [["speech", 62.06], ["sidetone", 10.72], ["chirp tone", 3.16]], null, null, null, null, [["speech", 39.35], ["busy signal", 14.78], ["throbbing", 8.68]], null, [["sine wave", 19.01], ["chirp tone", 18.44], ["speech", 16.61]], null, null], "duration": [1.72, 1.17, 2.68, 1.32, 0.82, -0.08, 2.55, 0.4, 0.5, 0.25, 0.51, 0.8, 0.96, 0.0, 0.44, 1.79, 2.59, 6.48, 0.38, 0.3, 1.96, 0.88, 1.5, 2.57, 1.65, 0.0, -0.22, 0.83, 2.1, 1.94, 2.14, 0.83, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/s-pgK_Rvuwc_filtered.json b/annotations_filtered/s-pgK_Rvuwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8238636dae110671b04b5e4c128c7be9ac131f9 --- /dev/null +++ b/annotations_filtered/s-pgK_Rvuwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 50.35], [52.0, 52.98], [54.0, 54.48], [56.0, 60.44], [61.0, 61.82], [63.0, 63.75], [71.0, 70.98], [74.0, 74.41], [78.0, 81.8], [83.0, 91.1], [92.0, 101.46], [110.0, 112.95]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 33.34, 0.0, 0.0, 0.0, 0.0, 30.45, 30.03, 30.95, 30.1], "audiomae_on_audioset": [null, null, null, [["music", 31.39], ["didgeridoo", 14.11], ["theremin", 9.09]], null, null, null, null, [["music", 47.57], ["speech", 15.81], ["throbbing", 4.49]], [["speech", 41.93], ["music", 35.42], ["theremin", 4.35]], [["music", 54.88], ["speech", 25.8], ["thunk", 2.7]], [["speech", 28.34], ["didgeridoo", 24.69], ["music", 16.8]]], "duration": [0.35, 0.98, 0.48, 4.44, 0.82, 0.75, -0.02, 0.41, 3.8, 8.1, 9.46, 2.95]} \ No newline at end of file diff --git a/annotations_filtered/s-rl8q9jezU_filtered.json b/annotations_filtered/s-rl8q9jezU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2af9c3910d18265d2f1059063eb26c54fc4b08c7 --- /dev/null +++ b/annotations_filtered/s-rl8q9jezU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.0], [17.0, 17.49], [23.0, 23.31], [27.0, 37.42], [40.0, 40.19], [42.0, 54.48], [56.0, 67.83], [71.0, 72.96], [76.0, 76.77], [78.0, 80.96], [82.0, 84.37], [86.0, 89.34], [98.0, 97.9], [98.0, 104.06], [110.0, 117.44], [125.0, 125.44], [126.0, 127.7], [128.0, 130.37], [134.0, 137.27], [138.0, 138.65], [140.0, 142.25], [143.0, 143.94], [144.0, 145.84], [147.0, 152.12], [155.0, 155.92], [159.0, 164.51], [168.0, 169.15]], "keep_status": [true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [37.25, 0.0, 0.0, 32.36, 0.0, 34.56, 37.14, 0.0, 0.0, 40.88, 40.88, 39.07, 0.0, 31.87, 32.19, 0.0, 0.0, 48.82, 43.82, 0.0, 45.98, 0.0, 0.0, 36.29, 0.0, 38.78, 0.0], "audiomae_on_audioset": [[["music", 26.37], ["whale vocalization", 13.09], ["hum", 5.44]], null, null, [["buzz", 71.07], ["music", 9.32], ["fly, housefly", 5.29]], null, [["music", 68.93], ["synthesizer", 4.74], ["effects unit", 3.88]], [["music", 44.14], ["hum", 17.77], ["mains hum", 12.62]], null, null, [["music", 54.23], ["bleat", 7.39], ["sheep", 6.72]], [["music", 28.73], ["speech", 19.54], ["hum", 15.63]], [["music", 50.94], ["speech", 16.8], ["mains hum", 7.7]], null, [["mains hum", 39.94], ["hum", 28.42], ["music", 21.08]], [["music", 50.13], ["whale vocalization", 14.7], ["theremin", 5.99]], null, null, [["mains hum", 46.55], ["hum", 19.33], ["music", 7.14]], [["music", 68.29], ["speech", 3.26], ["grunt", 1.87]], null, [["music", 40.37], ["theremin", 16.34], ["ambient music", 5.9]], null, null, [["music", 55.34], ["throbbing", 9.42], ["hum", 6.77]], null, [["music", 55.31], ["whale vocalization", 11.51], ["ambient music", 5.71]], null], "duration": [5.0, 0.49, 0.31, 10.42, 0.19, 12.48, 11.83, 1.96, 0.77, 2.96, 2.37, 3.34, -0.1, 6.06, 7.44, 0.44, 1.7, 2.37, 3.27, 0.65, 2.25, 0.94, 1.84, 5.12, 0.92, 5.51, 1.15]} \ No newline at end of file diff --git a/annotations_filtered/s-vP7WgMkpA_filtered.json b/annotations_filtered/s-vP7WgMkpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3429ea54609483e0952e11f2da2f7a4c2089a61f --- /dev/null +++ b/annotations_filtered/s-vP7WgMkpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 45.44]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.44]} \ No newline at end of file diff --git a/annotations_filtered/s039YJGaP-Y_filtered.json b/annotations_filtered/s039YJGaP-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1834680fa447d5518ee9955c9291df9d769df82d --- /dev/null +++ b/annotations_filtered/s039YJGaP-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.14], [1.0, 2.84], [10.0, 10.12], [19.0, 19.53], [22.0, 22.6], [23.0, 23.19], [35.0, 35.73], [40.0, 40.91], [44.0, 44.95], [47.0, 47.16], [50.0, 52.07], [54.0, 54.55], [59.0, 78.14], [81.0, 85.09], [88.0, 88.74], [92.0, 96.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 64.41, 52.16, 0.0, 39.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 54.02], ["sidetone", 12.84], ["radio", 3.7]], null, null, null, null, [["music", 24.71], ["hum", 12.54], ["mains hum", 9.34]]], "duration": [0.14, 1.84, 0.12, 0.53, 0.6, 0.19, 0.73, 0.91, 0.95, 0.16, 2.07, 0.55, 19.14, 4.09, 0.74, 4.72]} \ No newline at end of file diff --git a/annotations_filtered/s0EAZmF0k6g_filtered.json b/annotations_filtered/s0EAZmF0k6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cff4cef91cf6aec9a04f67c7467c830795e19478 --- /dev/null +++ b/annotations_filtered/s0EAZmF0k6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[130.0, 130.71]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.71]} \ No newline at end of file diff --git a/annotations_filtered/s0_sBamhlIs_filtered.json b/annotations_filtered/s0_sBamhlIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..191179aa13a10068fe7068ce5c36e49fb86ad317 --- /dev/null +++ b/annotations_filtered/s0_sBamhlIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.53], [11.0, 11.85], [14.0, 16.75], [17.0, 18.06], [23.0, 23.13], [23.0, 23.58], [24.0, 24.46], [25.0, 25.25], [26.0, 33.59], [35.0, 34.87], [35.0, 35.72], [36.0, 36.66], [41.0, 41.35], [45.0, 46.28], [47.0, 53.59], [57.0, 58.23], [62.0, 62.7], [64.0, 80.94], [82.0, 82.9], [85.0, 91.08], [97.0, 116.24], [117.0, 117.48], [117.0, 117.51], [118.0, 119.5]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [90.43, 0.0, 44.34, 0.0, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 0.0, 39.35, 0.0, 35.9, 36.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["didgeridoo", 23.07], ["music", 16.93], ["effects unit", 13.94]], null, null, null, null, null, [["music", 72.4], ["didgeridoo", 2.8], ["musical instrument", 2.7]], null, null, null, null, null, [["music", 69.95], ["musical instrument", 5.86], ["theremin", 3.94]], null, null, [["music", 57.3], ["speech", 18.67], ["musical instrument", 3.33]], null, [["music", 55.25], ["musical instrument", 4.2], ["effects unit", 2.96]], [["music", 65.02], ["musical instrument", 5.64], ["trombone", 3.37]], null, null, null], "duration": [3.53, 0.85, 2.75, 1.06, 0.13, 0.58, 0.46, 0.25, 7.59, -0.13, 0.72, 0.66, 0.35, 1.28, 6.59, 1.23, 0.7, 16.94, 0.9, 6.08, 19.24, 0.48, 0.51, 1.5]} \ No newline at end of file diff --git a/annotations_filtered/s0bxFcZV40A_filtered.json b/annotations_filtered/s0bxFcZV40A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..948508415abefca4a7a1a0e7eb3286b857627486 --- /dev/null +++ b/annotations_filtered/s0bxFcZV40A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.68], [10.0, 10.52], [14.0, 23.55], [25.0, 25.24], [26.0, 26.23], [26.0, 26.32], [28.0, 28.95], [31.0, 31.56], [34.0, 47.61], [48.0, 49.5], [53.0, 54.3], [55.0, 55.66], [58.0, 60.93], [62.0, 62.9], [65.0, 74.92], [77.0, 92.6], [97.0, 97.39], [102.0, 102.32], [116.0, 116.01], [116.0, 117.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 55.39, 0.0, 0.0, 0.0, 73.36, 0.0, 49.92, 33.22, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.53], ["mains hum", 26.18], ["hum", 17.7]], [["music", 40.26], ["hum", 16.55], ["throbbing", 4.98]], null, null, null, null], "duration": [1.68, 0.52, 9.55, 0.24, 0.23, 0.32, 0.95, 0.56, 13.61, 1.5, 1.3, 0.66, 2.93, 0.9, 9.92, 15.6, 0.39, 0.32, 0.01, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/s0eHgfzlrF8_filtered.json b/annotations_filtered/s0eHgfzlrF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..434ec9175c6d369753b86edfe5924eb58837dd7c --- /dev/null +++ b/annotations_filtered/s0eHgfzlrF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.28], [17.0, 20.38], [28.0, 28.63], [32.0, 32.73], [36.0, 36.96], [41.0, 44.24], [55.0, 74.01], [76.0, 83.84]], "keep_status": [false, true, false, false, false, false, false, true], "silence_prob": [0.0, 31.51, 0.0, 0.0, 0.0, 31.97, 32.96, 32.13], "audiomae_on_audioset": [null, [["frog", 34.95], ["grunt", 11.01], ["sound effect", 6.32]], null, null, null, [["noise", 52.67], ["music", 22.14], ["cacophony", 3.76]], [["music", 82.02], ["grunt", 4.88], ["speech", 2.3]], [["music", 21.69], ["hum", 12.47], ["mains hum", 10.24]]], "duration": [0.28, 3.38, 0.63, 0.73, 0.96, 3.24, 19.01, 7.84]} \ No newline at end of file diff --git a/annotations_filtered/s0vNsH81YeA_filtered.json b/annotations_filtered/s0vNsH81YeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f8f0aca15fefc59646472fa95786b7483de2c74 --- /dev/null +++ b/annotations_filtered/s0vNsH81YeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.1], [22.0, 34.64], [35.0, 42.9], [44.0, 62.28], [63.0, 68.5], [72.0, 81.53], [82.0, 83.47], [85.0, 85.56], [88.0, 89.24], [90.0, 91.57], [92.0, 97.38], [99.0, 101.66], [104.0, 106.24], [107.0, 120.19]], "keep_status": [false, true, false, true, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 43.93, 39.77, 49.64, 64.52, 46.12, 0.0, 0.0, 0.0, 0.0, 34.78, 31.51, 64.29, 33.78], "audiomae_on_audioset": [null, [["music", 39.35], ["speech", 16.22], ["didgeridoo", 5.06]], [["music", 67.02], ["foghorn", 8.31], ["brass instrument", 4.97]], [["speech", 31.88], ["music", 25.48], ["brass instrument", 5.53]], null, [["music", 60.41], ["theremin", 7.25], ["musical instrument", 3.59]], null, null, null, null, [["music", 45.31], ["fly, housefly", 7.92], ["mosquito", 4.36]], [["music", 24.2], ["speech", 20.18], ["cacophony", 4.63]], null, [["music", 23.8], ["speech", 18.54], ["didgeridoo", 17.3]]], "duration": [1.1, 12.64, 7.9, 18.28, 5.5, 9.53, 1.47, 0.56, 1.24, 1.57, 5.38, 2.66, 2.24, 13.19]} \ No newline at end of file diff --git a/annotations_filtered/s1QgQny2o5E_filtered.json b/annotations_filtered/s1QgQny2o5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11e98fcd87fea16a646bb5ec1501130f845b8d4a --- /dev/null +++ b/annotations_filtered/s1QgQny2o5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 29.32], [31.0, 34.11], [37.0, 39.09], [41.0, 44.24], [46.0, 46.9], [49.0, 49.65], [53.0, 53.79], [57.0, 59.64], [63.0, 62.53], [67.0, 71.17], [73.0, 88.57], [89.0, 91.84], [93.0, 94.53], [96.0, 112.19], [114.0, 115.65]], "keep_status": [false, true, true, true, false, false, false, true, false, true, false, true, false, false, false], "silence_prob": [35.73, 34.98, 30.91, 42.28, 0.0, 0.0, 0.0, 38.32, 0.0, 32.7, 29.36, 36.2, 0.0, 32.96, 0.0], "audiomae_on_audioset": [[["music", 41.74], ["hum", 21.17], ["mains hum", 17.4]], [["mains hum", 29.07], ["hum", 19.88], ["music", 9.78]], [["music", 28.04], ["sound effect", 14.85], ["synthesizer", 7.86]], [["music", 29.86], ["gong", 20.4], ["sonar", 7.51]], null, null, null, [["music", 18.71], ["hum", 17.97], ["mains hum", 14.61]], null, [["mains hum", 15.15], ["hum", 12.47], ["speech", 8.57]], [["music", 42.94], ["speech", 24.15], ["hum", 9.26]], [["music", 31.89], ["whale vocalization", 15.45], ["civil defense siren", 11.02]], null, [["music", 78.67], ["scary music", 8.25], ["foghorn", 2.74]], null], "duration": [5.32, 3.11, 2.09, 3.24, 0.9, 0.65, 0.79, 2.64, -0.47, 4.17, 15.57, 2.84, 1.53, 16.19, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/s1Y023ZS4Ms_filtered.json b/annotations_filtered/s1Y023ZS4Ms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe33d7b3a3897b5b1a5a3ba0a522b0bfbe26aaac --- /dev/null +++ b/annotations_filtered/s1Y023ZS4Ms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.01], [13.0, 14.3], [27.0, 30.64], [31.0, 36.09], [36.0, 41.32], [42.0, 42.45], [43.0, 43.71], [44.0, 45.82], [47.0, 47.68], [50.0, 52.15], [55.0, 56.32], [59.0, 59.97], [64.0, 64.71], [69.0, 71.61], [73.0, 73.01], [74.0, 75.66]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [36.5, 0.0, 37.89, 43.53, 47.66, 0.0, 0.0, 0.0, 0.0, 47.2, 0.0, 0.0, 0.0, 38.37, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 81.82], ["fart", 5.44], ["boing", 2.87]], null, [["speech", 56.48], ["music", 11.79], ["animal", 2.89]], [["music", 33.58], ["rumble", 12.64], ["speech", 10.45]], [["speech", 49.4], ["music", 15.72], ["didgeridoo", 6.06]], null, null, null, null, [["music", 34.18], ["synthesizer", 10.31], ["door", 3.48]], null, null, null, [["roaring cats (lions, tigers)", 25.26], ["animal", 13.71], ["wild animals", 9.43]], null, null], "duration": [5.01, 1.3, 3.64, 5.09, 5.32, 0.45, 0.71, 1.82, 0.68, 2.15, 1.32, 0.97, 0.71, 2.61, 0.01, 1.66]} \ No newline at end of file diff --git a/annotations_filtered/s1hs62Is67s_filtered.json b/annotations_filtered/s1hs62Is67s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/s1hs62Is67s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/s1nXXro4Aio_filtered.json b/annotations_filtered/s1nXXro4Aio_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9527c41a06f4af1df21dfbad8a592baae174560 --- /dev/null +++ b/annotations_filtered/s1nXXro4Aio_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.84], [9.0, 9.49], [12.0, 13.2], [15.0, 16.55], [19.0, 36.9], [44.0, 45.2], [50.0, 74.65], [75.0, 89.88], [95.0, 123.89], [125.0, 126.18], [130.0, 131.9], [135.0, 138.38], [141.0, 145.05], [147.0, 155.41]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.84, 0.0, 29.02, 30.21, 28.68, 0.0, 0.0, 30.65, 37.31, 41.5], "audiomae_on_audioset": [null, null, null, null, [["fly, housefly", 54.08], ["insect", 31.68], ["bee, wasp, etc.", 7.99]], null, [["speech", 29.25], ["vehicle", 9.6], ["car", 7.69]], [["speech", 61.59], ["buzz", 5.61], ["hum", 4.56]], [["hum", 37.24], ["music", 29.34], ["throbbing", 15.47]], null, null, [["fly, housefly", 38.82], ["music", 13.03], ["insect", 9.41]], [["music", 48.68], ["speech", 5.47], ["hum", 4.41]], [["hum", 54.09], ["mains hum", 9.25], ["speech", 6.04]]], "duration": [-0.16, 0.49, 1.2, 1.55, 17.9, 1.2, 24.65, 14.88, 28.89, 1.18, 1.9, 3.38, 4.05, 8.41]} \ No newline at end of file diff --git a/annotations_filtered/s1s6SqHLUQA_filtered.json b/annotations_filtered/s1s6SqHLUQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6050247d23e87cb889f45cff920e13b8975e21df --- /dev/null +++ b/annotations_filtered/s1s6SqHLUQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.11], [9.0, 67.95], [68.0, 69.5], [70.0, 70.93]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [1.11, 58.95, 1.5, 0.93]} \ No newline at end of file diff --git a/annotations_filtered/s2Tpk6RnkaA_filtered.json b/annotations_filtered/s2Tpk6RnkaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a923d65123e0d78e39fe093aef8a350e19621d12 --- /dev/null +++ b/annotations_filtered/s2Tpk6RnkaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [10.0, 9.88], [14.0, 14.07], [18.0, 17.98], [21.0, 22.03], [23.0, 24.17], [27.0, 27.5], [32.0, 33.0], [35.0, 34.82], [37.0, 37.88], [39.0, 41.23], [47.0, 47.31], [48.0, 48.03], [50.0, 50.45], [54.0, 54.89], [56.0, 57.69], [61.0, 61.38], [63.0, 64.37], [65.0, 65.18], [66.0, 66.21], [68.0, 68.52], [70.0, 70.85], [73.0, 73.04], [84.0, 86.86], [88.0, 90.66], [93.0, 94.49], [96.0, 99.25], [100.0, 100.77], [103.0, 103.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 99.85, 0.0, 98.27, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, -0.12, 0.07, -0.02, 1.03, 1.17, 0.5, 1.0, -0.18, 0.88, 2.23, 0.31, 0.03, 0.45, 0.89, 1.69, 0.38, 1.37, 0.18, 0.21, 0.52, 0.85, 0.04, 2.86, 2.66, 1.49, 3.25, 0.77, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/s2pqELFTepw_filtered.json b/annotations_filtered/s2pqELFTepw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..772c88fc9ca2908b0655cf5ed9933a38bf128252 --- /dev/null +++ b/annotations_filtered/s2pqELFTepw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.71], [13.0, 15.43], [16.0, 18.35], [20.0, 20.36], [22.0, 22.32], [27.0, 27.04], [28.0, 30.86], [33.0, 34.38], [37.0, 38.03], [41.0, 41.96], [44.0, 45.6], [48.0, 48.81], [54.0, 56.81], [72.0, 71.76], [83.0, 84.43], [88.0, 89.28], [93.0, 95.91], [97.0, 98.04], [101.0, 101.65], [103.0, 103.65], [105.0, 104.84], [111.0, 112.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.85, 79.94, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, 2.43, 2.35, 0.36, 0.32, 0.04, 2.86, 1.38, 1.03, 0.96, 1.6, 0.81, 2.81, -0.24, 1.43, 1.28, 2.91, 1.04, 0.65, 0.65, -0.16, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/s2wBtcmE5W8_filtered.json b/annotations_filtered/s2wBtcmE5W8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..299d1b1fe975d08b5726e02b6b154aa7182ad2c2 --- /dev/null +++ b/annotations_filtered/s2wBtcmE5W8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.77], [8.0, 8.19], [10.0, 11.31], [13.0, 17.56], [20.0, 24.81], [26.0, 31.19], [32.0, 32.95], [34.0, 34.47], [35.0, 37.45], [39.0, 39.12], [41.0, 49.62], [51.0, 56.44], [60.0, 69.97], [73.0, 81.41], [82.0, 84.62], [86.0, 87.32], [88.0, 91.1], [93.0, 93.16], [94.0, 95.55], [97.0, 97.77], [98.0, 98.91], [100.0, 100.33], [100.0, 101.16], [102.0, 102.84], [105.0, 105.43], [107.0, 107.32], [108.0, 119.72]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, true, true, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 40.01, 51.12, 50.56, 0.0, 0.0, 51.23, 0.0, 32.74, 33.6, 31.2, 44.57, 44.37, 0.0, 28.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.09], "audiomae_on_audioset": [null, null, null, [["music", 46.83], ["hum", 7.74], ["whale vocalization", 4.85]], null, null, null, null, null, null, [["music", 50.06], ["speech", 18.93], ["whack, thwack", 5.97]], [["speech", 36.75], ["music", 29.92], ["throbbing", 3.55]], [["music", 15.78], ["roar", 15.05], ["animal", 10.91]], [["hum", 31.2], ["music", 14.06], ["throbbing", 12.55]], [["creak", 20.29], ["speech", 19.9], ["telephone bell ringing", 14.12]], null, [["speech", 21.61], ["whack, thwack", 11.32], ["sound effect", 9.39]], null, null, null, null, null, null, null, null, null, [["music", 37.65], ["speech", 19.7], ["mains hum", 9.73]]], "duration": [1.77, 0.19, 1.31, 4.56, 4.81, 5.19, 0.95, 0.47, 2.45, 0.12, 8.62, 5.44, 9.97, 8.41, 2.62, 1.32, 3.1, 0.16, 1.55, 0.77, 0.91, 0.33, 1.16, 0.84, 0.43, 0.32, 11.72]} \ No newline at end of file diff --git a/annotations_filtered/s2xKn06X9cQ_filtered.json b/annotations_filtered/s2xKn06X9cQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1df1551d1615363b7b91b5fa75a1b04051ac750 --- /dev/null +++ b/annotations_filtered/s2xKn06X9cQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.19], [11.0, 11.58], [13.0, 13.24], [23.0, 24.68], [26.0, 28.39], [33.0, 34.08], [36.0, 37.1], [39.0, 42.31], [43.0, 46.55], [49.0, 50.01], [52.0, 54.95], [56.0, 56.47], [59.0, 62.87], [67.0, 68.57], [70.0, 72.05], [73.0, 74.06], [75.0, 76.27], [77.0, 77.08], [78.0, 78.87], [80.0, 88.53], [90.0, 92.58], [93.0, 97.26]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.59, 0.0, 0.0, 42.22, 34.28, 0.0, 45.3, 0.0, 41.87, 0.0, 44.09, 0.0, 0.0, 0.0, 0.0, 32.99, 45.95, 37.55], "audiomae_on_audioset": [null, null, null, null, [["music", 61.39], ["mosquito", 3.92], ["fly, housefly", 3.68]], null, null, [["music", 37.86], ["sidetone", 12.41], ["hum", 9.43]], [["music", 58.32], ["musical instrument", 9.0], ["speech", 8.91]], null, [["music", 49.26], ["throbbing", 26.28], ["hum", 2.74]], null, [["boing", 71.02], ["music", 16.56], ["throbbing", 4.17]], null, [["fly, housefly", 59.52], ["insect", 25.05], ["mosquito", 10.25]], null, null, null, null, [["speech", 44.86], ["music", 29.01], ["electric shaver, electric razor", 3.3]], [["music", 49.76], ["synthesizer", 5.65], ["musical instrument", 3.96]], [["music", 42.28], ["speech", 35.55], ["throbbing", 2.93]]], "duration": [1.19, 0.58, 0.24, 1.68, 2.39, 1.08, 1.1, 3.31, 3.55, 1.01, 2.95, 0.47, 3.87, 1.57, 2.05, 1.06, 1.27, 0.08, 0.87, 8.53, 2.58, 4.26]} \ No newline at end of file diff --git a/annotations_filtered/s33dP0ETrCo_filtered.json b/annotations_filtered/s33dP0ETrCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..623882ddcaa2c1eb516dff1dc021bc2ca30843fb --- /dev/null +++ b/annotations_filtered/s33dP0ETrCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.38], [13.0, 19.65], [24.0, 25.12], [29.0, 31.23], [32.0, 33.56], [36.0, 37.52], [40.0, 41.12], [42.0, 43.68], [44.0, 47.06], [51.0, 52.79], [65.0, 65.11], [65.0, 65.8], [73.0, 73.82], [79.0, 79.61], [82.0, 83.86], [87.0, 88.1], [92.0, 92.15], [93.0, 93.6], [95.0, 95.81], [105.0, 105.71], [106.0, 107.18], [112.0, 113.36], [117.0, 117.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.04, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 6.65, 1.12, 2.23, 1.56, 1.52, 1.12, 1.68, 3.06, 1.79, 0.11, 0.8, 0.82, 0.61, 1.86, 1.1, 0.15, 0.6, 0.81, 0.71, 1.18, 1.36, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/s3PbszHh8vE_filtered.json b/annotations_filtered/s3PbszHh8vE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d961b419db0e5c3f63bada4852244fb30de95c5 --- /dev/null +++ b/annotations_filtered/s3PbszHh8vE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.08], [14.0, 13.93], [28.0, 28.0], [31.0, 31.94], [48.0, 47.98], [83.0, 85.29], [89.0, 89.07], [94.0, 96.3], [97.0, 97.92], [99.0, 104.38], [106.0, 117.36], [123.0, 123.18], [126.0, 126.59], [131.0, 130.65]], "keep_status": [false, false, false, false, false, true, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.4, 0.0, 30.23, 0.0, 29.68, 37.85, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 65.27], ["musical instrument", 2.55], ["yodeling", 1.8]], null, [["mosquito", 40.02], ["fly, housefly", 16.13], ["insect", 12.81]], null, [["speech", 27.16], ["music", 22.83], ["throbbing", 17.93]], [["theremin", 46.84], ["music", 33.25], ["musical instrument", 3.07]], null, null, null], "duration": [0.08, -0.07, 0.0, 0.94, -0.02, 2.29, 0.07, 2.3, 0.92, 5.38, 11.36, 0.18, 0.59, -0.35]} \ No newline at end of file diff --git a/annotations_filtered/s3RNsZvdYZQ_filtered.json b/annotations_filtered/s3RNsZvdYZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d8fb3862edc6b5f09c7cdc4df03edd50c8827ac --- /dev/null +++ b/annotations_filtered/s3RNsZvdYZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.4], [7.0, 8.38], [10.0, 10.05], [11.0, 12.55], [17.0, 17.36], [22.0, 22.17], [24.0, 28.27], [39.0, 39.87], [54.0, 58.02], [60.0, 62.36], [69.0, 70.17], [71.0, 76.35], [80.0, 83.96], [87.0, 88.3], [92.0, 93.09], [96.0, 97.28], [101.0, 101.38], [102.0, 102.74], [105.0, 105.17], [107.0, 110.91], [111.0, 111.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.52, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 99.98, 91.47, 0.0, 34.25, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["breaking", 64.01], ["music", 15.83], ["speech", 1.78]], null, null, null, null, null, null, null, null, null], "duration": [4.4, 1.38, 0.05, 1.55, 0.36, 0.17, 4.27, 0.87, 4.02, 2.36, 1.17, 5.35, 3.96, 1.3, 1.09, 1.28, 0.38, 0.74, 0.17, 3.91, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/s3mwDA8sv8I_filtered.json b/annotations_filtered/s3mwDA8sv8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af9dfbc0fd9e59d81314498bcc3136e9dc95a3a8 --- /dev/null +++ b/annotations_filtered/s3mwDA8sv8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [10.0, 10.13], [13.0, 13.54], [15.0, 14.77], [19.0, 20.36], [22.0, 24.09], [26.0, 26.82], [28.0, 29.56], [31.0, 32.76], [35.0, 36.48], [38.0, 38.67], [41.0, 41.01], [42.0, 50.87], [52.0, 62.46], [64.0, 64.93], [66.0, 68.77], [69.0, 78.73], [81.0, 81.63], [84.0, 85.8], [87.0, 90.17], [93.0, 95.94], [97.0, 100.53], [102.0, 102.27], [103.0, 104.53], [106.0, 109.14], [112.0, 115.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5, 81.35, 0.0, 75.72, 56.33, 0.0, 0.0, 71.29, 64.07, 60.6, 0.0, 0.0, 80.82, 58.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 29.12], ["insect", 18.83], ["speech", 15.73]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.13, 0.54, -0.23, 1.36, 2.09, 0.82, 1.56, 1.76, 1.48, 0.67, 0.01, 8.87, 10.46, 0.93, 2.77, 9.73, 0.63, 1.8, 3.17, 2.94, 3.53, 0.27, 1.53, 3.14, 3.3]} \ No newline at end of file diff --git a/annotations_filtered/s3rv0BdxWfM_filtered.json b/annotations_filtered/s3rv0BdxWfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52e14a144b0ff53214a603b729f776bb11f18e93 --- /dev/null +++ b/annotations_filtered/s3rv0BdxWfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.68], [19.0, 19.67], [20.0, 24.81], [25.0, 32.64], [34.0, 35.68], [38.0, 38.85], [41.0, 42.7], [43.0, 42.8], [44.0, 44.52], [46.0, 48.69], [50.0, 52.44], [53.0, 54.55], [56.0, 57.45], [58.0, 63.07], [64.0, 66.33], [78.0, 79.19], [80.0, 87.47], [89.0, 91.77], [92.0, 97.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.52, 0.0, 95.37, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 100.0, 0.0, 0.0, 99.44, 100.0, 0.0, 100.0, 100.0, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.68, 0.67, 4.81, 7.64, 1.68, 0.85, 1.7, -0.2, 0.52, 2.69, 2.44, 1.55, 1.45, 5.07, 2.33, 1.19, 7.47, 2.77, 5.73]} \ No newline at end of file diff --git a/annotations_filtered/s3znWXpeLPA_filtered.json b/annotations_filtered/s3znWXpeLPA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b471b030cd344ff27cc3182949e50f866ddb738f --- /dev/null +++ b/annotations_filtered/s3znWXpeLPA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.7], [11.0, 10.84], [11.0, 12.23], [14.0, 13.85], [14.0, 19.26], [20.0, 22.18], [26.0, 27.77], [31.0, 32.53], [36.0, 37.13], [40.0, 41.15], [43.0, 45.27], [48.0, 49.42], [50.0, 51.36], [54.0, 54.5], [61.0, 62.26], [66.0, 67.59], [76.0, 78.51], [82.0, 83.59], [85.0, 86.83], [88.0, 90.02], [95.0, 95.77], [103.0, 104.48], [106.0, 110.3], [112.0, 113.91], [116.0, 116.53], [118.0, 119.79], [121.0, 128.71]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 46.19, 53.4, 0.0, 0.0, 0.0, 0.0, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 83.7, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 87.55], "audiomae_on_audioset": [null, null, null, null, [["speech", 45.16], ["whale vocalization", 16.26], ["music", 3.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.7, -0.16, 1.23, -0.15, 5.26, 2.18, 1.77, 1.53, 1.13, 1.15, 2.27, 1.42, 1.36, 0.5, 1.26, 1.59, 2.51, 1.59, 1.83, 2.02, 0.77, 1.48, 4.3, 1.91, 0.53, 1.79, 7.71]} \ No newline at end of file diff --git a/annotations_filtered/s43ARFFNrz0_filtered.json b/annotations_filtered/s43ARFFNrz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d843ae51f27a09060ed2838e088385c26bd3e2a --- /dev/null +++ b/annotations_filtered/s43ARFFNrz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.42], [19.0, 19.08], [20.0, 20.63], [21.0, 21.83], [26.0, 26.32], [52.0, 54.18], [60.0, 60.29], [71.0, 76.4], [77.0, 77.82], [79.0, 88.03]], "keep_status": [true, false, false, false, false, true, false, false, false, false], "silence_prob": [45.59, 0.0, 0.0, 0.0, 0.0, 43.33, 0.0, 62.07, 0.0, 62.47], "audiomae_on_audioset": [[["raindrop", 24.44], ["rain on surface", 16.42], ["rain", 14.5]], null, null, null, null, [["rain on surface", 24.23], ["rain", 16.14], ["raindrop", 12.59]], null, null, null, null], "duration": [3.42, 0.08, 0.63, 0.83, 0.32, 2.18, 0.29, 5.4, 0.82, 9.03]} \ No newline at end of file diff --git a/annotations_filtered/s4AzrUO3D1w_filtered.json b/annotations_filtered/s4AzrUO3D1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4433fcd76bdeeebe45469f8616bddee144f87b81 --- /dev/null +++ b/annotations_filtered/s4AzrUO3D1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [2.0, 2.08], [3.0, 3.45], [8.0, 8.14], [10.0, 10.76], [12.0, 12.26], [14.0, 13.91], [15.0, 14.84], [15.0, 16.34], [17.0, 17.15], [19.0, 19.53], [20.0, 21.17], [22.0, 22.64], [38.0, 38.58], [39.0, 39.33], [40.0, 40.68], [42.0, 42.16], [43.0, 43.87], [45.0, 46.3], [51.0, 51.04], [53.0, 54.46], [59.0, 60.99], [81.0, 84.57], [95.0, 118.66], [119.0, 118.94], [119.0, 123.79], [126.0, 128.34], [130.0, 132.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.08, 49.0, 0.0, 90.78, 81.71, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.83], ["speech", 10.07], ["musical instrument", 4.0]], [["speech", 30.54], ["buzz", 6.38], ["bleat", 5.3]], null, null, null, null], "duration": [0.38, 0.08, 0.45, 0.14, 0.76, 0.26, -0.09, -0.16, 1.34, 0.15, 0.53, 1.17, 0.64, 0.58, 0.33, 0.68, 0.16, 0.87, 1.3, 0.04, 1.46, 1.99, 3.57, 23.66, -0.06, 4.79, 2.34, 2.63]} \ No newline at end of file diff --git a/annotations_filtered/s4esaE679Wg_filtered.json b/annotations_filtered/s4esaE679Wg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c92efb29a57712b5c18b0f7cb6c7a3a2a38b46ca --- /dev/null +++ b/annotations_filtered/s4esaE679Wg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 22.92], [24.0, 27.82], [30.0, 35.09], [46.0, 46.65], [47.0, 47.68], [52.0, 53.59], [56.0, 59.9], [61.0, 62.09], [65.0, 66.02], [68.0, 68.82], [72.0, 84.32], [86.0, 96.48], [96.0, 96.52], [97.0, 96.77], [97.0, 101.75], [103.0, 124.07], [125.0, 165.86], [166.0, 166.45], [167.0, 167.44], [167.0, 167.59]], "keep_status": [true, true, true, false, false, false, true, false, false, false, false, true, false, false, true, true, false, false, false, false], "silence_prob": [27.82, 27.77, 28.68, 0.0, 0.0, 0.0, 31.55, 0.0, 0.0, 0.0, 27.81, 28.01, 0.0, 0.0, 28.17, 27.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 31.73], ["cattle, bovinae", 11.59], ["animal", 8.43]], [["vehicle", 20.08], ["car", 14.77], ["skidding", 12.77]], [["music", 13.86], ["noise", 9.43], ["sound effect", 9.23]], null, null, null, [["music", 56.84], ["cattle, bovinae", 7.04], ["didgeridoo", 5.51]], null, null, null, [["speech", 68.8], ["vehicle", 5.95], ["motorcycle", 3.03]], [["speech", 35.1], ["vehicle", 6.55], ["music", 6.16]], null, null, [["music", 45.72], ["noise", 13.11], ["musical instrument", 7.32]], [["music", 52.24], ["buzz", 5.51], ["fly, housefly", 3.17]], null, null, null, null], "duration": [14.92, 3.82, 5.09, 0.65, 0.68, 1.59, 3.9, 1.09, 1.02, 0.82, 12.32, 10.48, 0.52, -0.23, 4.75, 21.07, 40.86, 0.45, 0.44, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/s4heu0mPm-I_filtered.json b/annotations_filtered/s4heu0mPm-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f853631c471b37507050eb110ae75611c2de68b4 --- /dev/null +++ b/annotations_filtered/s4heu0mPm-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.58], [9.0, 11.08], [13.0, 16.53], [17.0, 16.93], [17.0, 18.23], [19.0, 20.58], [24.0, 28.07], [29.0, 28.76], [33.0, 35.6]], "keep_status": [false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 45.95, 53.22, 0.0, 0.0, 0.0, 51.39, 0.0, 42.37], "audiomae_on_audioset": [null, [["speech", 38.2], ["hum", 12.0], ["throbbing", 7.09]], null, null, null, null, null, null, [["speech", 36.92], ["hum", 17.73], ["throbbing", 14.87]]], "duration": [1.58, 2.08, 3.53, -0.07, 1.23, 1.58, 4.07, -0.24, 2.6]} \ No newline at end of file diff --git a/annotations_filtered/s4veow_qEDk_filtered.json b/annotations_filtered/s4veow_qEDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89b4e610610c2ab3a36033eee066dfbf02d7c0d1 --- /dev/null +++ b/annotations_filtered/s4veow_qEDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.56], [8.0, 8.18], [11.0, 10.69], [14.0, 14.66], [18.0, 18.33], [24.0, 24.68], [28.0, 30.81], [38.0, 38.43], [51.0, 51.63], [56.0, 56.73], [58.0, 59.04], [64.0, 64.72], [73.0, 73.47], [75.0, 74.71], [76.0, 76.27], [81.0, 83.57], [85.0, 86.12], [87.0, 87.57], [90.0, 90.63], [94.0, 94.12], [95.0, 95.69], [100.0, 100.33], [104.0, 105.46], [108.0, 108.26], [110.0, 110.54], [111.0, 112.08], [112.0, 112.77], [115.0, 115.08], [118.0, 118.72], [123.0, 124.29], [127.0, 127.92], [132.0, 132.88], [134.0, 134.59], [138.0, 138.15], [147.0, 147.8], [149.0, 149.05], [152.0, 152.47], [157.0, 156.66], [160.0, 161.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 71.81], ["sidetone", 22.75], ["radio", 3.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.56, 0.18, -0.31, 0.66, 0.33, 0.68, 2.81, 0.43, 0.63, 0.73, 1.04, 0.72, 0.47, -0.29, 0.27, 2.57, 1.12, 0.57, 0.63, 0.12, 0.69, 0.33, 1.46, 0.26, 0.54, 1.08, 0.77, 0.08, 0.72, 1.29, 0.92, 0.88, 0.59, 0.15, 0.8, 0.05, 0.47, -0.34, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/s59yqpV0ICo_filtered.json b/annotations_filtered/s59yqpV0ICo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60ad41bd5601cb0b96b48212abbdfbd5194c575f --- /dev/null +++ b/annotations_filtered/s59yqpV0ICo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.89], [11.0, 11.37], [14.0, 14.47], [17.0, 18.25], [32.0, 32.46], [34.0, 34.01], [46.0, 46.23], [47.0, 48.3], [54.0, 54.63], [84.0, 84.65], [86.0, 88.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.11, 0.37, 0.47, 1.25, 0.46, 0.01, 0.23, 1.3, 0.63, 0.65, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/s5D8jf0k_1k_filtered.json b/annotations_filtered/s5D8jf0k_1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43064d3d407d573a84644b6d0f123c516439cd74 --- /dev/null +++ b/annotations_filtered/s5D8jf0k_1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.71], [8.0, 8.9], [10.0, 11.6], [13.0, 13.04], [14.0, 16.26], [17.0, 22.18], [23.0, 31.24], [35.0, 36.69], [38.0, 43.68]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [96.04, 0.0, 0.0, 0.0, 60.32, 71.72, 57.72, 0.0, 37.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 19.91], ["whip", 18.56], ["music", 9.41]]], "duration": [2.71, 0.9, 1.6, 0.04, 2.26, 5.18, 8.24, 1.69, 5.68]} \ No newline at end of file diff --git a/annotations_filtered/s5XdRd5SQIw_filtered.json b/annotations_filtered/s5XdRd5SQIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..343bfc9ae172e98caf4a1675b8d71add8a30e348 --- /dev/null +++ b/annotations_filtered/s5XdRd5SQIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.22], [9.0, 9.49], [14.0, 14.13], [16.0, 16.01], [19.0, 20.01], [24.0, 25.86], [27.0, 28.0], [32.0, 32.44], [37.0, 37.45], [39.0, 39.92], [40.0, 41.37], [45.0, 45.79], [47.0, 48.61], [49.0, 50.97], [51.0, 59.78], [66.0, 66.58], [74.0, 73.87], [77.0, 78.22], [80.0, 95.39], [96.0, 96.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 0.0, 0.0, 99.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.22, 0.49, 0.13, 0.01, 1.01, 1.86, 1.0, 0.44, 0.45, 0.92, 1.37, 0.79, 1.61, 1.97, 8.78, 0.58, -0.13, 1.22, 15.39, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/s5jDTz07buw_filtered.json b/annotations_filtered/s5jDTz07buw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fae84b127bcc1482a8a971aacd2e52032322016 --- /dev/null +++ b/annotations_filtered/s5jDTz07buw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [5.0, 5.91], [8.0, 11.33], [12.0, 14.12], [15.0, 16.01], [17.0, 18.25], [20.0, 23.99], [25.0, 28.81], [31.0, 31.35], [38.0, 38.35], [39.0, 39.04], [41.0, 42.4], [45.0, 45.94], [47.0, 51.19], [54.0, 54.62], [56.0, 56.42], [58.0, 65.35], [66.0, 65.87], [67.0, 68.23], [68.0, 68.42], [68.0, 71.0], [71.0, 72.72], [73.0, 72.93], [73.0, 80.49], [82.0, 84.05], [85.0, 86.07], [88.0, 89.23], [89.0, 91.07], [92.0, 92.84], [94.0, 95.4], [104.0, 104.52], [106.0, 121.24], [122.0, 127.23], [128.0, 128.76], [130.0, 130.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 76.7, 0.0, 0.0, 100.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 98.8, 99.96, 0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 96.17, 99.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 0.91, 3.33, 2.12, 1.01, 1.25, 3.99, 3.81, 0.35, 0.35, 0.04, 1.4, 0.94, 4.19, 0.62, 0.42, 7.35, -0.13, 1.23, 0.42, 3.0, 1.72, -0.07, 7.49, 2.05, 1.07, 1.23, 2.07, 0.84, 1.4, 0.52, 15.24, 5.23, 0.76, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/s6DlYFmuJXw_filtered.json b/annotations_filtered/s6DlYFmuJXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7f18eb88294c3ed98d672eab6099052cd172df7 --- /dev/null +++ b/annotations_filtered/s6DlYFmuJXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.94], [4.0, 6.08], [9.0, 11.33], [13.0, 13.27], [14.0, 14.27], [15.0, 25.05], [25.0, 26.47], [27.0, 29.17], [30.0, 30.54], [31.0, 33.66], [34.0, 35.58], [36.0, 44.14], [44.0, 44.44], [44.0, 45.93], [49.0, 58.94], [62.0, 62.8], [68.0, 70.75], [73.0, 93.23], [95.0, 95.93], [97.0, 98.46], [100.0, 104.4], [108.0, 108.26], [109.0, 110.15], [116.0, 121.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [98.27, 68.8, 72.46, 0.0, 0.0, 78.55, 0.0, 86.64, 0.0, 75.72, 0.0, 59.77, 0.0, 0.0, 50.26, 0.0, 61.37, 53.59, 0.0, 0.0, 34.73, 0.0, 0.0, 33.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.05], ["carnatic music", 6.39], ["musical instrument", 3.67]], null, null, [["music", 51.01], ["hum", 8.46], ["throbbing", 6.73]]], "duration": [2.94, 2.08, 2.33, 0.27, 0.27, 10.05, 1.47, 2.17, 0.54, 2.66, 1.58, 8.14, 0.44, 1.93, 9.94, 0.8, 2.75, 20.23, 0.93, 1.46, 4.4, 0.26, 1.15, 5.74]} \ No newline at end of file diff --git a/annotations_filtered/s6JmX_n5oeo_filtered.json b/annotations_filtered/s6JmX_n5oeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a2b2cfe2e3ff960c1a82feb87092f08e041cd86 --- /dev/null +++ b/annotations_filtered/s6JmX_n5oeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.5], [17.0, 20.61], [22.0, 23.23], [26.0, 26.86], [31.0, 31.6], [38.0, 38.6], [40.0, 42.11], [45.0, 45.37], [47.0, 50.92], [55.0, 58.9], [64.0, 65.64], [66.0, 67.63], [71.0, 76.84], [78.0, 79.35], [81.0, 81.55], [82.0, 82.17], [84.0, 83.67], [84.0, 86.64], [88.0, 92.64], [95.0, 95.15], [98.0, 98.91], [99.0, 99.94], [100.0, 102.24], [103.0, 116.09]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [73.82, 99.59, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 47.08, 79.41, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 76.86, 99.26, 0.0, 0.0, 0.0, 72.01, 41.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["stomach rumble", 16.21], ["hum", 13.88], ["throbbing", 7.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 17.13], ["tuning fork", 10.93], ["hum", 8.72]]], "duration": [4.5, 3.61, 1.23, 0.86, 0.6, 0.6, 2.11, 0.37, 3.92, 3.9, 1.64, 1.63, 5.84, 1.35, 0.55, 0.17, -0.33, 2.64, 4.64, 0.15, 0.91, 0.94, 2.24, 13.09]} \ No newline at end of file diff --git a/annotations_filtered/s6lrBldtwVk_filtered.json b/annotations_filtered/s6lrBldtwVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af9b5ff1196d1179778255a37cea95a448e7d6be --- /dev/null +++ b/annotations_filtered/s6lrBldtwVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[88.0, 88.01], [89.0, 102.14]], "keep_status": [false, true], "silence_prob": [0.0, 29.96], "audiomae_on_audioset": [null, [["fly, housefly", 16.37], ["insect", 13.88], ["speech", 13.1]]], "duration": [0.01, 13.14]} \ No newline at end of file diff --git a/annotations_filtered/s6moLb_ieqA_filtered.json b/annotations_filtered/s6moLb_ieqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..399feecbce8c04c43ef29e6235188fb44c9f013d --- /dev/null +++ b/annotations_filtered/s6moLb_ieqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.61], [2.0, 3.16], [5.0, 5.88], [6.0, 7.43], [10.0, 10.45], [22.0, 46.41], [48.0, 48.17], [54.0, 59.73], [65.0, 64.86], [65.0, 65.64], [68.0, 73.28], [74.0, 79.79], [83.0, 83.15], [83.0, 87.74], [93.0, 103.81], [107.0, 107.87], [109.0, 109.02], [111.0, 112.56], [113.0, 117.78], [122.0, 121.71], [122.0, 123.79], [126.0, 127.58], [128.0, 129.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 62.58, 0.0, 50.91, 0.0, 0.0, 100.0, 99.91, 0.0, 47.9, 32.83, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 43.18], ["speech", 34.29], ["music", 4.59]], [["music", 42.63], ["thunk", 13.99], ["whack, thwack", 12.09]], null, null, null, null, null, null, null, null], "duration": [-0.39, 1.16, 0.88, 1.43, 0.45, 24.41, 0.17, 5.73, -0.14, 0.64, 5.28, 5.79, 0.15, 4.74, 10.81, 0.87, 0.02, 1.56, 4.78, -0.29, 1.79, 1.58, 1.0]} \ No newline at end of file diff --git a/annotations_filtered/s6n8HGwboO4_filtered.json b/annotations_filtered/s6n8HGwboO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f3a8e9b9da144c5d24da71ec7ad444b836ed723 --- /dev/null +++ b/annotations_filtered/s6n8HGwboO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.26], [7.0, 9.46], [39.0, 40.8], [43.0, 43.43], [45.0, 46.23], [49.0, 59.56], [63.0, 68.37], [69.0, 74.98], [76.0, 78.19], [79.0, 81.72], [83.0, 83.47], [84.0, 85.46], [87.0, 88.13], [89.0, 90.46], [91.0, 93.02], [94.0, 95.77], [100.0, 100.92], [107.0, 107.54], [111.0, 112.9], [116.0, 117.54], [120.0, 121.78], [125.0, 127.18], [128.0, 129.63], [134.0, 135.89], [138.0, 138.64], [141.0, 144.04]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 81.89, 0.0, 0.0, 0.0, 47.05, 64.52, 56.55, 70.72, 63.64, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 59.07], "audiomae_on_audioset": [null, null, null, null, null, [["cello", 34.32], ["music", 17.79], ["bowed string instrument", 12.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.22], ["sidetone", 21.66], ["hum", 4.95]], null, null, null, null], "duration": [1.26, 2.46, 1.8, 0.43, 1.23, 10.56, 5.37, 5.98, 2.19, 2.72, 0.47, 1.46, 1.13, 1.46, 2.02, 1.77, 0.92, 0.54, 1.9, 1.54, 1.78, 2.18, 1.63, 1.89, 0.64, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/s6pAWtuEIR8_filtered.json b/annotations_filtered/s6pAWtuEIR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7496d68cfe8737c25ccafb8e8a3aa9ae12ce30d --- /dev/null +++ b/annotations_filtered/s6pAWtuEIR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.79], [4.0, 4.38], [5.0, 5.97], [9.0, 12.39], [13.0, 13.78], [17.0, 17.63], [21.0, 22.23], [24.0, 25.96], [27.0, 27.51], [39.0, 39.06], [40.0, 48.91], [50.0, 50.33], [51.0, 51.95], [53.0, 54.26], [63.0, 64.2], [73.0, 73.74], [78.0, 78.58], [81.0, 81.75], [97.0, 98.95], [100.0, 103.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 71.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 53.81], ["beatboxing", 27.47], ["fart", 2.99]], null, null, null, null, null, null, null, null, [["speech", 19.91], ["hum", 19.21], ["arrow", 12.62]]], "duration": [1.79, 0.38, 0.97, 3.39, 0.78, 0.63, 1.23, 1.96, 0.51, 0.06, 8.91, 0.33, 0.95, 1.26, 1.2, 0.74, 0.58, 0.75, 1.95, 3.52]} \ No newline at end of file diff --git a/annotations_filtered/s7ougTo-pGg_filtered.json b/annotations_filtered/s7ougTo-pGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10e5072149c2a8914c6f6995db0f1d572ae91a70 --- /dev/null +++ b/annotations_filtered/s7ougTo-pGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.72], [6.0, 7.43], [15.0, 15.43], [17.0, 17.78], [19.0, 20.33], [28.0, 28.78], [33.0, 34.13], [53.0, 53.54], [55.0, 60.93], [62.0, 66.77], [74.0, 74.66], [84.0, 83.67], [88.0, 88.53], [89.0, 107.64], [111.0, 136.17], [139.0, 149.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.02, 34.34, 0.0, 0.0, 0.0, 33.5, 32.91, 43.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 51.19], ["sidetone", 21.31], ["electronic music", 4.52]], [["music", 71.47], ["electronic music", 3.16], ["musical instrument", 2.0]], null, null, null, [["music", 43.31], ["cattle, bovinae", 16.24], ["moo", 12.96]], [["music", 67.98], ["electronic music", 6.39], ["cattle, bovinae", 3.07]], [["music", 73.33], ["didgeridoo", 3.37], ["musical instrument", 2.98]]], "duration": [0.72, 1.43, 0.43, 0.78, 1.33, 0.78, 1.13, 0.54, 5.93, 4.77, 0.66, -0.33, 0.53, 18.64, 25.17, 10.37]} \ No newline at end of file diff --git a/annotations_filtered/s8WzJJoKq_4_filtered.json b/annotations_filtered/s8WzJJoKq_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d081226514e3f4297c4c1e294181718a79156674 --- /dev/null +++ b/annotations_filtered/s8WzJJoKq_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.98], [4.0, 4.62], [6.0, 6.72], [8.0, 9.88], [11.0, 12.19], [13.0, 14.45], [15.0, 15.55], [16.0, 16.5], [18.0, 18.82], [20.0, 21.27], [23.0, 23.16], [29.0, 29.51], [35.0, 36.56], [43.0, 45.01], [47.0, 47.68], [48.0, 49.15], [51.0, 51.9], [53.0, 54.5], [57.0, 57.91], [59.0, 59.88], [62.0, 63.75], [64.0, 65.04], [70.0, 70.23], [72.0, 74.9], [83.0, 83.2], [101.0, 101.71], [103.0, 104.95], [113.0, 113.32], [116.0, 117.66], [118.0, 119.53], [121.0, 121.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.02, 0.62, 0.72, 1.88, 1.19, 1.45, 0.55, 0.5, 0.82, 1.27, 0.16, 0.51, 1.56, 2.01, 0.68, 1.15, 0.9, 1.5, 0.91, 0.88, 1.75, 1.04, 0.23, 2.9, 0.2, 0.71, 1.95, 0.32, 1.66, 1.53, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/s8cVCsIcGAE_filtered.json b/annotations_filtered/s8cVCsIcGAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3841a8769336edf6a035a01421ef7969ed6c10ef --- /dev/null +++ b/annotations_filtered/s8cVCsIcGAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 26.11], [27.0, 27.97], [28.0, 29.52], [30.0, 36.14], [38.0, 45.54], [50.0, 77.38], [80.0, 81.4], [84.0, 85.5], [91.0, 93.53], [99.0, 141.81], [144.0, 148.98]], "keep_status": [false, false, false, true, true, false, false, false, true, false, true], "silence_prob": [30.83, 0.0, 0.0, 29.83, 28.63, 28.65, 0.0, 0.0, 28.39, 0.0, 35.22], "audiomae_on_audioset": [[["hum", 33.73], ["speech", 24.09], ["mains hum", 15.53]], null, null, [["speech", 25.99], ["music", 9.71], ["animal", 6.97]], [["music", 15.29], ["speech", 14.55], ["buzz", 11.2]], [["mains hum", 30.79], ["music", 20.13], ["hum", 19.37]], null, null, [["music", 23.38], ["hum", 17.15], ["throbbing", 12.83]], null, [["music", 44.85], ["hum", 12.76], ["speech", 8.67]]], "duration": [10.11, 0.97, 1.52, 6.14, 7.54, 27.38, 1.4, 1.5, 2.53, 42.81, 4.98]} \ No newline at end of file diff --git a/annotations_filtered/s8hKbzuOAQY_filtered.json b/annotations_filtered/s8hKbzuOAQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63728fc0fb586a4efd152268d138a7ce41abf507 --- /dev/null +++ b/annotations_filtered/s8hKbzuOAQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.31], [9.0, 9.75], [11.0, 10.77], [12.0, 12.63], [17.0, 19.08], [21.0, 21.73], [41.0, 41.22], [42.0, 42.36], [43.0, 44.02], [66.0, 67.37], [69.0, 69.26], [70.0, 70.21], [71.0, 71.81], [74.0, 76.08], [79.0, 79.44], [80.0, 81.6], [82.0, 82.61], [83.0, 83.42], [87.0, 87.39], [113.0, 114.07], [128.0, 128.73], [130.0, 130.13], [130.0, 131.99]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 15.21], ["carnatic music", 8.95], ["speech", 8.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 0.75, -0.23, 0.63, 2.08, 0.73, 0.22, 0.36, 1.02, 1.37, 0.26, 0.21, 0.81, 2.08, 0.44, 1.6, 0.61, 0.42, 0.39, 1.07, 0.73, 0.13, 1.99]} \ No newline at end of file diff --git a/annotations_filtered/s8jfw7FxNqA_filtered.json b/annotations_filtered/s8jfw7FxNqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39fbac81afed8dde6e0df4576c471bd5fb81fd57 --- /dev/null +++ b/annotations_filtered/s8jfw7FxNqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[125.0, 125.14], [126.0, 126.39], [127.0, 127.3]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.14, 0.39, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/s8tXE43jYho_filtered.json b/annotations_filtered/s8tXE43jYho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63dbcf8321b800a76bf0193a03e54adc9ab388d5 --- /dev/null +++ b/annotations_filtered/s8tXE43jYho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.97], [11.0, 14.18], [17.0, 18.2], [21.0, 23.33], [29.0, 29.02], [32.0, 44.42], [46.0, 48.57], [59.0, 64.37], [66.0, 75.22], [77.0, 84.74], [85.0, 85.02], [86.0, 88.2], [91.0, 91.62], [95.0, 102.9], [106.0, 106.59]], "keep_status": [false, false, false, true, false, false, true, true, false, false, false, true, false, true, false], "silence_prob": [0.0, 99.99, 0.0, 46.33, 0.0, 40.64, 36.55, 45.08, 35.54, 35.13, 0.0, 35.3, 0.0, 36.74, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 44.05], ["musical instrument", 10.29], ["guitar", 3.83]], null, [["music", 54.98], ["theremin", 12.17], ["hum", 5.04]], [["music", 31.45], ["speech", 28.75], ["didgeridoo", 5.0]], [["music", 53.79], ["musical instrument", 7.81], ["hum", 4.57]], [["music", 70.96], ["speech", 14.64], ["effects unit", 1.63]], [["music", 72.67], ["speech", 5.53], ["boing", 4.36]], null, [["speech", 21.59], ["music", 11.57], ["dog", 9.34]], null, [["music", 32.57], ["speech", 15.31], ["guitar", 15.29]], null], "duration": [1.97, 3.18, 1.2, 2.33, 0.02, 12.42, 2.57, 5.37, 9.22, 7.74, 0.02, 2.2, 0.62, 7.9, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/s9FoorJGkrA_filtered.json b/annotations_filtered/s9FoorJGkrA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12b14cb8f307dd2fb54a34bf592f90e7ccbdfc08 --- /dev/null +++ b/annotations_filtered/s9FoorJGkrA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.0], [12.0, 13.8], [14.0, 14.49], [15.0, 15.3], [16.0, 22.87], [24.0, 24.97], [27.0, 27.36], [29.0, 29.74], [31.0, 31.4], [35.0, 37.64], [38.0, 40.61], [42.0, 43.8], [47.0, 48.44], [49.0, 49.5], [50.0, 49.62], [50.0, 49.98], [51.0, 56.51], [58.0, 64.61], [65.0, 70.01], [72.0, 73.31], [74.0, 97.01], [98.0, 99.2], [104.0, 104.79], [107.0, 107.08], [115.0, 116.65], [121.0, 121.66], [124.0, 124.77], [130.0, 129.78], [133.0, 133.52], [135.0, 135.3], [139.0, 140.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 97.33, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 98.66, 98.36, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 1.8, 0.49, 0.3, 6.87, 0.97, 0.36, 0.74, 0.4, 2.64, 2.61, 1.8, 1.44, 0.5, -0.38, -0.02, 5.51, 6.61, 5.01, 1.31, 23.01, 1.2, 0.79, 0.08, 1.65, 0.66, 0.77, -0.22, 0.52, 0.3, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/s9IqypZYH6A_filtered.json b/annotations_filtered/s9IqypZYH6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9295864d812f1fdfa910f7230a321fd151e5015b --- /dev/null +++ b/annotations_filtered/s9IqypZYH6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [5.0, 4.94], [24.0, 24.14], [33.0, 34.37], [57.0, 57.15], [58.0, 80.15], [83.0, 88.99], [89.0, 90.49], [91.0, 91.72], [105.0, 106.14], [111.0, 111.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 58.72, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, -0.06, 0.14, 1.37, 0.15, 22.15, 5.99, 1.49, 0.72, 1.14, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/s9JqbCH4aVw_filtered.json b/annotations_filtered/s9JqbCH4aVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..243653208cc2183b1bfe576ae941b9dac10034e4 --- /dev/null +++ b/annotations_filtered/s9JqbCH4aVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.43], [13.0, 13.66], [14.0, 15.21], [15.0, 18.0], [19.0, 20.36], [22.0, 22.1], [23.0, 29.69], [30.0, 30.75], [32.0, 33.18], [35.0, 41.82], [42.0, 43.02], [44.0, 46.92], [49.0, 53.23], [54.0, 54.24], [56.0, 56.94], [60.0, 63.24], [64.0, 64.56], [65.0, 65.65], [66.0, 67.12], [69.0, 68.98], [69.0, 71.1], [72.0, 72.25], [74.0, 74.48], [79.0, 81.48], [83.0, 83.79], [85.0, 85.53], [87.0, 90.85], [93.0, 93.14], [95.0, 94.83], [97.0, 98.15], [101.0, 104.3], [107.0, 108.48], [109.0, 110.3], [114.0, 114.76], [115.0, 116.21], [118.0, 118.3], [122.0, 122.62], [124.0, 125.02], [133.0, 133.64], [134.0, 134.15], [134.0, 134.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 54.1, 0.0, 0.0, 42.44, 0.0, 0.0, 61.27, 0.0, 39.85, 38.37, 0.0, 0.0, 32.85, 0.0, 0.0, 0.0, 0.0, 53.1, 0.0, 0.0, 33.76, 0.0, 0.0, 32.78, 0.0, 0.0, 0.0, 97.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 68.39], ["sidetone", 9.4], ["whack, thwack", 2.7]], null, null, null, null, [["music", 33.52], ["musical instrument", 19.71], ["didgeridoo", 6.0]], [["speech", 55.23], ["radio", 38.43], ["telephone", 2.16]], null, null, [["speech", 33.91], ["radio", 30.24], ["sidetone", 21.32]], null, null, null, null, null, null, null, [["fart", 39.27], ["busy signal", 13.63], ["sound effect", 9.34]], null, null, [["moo", 46.84], ["cattle, bovinae", 34.04], ["livestock, farm animals, working animals", 8.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.43, 0.66, 1.21, 3.0, 1.36, 0.1, 6.69, 0.75, 1.18, 6.82, 1.02, 2.92, 4.23, 0.24, 0.94, 3.24, 0.56, 0.65, 1.12, -0.02, 2.1, 0.25, 0.48, 2.48, 0.79, 0.53, 3.85, 0.14, -0.17, 1.15, 3.3, 1.48, 1.3, 0.76, 1.21, 0.3, 0.62, 1.02, 0.64, 0.15, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/s9TKR7rSFfA_filtered.json b/annotations_filtered/s9TKR7rSFfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83863a81096c0126ce5a686455d25a533343edae --- /dev/null +++ b/annotations_filtered/s9TKR7rSFfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.86], [4.0, 3.96], [5.0, 6.64], [8.0, 8.82], [10.0, 10.03], [17.0, 19.77], [21.0, 21.61], [22.0, 23.16], [25.0, 25.34], [27.0, 26.67], [28.0, 28.51], [29.0, 33.71], [37.0, 41.99], [44.0, 44.91], [47.0, 47.22], [47.0, 48.98], [51.0, 54.95], [56.0, 56.03], [57.0, 61.79], [63.0, 64.89], [68.0, 69.43], [74.0, 74.55], [76.0, 77.14], [95.0, 94.85], [96.0, 96.6], [98.0, 100.62], [103.0, 103.94], [108.0, 108.11], [108.0, 108.14], [110.0, 115.05], [116.0, 116.28], [118.0, 118.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 77.7, 32.88, 0.0, 0.0, 0.0, 39.08, 0.0, 38.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.75, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 24.6], ["noise", 20.02], ["mains hum", 19.38]], null, null, null, [["sidetone", 43.91], ["speech", 27.46], ["hum", 4.22]], null, [["hum", 15.94], ["speech", 15.38], ["mains hum", 12.54]], null, null, null, null, null, null, [["hum", 16.21], ["snicker", 7.6], ["eruption", 6.5]], null, null, null, null, null, null], "duration": [-0.14, -0.04, 1.64, 0.82, 0.03, 2.77, 0.61, 1.16, 0.34, -0.33, 0.51, 4.71, 4.99, 0.91, 0.22, 1.98, 3.95, 0.03, 4.79, 1.89, 1.43, 0.55, 1.14, -0.15, 0.6, 2.62, 0.94, 0.11, 0.14, 5.05, 0.28, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/s9jX0S7mvB8_filtered.json b/annotations_filtered/s9jX0S7mvB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c41fccd3f1a30cc8328876b4b3d7d5a272464c02 --- /dev/null +++ b/annotations_filtered/s9jX0S7mvB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.45], [9.0, 9.34], [9.0, 10.99], [11.0, 32.98], [35.0, 37.71], [40.0, 40.9], [45.0, 46.35], [47.0, 52.79], [59.0, 64.25], [66.0, 67.1], [69.0, 69.45], [75.0, 76.71], [77.0, 77.92], [78.0, 80.6], [82.0, 87.05], [90.0, 91.08], [101.0, 104.38], [110.0, 111.62], [114.0, 113.86]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.61, 0.0, 0.0, 82.97, 45.52, 0.0, 0.0, 92.97, 82.61, 0.0, 0.0, 0.0, 0.0, 97.0, 95.23, 0.0, 96.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 12.07], ["buzz", 9.32], ["rumble", 9.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.45, 0.34, 1.99, 21.98, 2.71, 0.9, 1.35, 5.79, 5.25, 1.1, 0.45, 1.71, 0.92, 2.6, 5.05, 1.08, 3.38, 1.62, -0.14]} \ No newline at end of file diff --git a/annotations_filtered/s9k-uO50300_filtered.json b/annotations_filtered/s9k-uO50300_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da291a0f2f412e65b5c535831f86c9de5c4744fd --- /dev/null +++ b/annotations_filtered/s9k-uO50300_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 14.1], [16.0, 18.87], [21.0, 30.4], [32.0, 32.36], [35.0, 37.35], [42.0, 51.46], [52.0, 53.2], [54.0, 63.51], [65.0, 70.21], [71.0, 80.99], [83.0, 91.25], [93.0, 94.88], [97.0, 98.66], [100.0, 100.63], [102.0, 103.11], [105.0, 106.66], [107.0, 109.12], [111.0, 111.72], [113.0, 113.97], [116.0, 125.71], [127.0, 127.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.84, 99.31, 99.82, 0.0, 99.91, 85.35, 0.0, 98.59, 99.99, 99.99, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 99.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.1, 2.87, 9.4, 0.36, 2.35, 9.46, 1.2, 9.51, 5.21, 9.99, 8.25, 1.88, 1.66, 0.63, 1.11, 1.66, 2.12, 0.72, 0.97, 9.71, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/s9nYXJweTPU_filtered.json b/annotations_filtered/s9nYXJweTPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0993106213d6f7316d74df39ae88d08f76c9adc --- /dev/null +++ b/annotations_filtered/s9nYXJweTPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.16], [16.0, 16.63], [28.0, 30.06], [35.0, 42.48], [43.0, 73.09], [74.0, 78.07], [79.0, 93.8], [94.0, 95.71], [104.0, 105.12], [106.0, 106.88], [118.0, 119.8], [127.0, 126.91], [130.0, 130.35], [135.0, 136.0], [138.0, 139.63], [142.0, 142.2], [147.0, 148.9], [164.0, 166.08], [167.0, 169.01], [170.0, 171.49], [173.0, 174.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.46, 0.0, 94.95, 85.54, 0.0, 100.0, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 99.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.16, 0.63, 2.06, 7.48, 30.09, 4.07, 14.8, 1.71, 1.12, 0.88, 1.8, -0.09, 0.35, 1.0, 1.63, 0.2, 1.9, 2.08, 2.01, 1.49, 1.77]} \ No newline at end of file diff --git a/annotations_filtered/s9prJba2vkw_filtered.json b/annotations_filtered/s9prJba2vkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3df13a9e2d9965fc594b302cee3627d7cd0cd11c --- /dev/null +++ b/annotations_filtered/s9prJba2vkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.18], [44.0, 46.52], [47.0, 48.07], [49.0, 51.85], [62.0, 63.39], [64.0, 65.55], [73.0, 73.06], [73.0, 74.24], [79.0, 79.46], [82.0, 83.07], [94.0, 94.31], [102.0, 102.98], [113.0, 113.31], [117.0, 119.15], [120.0, 120.14], [122.0, 122.47], [124.0, 124.16], [125.0, 126.91], [136.0, 136.73], [137.0, 137.83], [140.0, 139.97], [147.0, 149.57], [152.0, 154.41], [155.0, 156.81], [158.0, 159.39], [160.0, 161.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 51.94, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.18, 2.52, 1.07, 2.85, 1.39, 1.55, 0.06, 1.24, 0.46, 1.07, 0.31, 0.98, 0.31, 2.15, 0.14, 0.47, 0.16, 1.91, 0.73, 0.83, -0.03, 2.57, 2.41, 1.81, 1.39, 1.87]} \ No newline at end of file diff --git a/annotations_filtered/sA0SngAZcdA_filtered.json b/annotations_filtered/sA0SngAZcdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5c305dc69c1c786b39e0a4f746ae15733bdbc88 --- /dev/null +++ b/annotations_filtered/sA0SngAZcdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.91], [8.0, 10.77], [14.0, 27.73], [30.0, 30.48], [33.0, 35.02], [35.0, 35.99], [43.0, 43.78], [45.0, 45.59], [57.0, 57.72], [62.0, 68.17], [70.0, 70.98], [76.0, 77.55], [79.0, 78.88], [80.0, 87.0], [88.0, 93.95]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.55, 97.92, 47.16, 0.0, 35.46, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 92.8, 58.55], "audiomae_on_audioset": [null, null, [["music", 60.24], ["speech", 10.98], ["hum", 2.03]], null, [["speech", 31.56], ["music", 5.78], ["radio", 5.01]], null, null, null, null, null, null, null, null, null, null], "duration": [2.91, 2.77, 13.73, 0.48, 2.02, 0.99, 0.78, 0.59, 0.72, 6.17, 0.98, 1.55, -0.12, 7.0, 5.95]} \ No newline at end of file diff --git a/annotations_filtered/sAO0owc4xeY_filtered.json b/annotations_filtered/sAO0owc4xeY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6883e6b3af5b7a0f70bb76423e11dc7e0d31028 --- /dev/null +++ b/annotations_filtered/sAO0owc4xeY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.4], [3.0, 3.3], [15.0, 16.6], [18.0, 18.84], [20.0, 27.11], [27.0, 27.48], [28.0, 27.72], [29.0, 39.8], [43.0, 44.64], [48.0, 48.14], [49.0, 49.96], [51.0, 51.53], [52.0, 56.93], [58.0, 57.94], [58.0, 58.01], [58.0, 58.68], [59.0, 59.9], [61.0, 61.7], [62.0, 63.68], [65.0, 66.7], [68.0, 68.5], [69.0, 69.63], [74.0, 75.05], [77.0, 77.23], [80.0, 80.77], [84.0, 85.01], [86.0, 87.66], [89.0, 90.17], [91.0, 91.13], [92.0, 93.92], [95.0, 98.2], [98.0, 99.17], [103.0, 104.63], [107.0, 113.53], [114.0, 114.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 63.42, 0.0, 0.0, 39.57, 0.0, 0.0, 0.0, 0.0, 34.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 0.0, 54.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mains hum", 31.43], ["hum", 26.06], ["speech", 14.7]], null, null, null, null, [["fly, housefly", 43.74], ["insect", 30.0], ["bee, wasp, etc.", 17.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.3, 1.6, 0.84, 7.11, 0.48, -0.28, 10.8, 1.64, 0.14, 0.96, 0.53, 4.93, -0.06, 0.01, 0.68, 0.9, 0.7, 1.68, 1.7, 0.5, 0.63, 1.05, 0.23, 0.77, 1.01, 1.66, 1.17, 0.13, 1.92, 3.2, 1.17, 1.63, 6.53, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/sAgSUFT4cVk_filtered.json b/annotations_filtered/sAgSUFT4cVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a517adb06042a6d7cbc1c7fec337df76da0a699 --- /dev/null +++ b/annotations_filtered/sAgSUFT4cVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.82], [11.0, 10.86], [11.0, 12.12], [13.0, 14.25], [16.0, 16.53], [17.0, 17.93], [26.0, 27.26], [28.0, 29.88], [30.0, 32.59], [35.0, 38.5], [40.0, 40.22], [41.0, 42.25], [44.0, 43.7], [44.0, 48.27], [52.0, 52.15], [55.0, 56.47], [58.0, 58.38], [60.0, 60.45], [63.0, 63.36], [64.0, 64.76], [67.0, 68.71], [72.0, 72.28], [73.0, 75.84], [77.0, 78.83], [83.0, 85.08], [87.0, 90.1], [95.0, 95.32], [96.0, 99.08], [106.0, 106.68], [111.0, 112.16], [115.0, 116.14], [118.0, 118.56], [122.0, 124.02], [127.0, 130.08]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.4, 39.46, 0.0, 0.0, 0.0, 35.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.07, 0.0, 31.65, 32.11, 0.0, 31.88, 0.0, 0.0, 0.0, 0.0, 28.75, 28.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["chirp tone", 32.5], ["music", 29.29], ["sine wave", 5.79]], [["music", 35.3], ["throbbing", 17.31], ["hum", 15.29]], null, null, null, [["throbbing", 21.85], ["music", 18.79], ["hum", 13.32]], null, null, null, null, null, null, null, null, [["music", 21.31], ["throbbing", 14.33], ["hum", 12.79]], null, [["sidetone", 32.15], ["music", 25.56], ["speech", 6.59]], [["sidetone", 35.96], ["music", 27.47], ["speech", 15.7]], null, [["music", 41.44], ["synthesizer", 11.2], ["hum", 10.06]], null, null, null, null, [["music", 48.08], ["hum", 13.82], ["electronic music", 11.85]], [["music", 48.21], ["hum", 10.34], ["throbbing", 5.62]]], "duration": [0.82, -0.14, 1.12, 1.25, 0.53, 0.93, 1.26, 1.88, 2.59, 3.5, 0.22, 1.25, -0.3, 4.27, 0.15, 1.47, 0.38, 0.45, 0.36, 0.76, 1.71, 0.28, 2.84, 1.83, 2.08, 3.1, 0.32, 3.08, 0.68, 1.16, 1.14, 0.56, 2.02, 3.08]} \ No newline at end of file diff --git a/annotations_filtered/sAtsZPmjExo_filtered.json b/annotations_filtered/sAtsZPmjExo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..046cc335a07982b979486650f503fb34f1408866 --- /dev/null +++ b/annotations_filtered/sAtsZPmjExo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.83], [9.0, 9.54], [13.0, 14.39], [21.0, 20.82], [41.0, 45.89], [51.0, 51.38], [54.0, 54.8], [56.0, 61.72], [65.0, 68.08], [70.0, 70.93], [83.0, 83.29], [88.0, 88.1], [88.0, 89.23], [91.0, 92.57], [93.0, 92.8], [93.0, 92.87], [93.0, 93.34], [104.0, 103.94], [112.0, 115.43], [117.0, 117.66], [119.0, 119.53], [121.0, 129.74], [133.0, 143.02], [148.0, 149.28], [152.0, 158.03]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.98, 0.0, 0.0, 31.6, 40.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 48.78, 38.58, 0.0, 32.15], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 42.48], ["moo", 31.37], ["livestock, farm animals, working animals", 25.5]], null, null, [["speech", 67.01], ["explosion", 10.66], ["music", 9.76]], [["music", 32.0], ["hum", 11.0], ["synthesizer", 7.92]], null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 58.91], ["throbbing", 16.53], ["music", 12.77]], [["hum", 35.28], ["mains hum", 22.49], ["throbbing", 7.91]], null, [["speech", 85.0], ["vehicle", 2.88], ["car", 2.13]]], "duration": [-0.17, 0.54, 1.39, -0.18, 4.89, 0.38, 0.8, 5.72, 3.08, 0.93, 0.29, 0.1, 1.23, 1.57, -0.2, -0.13, 0.34, -0.06, 3.43, 0.66, 0.53, 8.74, 10.02, 1.28, 6.03]} \ No newline at end of file diff --git a/annotations_filtered/sAvGdule3fA_filtered.json b/annotations_filtered/sAvGdule3fA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef0b1094eaf27534549dda360e2ab5c7a57d96de --- /dev/null +++ b/annotations_filtered/sAvGdule3fA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.89], [13.0, 13.71], [14.0, 14.32], [15.0, 18.52], [19.0, 20.63], [21.0, 22.74], [25.0, 27.75], [28.0, 28.92], [29.0, 30.87], [32.0, 32.32], [33.0, 33.13], [34.0, 38.47], [39.0, 41.89], [42.0, 43.8], [45.0, 46.16], [47.0, 50.3], [51.0, 53.82], [55.0, 56.07], [57.0, 63.29], [64.0, 65.21], [66.0, 68.79], [69.0, 70.92], [73.0, 73.99], [75.0, 76.11], [77.0, 79.71], [80.0, 81.65], [83.0, 85.9], [87.0, 87.42], [88.0, 87.79], [89.0, 90.29], [91.0, 93.31], [95.0, 94.93], [98.0, 101.6], [105.0, 105.19], [109.0, 113.07], [115.0, 115.3], [116.0, 123.06], [125.0, 128.49], [129.0, 134.5], [135.0, 135.3], [136.0, 137.24], [138.0, 138.82], [140.0, 140.63], [141.0, 150.08], [153.0, 155.31], [157.0, 157.67], [161.0, 162.35], [163.0, 164.96], [166.0, 166.97], [168.0, 169.97], [171.0, 171.96], [173.0, 173.21], [177.0, 184.1], [186.0, 188.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 78.21, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 87.19, 83.88, 0.0, 0.0, 75.88, 76.86, 0.0, 50.06, 0.0, 53.65, 0.0, 0.0, 0.0, 86.09, 0.0, 64.18, 0.0, 0.0, 0.0, 61.57, 0.0, 53.47, 0.0, 40.38, 0.0, 50.97, 42.33, 39.38, 0.0, 0.0, 0.0, 0.0, 39.94, 47.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.52, 37.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 36.88], ["music", 22.37], ["hum", 13.93]], null, null, [["music", 26.15], ["organ", 13.49], ["musical instrument", 10.53]], [["music", 49.68], ["theremin", 12.61], ["musical instrument", 5.17]], null, null, null, null, [["music", 43.83], ["speech", 24.39], ["foghorn", 13.96]], [["music", 27.07], ["hum", 8.67], ["mains hum", 8.54]], null, null, null, null, null, null, null, [["music", 45.96], ["theremin", 24.0], ["foghorn", 5.16]], [["music", 56.38], ["didgeridoo", 21.33], ["theremin", 4.84]]], "duration": [0.89, 0.71, 0.32, 3.52, 1.63, 1.74, 2.75, 0.92, 1.87, 0.32, 0.13, 4.47, 2.89, 1.8, 1.16, 3.3, 2.82, 1.07, 6.29, 1.21, 2.79, 1.92, 0.99, 1.11, 2.71, 1.65, 2.9, 0.42, -0.21, 1.29, 2.31, -0.07, 3.6, 0.19, 4.07, 0.3, 7.06, 3.49, 5.5, 0.3, 1.24, 0.82, 0.63, 9.08, 2.31, 0.67, 1.35, 1.96, 0.97, 1.97, 0.96, 0.21, 7.1, 2.5]} \ No newline at end of file diff --git a/annotations_filtered/sAwwDhNJJO0_filtered.json b/annotations_filtered/sAwwDhNJJO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/sAwwDhNJJO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/sBDEE3_Z-cw_filtered.json b/annotations_filtered/sBDEE3_Z-cw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68fe845530d33cb210b31ae54f3cf6a18b6775c4 --- /dev/null +++ b/annotations_filtered/sBDEE3_Z-cw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.19], [32.0, 32.32], [38.0, 38.26], [41.0, 53.55], [58.0, 65.31]], "keep_status": [false, false, false, false, true], "silence_prob": [35.27, 0.0, 0.0, 32.05, 30.39], "audiomae_on_audioset": [[["music", 59.11], ["electronic music", 9.5], ["throbbing", 4.21]], null, null, [["music", 71.58], ["electronic music", 6.18], ["throbbing", 4.55]], [["music", 42.77], ["vehicle", 8.21], ["car", 7.75]]], "duration": [2.19, 0.32, 0.26, 12.55, 7.31]} \ No newline at end of file diff --git a/annotations_filtered/sBJ2jguXBes_filtered.json b/annotations_filtered/sBJ2jguXBes_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf9c9acd0f19e11265b89b576772ea51fa7788c1 --- /dev/null +++ b/annotations_filtered/sBJ2jguXBes_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.81], [34.0, 88.01], [88.0, 91.1], [92.0, 94.95], [97.0, 107.08], [110.0, 109.98], [112.0, 116.67], [118.0, 118.67], [119.0, 120.26]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.1, 58.3, 41.09, 0.0, 95.91, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 30.95], ["mains hum", 26.99], ["rumble", 12.71]], null, null, null, null], "duration": [1.81, 54.01, 3.1, 2.95, 10.08, -0.02, 4.67, 0.67, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/sBSibz9xdic_filtered.json b/annotations_filtered/sBSibz9xdic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55f5150522772314dd8018009976f376f1e22e68 --- /dev/null +++ b/annotations_filtered/sBSibz9xdic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 13.85], [21.0, 21.59], [22.0, 22.65], [23.0, 23.79], [27.0, 27.72], [31.0, 39.82], [41.0, 41.64], [42.0, 41.82], [42.0, 42.08], [42.0, 42.89], [54.0, 54.43], [57.0, 60.4], [64.0, 64.74], [78.0, 78.81], [84.0, 84.59], [86.0, 86.49], [87.0, 86.98], [87.0, 88.8], [89.0, 90.04], [94.0, 96.18], [97.0, 97.9], [100.0, 104.48], [108.0, 108.92], [110.0, 110.35], [112.0, 112.29], [114.0, 116.77], [125.0, 125.31]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [44.72, 0.0, 0.0, 0.0, 0.0, 43.08, 0.0, 0.0, 0.0, 0.0, 0.0, 35.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 39.18, 0.0, 0.0, 0.0, 32.23, 0.0], "audiomae_on_audioset": [[["speech", 35.59], ["animal", 11.54], ["whale vocalization", 9.97]], null, null, null, null, [["speech", 49.74], ["radio", 13.34], ["explosion", 5.0]], null, null, null, null, null, [["speech", 52.25], ["boing", 18.69], ["clang", 4.31]], null, null, null, null, null, null, null, null, null, [["mains hum", 32.31], ["hum", 25.72], ["fly, housefly", 9.72]], null, null, null, [["whale vocalization", 38.64], ["howl", 10.18], ["animal", 8.33]], null], "duration": [12.85, 0.59, 0.65, 0.79, 0.72, 8.82, 0.64, -0.18, 0.08, 0.89, 0.43, 3.4, 0.74, 0.81, 0.59, 0.49, -0.02, 1.8, 1.04, 2.18, 0.9, 4.48, 0.92, 0.35, 0.29, 2.77, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/sBjNpZ5t9S4_filtered.json b/annotations_filtered/sBjNpZ5t9S4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9e2a0c7023e12a450903540da11301e3af7c182 --- /dev/null +++ b/annotations_filtered/sBjNpZ5t9S4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.77], [15.0, 17.1], [18.0, 18.59], [21.0, 21.37], [30.0, 34.96], [44.0, 48.27], [56.0, 56.12], [64.0, 65.3], [68.0, 71.85], [79.0, 80.45], [81.0, 81.03], [83.0, 87.27]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 46.4, 42.19, 0.0, 0.0, 100.0, 0.0, 0.0, 97.43], "audiomae_on_audioset": [null, null, null, null, [["noise", 13.4], ["groan", 9.5], ["sound effect", 8.07]], [["gong", 42.12], ["music", 14.76], ["chirp tone", 9.12]], null, null, null, null, null, null], "duration": [1.77, 2.1, 0.59, 0.37, 4.96, 4.27, 0.12, 1.3, 3.85, 1.45, 0.03, 4.27]} \ No newline at end of file diff --git a/annotations_filtered/sC78ImgOLQI_filtered.json b/annotations_filtered/sC78ImgOLQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0162137acdf68374897c1e991f85912f54531a4 --- /dev/null +++ b/annotations_filtered/sC78ImgOLQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [4.0, 5.36], [14.0, 13.91], [17.0, 17.14], [18.0, 18.27], [19.0, 50.58], [54.0, 56.03], [57.0, 58.99], [60.0, 60.69], [62.0, 65.8], [67.0, 68.37], [69.0, 70.75], [72.0, 72.47], [73.0, 74.28], [75.0, 82.43], [83.0, 98.1], [98.0, 98.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 67.25, 0.0, 0.0, 0.0, 0.0, 34.06, 32.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 19.53], ["music", 15.96], ["synthesizer", 9.49]], [["music", 25.2], ["synthesizer", 11.78], ["speech", 11.25]], null], "duration": [0.23, 1.36, -0.09, 0.14, 0.27, 31.58, 2.03, 1.99, 0.69, 3.8, 1.37, 1.75, 0.47, 1.28, 7.43, 15.1, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/sCG88QHentc_filtered.json b/annotations_filtered/sCG88QHentc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74421b5097ff59d1e927c3540caf34c2796b2a3a --- /dev/null +++ b/annotations_filtered/sCG88QHentc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.99], [15.0, 15.77], [24.0, 25.42], [32.0, 32.36], [33.0, 33.84], [35.0, 35.68], [38.0, 38.77], [41.0, 42.74], [44.0, 43.98], [70.0, 70.31], [71.0, 71.36], [73.0, 81.21], [84.0, 84.65], [91.0, 91.91], [94.0, 93.9], [100.0, 101.06], [115.0, 115.75], [122.0, 122.91], [124.0, 125.02], [126.0, 127.97], [129.0, 128.71], [134.0, 134.03], [136.0, 135.97], [153.0, 152.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 0.77, 1.42, 0.36, 0.84, 0.68, 0.77, 1.74, -0.02, 0.31, 0.36, 8.21, 0.65, 0.91, -0.1, 1.06, 0.75, 0.91, 1.02, 1.97, -0.29, 0.03, -0.03, -0.34]} \ No newline at end of file diff --git a/annotations_filtered/sCJ_SlkCT_o_filtered.json b/annotations_filtered/sCJ_SlkCT_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b00a6aef8ce20cc0e7a0e78d31eb515445dbbbb --- /dev/null +++ b/annotations_filtered/sCJ_SlkCT_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [3.0, 4.46], [7.0, 25.3], [26.0, 34.97], [36.0, 37.52], [38.0, 38.43], [40.0, 61.64], [66.0, 66.41], [71.0, 70.78], [71.0, 71.95], [73.0, 75.49], [76.0, 83.74], [85.0, 85.26], [86.0, 85.78], [92.0, 92.48], [97.0, 99.32], [116.0, 118.47], [121.0, 136.75], [138.0, 137.84]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 37.27, 31.83, 0.0, 0.0, 37.19, 0.0, 0.0, 0.0, 37.99, 38.72, 0.0, 0.0, 0.0, 83.7, 38.16, 38.78, 0.0], "audiomae_on_audioset": [null, null, [["music", 24.96], ["speech", 19.22], ["cattle, bovinae", 7.63]], [["music", 32.54], ["didgeridoo", 16.44], ["boing", 14.59]], null, null, [["moo", 28.02], ["cattle, bovinae", 22.96], ["livestock, farm animals, working animals", 15.92]], null, null, null, [["cattle, bovinae", 44.99], ["moo", 27.31], ["livestock, farm animals, working animals", 23.35]], [["moo", 32.73], ["cattle, bovinae", 32.13], ["livestock, farm animals, working animals", 31.91]], null, null, null, null, [["groan", 29.55], ["speech", 21.77], ["livestock, farm animals, working animals", 13.47]], [["music", 56.97], ["didgeridoo", 25.97], ["musical instrument", 4.01]], null], "duration": [0.93, 1.46, 18.3, 8.97, 1.52, 0.43, 21.64, 0.41, -0.22, 0.95, 2.49, 7.74, 0.26, -0.22, 0.48, 2.32, 2.47, 15.75, -0.16]} \ No newline at end of file diff --git a/annotations_filtered/sCSTQpBwqqs_filtered.json b/annotations_filtered/sCSTQpBwqqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e41add6143718548ec81e38aafe7e5b849449bf3 --- /dev/null +++ b/annotations_filtered/sCSTQpBwqqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 42.23], [43.0, 43.95], [44.0, 51.26], [52.0, 53.92], [55.0, 56.34], [57.0, 62.78], [64.0, 79.54], [80.0, 81.67], [82.0, 92.33], [93.0, 96.52], [98.0, 103.44], [104.0, 108.48], [119.0, 119.35], [122.0, 124.75], [125.0, 127.87]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [67.38, 0.0, 88.1, 0.0, 0.0, 71.14, 34.48, 0.0, 46.68, 53.65, 49.5, 37.85, 0.0, 55.6, 47.54], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 47.87], ["mains hum", 19.15], ["music", 5.57]], null, [["insect", 40.43], ["animal", 7.48], ["fly, housefly", 6.62]], null, [["fly, housefly", 12.96], ["fireworks", 12.49], ["insect", 11.83]], [["speech", 39.45], ["explosion", 9.48], ["whack, thwack", 4.39]], null, null, [["fly, housefly", 34.31], ["insect", 29.96], ["speech", 10.47]]], "duration": [26.23, 0.95, 7.26, 1.92, 1.34, 5.78, 15.54, 1.67, 10.33, 3.52, 5.44, 4.48, 0.35, 2.75, 2.87]} \ No newline at end of file diff --git a/annotations_filtered/sCiErOySQtA_filtered.json b/annotations_filtered/sCiErOySQtA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f75622c82aec085bc5b22ad1dc7b9a3bf6c7109 --- /dev/null +++ b/annotations_filtered/sCiErOySQtA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.73], [10.0, 10.4], [12.0, 12.16], [13.0, 29.81], [31.0, 32.75], [34.0, 38.82], [44.0, 43.98], [46.0, 46.2], [46.0, 46.57], [51.0, 54.28], [56.0, 60.62], [63.0, 67.86], [69.0, 76.57], [79.0, 84.35], [86.0, 108.01], [111.0, 122.91]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 40.11, 0.0, 73.82, 0.0, 0.0, 0.0, 43.58, 37.03, 55.11, 41.72, 83.88, 46.83, 95.91], "audiomae_on_audioset": [null, null, null, [["mains hum", 53.62], ["hum", 29.38], ["sidetone", 4.54]], null, null, null, null, null, [["dog", 16.06], ["bow-wow", 10.78], ["domestic animals, pets", 8.75]], [["speech", 44.01], ["hum", 7.69], ["fly, housefly", 7.56]], null, [["hum", 29.18], ["speech", 23.12], ["mains hum", 9.82]], null, [["hum", 34.61], ["mains hum", 18.08], ["fart", 7.56]], null], "duration": [0.73, 0.4, 0.16, 16.81, 1.75, 4.82, -0.02, 0.2, 0.57, 3.28, 4.62, 4.86, 7.57, 5.35, 22.01, 11.91]} \ No newline at end of file diff --git a/annotations_filtered/sCr9YZRDsJA_filtered.json b/annotations_filtered/sCr9YZRDsJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad652c67a4e6e37c9333b62603c656dbad018c7e --- /dev/null +++ b/annotations_filtered/sCr9YZRDsJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [8.0, 8.92], [17.0, 17.98], [24.0, 25.69], [30.0, 30.0], [39.0, 39.39], [50.0, 50.55], [54.0, 54.36], [67.0, 74.36], [77.0, 77.7], [78.0, 79.62], [104.0, 104.8], [106.0, 106.1], [111.0, 115.48], [126.0, 127.31], [130.0, 131.14], [133.0, 133.76], [134.0, 135.72], [137.0, 146.38], [147.0, 148.09], [153.0, 155.01], [157.0, 160.3], [164.0, 164.73], [165.0, 174.8], [182.0, 182.63], [184.0, 208.94], [210.0, 213.17], [213.0, 213.34], [213.0, 213.44], [213.0, 213.61], [214.0, 224.34], [231.0, 232.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.51, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 29.31, 0.0, 30.96, 29.03, 0.0, 29.16, 0.0, 30.16, 29.08, 0.0, 0.0, 0.0, 29.48, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 71.84], ["scratching (performance technique)", 7.11], ["electronic music", 3.47]], null, null, null, null, null, null, null, null, null, [["music", 45.33], ["speech", 39.53], ["didgeridoo", 1.94]], null, [["speech", 62.65], ["vehicle", 6.68], ["boat, water vehicle", 3.47]], [["speech", 61.0], ["music", 9.7], ["vehicle", 3.78]], null, [["speech", 18.11], ["livestock, farm animals, working animals", 10.29], ["cattle, bovinae", 5.84]], null, [["speech", 19.36], ["cattle, bovinae", 12.05], ["music", 11.99]], [["music", 47.37], ["whoosh, swoosh, swish", 4.11], ["whack, thwack", 3.61]], null, null, null, [["sidetone", 21.84], ["throbbing", 20.94], ["music", 20.1]], null], "duration": [0.45, 0.92, 0.98, 1.69, 0.0, 0.39, 0.55, 0.36, 7.36, 0.7, 1.62, 0.8, 0.1, 4.48, 1.31, 1.14, 0.76, 1.72, 9.38, 1.09, 2.01, 3.3, 0.73, 9.8, 0.63, 24.94, 3.17, 0.34, 0.44, 0.61, 10.34, 1.36]} \ No newline at end of file diff --git a/annotations_filtered/sCsMjWjftZs_filtered.json b/annotations_filtered/sCsMjWjftZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b59c66a6a1aa76ac969f47d244fb83b090e39f60 --- /dev/null +++ b/annotations_filtered/sCsMjWjftZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.5], [11.0, 11.03], [13.0, 13.95], [18.0, 44.76], [48.0, 52.35], [55.0, 62.65], [63.0, 64.96], [71.0, 79.35], [86.0, 87.52], [88.0, 93.38], [94.0, 95.4], [99.0, 101.56], [103.0, 103.89], [106.0, 107.08], [108.0, 136.7], [137.0, 137.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.27, 64.86, 31.58, 0.0, 33.34, 0.0, 35.67, 0.0, 39.69, 0.0, 0.0, 31.65, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 81.98], ["speech", 1.34], ["musical instrument", 0.95]], null, [["music", 77.15], ["theremin", 5.36], ["musical instrument", 3.72]], null, [["music", 75.62], ["throbbing", 11.71], ["hum", 1.78]], null, [["hum", 36.38], ["music", 22.69], ["mains hum", 15.16]], null, [["music", 42.07], ["foghorn", 14.28], ["speech", 2.25]], null, null, [["music", 70.3], ["scary music", 2.9], ["mains hum", 2.65]], null], "duration": [0.5, 0.03, 0.95, 26.76, 4.35, 7.65, 1.96, 8.35, 1.52, 5.38, 1.4, 2.56, 0.89, 1.08, 28.7, 0.94]} \ No newline at end of file diff --git a/annotations_filtered/sDEWZnPJGRU_filtered.json b/annotations_filtered/sDEWZnPJGRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef31538318e9f36825d191c5f1d733aa24eeaf40 --- /dev/null +++ b/annotations_filtered/sDEWZnPJGRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.01], [30.0, 31.51], [33.0, 34.26], [37.0, 45.45], [48.0, 49.23], [49.0, 50.16], [51.0, 56.81], [59.0, 62.26], [71.0, 72.4], [81.0, 83.67], [92.0, 92.97], [94.0, 95.34], [113.0, 115.18], [127.0, 128.14], [131.0, 143.4], [148.0, 155.55], [169.0, 170.26], [171.0, 172.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.02, 0.0, 0.0, 33.05, 0.0, 0.0, 32.92, 32.64, 0.0, 31.63, 0.0, 0.0, 36.39, 0.0, 32.3, 31.58, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 30.36], ["mosquito", 27.39], ["insect", 16.12]], null, null, [["music", 67.9], ["didgeridoo", 6.38], ["throbbing", 2.29]], [["music", 66.85], ["didgeridoo", 3.94], ["musical instrument", 1.33]], null, [["music", 67.86], ["carnatic music", 5.67], ["chant", 1.92]], null, null, [["music", 83.32], ["electronic music", 1.61], ["throbbing", 1.38]], null, [["music", 65.81], ["musical instrument", 4.78], ["didgeridoo", 3.08]], [["music", 71.31], ["buzz", 4.0], ["mosquito", 2.6]], null, null], "duration": [2.01, 1.51, 1.26, 8.45, 1.23, 1.16, 5.81, 3.26, 1.4, 2.67, 0.97, 1.34, 2.18, 1.14, 12.4, 7.55, 1.26, 1.42]} \ No newline at end of file diff --git a/annotations_filtered/sDsoiCkKuZY_filtered.json b/annotations_filtered/sDsoiCkKuZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1eec3f8200563276a1600adf3caf49bd39c40687 --- /dev/null +++ b/annotations_filtered/sDsoiCkKuZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.51], [10.0, 11.18], [33.0, 57.81], [61.0, 61.92], [64.0, 65.15], [66.0, 76.89], [87.0, 95.66], [96.0, 96.8], [99.0, 102.19], [104.0, 104.3], [105.0, 104.99]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.77, 0.0, 0.0, 38.08, 37.58, 0.0, 42.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 25.49], ["didgeridoo", 14.55], ["mosquito", 8.42]], null, null, [["music", 45.5], ["throbbing", 10.0], ["hum", 9.55]], [["music", 59.24], ["theremin", 14.08], ["synthesizer", 3.14]], null, [["music", 50.5], ["speech", 20.11], ["didgeridoo", 12.1]], null, null], "duration": [1.51, 1.18, 24.81, 0.92, 1.15, 10.89, 8.66, 0.8, 3.19, 0.3, -0.01]} \ No newline at end of file diff --git a/annotations_filtered/sEWuVNk2TKA_filtered.json b/annotations_filtered/sEWuVNk2TKA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..717c86dd070877adcfc4bcb9b8f30e732cf5039a --- /dev/null +++ b/annotations_filtered/sEWuVNk2TKA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.76], [12.0, 14.52], [15.0, 15.53], [17.0, 17.61], [19.0, 19.99], [20.0, 20.66], [23.0, 24.44], [27.0, 28.11], [31.0, 32.32], [34.0, 34.47], [36.0, 36.53], [39.0, 39.68], [46.0, 50.99], [52.0, 52.73], [57.0, 57.77], [60.0, 61.35], [66.0, 65.94], [68.0, 68.66], [71.0, 70.93], [75.0, 75.12], [76.0, 76.81], [78.0, 79.02], [83.0, 84.62], [86.0, 87.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.56, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.76, 2.52, 0.53, 0.61, 0.99, 0.66, 1.44, 1.11, 1.32, 0.47, 0.53, 0.68, 4.99, 0.73, 0.77, 1.35, -0.06, 0.66, -0.07, 0.12, 0.81, 1.02, 1.62, 1.17]} \ No newline at end of file diff --git a/annotations_filtered/sEXIC0OaQSU_filtered.json b/annotations_filtered/sEXIC0OaQSU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c35909523ee6041946c8e37cff48c909713cfecd --- /dev/null +++ b/annotations_filtered/sEXIC0OaQSU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [5.0, 8.67], [53.0, 53.1]], "keep_status": [false, true, false], "silence_prob": [0.0, 44.75, 0.0], "audiomae_on_audioset": [null, [["speech", 22.32], ["noise", 15.86], ["music", 10.36]], null], "duration": [1.11, 3.67, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/sEnFt6neTu0_filtered.json b/annotations_filtered/sEnFt6neTu0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45d13f518c93cb3999b5fcf3e0b62d863ac0d16e --- /dev/null +++ b/annotations_filtered/sEnFt6neTu0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.07], [7.0, 8.58], [12.0, 13.56], [14.0, 14.96], [20.0, 21.52], [25.0, 25.69], [28.0, 27.77], [29.0, 30.43], [31.0, 33.47], [38.0, 39.77], [48.0, 49.94], [54.0, 55.9], [60.0, 64.18], [66.0, 66.45], [68.0, 68.5], [70.0, 70.53], [72.0, 72.76], [74.0, 76.17], [78.0, 78.48], [80.0, 82.24], [83.0, 86.17], [93.0, 95.37], [98.0, 105.68], [106.0, 106.07], [110.0, 111.35], [114.0, 114.49], [116.0, 116.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.92, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 40.57, 40.22, 34.62, 32.26, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["sidetone", 28.9], ["music", 23.99], ["speech", 20.5]], null, null, null, [["music", 52.91], ["speech", 15.02], ["animal", 2.21]], null, null, null, null, null, null, [["music", 37.37], ["speech", 31.11], ["musical instrument", 3.18]], [["music", 67.14], ["speech", 9.58], ["didgeridoo", 2.27]], [["music", 34.57], ["speech", 31.34], ["beatboxing", 3.28]], [["speech", 48.5], ["music", 14.14], ["groan", 6.36]], null, null, null, null], "duration": [3.07, 1.58, 1.56, 0.96, 1.52, 0.69, -0.23, 1.43, 2.47, 1.77, 1.94, 1.9, 4.18, 0.45, 0.5, 0.53, 0.76, 2.17, 0.48, 2.24, 3.17, 2.37, 7.68, 0.07, 1.35, 0.49, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/sF-j-GhV6xw_filtered.json b/annotations_filtered/sF-j-GhV6xw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b72e0c970b91bec56f38827b4648e1bc5ccf636 --- /dev/null +++ b/annotations_filtered/sF-j-GhV6xw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [10.0, 14.62], [17.0, 16.78], [22.0, 23.9], [28.0, 30.52], [32.0, 32.43], [40.0, 40.36], [45.0, 45.54], [51.0, 51.73], [53.0, 54.23], [59.0, 58.77], [62.0, 62.02], [70.0, 70.9], [74.0, 74.53], [75.0, 75.74], [78.0, 79.12], [88.0, 87.98], [91.0, 92.37], [100.0, 102.66], [107.0, 107.15], [112.0, 114.98], [116.0, 116.18], [117.0, 117.96], [132.0, 132.43], [148.0, 149.81], [167.0, 169.69], [172.0, 173.57], [179.0, 187.78], [190.0, 190.56], [191.0, 192.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 36.98, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 28.85, 0.0, 47.98, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 43.65], ["throbbing", 18.5], ["hum", 8.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.28], ["hum", 20.33], ["static", 7.34]], null, [["music", 43.74], ["breaking", 15.76], ["buzz", 6.2]], null, null], "duration": [0.61, 4.62, -0.22, 1.9, 2.52, 0.43, 0.36, 0.54, 0.73, 1.23, -0.23, 0.02, 0.9, 0.53, 0.74, 1.12, -0.02, 1.37, 2.66, 0.15, 2.98, 0.18, 0.96, 0.43, 1.81, 2.69, 1.57, 8.78, 0.56, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/sFJmNKLW-2A_filtered.json b/annotations_filtered/sFJmNKLW-2A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48ddf8cac2743907fd1439bffa05f18cc4a08048 --- /dev/null +++ b/annotations_filtered/sFJmNKLW-2A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [4.0, 5.53], [6.0, 6.81], [11.0, 11.08], [12.0, 17.2], [22.0, 22.96], [24.0, 26.91], [29.0, 31.14], [36.0, 41.08], [42.0, 42.65], [50.0, 50.52], [53.0, 53.97], [55.0, 57.43], [59.0, 59.93], [64.0, 65.84], [66.0, 69.97], [72.0, 72.42], [74.0, 75.98], [77.0, 78.61], [82.0, 82.16], [85.0, 86.05], [87.0, 87.93], [90.0, 93.14], [94.0, 99.94], [101.0, 103.81], [105.0, 108.23], [109.0, 110.73], [112.0, 132.61], [135.0, 140.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 91.64, 82.07, 69.07, 0.0, 0.0, 0.0, 76.04, 0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.88, 78.89, 87.19, 52.74, 0.0, 43.1, 76.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.19], ["speech", 12.14], ["hum", 5.39]], null], "duration": [0.5, 1.53, 0.81, 0.08, 5.2, 0.96, 2.91, 2.14, 5.08, 0.65, 0.52, 0.97, 2.43, 0.93, 1.84, 3.97, 0.42, 1.98, 1.61, 0.16, 1.05, 0.93, 3.14, 5.94, 2.81, 3.23, 1.73, 20.61, 5.61]} \ No newline at end of file diff --git a/annotations_filtered/sFW-yxe13lo_filtered.json b/annotations_filtered/sFW-yxe13lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b61f474b5fe32fbdd6846034d03dc60f4cd3301 --- /dev/null +++ b/annotations_filtered/sFW-yxe13lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [4.0, 4.82], [8.0, 8.41], [27.0, 27.45], [28.0, 30.38], [31.0, 33.83], [34.0, 35.36], [36.0, 37.1], [38.0, 39.38], [40.0, 40.86], [43.0, 44.12], [44.0, 45.74], [47.0, 47.24], [48.0, 50.03], [51.0, 52.66], [55.0, 55.81], [60.0, 62.92], [63.0, 64.15], [64.0, 65.58], [67.0, 66.7], [68.0, 68.32], [70.0, 73.85], [76.0, 76.79], [78.0, 78.81], [80.0, 83.98], [85.0, 86.54], [87.0, 97.66], [106.0, 109.16], [110.0, 123.6]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.62, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.91, 0.0, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 49.0, 0.0, 34.47, 37.02, 31.82], "audiomae_on_audioset": [null, null, null, null, [["moo", 24.55], ["cattle, bovinae", 23.19], ["speech", 12.62]], null, null, null, null, null, null, null, null, [["honk", 33.37], ["goose", 31.17], ["fowl", 6.13]], null, null, null, null, null, null, null, null, null, null, [["speech", 52.71], ["fly, housefly", 2.83], ["whale vocalization", 2.18]], null, [["music", 26.2], ["didgeridoo", 24.86], ["speech", 10.26]], [["sidetone", 23.03], ["speech", 13.08], ["music", 10.14]], [["hum", 33.3], ["throbbing", 13.06], ["buzz", 11.25]]], "duration": [0.64, 0.82, 0.41, 0.45, 2.38, 2.83, 1.36, 1.1, 1.38, 0.86, 1.12, 1.74, 0.24, 2.03, 1.66, 0.81, 2.92, 1.15, 1.58, -0.3, 0.32, 3.85, 0.79, 0.81, 3.98, 1.54, 10.66, 3.16, 13.6]} \ No newline at end of file diff --git a/annotations_filtered/sFW15hEqZQk_filtered.json b/annotations_filtered/sFW15hEqZQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4e9ad99e02c28b029bc8a8aa81744c24abae442 --- /dev/null +++ b/annotations_filtered/sFW15hEqZQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.66], [8.0, 10.32], [12.0, 13.04], [14.0, 15.77], [16.0, 17.96], [22.0, 22.55], [26.0, 27.08], [28.0, 30.3], [37.0, 38.11], [39.0, 40.59], [43.0, 43.73], [45.0, 46.23], [49.0, 50.84], [56.0, 56.39], [59.0, 59.22], [61.0, 62.34], [64.0, 63.75], [64.0, 65.72], [67.0, 71.76], [73.0, 74.9], [78.0, 79.14], [79.0, 80.84], [82.0, 85.6], [86.0, 87.72], [88.0, 89.26], [90.0, 92.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.97, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.45, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 44.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.39], ["sine wave", 14.16], ["sidetone", 11.72]]], "duration": [2.66, 2.32, 1.04, 1.77, 1.96, 0.55, 1.08, 2.3, 1.11, 1.59, 0.73, 1.23, 1.84, 0.39, 0.22, 1.34, -0.25, 1.72, 4.76, 1.9, 1.14, 1.84, 3.6, 1.72, 1.26, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/sFjraGFeU-A_filtered.json b/annotations_filtered/sFjraGFeU-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91c5b563cfdfd0a249a61b6953e9042a3e12b9c2 --- /dev/null +++ b/annotations_filtered/sFjraGFeU-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.88], [9.0, 9.69], [11.0, 13.41], [19.0, 23.89], [25.0, 27.26], [31.0, 35.33], [39.0, 43.7]], "keep_status": [false, false, false, false, false, true, true], "silence_prob": [36.87, 0.0, 91.13, 36.9, 100.0, 32.38, 40.28], "audiomae_on_audioset": [[["speech", 34.8], ["sidetone", 33.21], ["mains hum", 6.71]], null, null, [["thunk", 62.04], ["mains hum", 10.31], ["hum", 10.17]], null, [["hum", 27.11], ["mains hum", 19.35], ["thunk", 7.0]], [["speech", 21.29], ["insect", 17.98], ["fly, housefly", 10.9]]], "duration": [4.88, 0.69, 2.41, 4.89, 2.26, 4.33, 4.7]} \ No newline at end of file diff --git a/annotations_filtered/sGLXpKnQfSs_filtered.json b/annotations_filtered/sGLXpKnQfSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e80b84603aa6db98d67d5e16f1bc3671915b3c2c --- /dev/null +++ b/annotations_filtered/sGLXpKnQfSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 39.09], [40.0, 40.95], [41.0, 41.88], [43.0, 45.59], [55.0, 60.74], [64.0, 84.48], [87.0, 88.84], [92.0, 92.82], [94.0, 122.5], [124.0, 124.46], [125.0, 125.49], [126.0, 126.49], [128.0, 150.3], [151.0, 152.31], [155.0, 155.41], [160.0, 161.65], [163.0, 163.71]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [43.66, 0.0, 0.0, 35.54, 38.58, 33.8, 0.0, 0.0, 33.7, 0.0, 0.0, 0.0, 31.08, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 76.45], ["electronic music", 3.81], ["telephone bell ringing", 3.3]], null, null, [["music", 77.38], ["hum", 2.95], ["throbbing", 2.87]], [["music", 31.4], ["speech", 13.33], ["throbbing", 10.14]], [["music", 45.66], ["speech", 19.73], ["throbbing", 10.39]], null, null, [["music", 69.48], ["didgeridoo", 6.44], ["theremin", 2.3]], null, null, null, [["music", 49.68], ["hum", 9.56], ["cacophony", 6.65]], null, null, null, null], "duration": [28.09, 0.95, 0.88, 2.59, 5.74, 20.48, 1.84, 0.82, 28.5, 0.46, 0.49, 0.49, 22.3, 1.31, 0.41, 1.65, 0.71]} \ No newline at end of file diff --git a/annotations_filtered/sGPeVmnAFAI_filtered.json b/annotations_filtered/sGPeVmnAFAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..463d84d235352428f15f327c082c6666da0f45af --- /dev/null +++ b/annotations_filtered/sGPeVmnAFAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [5.0, 6.89], [8.0, 9.63], [13.0, 12.7], [16.0, 16.53], [21.0, 21.88], [23.0, 23.9], [26.0, 26.89], [29.0, 29.78], [33.0, 33.18], [34.0, 35.75], [36.0, 36.07], [38.0, 39.24], [40.0, 39.9], [51.0, 51.8], [53.0, 53.49], [57.0, 57.84], [59.0, 59.54], [61.0, 64.74], [65.0, 66.34], [69.0, 70.44], [71.0, 73.09], [74.0, 77.62], [81.0, 82.29], [83.0, 84.08], [86.0, 87.93], [89.0, 91.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 0.0, 0.0, 53.28, 92.31, 0.0, 0.0, 0.0, 99.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.89, 1.63, -0.3, 0.53, 0.88, 0.9, 0.89, 0.78, 0.18, 1.75, 0.07, 1.24, -0.1, 0.8, 0.49, 0.84, 0.54, 3.74, 1.34, 1.44, 2.09, 3.62, 1.29, 1.08, 1.93, 2.03]} \ No newline at end of file diff --git a/annotations_filtered/sGuNGXmQZSE_filtered.json b/annotations_filtered/sGuNGXmQZSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff3d7fb23c5c0a1de35d0d7534084abeaa736dc3 --- /dev/null +++ b/annotations_filtered/sGuNGXmQZSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.4], [8.0, 11.35], [13.0, 19.58], [21.0, 21.24], [22.0, 25.61], [28.0, 28.27], [32.0, 33.08], [34.0, 34.05], [41.0, 40.9], [43.0, 45.67], [47.0, 47.97], [50.0, 51.22], [54.0, 54.48], [57.0, 57.91], [58.0, 58.63], [60.0, 60.94], [63.0, 63.81], [65.0, 65.06], [66.0, 65.99], [72.0, 72.71], [81.0, 84.82], [85.0, 86.93], [90.0, 90.41], [91.0, 92.77], [96.0, 97.55], [101.0, 101.07], [104.0, 105.7], [107.0, 107.33], [109.0, 112.46], [115.0, 117.91], [121.0, 131.84], [133.0, 142.62], [143.0, 143.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 84.25, 53.72, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 95.37, 40.34, 58.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.02], ["theremin", 12.18], ["brass instrument", 4.38]], null, null], "duration": [0.4, 3.35, 6.58, 0.24, 3.61, 0.27, 1.08, 0.05, -0.1, 2.67, 0.97, 1.22, 0.48, 0.91, 0.63, 0.94, 0.81, 0.06, -0.01, 0.71, 3.82, 1.93, 0.41, 1.77, 1.55, 0.07, 1.7, 0.33, 3.46, 2.91, 10.84, 9.62, 0.8]} \ No newline at end of file diff --git a/annotations_filtered/sH8nzHarprc_filtered.json b/annotations_filtered/sH8nzHarprc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59960ebf078d57878ac674415bbf65104e13c7cd --- /dev/null +++ b/annotations_filtered/sH8nzHarprc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.02], [15.0, 21.84], [27.0, 30.01], [34.0, 34.65], [40.0, 41.59], [43.0, 43.48], [51.0, 51.43], [53.0, 54.16], [61.0, 60.94], [68.0, 70.53], [74.0, 98.68], [102.0, 104.41], [108.0, 111.3], [112.0, 137.59], [140.0, 141.59], [144.0, 145.71], [148.0, 149.05]], "keep_status": [true, false, true, false, false, false, false, false, false, true, true, false, true, false, false, false, false], "silence_prob": [34.44, 33.64, 34.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.4, 28.88, 29.9, 29.07, 28.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 28.47], ["hum", 25.11], ["mains hum", 11.25]], [["music", 39.76], ["hum", 25.16], ["throbbing", 13.23]], [["speech", 37.25], ["music", 13.64], ["hum", 4.23]], null, null, null, null, null, null, [["music", 27.06], ["tabla", 11.49], ["carnatic music", 6.39]], [["music", 61.47], ["sound effect", 2.86], ["buzz", 2.78]], [["music", 51.73], ["speech", 23.96], ["buzz", 5.44]], [["music", 46.21], ["speech", 15.24], ["boing", 6.85]], [["music", 49.72], ["speech", 19.7], ["boing", 2.75]], null, null, null], "duration": [4.02, 6.84, 3.01, 0.65, 1.59, 0.48, 0.43, 1.16, -0.06, 2.53, 24.68, 2.41, 3.3, 25.59, 1.59, 1.71, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/sHFXRjwKOG8_filtered.json b/annotations_filtered/sHFXRjwKOG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3ff767ae84ae32e3653c9c6cab2d2803a259fe1 --- /dev/null +++ b/annotations_filtered/sHFXRjwKOG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.11], [9.0, 12.26], [15.0, 16.43], [18.0, 21.14], [23.0, 24.66], [25.0, 28.63], [31.0, 31.95], [33.0, 33.18], [50.0, 69.04], [73.0, 81.45], [81.0, 81.48], [81.0, 97.88], [98.0, 103.13], [104.0, 129.93], [132.0, 138.1], [140.0, 149.54], [152.0, 156.44], [157.0, 157.45], [157.0, 159.9]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, true, true, false, true], "silence_prob": [65.79, 58.55, 0.0, 81.53, 0.0, 72.31, 0.0, 0.0, 28.45, 27.85, 0.0, 31.63, 49.45, 37.82, 44.07, 28.17, 39.09, 0.0, 49.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["vehicle", 35.45], ["speech", 20.67], ["car", 10.53]], [["vehicle", 42.59], ["car", 23.78], ["skidding", 8.21]], null, [["hum", 26.85], ["music", 22.18], ["mains hum", 15.97]], [["hum", 66.37], ["mains hum", 11.02], ["throbbing", 6.25]], [["music", 37.53], ["hum", 15.04], ["throbbing", 10.88]], [["music", 27.97], ["throbbing", 26.99], ["hum", 17.09]], [["speech", 38.51], ["music", 14.59], ["groan", 4.01]], [["music", 29.5], ["glass", 12.1], ["mains hum", 7.87]], null, [["glass", 15.04], ["cowbell", 11.7], ["breaking", 8.63]]], "duration": [2.11, 3.26, 1.43, 3.14, 1.66, 3.63, 0.95, 0.18, 19.04, 8.45, 0.48, 16.88, 5.13, 25.93, 6.1, 9.54, 4.44, 0.45, 2.9]} \ No newline at end of file diff --git a/annotations_filtered/sHTeguzrPto_filtered.json b/annotations_filtered/sHTeguzrPto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a04e63c1232743529d3f74fd262ca0e5a330e53e --- /dev/null +++ b/annotations_filtered/sHTeguzrPto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 47.01], [49.0, 49.27], [49.0, 49.84], [50.0, 50.08], [50.0, 51.19], [52.0, 60.79]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 46.83], "audiomae_on_audioset": [null, null, null, null, null, [["music", 16.84], ["crack", 10.83], ["speech", 9.61]]], "duration": [40.01, 0.27, 0.84, 0.08, 1.19, 8.79]} \ No newline at end of file diff --git a/annotations_filtered/sHt3TElCugg_filtered.json b/annotations_filtered/sHt3TElCugg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e65df76af16fd6ca887e9c5913c93c0c6eb3b7b1 --- /dev/null +++ b/annotations_filtered/sHt3TElCugg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.31], [8.0, 15.38], [19.0, 23.23], [26.0, 25.62], [26.0, 27.13], [28.0, 27.97], [32.0, 46.31], [46.0, 47.26], [48.0, 48.88], [49.0, 71.32], [72.0, 76.3], [80.0, 81.38], [84.0, 89.01], [112.0, 112.45], [113.0, 113.98], [120.0, 119.53], [125.0, 125.71], [132.0, 134.11], [135.0, 135.16], [148.0, 153.96], [156.0, 163.11], [167.0, 166.94], [167.0, 168.0], [175.0, 175.47], [181.0, 181.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [35.41, 32.53, 33.08, 0.0, 0.0, 0.0, 32.86, 0.0, 0.0, 32.71, 36.37, 0.0, 34.22, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 32.93, 33.15, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 66.96], ["throbbing", 8.53], ["sampler", 3.94]], [["music", 59.36], ["throbbing", 21.83], ["hum", 2.25]], [["music", 56.97], ["throbbing", 15.5], ["hum", 7.79]], null, null, null, [["music", 67.75], ["throbbing", 11.21], ["electronic music", 5.16]], null, null, [["music", 78.06], ["drum machine", 3.94], ["electronic music", 3.79]], [["music", 71.42], ["electronic music", 6.32], ["drum machine", 4.82]], null, [["music", 56.79], ["throbbing", 5.43], ["electronic music", 3.92]], null, null, null, null, null, null, [["music", 45.62], ["throbbing", 10.06], ["whack, thwack", 4.62]], [["music", 51.33], ["speech", 9.73], ["throbbing", 7.14]], null, null, null, null], "duration": [3.31, 7.38, 4.23, -0.38, 1.13, -0.03, 14.31, 1.26, 0.88, 22.32, 4.3, 1.38, 5.01, 0.45, 0.98, -0.47, 0.71, 2.11, 0.16, 5.96, 7.11, -0.06, 1.0, 0.47, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/sIB8AdUqEqg_filtered.json b/annotations_filtered/sIB8AdUqEqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1833e864fb150c30b670307b735aa3c7cf3aa7c4 --- /dev/null +++ b/annotations_filtered/sIB8AdUqEqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 79.49]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [42.49]} \ No newline at end of file diff --git a/annotations_filtered/sIDHrcDf-N0_filtered.json b/annotations_filtered/sIDHrcDf-N0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d680cd37e3df33519a49135b9665e2830a0b319 --- /dev/null +++ b/annotations_filtered/sIDHrcDf-N0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 21.32], [28.0, 33.62], [34.0, 34.45], [35.0, 34.86], [36.0, 37.03], [41.0, 42.06], [43.0, 43.41], [44.0, 45.12], [48.0, 49.22], [50.0, 61.94], [62.0, 62.58], [63.0, 74.28], [77.0, 78.49], [83.0, 83.61], [87.0, 88.59], [90.0, 107.94], [120.0, 121.39], [123.0, 122.91], [126.0, 128.31], [129.0, 130.52], [132.0, 134.96], [138.0, 137.89], [140.0, 182.19]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [28.49, 28.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.26, 0.0, 28.85, 0.0, 0.0, 0.0, 29.03, 0.0, 0.0, 31.23, 0.0, 29.45, 0.0, 0.0], "audiomae_on_audioset": [[["music", 17.49], ["vehicle", 13.44], ["aircraft", 7.85]], [["speech", 34.39], ["music", 23.27], ["vehicle", 6.43]], null, null, null, null, null, null, null, [["music", 47.01], ["throbbing", 30.9], ["hum", 4.46]], null, [["speech", 56.71], ["vehicle", 8.13], ["music", 5.86]], null, null, null, [["music", 68.48], ["speech", 11.66], ["musical instrument", 2.08]], null, null, [["throbbing", 27.21], ["music", 23.48], ["hum", 16.83]], null, [["music", 45.94], ["tuning fork", 10.24], ["ping", 4.57]], null, null], "duration": [19.32, 5.62, 0.45, -0.14, 1.03, 1.06, 0.41, 1.12, 1.22, 11.94, 0.58, 11.28, 1.49, 0.61, 1.59, 17.94, 1.39, -0.09, 2.31, 1.52, 2.96, -0.11, 42.19]} \ No newline at end of file diff --git a/annotations_filtered/sILyPxN_1Dc_filtered.json b/annotations_filtered/sILyPxN_1Dc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35ffc236df44acbf8e73da9356a86502dd20dd1b --- /dev/null +++ b/annotations_filtered/sILyPxN_1Dc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.73], [16.0, 16.44], [19.0, 20.06], [22.0, 22.67], [47.0, 47.41], [51.0, 50.99], [53.0, 56.24], [58.0, 57.96], [69.0, 71.17], [72.0, 72.59]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 73.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 46.53], ["animal", 10.62], ["domestic animals, pets", 5.5]], null, null, null], "duration": [0.73, 0.44, 1.06, 0.67, 0.41, -0.01, 3.24, -0.04, 2.17, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/sISJ7r3kERg_filtered.json b/annotations_filtered/sISJ7r3kERg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9150d2c356b09690712d06b7446cbdaa92e4d8bf --- /dev/null +++ b/annotations_filtered/sISJ7r3kERg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.13], [8.0, 8.67], [10.0, 20.8], [21.0, 23.8], [25.0, 26.11], [28.0, 28.27], [28.0, 29.76], [30.0, 30.55], [32.0, 32.26], [33.0, 33.12], [33.0, 34.97], [36.0, 36.91], [38.0, 38.53], [42.0, 43.26], [44.0, 45.79], [47.0, 47.8], [48.0, 48.95], [50.0, 49.92], [51.0, 51.58], [54.0, 57.37], [58.0, 58.82], [59.0, 59.58], [60.0, 61.37], [62.0, 63.98], [65.0, 68.67], [70.0, 69.79], [71.0, 71.95], [73.0, 74.6], [75.0, 75.78], [76.0, 76.96], [78.0, 78.56], [79.0, 79.89], [81.0, 82.21], [82.0, 90.98], [96.0, 96.35], [99.0, 99.25], [101.0, 101.46], [102.0, 107.43], [108.0, 108.01], [108.0, 108.46], [109.0, 114.45], [117.0, 117.27], [118.0, 118.44], [121.0, 127.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [92.8, 0.0, 50.31, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 0.0, 51.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.78, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 29.87, 0.0, 0.0, 46.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.18], ["wild animals", 15.1], ["animal", 11.72]], null, null, null, null, null, null, [["livestock, farm animals, working animals", 23.86], ["cattle, bovinae", 20.49], ["moo", 18.08]], null, null, [["theremin", 46.15], ["speech", 20.17], ["music", 4.15]]], "duration": [6.13, 0.67, 10.8, 2.8, 1.11, 0.27, 1.76, 0.55, 0.26, 0.12, 1.97, 0.91, 0.53, 1.26, 1.79, 0.8, 0.95, -0.08, 0.58, 3.37, 0.82, 0.58, 1.37, 1.98, 3.67, -0.21, 0.95, 1.6, 0.78, 0.96, 0.56, 0.89, 1.21, 8.98, 0.35, 0.25, 0.46, 5.43, 0.01, 0.46, 5.45, 0.27, 0.44, 6.23]} \ No newline at end of file diff --git a/annotations_filtered/sIY7BQkbIT8_filtered.json b/annotations_filtered/sIY7BQkbIT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a784adb5a939532e36570a0ebbb87612e73e93e --- /dev/null +++ b/annotations_filtered/sIY7BQkbIT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[170.0, 170.87], [171.0, 217.11]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.87, 46.11]} \ No newline at end of file diff --git a/annotations_filtered/sIwsArbH5ck_filtered.json b/annotations_filtered/sIwsArbH5ck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98f43d29d5ee264972bdba2845891f98a9deeab1 --- /dev/null +++ b/annotations_filtered/sIwsArbH5ck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.08], [16.0, 15.99], [29.0, 29.83], [30.0, 30.67], [39.0, 42.89], [56.0, 56.13], [57.0, 57.06], [58.0, 58.13], [66.0, 68.76], [69.0, 70.06], [76.0, 77.23], [79.0, 78.98], [81.0, 82.65], [94.0, 95.23], [104.0, 105.11], [106.0, 108.53], [112.0, 114.05], [117.0, 131.19], [134.0, 138.5], [144.0, 144.0], [144.0, 144.48], [154.0, 155.41], [161.0, 168.32]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.37, 0.0, 0.0, 0.0, 39.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.49, 36.42, 50.71, 51.77, 0.0, 0.0, 0.0, 53.16], "audiomae_on_audioset": [null, null, null, null, [["hum", 14.7], ["mains hum", 9.27], ["music", 8.79]], null, null, null, [["hum", 13.78], ["throbbing", 10.17], ["music", 9.21]], null, null, null, null, null, null, [["music", 35.43], ["speech", 19.17], ["mains hum", 8.46]], [["speech", 39.01], ["music", 4.02], ["hum", 3.57]], null, null, null, null, null, null], "duration": [1.08, -0.01, 0.83, 0.67, 3.89, 0.13, 0.06, 0.13, 2.76, 1.06, 1.23, -0.02, 1.65, 1.23, 1.11, 2.53, 2.05, 14.19, 4.5, 0.0, 0.48, 1.41, 7.32]} \ No newline at end of file diff --git a/annotations_filtered/sJ9nOmRn6fg_filtered.json b/annotations_filtered/sJ9nOmRn6fg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1db5541670f7f67e8aadb9a894b1bc5d35f11161 --- /dev/null +++ b/annotations_filtered/sJ9nOmRn6fg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [4.0, 6.35], [7.0, 22.91], [24.0, 26.92], [31.0, 40.37], [42.0, 44.9]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 81.0, 72.01, 49.68, 60.05, 52.68], "audiomae_on_audioset": [null, null, null, [["music", 25.04], ["speech", 7.15], ["musical instrument", 4.74]], null, null], "duration": [0.36, 2.35, 15.91, 2.92, 9.37, 2.9]} \ No newline at end of file diff --git a/annotations_filtered/sJGWczuXzT8_filtered.json b/annotations_filtered/sJGWczuXzT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fc0eb91d52d84b3dba263c8f8eac673da7fd17d --- /dev/null +++ b/annotations_filtered/sJGWczuXzT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.0], [16.0, 19.47], [21.0, 22.72], [24.0, 32.22], [33.0, 34.45], [36.0, 40.0], [46.0, 46.7], [49.0, 51.54], [53.0, 54.19], [56.0, 56.73], [57.0, 56.98], [57.0, 59.41], [59.0, 59.49], [60.0, 61.33], [65.0, 72.03], [74.0, 75.56], [78.0, 91.18], [96.0, 104.41], [110.0, 110.4], [111.0, 114.74], [115.0, 117.49], [126.0, 127.41]], "keep_status": [false, true, false, true, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false, true, true, false], "silence_prob": [31.14, 32.76, 0.0, 30.63, 0.0, 31.94, 0.0, 29.91, 0.0, 0.0, 0.0, 30.17, 0.0, 0.0, 29.32, 0.0, 30.84, 32.44, 0.0, 48.69, 38.45, 0.0], "audiomae_on_audioset": [[["music", 32.83], ["didgeridoo", 26.95], ["speech", 15.39]], [["music", 23.55], ["mains hum", 18.72], ["hum", 16.4]], null, [["speech", 37.73], ["music", 15.94], ["hum", 9.67]], null, [["music", 25.29], ["speech", 15.64], ["fart", 8.08]], null, [["music", 47.79], ["throbbing", 11.36], ["speech", 10.27]], null, null, null, [["speech", 57.16], ["music", 8.88], ["sidetone", 7.79]], null, null, [["speech", 32.39], ["music", 19.95], ["buzz", 11.92]], null, [["music", 67.01], ["throbbing", 10.55], ["hum", 4.89]], [["fly, housefly", 49.78], ["insect", 13.95], ["mosquito", 8.09]], null, [["speech", 29.24], ["music", 21.86], ["whale vocalization", 7.78]], [["speech", 33.12], ["fly, housefly", 12.36], ["sidetone", 11.53]], null], "duration": [5.0, 3.47, 1.72, 8.22, 1.45, 4.0, 0.7, 2.54, 1.19, 0.73, -0.02, 2.41, 0.49, 1.33, 7.03, 1.56, 13.18, 8.41, 0.4, 3.74, 2.49, 1.41]} \ No newline at end of file diff --git a/annotations_filtered/sJU2cz9ytPQ_filtered.json b/annotations_filtered/sJU2cz9ytPQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/sJU2cz9ytPQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/sJsCKwZLztk_filtered.json b/annotations_filtered/sJsCKwZLztk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6273f2e332cff5626340acbc65b67dc45429f85c --- /dev/null +++ b/annotations_filtered/sJsCKwZLztk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.67], [3.0, 3.77], [5.0, 5.78], [9.0, 10.34], [15.0, 14.98], [18.0, 17.74], [18.0, 18.33], [20.0, 21.37], [25.0, 38.67], [42.0, 42.99], [46.0, 47.76], [49.0, 61.62], [63.0, 64.05], [66.0, 68.3], [69.0, 69.63], [73.0, 81.19], [84.0, 84.3], [85.0, 85.7], [103.0, 103.3], [105.0, 106.02], [116.0, 117.39], [122.0, 125.19], [128.0, 129.56], [131.0, 130.77], [131.0, 131.23], [133.0, 134.54], [136.0, 136.93], [140.0, 140.36], [147.0, 147.24], [150.0, 157.99], [158.0, 158.31], [160.0, 161.1], [162.0, 162.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 78.21, 0.0, 41.48, 0.0, 33.12, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.17], ["speech", 29.08], ["theremin", 7.56]], null, [["music", 41.97], ["speech", 17.37], ["carnatic music", 12.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.33, 0.77, 0.78, 1.34, -0.02, -0.26, 0.33, 1.37, 13.67, 0.99, 1.76, 12.62, 1.05, 2.3, 0.63, 8.19, 0.3, 0.7, 0.3, 1.02, 1.39, 3.19, 1.56, -0.23, 0.23, 1.54, 0.93, 0.36, 0.24, 7.99, 0.31, 1.1, 0.35]} \ No newline at end of file diff --git a/annotations_filtered/sJsHcwZsNnI_filtered.json b/annotations_filtered/sJsHcwZsNnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f32a7fcd1cfa342a688ff5b2f306b1ebee21869 --- /dev/null +++ b/annotations_filtered/sJsHcwZsNnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 48.17], [54.0, 56.12], [57.0, 61.28], [67.0, 73.55], [74.0, 74.33], [85.0, 85.51], [87.0, 87.91], [90.0, 90.46], [92.0, 96.96], [98.0, 99.08], [107.0, 107.45], [110.0, 134.4], [136.0, 136.14], [137.0, 139.95], [142.0, 151.68]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.39, 34.01, 32.56, 30.12, 0.0, 0.0, 0.0, 0.0, 32.25, 0.0, 0.0, 29.92, 0.0, 34.26, 28.82], "audiomae_on_audioset": [[["music", 41.46], ["telephone bell ringing", 23.05], ["telephone", 11.52]], [["music", 68.83], ["throbbing", 7.12], ["hum", 4.33]], [["music", 62.03], ["livestock, farm animals, working animals", 3.53], ["reggae", 3.16]], [["music", 52.1], ["speech", 5.2], ["musical instrument", 4.98]], null, null, null, null, [["music", 70.14], ["theremin", 4.43], ["throbbing", 3.69]], null, null, [["music", 40.71], ["speech", 29.93], ["throbbing", 6.15]], null, [["fly, housefly", 54.67], ["mosquito", 26.49], ["insect", 17.41]], [["music", 46.24], ["speech", 25.16], ["throbbing", 11.91]]], "duration": [5.17, 2.12, 4.28, 6.55, 0.33, 0.51, 0.91, 0.46, 4.96, 1.08, 0.45, 24.4, 0.14, 2.95, 9.68]} \ No newline at end of file diff --git a/annotations_filtered/sJusqH8NxP4_filtered.json b/annotations_filtered/sJusqH8NxP4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..549837242ac66cc5e774758cded3cc028e625fe8 --- /dev/null +++ b/annotations_filtered/sJusqH8NxP4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 26.72], [29.0, 42.45], [46.0, 95.82], [98.0, 97.83], [98.0, 117.76]], "keep_status": [true, false, false, false, false], "silence_prob": [31.62, 30.22, 0.0, 0.0, 31.04], "audiomae_on_audioset": [[["music", 36.76], ["throbbing", 9.2], ["hum", 9.03]], [["mains hum", 42.59], ["hum", 19.27], ["music", 14.92]], null, null, [["music", 61.92], ["throbbing", 10.41], ["hum", 5.77]]], "duration": [13.72, 13.45, 49.82, -0.17, 19.76]} \ No newline at end of file diff --git a/annotations_filtered/sJwgNs3BWYY_filtered.json b/annotations_filtered/sJwgNs3BWYY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cbeb6e41065bd4558684aa27b6aaaae0a7c9b4c --- /dev/null +++ b/annotations_filtered/sJwgNs3BWYY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.45], [16.0, 16.73], [20.0, 20.56], [25.0, 24.93], [28.0, 28.27], [29.0, 33.22], [34.0, 34.55], [35.0, 36.1], [43.0, 50.19]], "keep_status": [false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.66, 0.0, 0.0, 30.07], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 35.06], ["sidetone", 14.04], ["music", 12.7]], null, null, [["music", 31.83], ["animal", 14.56], ["speech", 10.55]]], "duration": [1.45, 0.73, 0.56, -0.07, 0.27, 4.22, 0.55, 1.1, 7.19]} \ No newline at end of file diff --git a/annotations_filtered/sKFlL_G9S0c_filtered.json b/annotations_filtered/sKFlL_G9S0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7d672c1c29f3f29fec34bd84f5e493a17293592 --- /dev/null +++ b/annotations_filtered/sKFlL_G9S0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.29], [7.0, 8.14], [8.0, 23.94], [26.0, 26.76], [31.0, 38.82], [41.0, 45.69], [48.0, 65.08], [81.0, 81.77], [97.0, 97.75], [100.0, 101.06], [104.0, 115.42], [116.0, 124.36]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 44.4, 0.0, 32.13, 31.08, 32.37, 0.0, 0.0, 0.0, 31.11, 30.97], "audiomae_on_audioset": [null, null, [["music", 77.14], ["speech", 4.48], ["ambient music", 2.41]], null, [["music", 55.69], ["speech", 15.86], ["synthesizer", 7.08]], [["moo", 25.86], ["cattle, bovinae", 25.13], ["sidetone", 14.1]], [["music", 80.3], ["didgeridoo", 4.8], ["musical instrument", 1.89]], null, null, null, [["music", 26.6], ["buzz", 17.83], ["fly, housefly", 11.73]], [["music", 37.59], ["livestock, farm animals, working animals", 6.5], ["boing", 3.61]]], "duration": [1.29, 1.14, 15.94, 0.76, 7.82, 4.69, 17.08, 0.77, 0.75, 1.06, 11.42, 8.36]} \ No newline at end of file diff --git a/annotations_filtered/sKNAfihSpnk_filtered.json b/annotations_filtered/sKNAfihSpnk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8c7165dde48fb4f4feb21e2dcb32a23a832c83b --- /dev/null +++ b/annotations_filtered/sKNAfihSpnk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.99], [12.0, 12.06], [13.0, 18.18], [20.0, 21.61], [23.0, 27.95], [29.0, 29.27], [31.0, 32.66], [33.0, 34.05], [35.0, 35.88], [37.0, 37.91], [39.0, 40.46], [44.0, 45.72], [51.0, 52.47], [54.0, 55.02], [57.0, 57.64], [58.0, 58.58], [60.0, 60.57], [69.0, 69.08], [72.0, 75.68], [77.0, 77.38], [78.0, 78.83], [81.0, 95.71], [97.0, 97.44], [101.0, 100.97], [102.0, 106.57], [108.0, 108.6], [109.0, 110.2], [112.0, 113.63], [116.0, 116.09], [118.0, 118.88], [121.0, 122.12], [123.0, 123.74], [127.0, 127.85], [129.0, 129.63]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.04, 0.0, 48.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 91.47, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["telephone", 20.09], ["speech", 16.12], ["fart", 9.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 0.06, 5.18, 1.61, 4.95, 0.27, 1.66, 1.05, 0.88, 0.91, 1.46, 1.72, 1.47, 1.02, 0.64, 0.58, 0.57, 0.08, 3.68, 0.38, 0.83, 14.71, 0.44, -0.03, 4.57, 0.6, 1.2, 1.63, 0.09, 0.88, 1.12, 0.74, 0.85, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/sKfQGRwlm9Q_filtered.json b/annotations_filtered/sKfQGRwlm9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..165e168cab53f1b49e76fa6101c92d5fc03d1b4e --- /dev/null +++ b/annotations_filtered/sKfQGRwlm9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.62], [8.0, 8.41], [9.0, 9.96], [12.0, 12.56], [13.0, 13.22], [21.0, 22.65], [26.0, 29.86], [31.0, 33.03], [34.0, 34.65], [36.0, 37.15], [38.0, 38.89], [43.0, 43.23], [46.0, 46.5], [47.0, 47.28], [58.0, 58.5], [60.0, 60.67], [62.0, 86.31], [92.0, 93.63], [95.0, 95.18], [97.0, 98.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.62, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.3], ["speech", 17.89], ["musical instrument", 7.2]], null, null, null], "duration": [1.62, 0.41, 0.96, 0.56, 0.22, 1.65, 3.86, 2.03, 0.65, 1.15, 0.89, 0.23, 0.5, 0.28, 0.5, 0.67, 24.31, 1.63, 0.18, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/sKrpl-KBTzQ_filtered.json b/annotations_filtered/sKrpl-KBTzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..406dcb3a00210846c8bf5ead0bff0eae2c70c641 --- /dev/null +++ b/annotations_filtered/sKrpl-KBTzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 74.51], [76.0, 77.06], [77.0, 77.55], [80.0, 80.4]], "keep_status": [true, false, false, false], "silence_prob": [32.62, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 17.65], ["sidetone", 17.29], ["moo", 10.21]], null, null, null], "duration": [4.51, 1.06, 0.55, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/sKrqOTg_FJY_filtered.json b/annotations_filtered/sKrqOTg_FJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ecf285ca5e4a603ab92536542cdeac75b082a9a --- /dev/null +++ b/annotations_filtered/sKrqOTg_FJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 20.58], [23.0, 29.44], [30.0, 31.92], [33.0, 34.37], [36.0, 36.56], [39.0, 40.42], [43.0, 49.11], [51.0, 51.07], [56.0, 67.66], [81.0, 81.94], [85.0, 89.43], [91.0, 91.4], [93.0, 98.15]], "keep_status": [true, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [31.6, 34.43, 0.0, 0.0, 0.0, 0.0, 31.54, 0.0, 31.96, 0.0, 44.84, 0.0, 87.74], "audiomae_on_audioset": [[["music", 36.39], ["buzz", 11.3], ["fly, housefly", 7.44]], [["fly, housefly", 48.73], ["insect", 32.71], ["mosquito", 7.69]], null, null, null, null, [["music", 67.42], ["speech", 10.27], ["didgeridoo", 1.66]], null, [["music", 19.14], ["cattle, bovinae", 14.26], ["vehicle", 13.42]], null, [["music", 23.43], ["speech", 13.46], ["synthesizer", 9.06]], null, null], "duration": [19.58, 6.44, 1.92, 1.37, 0.56, 1.42, 6.11, 0.07, 11.66, 0.94, 4.43, 0.4, 5.15]} \ No newline at end of file diff --git a/annotations_filtered/sL1b7ZnItoI_filtered.json b/annotations_filtered/sL1b7ZnItoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baf5d8c6c6e49e1852ca5d9fde25a815964ecf68 --- /dev/null +++ b/annotations_filtered/sL1b7ZnItoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 32.59], [33.0, 33.52], [55.0, 57.23], [57.0, 57.35], [57.0, 60.52], [62.0, 63.31], [71.0, 71.83], [73.0, 74.21], [77.0, 78.38], [79.0, 79.59], [80.0, 83.1]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [35.75, 0.0, 51.71, 0.0, 47.08, 0.0, 0.0, 0.0, 0.0, 0.0, 44.09], "audiomae_on_audioset": [[["music", 33.01], ["speech", 22.17], ["boing", 20.18]], null, null, null, [["sidetone", 31.21], ["music", 19.26], ["speech", 14.23]], null, null, null, null, null, [["music", 47.33], ["speech", 19.31], ["throbbing", 6.48]]], "duration": [6.59, 0.52, 2.23, 0.35, 3.52, 1.31, 0.83, 1.21, 1.38, 0.59, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/sL6QJSdqlt0_filtered.json b/annotations_filtered/sL6QJSdqlt0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e72e72c3c28f098c5eea4fbb3347bdc266b817d7 --- /dev/null +++ b/annotations_filtered/sL6QJSdqlt0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.25], [11.0, 19.48], [21.0, 26.37], [29.0, 36.14], [38.0, 40.44], [43.0, 50.82], [52.0, 56.0], [58.0, 64.96], [67.0, 68.54], [70.0, 84.6], [87.0, 87.71], [88.0, 89.99], [91.0, 91.57], [92.0, 97.39], [99.0, 103.22], [104.0, 104.94], [106.0, 132.78]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [59.77, 70.86, 58.22, 73.67, 58.22, 51.28, 43.9, 54.83, 0.0, 52.51, 0.0, 0.0, 0.0, 56.4, 44.6, 0.0, 34.19], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 34.46], ["music", 20.24], ["electronic music", 10.8]], null, null, null, null, null, null, null, [["music", 28.21], ["gong", 27.27], ["electronic music", 22.63]], null, [["music", 19.53], ["sine wave", 13.46], ["hum", 12.27]]], "duration": [8.25, 8.48, 5.37, 7.14, 2.44, 7.82, 4.0, 6.96, 1.54, 14.6, 0.71, 1.99, 0.57, 5.39, 4.22, 0.94, 26.78]} \ No newline at end of file diff --git a/annotations_filtered/sL6gDhH7FpE_filtered.json b/annotations_filtered/sL6gDhH7FpE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4dcb7954492e5e3c5065d3ce299c8310a02df9b0 --- /dev/null +++ b/annotations_filtered/sL6gDhH7FpE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.49], [12.0, 15.15], [18.0, 19.94], [28.0, 28.75], [30.0, 30.57], [34.0, 34.28], [36.0, 36.46], [37.0, 37.27], [40.0, 41.64], [43.0, 43.71], [46.0, 47.09], [51.0, 51.26], [54.0, 54.46], [55.0, 55.59], [57.0, 58.6], [87.0, 88.43], [89.0, 90.56], [92.0, 91.79], [94.0, 96.43], [105.0, 105.22], [109.0, 110.42], [113.0, 113.22], [117.0, 117.12], [122.0, 123.65], [134.0, 133.89], [135.0, 135.53], [138.0, 138.75], [139.0, 141.42], [143.0, 146.42], [149.0, 149.82], [151.0, 151.56], [153.0, 154.62], [156.0, 156.91], [159.0, 159.63], [161.0, 161.91], [172.0, 172.23], [174.0, 174.87], [177.0, 177.96], [180.0, 180.89], [190.0, 190.73], [193.0, 193.35], [193.0, 193.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 47.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 15.62], ["hum", 3.95], ["musical instrument", 3.9]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.49, 3.15, 1.94, 0.75, 0.57, 0.28, 0.46, 0.27, 1.64, 0.71, 1.09, 0.26, 0.46, 0.59, 1.6, 1.43, 1.56, -0.21, 2.43, 0.22, 1.42, 0.22, 0.12, 1.65, -0.11, 0.53, 0.75, 2.42, 3.42, 0.82, 0.56, 1.62, 0.91, 0.63, 0.91, 0.23, 0.87, 0.96, 0.89, 0.73, 0.35, 0.48]} \ No newline at end of file diff --git a/annotations_filtered/sLAan2iZs_Y_filtered.json b/annotations_filtered/sLAan2iZs_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dcaf2fbf0c703ad0306aff494a8681de1be9933 --- /dev/null +++ b/annotations_filtered/sLAan2iZs_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.59], [18.0, 18.76], [19.0, 20.39], [23.0, 23.8], [26.0, 26.13], [33.0, 33.12], [35.0, 36.26], [43.0, 45.71], [49.0, 50.33], [58.0, 58.82], [60.0, 61.57], [64.0, 66.43], [68.0, 68.74], [70.0, 71.74], [73.0, 77.82], [81.0, 82.21], [84.0, 92.55], [93.0, 94.22], [96.0, 97.8]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 0.0, 94.95, 0.0, 0.0, 97.64, 0.0, 59.33, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["eruption", 16.02], ["noise", 14.39], ["white noise", 9.48]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.76, 1.39, 0.8, 0.13, 0.12, 1.26, 2.71, 1.33, 0.82, 1.57, 2.43, 0.74, 1.74, 4.82, 1.21, 8.55, 1.22, 1.8]} \ No newline at end of file diff --git a/annotations_filtered/sLKnt2jBax4_filtered.json b/annotations_filtered/sLKnt2jBax4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aba0825d1a0e8ee11d8a1915ad861715682b20c3 --- /dev/null +++ b/annotations_filtered/sLKnt2jBax4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.18], [14.0, 14.27], [15.0, 15.15], [18.0, 20.51], [24.0, 43.9], [51.0, 51.48], [59.0, 81.18], [82.0, 82.63]], "keep_status": [false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.6, 30.53, 0.0, 32.34, 0.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 34.2], ["moo", 19.86], ["livestock, farm animals, working animals", 14.82]], [["music", 43.27], ["livestock, farm animals, working animals", 7.78], ["groan", 6.69]], null, [["music", 47.01], ["speech", 7.42], ["livestock, farm animals, working animals", 5.96]], null], "duration": [0.18, 0.27, 0.15, 2.51, 19.9, 0.48, 22.18, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/sLLp4bO6dDI_filtered.json b/annotations_filtered/sLLp4bO6dDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b27fc2943ac84c7fafba4eaeab1fec903a4f354 --- /dev/null +++ b/annotations_filtered/sLLp4bO6dDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.62], [25.0, 30.91], [31.0, 33.91], [35.0, 44.27], [46.0, 84.05], [84.0, 85.5], [86.0, 87.52], [90.0, 102.88], [103.0, 140.58], [142.0, 155.34], [156.0, 162.63], [166.0, 167.0], [168.0, 169.2], [170.0, 173.38], [175.0, 175.51]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 44.52, 40.71, 42.0, 0.0, 0.0, 0.0, 36.11, 0.0, 46.43, 47.86, 0.0, 0.0, 47.12, 0.0], "audiomae_on_audioset": [null, [["music", 25.09], ["speech", 17.46], ["hum", 8.88]], [["speech", 23.16], ["hum", 21.89], ["mains hum", 15.98]], [["hum", 46.3], ["mains hum", 32.32], ["throbbing", 6.88]], null, null, null, [["frog", 78.91], ["owl", 6.66], ["hum", 1.91]], null, [["hum", 61.81], ["mains hum", 16.37], ["throbbing", 11.67]], [["rumble", 32.55], ["hum", 27.28], ["mains hum", 12.8]], null, null, [["hum", 32.45], ["music", 9.28], ["throbbing", 8.92]], null], "duration": [1.62, 5.91, 2.91, 9.27, 38.05, 1.5, 1.52, 12.88, 37.58, 13.34, 6.63, 1.0, 1.2, 3.38, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/sLWhxB6QNrw_filtered.json b/annotations_filtered/sLWhxB6QNrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c295c01cb0c201a947058d585ae6c55f721476a6 --- /dev/null +++ b/annotations_filtered/sLWhxB6QNrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.92], [12.0, 12.93], [17.0, 20.46], [24.0, 44.95]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 37.93, 30.45], "audiomae_on_audioset": [null, null, [["throbbing", 42.05], ["hum", 38.31], ["mains hum", 11.07]], [["speech", 68.1], ["music", 10.2], ["hum", 5.35]]], "duration": [0.92, 0.93, 3.46, 20.95]} \ No newline at end of file diff --git a/annotations_filtered/sLlQvz0y7QM_filtered.json b/annotations_filtered/sLlQvz0y7QM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f12cc9ac2b9bee77a059dfb3736f9bc673f80b16 --- /dev/null +++ b/annotations_filtered/sLlQvz0y7QM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.3], [39.0, 45.98], [47.0, 54.73], [58.0, 62.33], [91.0, 90.96], [94.0, 100.48]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 99.98, 99.78, 98.86, 0.0, 73.06], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.3, 6.98, 7.73, 4.33, -0.04, 6.48]} \ No newline at end of file diff --git a/annotations_filtered/sM1I11qUM44_filtered.json b/annotations_filtered/sM1I11qUM44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..448c222fb02bf62f335d87484dd4203c5e290b23 --- /dev/null +++ b/annotations_filtered/sM1I11qUM44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.89], [24.0, 28.51], [34.0, 37.08], [42.0, 43.07], [44.0, 69.06], [73.0, 98.91], [103.0, 106.1], [110.0, 133.19], [134.0, 134.47], [138.0, 140.19], [143.0, 143.18], [144.0, 164.39], [170.0, 188.32], [197.0, 199.0]], "keep_status": [false, true, true, false, true, true, true, true, false, true, false, true, true, false], "silence_prob": [0.0, 33.01, 32.39, 0.0, 32.33, 32.39, 37.84, 32.37, 0.0, 45.27, 0.0, 31.41, 30.34, 33.13], "audiomae_on_audioset": [null, [["speech", 30.62], ["explosion", 17.45], ["burst, pop", 12.96]], [["music", 23.21], ["throbbing", 9.3], ["didgeridoo", 7.95]], null, [["music", 32.27], ["speech", 27.89], ["whack, thwack", 3.38]], [["music", 20.83], ["buzz", 16.84], ["fly, housefly", 10.99]], [["thunk", 44.28], ["music", 13.57], ["creak", 10.15]], [["speech", 35.9], ["whack, thwack", 19.88], ["music", 13.22]], null, [["sine wave", 37.96], ["speech", 14.84], ["music", 9.94]], null, [["music", 57.44], ["speech", 6.72], ["whack, thwack", 4.43]], [["music", 18.88], ["throbbing", 11.2], ["whack, thwack", 7.88]], [["fly, housefly", 46.17], ["insect", 30.73], ["mosquito", 12.25]]], "duration": [0.89, 4.51, 3.08, 1.07, 25.06, 25.91, 3.1, 23.19, 0.47, 2.19, 0.18, 20.39, 18.32, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/sMLop6XZBEw_filtered.json b/annotations_filtered/sMLop6XZBEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5696b287d203fa24ed639bcdede2eab33827b1a7 --- /dev/null +++ b/annotations_filtered/sMLop6XZBEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.95], [15.0, 25.05], [30.0, 34.86], [38.0, 38.62], [47.0, 47.21], [49.0, 51.63], [55.0, 54.94], [56.0, 56.73], [58.0, 58.38], [59.0, 60.05], [61.0, 61.55], [63.0, 63.44], [65.0, 72.28], [74.0, 77.3], [83.0, 85.02], [87.0, 87.44], [87.0, 88.82], [97.0, 98.37], [101.0, 105.02], [107.0, 107.42], [111.0, 111.08], [113.0, 113.97], [115.0, 115.89], [116.0, 158.25]], "keep_status": [false, true, true, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.76, 28.88, 0.0, 0.0, 35.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.42, 38.2, 34.39, 0.0, 0.0, 0.0, 34.57, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.52], ["vehicle", 4.41], ["speech", 4.33]], [["music", 34.24], ["speech", 19.15], ["moo", 13.86]], null, null, [["music", 47.88], ["electronic music", 6.42], ["synthesizer", 4.2]], null, null, null, null, null, null, [["music", 65.1], ["speech", 11.73], ["throbbing", 4.79]], [["music", 49.03], ["synthesizer", 11.17], ["musical instrument", 4.33]], [["music", 28.36], ["theremin", 20.39], ["foghorn", 15.74]], null, null, null, [["didgeridoo", 36.5], ["music", 34.42], ["throbbing", 4.26]], null, null, null, null, null], "duration": [1.95, 10.05, 4.86, 0.62, 0.21, 2.63, -0.06, 0.73, 0.38, 1.05, 0.55, 0.44, 7.28, 3.3, 2.02, 0.44, 1.82, 1.37, 4.02, 0.42, 0.08, 0.97, 0.89, 42.25]} \ No newline at end of file diff --git a/annotations_filtered/sMWnN_9GiX0_filtered.json b/annotations_filtered/sMWnN_9GiX0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94a43002c9da23f19378da60ba4d89209f138271 --- /dev/null +++ b/annotations_filtered/sMWnN_9GiX0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.37], [17.0, 17.71], [19.0, 20.61], [22.0, 22.18], [43.0, 45.05], [61.0, 62.45], [64.0, 73.99], [75.0, 86.95], [92.0, 92.89], [95.0, 95.79], [102.0, 103.84], [104.0, 104.95], [106.0, 106.93], [109.0, 111.6], [122.0, 123.33]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [72.46, 0.0, 0.0, 0.0, 80.82, 0.0, 32.71, 47.66, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 53.67], ["carnatic music", 9.66], ["vocal music", 7.31]], [["speech", 40.49], ["music", 7.84], ["buzz", 5.54]], null, null, null, null, null, null, null], "duration": [2.37, 0.71, 1.61, 0.18, 2.05, 1.45, 9.99, 11.95, 0.89, 0.79, 1.84, 0.95, 0.93, 2.6, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/sMjmQzP9D6o_filtered.json b/annotations_filtered/sMjmQzP9D6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ee360f5bdd10eb8bd8a132a5d32562ce3d0def7 --- /dev/null +++ b/annotations_filtered/sMjmQzP9D6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.51], [10.0, 14.45], [16.0, 17.91], [19.0, 31.68], [32.0, 34.87], [36.0, 45.03], [45.0, 59.05], [62.0, 66.36], [68.0, 73.57], [74.0, 74.61], [75.0, 81.75], [83.0, 85.13], [89.0, 97.07], [103.0, 116.78], [118.0, 131.82], [135.0, 134.94], [137.0, 148.76], [149.0, 149.44], [153.0, 160.27], [161.0, 177.47]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.03, 0.0, 59.86, 41.24, 55.6, 47.43, 46.83, 53.04, 0.0, 52.92, 53.04, 36.78, 55.67, 41.89, 0.0, 43.03, 0.0, 37.98, 55.81], "audiomae_on_audioset": [null, null, null, null, [["music", 34.76], ["whale vocalization", 18.04], ["electronic music", 7.47]], null, [["music", 56.6], ["speech", 17.08], ["electronic music", 5.87]], [["music", 50.44], ["didgeridoo", 15.91], ["theremin", 8.77]], null, null, null, null, [["music", 29.04], ["speech", 15.95], ["foghorn", 4.86]], null, [["theremin", 46.08], ["music", 42.29], ["ambient music", 1.56]], null, [["music", 66.95], ["theremin", 10.43], ["ambient music", 2.05]], null, [["music", 56.6], ["carnatic music", 14.43], ["theremin", 9.19]], null], "duration": [0.51, 4.45, 1.91, 12.68, 2.87, 9.03, 14.05, 4.36, 5.57, 0.61, 6.75, 2.13, 8.07, 13.78, 13.82, -0.06, 11.76, 0.44, 7.27, 16.47]} \ No newline at end of file diff --git a/annotations_filtered/sMrjeejmCpI_filtered.json b/annotations_filtered/sMrjeejmCpI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6bd7f14d07abaa4f323bd7e48a43073221c4aeb --- /dev/null +++ b/annotations_filtered/sMrjeejmCpI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.75], [10.0, 14.12], [26.0, 30.05], [32.0, 33.15], [37.0, 41.49], [51.0, 53.11], [67.0, 68.62], [70.0, 70.51], [75.0, 75.57], [87.0, 91.15], [96.0, 96.74], [100.0, 100.23], [102.0, 102.44], [104.0, 104.11], [124.0, 125.44], [154.0, 155.73], [169.0, 170.73], [173.0, 172.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.94, 32.31, 0.0, 32.06, 31.91, 0.0, 0.0, 0.0, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 76.26], ["musical instrument", 3.96], ["synthesizer", 2.9]], [["music", 76.01], ["musical instrument", 2.97], ["funny music", 2.52]], null, [["music", 44.44], ["speech", 18.31], ["sidetone", 7.62]], [["music", 38.14], ["boing", 21.02], ["didgeridoo", 13.02]], null, null, null, [["music", 74.91], ["musical instrument", 7.39], ["didgeridoo", 3.54]], null, null, null, null, null, null, null, null], "duration": [0.75, 4.12, 4.05, 1.15, 4.49, 2.11, 1.62, 0.51, 0.57, 4.15, 0.74, 0.23, 0.44, 0.11, 1.44, 1.73, 1.73, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/sMt3SzAH_i0_filtered.json b/annotations_filtered/sMt3SzAH_i0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6880bc7d36ee26211651ffed739a09fd86e2892f --- /dev/null +++ b/annotations_filtered/sMt3SzAH_i0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.07], [6.0, 6.52], [8.0, 8.26], [9.0, 10.42], [12.0, 13.04], [15.0, 21.88], [25.0, 25.76], [27.0, 42.31], [43.0, 46.63], [47.0, 49.79], [51.0, 50.99], [53.0, 53.81], [56.0, 56.69], [58.0, 58.43], [60.0, 60.84], [64.0, 64.03], [65.0, 68.12], [70.0, 72.1], [75.0, 75.49], [77.0, 78.65], [82.0, 82.48], [84.0, 84.65], [87.0, 87.96], [89.0, 89.51], [95.0, 96.04], [97.0, 97.8], [99.0, 99.99], [101.0, 101.93], [108.0, 109.97], [111.0, 111.96], [117.0, 117.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.51, 0.0, 0.0, 0.0, 0.0, 60.89, 0.0, 63.85, 85.9, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.07, 0.52, 0.26, 1.42, 1.04, 6.88, 0.76, 15.31, 3.63, 2.79, -0.01, 0.81, 0.69, 0.43, 0.84, 0.03, 3.12, 2.1, 0.49, 1.65, 0.48, 0.65, 0.96, 0.51, 1.04, 0.8, 0.99, 0.93, 1.97, 0.96, 0.83]} \ No newline at end of file diff --git a/annotations_filtered/sNGlmsj6C-E_filtered.json b/annotations_filtered/sNGlmsj6C-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..002296a666d1017a76a0f2b0d80201f64057701b --- /dev/null +++ b/annotations_filtered/sNGlmsj6C-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 45.0], [46.0, 46.21], [50.0, 51.97], [53.0, 53.3], [55.0, 55.11], [60.0, 60.69], [62.0, 62.06], [63.0, 63.02]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [44.0, 0.21, 1.97, 0.3, 0.11, 0.69, 0.06, 0.02]} \ No newline at end of file diff --git a/annotations_filtered/sNJmfuEWR8w_filtered.json b/annotations_filtered/sNJmfuEWR8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c90936957b10d2ca4e8db316e82a5348b569cb34 --- /dev/null +++ b/annotations_filtered/sNJmfuEWR8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[72.0, 72.54], [75.0, 74.98], [78.0, 81.04]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 33.87], "audiomae_on_audioset": [null, null, [["music", 48.27], ["boing", 34.72], ["speech", 2.25]]], "duration": [0.54, -0.02, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/sNcBUOlGBcg_filtered.json b/annotations_filtered/sNcBUOlGBcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06b804f64955ef79418becc110e76607c53cf654 --- /dev/null +++ b/annotations_filtered/sNcBUOlGBcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.12], [17.0, 17.81], [27.0, 28.71], [33.0, 33.42], [34.0, 34.67], [40.0, 41.23], [54.0, 56.19], [59.0, 60.54], [66.0, 70.88], [74.0, 73.8], [76.0, 76.37], [77.0, 77.65], [79.0, 79.41], [85.0, 88.18], [95.0, 96.04], [110.0, 110.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.12, 0.81, 1.71, 0.42, 0.67, 1.23, 2.19, 1.54, 4.88, -0.2, 0.37, 0.65, 0.41, 3.18, 1.04, 0.37]} \ No newline at end of file diff --git a/annotations_filtered/sNi3hwriXyE_filtered.json b/annotations_filtered/sNi3hwriXyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..701a63947af65450bdefc22bd687003526bfc0e2 --- /dev/null +++ b/annotations_filtered/sNi3hwriXyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 43.24], [44.0, 62.7], [64.0, 64.79], [67.0, 89.36], [92.0, 96.43], [97.0, 98.12], [99.0, 110.47], [112.0, 113.53], [115.0, 135.04]], "keep_status": [false, false, false, true, true, false, true, false, false], "silence_prob": [33.82, 34.05, 0.0, 31.81, 36.56, 0.0, 38.94, 0.0, 36.64], "audiomae_on_audioset": [[["music", 56.97], ["throbbing", 7.15], ["whack, thwack", 7.02]], [["music", 64.27], ["throbbing", 3.13], ["whip", 2.66]], null, [["fart", 29.23], ["fly, housefly", 19.65], ["mosquito", 8.6]], [["music", 22.36], ["mains hum", 17.27], ["hum", 13.03]], null, [["music", 48.42], ["musical instrument", 4.5], ["didgeridoo", 4.3]], null, [["speech", 36.76], ["music", 34.23], ["whack, thwack", 4.22]]], "duration": [7.24, 18.7, 0.79, 22.36, 4.43, 1.12, 11.47, 1.53, 20.04]} \ No newline at end of file diff --git a/annotations_filtered/sNom4k5Pwb8_filtered.json b/annotations_filtered/sNom4k5Pwb8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8283fc49af7a2935a351657aa38b79053085b42c --- /dev/null +++ b/annotations_filtered/sNom4k5Pwb8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 43.82], [61.0, 61.33], [67.0, 68.12]], "keep_status": [true, false, false], "silence_prob": [32.62, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.99], ["speech", 25.82], ["fart", 4.74]], null, null], "duration": [8.82, 0.33, 1.12]} \ No newline at end of file diff --git a/annotations_filtered/sNrOsj0xDPs_filtered.json b/annotations_filtered/sNrOsj0xDPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c60d7c7fa9c2bb2b2492eab0d41cbd00678784f --- /dev/null +++ b/annotations_filtered/sNrOsj0xDPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 15.77], [18.0, 18.86], [19.0, 20.04], [21.0, 21.76], [23.0, 23.97], [25.0, 25.35], [35.0, 35.72], [38.0, 46.06], [50.0, 66.19], [66.0, 77.89], [79.0, 80.18], [82.0, 83.42], [87.0, 91.67], [92.0, 91.71], [92.0, 91.74], [104.0, 105.63], [107.0, 108.73], [112.0, 114.93], [119.0, 119.89], [121.0, 121.41], [128.0, 128.01], [131.0, 131.09], [134.0, 134.42], [141.0, 145.66], [150.0, 152.71], [165.0, 165.45], [172.0, 172.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 53.4, 89.72, 0.0, 0.0, 31.69, 0.0, 0.0, 0.0, 0.0, 30.95, 0.0, 0.0, 0.0, 0.0, 0.0, 31.05, 33.74, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.04], ["theremin", 11.31], ["synthetic singing", 3.42]], null, null, null, null, [["moo", 32.06], ["cattle, bovinae", 19.18], ["livestock, farm animals, working animals", 6.92]], null, null, null, null, null, [["theremin", 36.08], ["music", 27.25], ["musical instrument", 2.57]], [["music", 28.08], ["theremin", 15.44], ["cello", 7.93]], null, null], "duration": [-0.23, 0.86, 1.04, 0.76, 0.97, 0.35, 0.72, 8.06, 16.19, 11.89, 1.18, 1.42, 4.67, -0.29, -0.26, 1.63, 1.73, 2.93, 0.89, 0.41, 0.01, 0.09, 0.42, 4.66, 2.71, 0.45, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/sO2RBLeWYyg_filtered.json b/annotations_filtered/sO2RBLeWYyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e6079a40d35b1b6436174091b9ccbec3b931675 --- /dev/null +++ b/annotations_filtered/sO2RBLeWYyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.65], [13.0, 14.23], [15.0, 17.98], [18.0, 26.25], [28.0, 28.48], [30.0, 31.65], [34.0, 36.29], [38.0, 42.31], [44.0, 45.5], [49.0, 56.59], [58.0, 68.82], [70.0, 72.91], [73.0, 77.65], [79.0, 82.32], [84.0, 85.48], [87.0, 90.51], [92.0, 95.44], [96.0, 99.23], [101.0, 107.45], [108.0, 113.51], [114.0, 116.99], [118.0, 119.52], [123.0, 128.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.88, 0.0, 100.0, 99.92, 0.0, 0.0, 99.98, 100.0, 0.0, 100.0, 100.0, 100.0, 99.85, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.65, 1.23, 2.98, 8.25, 0.48, 1.65, 2.29, 4.31, 1.5, 7.59, 10.82, 2.91, 4.65, 3.32, 1.48, 3.51, 3.44, 3.23, 6.45, 5.51, 2.99, 1.52, 5.31]} \ No newline at end of file diff --git a/annotations_filtered/sOA84te9mAw_filtered.json b/annotations_filtered/sOA84te9mAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..742e54f6f1ca30f4c2647d108699cea57dc81259 --- /dev/null +++ b/annotations_filtered/sOA84te9mAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.92], [11.0, 20.26], [22.0, 27.03], [28.0, 28.76], [31.0, 31.7], [40.0, 40.24], [41.0, 42.25], [43.0, 44.68], [50.0, 51.65], [63.0, 65.74], [67.0, 69.67], [71.0, 73.33], [74.0, 77.45], [77.0, 77.5], [78.0, 83.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 39.14, 45.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6, 82.79, 66.76, 59.77, 0.0, 43.25], "audiomae_on_audioset": [null, [["hum", 47.42], ["throbbing", 18.12], ["speech", 6.03]], [["speech", 49.49], ["hum", 13.61], ["music", 7.66]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 21.49], ["hum", 21.37], ["mains hum", 12.85]]], "duration": [0.92, 9.26, 5.03, 0.76, 0.7, 0.24, 1.25, 1.68, 1.65, 2.74, 2.67, 2.33, 3.45, 0.5, 5.86]} \ No newline at end of file diff --git a/annotations_filtered/sOBIrjgDZr4_filtered.json b/annotations_filtered/sOBIrjgDZr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51772936c4059c14d23e20bebb516ec9576ee67c --- /dev/null +++ b/annotations_filtered/sOBIrjgDZr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.89], [5.0, 6.35], [8.0, 10.25], [11.0, 13.58], [17.0, 17.14], [20.0, 19.74], [33.0, 35.28], [37.0, 37.71], [41.0, 42.18], [43.0, 45.12], [50.0, 52.37], [56.0, 56.22], [57.0, 61.3], [65.0, 66.02], [67.0, 67.34], [69.0, 70.01], [72.0, 71.93], [72.0, 72.96], [74.0, 75.69], [77.0, 78.43], [79.0, 80.76], [81.0, 81.77], [82.0, 91.54], [96.0, 101.11], [103.0, 106.37], [110.0, 109.92], [112.0, 162.16], [163.0, 163.58], [166.0, 170.56], [173.0, 173.16], [174.0, 174.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.3, 0.0, 76.04, 97.54, 0.0, 0.0, 93.13, 0.0, 0.0, 96.54, 98.44, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 98.86, 94.37, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.89, 1.35, 2.25, 2.58, 0.14, -0.26, 2.28, 0.71, 1.18, 2.12, 2.37, 0.22, 4.3, 1.02, 0.34, 1.01, -0.07, 0.96, 1.69, 1.43, 1.76, 0.77, 9.54, 5.11, 3.37, -0.08, 50.16, 0.58, 4.56, 0.16, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/sOGhuhC4AF0_filtered.json b/annotations_filtered/sOGhuhC4AF0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05d8b7331b982bb6932996b88853d9378b1d8a6a --- /dev/null +++ b/annotations_filtered/sOGhuhC4AF0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.26], [14.0, 15.31], [18.0, 19.52], [21.0, 23.72], [24.0, 28.38], [34.0, 34.89], [35.0, 35.8], [37.0, 41.59], [47.0, 47.95], [52.0, 58.53], [61.0, 97.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.3, 32.48, 0.0, 0.0, 33.67, 0.0, 32.56, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 87.09], ["mantra", 0.95], ["synthetic singing", 0.8]], [["music", 71.35], ["musical instrument", 4.52], ["maraca", 4.24]], null, null, [["music", 70.3], ["speech", 4.82], ["didgeridoo", 4.43]], null, [["music", 62.06], ["speech", 7.12], ["electronic music", 6.37]], null], "duration": [0.26, 1.31, 1.52, 2.72, 4.38, 0.89, 0.8, 4.59, 0.95, 6.53, 36.68]} \ No newline at end of file diff --git a/annotations_filtered/sOHoeZYeAeM_filtered.json b/annotations_filtered/sOHoeZYeAeM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ebd23c130d77e7d7c19b2b6db934c8a027600bd --- /dev/null +++ b/annotations_filtered/sOHoeZYeAeM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.28], [5.0, 5.75], [7.0, 9.59], [10.0, 15.75], [19.0, 29.12], [30.0, 34.43], [36.0, 61.97], [63.0, 78.0], [79.0, 80.82], [82.0, 84.13], [89.0, 89.16], [91.0, 93.43], [94.0, 97.77], [99.0, 99.33], [102.0, 102.88], [106.0, 107.11], [110.0, 112.26], [115.0, 120.21], [122.0, 123.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.62, 88.83, 99.31, 99.21, 73.97, 30.84, 0.0, 83.16, 0.0, 39.46, 51.88, 0.0, 0.0, 0.0, 66.63, 74.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 31.84], ["electric shaver, electric razor", 27.69], ["thunk", 19.01]], null, null, null, [["speech", 16.38], ["fly, housefly", 13.7], ["bee, wasp, etc.", 5.74]], null, null, null, null, null, null, null], "duration": [1.28, 0.75, 2.59, 5.75, 10.12, 4.43, 25.97, 15.0, 1.82, 2.13, 0.16, 2.43, 3.77, 0.33, 0.88, 1.11, 2.26, 5.21, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/sOLnb7BrMC8_filtered.json b/annotations_filtered/sOLnb7BrMC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08c771edda216ebb681f46eca0b4efba4f592b59 --- /dev/null +++ b/annotations_filtered/sOLnb7BrMC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.71], [22.0, 42.92], [48.0, 48.56], [51.0, 132.02], [133.0, 146.92]], "keep_status": [false, true, false, false, true], "silence_prob": [0.0, 30.75, 0.0, 0.0, 30.82], "audiomae_on_audioset": [null, [["music", 51.54], ["mains hum", 9.41], ["hum", 6.41]], null, null, [["explosion", 42.9], ["burst, pop", 14.91], ["eruption", 8.78]]], "duration": [0.71, 20.92, 0.56, 81.02, 13.92]} \ No newline at end of file diff --git a/annotations_filtered/sOPwbePhOXs_filtered.json b/annotations_filtered/sOPwbePhOXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c36a7c0277ed24abfcd6fecfd54b2cd53d39ba84 --- /dev/null +++ b/annotations_filtered/sOPwbePhOXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.73], [4.0, 4.29], [9.0, 10.15], [11.0, 13.2], [13.0, 13.76], [18.0, 21.36], [23.0, 24.49], [27.0, 27.28], [28.0, 32.16], [34.0, 33.74], [34.0, 34.57], [36.0, 39.29], [40.0, 41.61], [44.0, 45.22], [48.0, 55.97], [57.0, 60.93], [64.0, 69.23], [70.0, 71.95], [73.0, 82.17], [84.0, 84.97], [89.0, 90.85], [99.0, 100.21], [106.0, 106.03], [109.0, 109.81], [110.0, 116.29], [119.0, 120.01], [124.0, 124.88], [127.0, 127.75], [128.0, 129.68], [144.0, 148.9], [150.0, 151.38], [156.0, 167.24], [173.0, 173.67], [175.0, 178.33], [179.0, 181.2], [181.0, 181.79], [184.0, 184.92], [185.0, 185.21]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 82.61, 0.0, 73.82, 0.0, 0.0, 41.42, 0.0, 0.0, 87.19, 0.0, 0.0, 53.34, 51.66, 56.1, 0.0, 65.2, 0.0, 0.0, 0.0, 0.0, 0.0, 72.6, 0.0, 0.0, 0.0, 0.0, 39.86, 0.0, 57.56, 0.0, 80.46, 39.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["wail, moan", 18.35], ["sneeze", 9.23], ["speech", 7.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.59], ["sidetone", 3.56], ["music", 3.41]], null, null, null, null, [["whale vocalization", 19.77], ["livestock, farm animals, working animals", 19.17], ["moo", 15.71]], null, null, null], "duration": [0.73, 0.29, 1.15, 2.2, 0.76, 3.36, 1.49, 0.28, 4.16, -0.26, 0.57, 3.29, 1.61, 1.22, 7.97, 3.93, 5.23, 1.95, 9.17, 0.97, 1.85, 1.21, 0.03, 0.81, 6.29, 1.01, 0.88, 0.75, 1.68, 4.9, 1.38, 11.24, 0.67, 3.33, 2.2, 0.79, 0.92, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/sOesH75ggbQ_filtered.json b/annotations_filtered/sOesH75ggbQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2991ce3a7aa586f11ee5d46d758467a11a21b56 --- /dev/null +++ b/annotations_filtered/sOesH75ggbQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.1], [6.0, 14.42], [18.0, 22.11], [22.0, 22.5], [23.0, 25.51], [27.0, 27.65], [28.0, 30.59], [31.0, 36.39], [37.0, 36.98], [37.0, 38.06], [38.0, 40.26], [44.0, 46.41], [48.0, 48.56], [52.0, 54.13], [56.0, 56.34], [56.0, 56.61], [59.0, 60.13], [60.0, 60.32], [61.0, 61.45], [64.0, 64.39], [66.0, 67.05], [68.0, 68.17], [69.0, 71.22], [82.0, 82.36], [86.0, 87.02], [93.0, 95.17], [100.0, 100.92], [106.0, 107.2], [109.0, 109.71], [111.0, 111.16], [113.0, 114.52], [117.0, 118.59], [121.0, 121.07], [125.0, 129.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 87.37, 82.97, 0.0, 46.12, 0.0, 55.39, 95.64, 0.0, 0.0, 45.82, 40.68, 0.0, 43.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.36, 0.0, 0.0, 63.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.7], "audiomae_on_audioset": [null, null, null, null, [["music", 64.64], ["guitar", 5.65], ["musical instrument", 5.31]], null, null, null, null, null, [["music", 66.54], ["musical instrument", 4.91], ["singing", 2.72]], [["music", 37.48], ["brass instrument", 15.44], ["trombone", 14.35]], null, [["music", 28.17], ["pizzicato", 9.2], ["double bass", 8.87]], null, null, null, null, null, null, null, null, [["music", 71.28], ["humming", 5.01], ["musical instrument", 2.35]], null, null, null, null, null, null, null, null, null, null, [["music", 44.11], ["didgeridoo", 18.7], ["musical instrument", 8.83]]], "duration": [1.1, 8.42, 4.11, 0.5, 2.51, 0.65, 2.59, 5.39, -0.02, 1.06, 2.26, 2.41, 0.56, 2.13, 0.34, 0.61, 1.13, 0.32, 0.45, 0.39, 1.05, 0.17, 2.22, 0.36, 1.02, 2.17, 0.92, 1.2, 0.71, 0.16, 1.52, 1.59, 0.07, 4.86]} \ No newline at end of file diff --git a/annotations_filtered/sOqvTLXZsMs_filtered.json b/annotations_filtered/sOqvTLXZsMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1a20d29dacf3f2805c7d466bd2c070e15d10f3d --- /dev/null +++ b/annotations_filtered/sOqvTLXZsMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 28.26], [30.0, 31.18], [32.0, 62.68], [65.0, 88.16], [89.0, 90.49], [96.0, 106.69], [109.0, 109.49]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [97.83, 0.0, 0.0, 40.38, 0.0, 36.9, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 26.72], ["animal", 9.85], ["domestic animals, pets", 8.44]], null, [["hum", 35.87], ["mains hum", 21.38], ["music", 19.7]], null], "duration": [5.26, 1.18, 30.68, 23.16, 1.49, 10.69, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/sP9ufyH-Pdg_filtered.json b/annotations_filtered/sP9ufyH-Pdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f80a36e90a50d8ce2f906e1c589e37a30c4e573c --- /dev/null +++ b/annotations_filtered/sP9ufyH-Pdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.79], [9.0, 10.23], [11.0, 12.04], [13.0, 13.36], [16.0, 19.13], [21.0, 21.12], [22.0, 28.11], [29.0, 29.42], [30.0, 40.1], [41.0, 42.3], [44.0, 56.62], [58.0, 60.64], [61.0, 62.85], [63.0, 63.73], [66.0, 66.58], [69.0, 69.21], [71.0, 71.9], [75.0, 77.46], [79.0, 80.45], [81.0, 84.06], [86.0, 87.42], [88.0, 89.92], [90.0, 91.64], [93.0, 92.84], [94.0, 98.51], [100.0, 100.85], [102.0, 102.0], [104.0, 104.53], [107.0, 108.01], [109.0, 108.94], [110.0, 110.52], [114.0, 114.22], [122.0, 122.45], [124.0, 124.63]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [76.37, 0.0, 0.0, 0.0, 45.08, 0.0, 82.79, 0.0, 85.72, 0.0, 52.05, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 52.98, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 40.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 6.47], ["explosion", 5.9], ["stomach rumble", 3.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 17.61], ["noise", 10.62], ["frog", 8.54]], null, null, null, null, null, null, null, null, null], "duration": [2.79, 1.23, 1.04, 0.36, 3.13, 0.12, 6.11, 0.42, 10.1, 1.3, 12.62, 2.64, 1.85, 0.73, 0.58, 0.21, 0.9, 2.46, 1.45, 3.06, 1.42, 1.92, 1.64, -0.16, 4.51, 0.85, 0.0, 0.53, 1.01, -0.06, 0.52, 0.22, 0.45, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/sPHeq8OM-dU_filtered.json b/annotations_filtered/sPHeq8OM-dU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..101cfc8c09432274a86510eb40be3a6a03d15ad4 --- /dev/null +++ b/annotations_filtered/sPHeq8OM-dU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.51], [5.0, 6.35], [7.0, 8.01], [9.0, 13.69], [14.0, 14.88], [15.0, 16.02], [17.0, 16.98], [18.0, 18.42], [19.0, 19.72], [20.0, 20.95], [23.0, 23.26], [24.0, 24.7], [25.0, 25.96], [30.0, 33.44], [34.0, 36.59], [37.0, 37.44], [40.0, 42.45], [47.0, 49.01], [53.0, 58.87], [61.0, 63.12], [65.0, 65.06], [79.0, 79.07], [80.0, 80.64], [92.0, 91.89], [99.0, 100.45], [105.0, 105.12], [107.0, 108.19], [118.0, 118.84], [119.0, 119.62], [123.0, 127.13], [136.0, 136.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.26, 73.36, 0.0, 47.5, 38.21, 32.08, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.25, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.61], ["didgeridoo", 7.34], ["music", 6.81]], null, null, [["music", 86.06], ["carnatic music", 4.41], ["theremin", 1.43]], [["music", 81.46], ["carnatic music", 6.34], ["singing", 3.23]], [["music", 70.37], ["whimper", 4.01], ["speech", 3.41]], null, null, null, null, null, null, null, null, null, null, [["speech", 37.64], ["music", 17.77], ["vehicle", 6.75]], null], "duration": [1.51, 1.35, 1.01, 4.69, 0.88, 1.02, -0.02, 0.42, 0.72, 0.95, 0.26, 0.7, 0.96, 3.44, 2.59, 0.44, 2.45, 2.01, 5.87, 2.12, 0.06, 0.07, 0.64, -0.11, 1.45, 0.12, 1.19, 0.84, 0.62, 4.13, 0.63]} \ No newline at end of file diff --git a/annotations_filtered/sPQLY7niQC4_filtered.json b/annotations_filtered/sPQLY7niQC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ab03be68f293aa4e4568e1f73eff8c6f7d69338 --- /dev/null +++ b/annotations_filtered/sPQLY7niQC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [6.0, 7.48], [11.0, 13.1], [14.0, 15.55], [16.0, 17.09], [24.0, 24.24], [31.0, 31.9], [34.0, 35.38], [36.0, 40.59], [45.0, 45.79], [52.0, 52.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 37.89, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 61.5], ["guitar", 7.56], ["musical instrument", 5.09]], null, null], "duration": [1.31, 1.48, 2.1, 1.55, 1.09, 0.24, 0.9, 1.38, 4.59, 0.79, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/sPS0cKOGZO0_filtered.json b/annotations_filtered/sPS0cKOGZO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..282e93bf6ac2b075f23d29994f7581c969dac858 --- /dev/null +++ b/annotations_filtered/sPS0cKOGZO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.09], [11.0, 11.42], [14.0, 14.22], [23.0, 23.62], [31.0, 33.62], [36.0, 36.05], [37.0, 39.04], [47.0, 46.85], [49.0, 49.49], [54.0, 54.67], [56.0, 56.83], [64.0, 64.34], [70.0, 72.96], [74.0, 75.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 61.18, 0.0, 58.47, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 0.42, 0.22, 0.62, 2.62, 0.05, 2.04, -0.15, 0.49, 0.67, 0.83, 0.34, 2.96, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/sPZUh1YRnDg_filtered.json b/annotations_filtered/sPZUh1YRnDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..798ac053d8f90fd6404eba3c346b27924eac4632 --- /dev/null +++ b/annotations_filtered/sPZUh1YRnDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.04], [14.0, 16.16], [17.0, 18.77], [19.0, 19.8], [21.0, 22.71], [29.0, 31.56], [37.0, 38.57], [45.0, 45.62], [46.0, 47.95], [51.0, 56.54], [60.0, 82.54], [85.0, 121.34]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [72.6, 95.64, 0.0, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 32.0, 31.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 35.02], ["mains hum", 16.6], ["hum", 15.71]], [["vehicle", 37.19], ["skidding", 20.11], ["car", 18.15]], null], "duration": [2.04, 2.16, 1.77, 0.8, 1.71, 2.56, 1.57, 0.62, 1.95, 5.54, 22.54, 36.34]} \ No newline at end of file diff --git a/annotations_filtered/sPgl1DyIn3U_filtered.json b/annotations_filtered/sPgl1DyIn3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee01a05f46cb8bb113686192154e639887b71b8b --- /dev/null +++ b/annotations_filtered/sPgl1DyIn3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.35], [26.0, 28.8], [32.0, 35.28], [36.0, 37.02], [39.0, 42.01], [44.0, 55.09], [58.0, 62.56], [69.0, 95.54], [102.0, 102.98]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.66, 93.29, 0.0, 99.26, 80.11, 93.91, 68.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.35, 2.8, 3.28, 1.02, 3.01, 11.09, 4.56, 26.54, 0.98]} \ No newline at end of file diff --git a/annotations_filtered/sPlsA3_6hB8_filtered.json b/annotations_filtered/sPlsA3_6hB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebcc161bc050b93318cd7b5d0166cb648d5086f9 --- /dev/null +++ b/annotations_filtered/sPlsA3_6hB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 137.0], [138.0, 140.04]], "keep_status": [false, false], "silence_prob": [0.0, 51.71], "audiomae_on_audioset": [null, null], "duration": [129.0, 2.04]} \ No newline at end of file diff --git a/annotations_filtered/sQA199D8U2g_filtered.json b/annotations_filtered/sQA199D8U2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18bf8234039bc859137890d9795a4778f046eca3 --- /dev/null +++ b/annotations_filtered/sQA199D8U2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.33], [6.0, 7.64], [14.0, 14.67], [19.0, 20.06], [22.0, 23.58], [25.0, 25.93], [28.0, 33.22], [37.0, 81.41], [85.0, 87.05], [92.0, 91.98], [92.0, 95.34], [97.0, 117.95]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [33.84, 0.0, 0.0, 0.0, 0.0, 0.0, 31.83, 0.0, 71.72, 0.0, 39.93, 29.31], "audiomae_on_audioset": [[["music", 36.66], ["mains hum", 15.14], ["didgeridoo", 13.7]], null, null, null, null, null, [["music", 60.7], ["electronic music", 5.62], ["didgeridoo", 5.58]], null, null, null, [["speech", 46.79], ["music", 11.91], ["hum", 9.86]], [["speech", 51.4], ["music", 18.44], ["sonar", 7.38]]], "duration": [2.33, 1.64, 0.67, 1.06, 1.58, 0.93, 5.22, 44.41, 2.05, -0.02, 3.34, 20.95]} \ No newline at end of file diff --git a/annotations_filtered/sQC7OzU_d18_filtered.json b/annotations_filtered/sQC7OzU_d18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3606b99a6a146b916c3f2f8bbb612b289837d3f3 --- /dev/null +++ b/annotations_filtered/sQC7OzU_d18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [5.0, 5.22], [12.0, 17.68], [19.0, 21.56], [22.0, 24.98], [27.0, 28.83], [29.0, 34.96], [35.0, 35.72], [37.0, 56.91], [58.0, 67.12], [68.0, 67.88], [72.0, 72.49], [74.0, 74.61], [75.0, 76.62], [83.0, 83.98], [93.0, 92.97], [93.0, 97.36], [100.0, 100.75], [104.0, 112.68], [114.0, 115.11], [115.0, 121.73]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 53.78, 51.28, 59.33, 0.0, 33.0, 0.0, 33.87, 31.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 40.77, 0.0, 44.46], "audiomae_on_audioset": [null, null, null, null, null, null, [["mains hum", 30.95], ["hum", 13.25], ["music", 10.37]], null, [["buzz", 32.14], ["hum", 25.46], ["mains hum", 15.45]], [["mains hum", 30.41], ["hum", 28.02], ["music", 17.64]], null, null, null, null, null, null, [["speech", 47.39], ["music", 16.02], ["radio", 8.29]], null, [["hum", 47.0], ["mains hum", 19.76], ["music", 11.28]], null, [["hum", 22.44], ["speech", 10.78], ["mains hum", 9.58]]], "duration": [0.65, 0.22, 5.68, 2.56, 2.98, 1.83, 5.96, 0.72, 19.91, 9.12, -0.12, 0.49, 0.61, 1.62, 0.98, -0.03, 4.36, 0.75, 8.68, 1.11, 6.73]} \ No newline at end of file diff --git a/annotations_filtered/sQFqzFD78Ck_filtered.json b/annotations_filtered/sQFqzFD78Ck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..069932d3e436a03974f41c2b3c386b5883fed27e --- /dev/null +++ b/annotations_filtered/sQFqzFD78Ck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [17.0, 19.33], [22.0, 22.42], [32.0, 32.17], [35.0, 35.94], [36.0, 36.66], [44.0, 45.94], [46.0, 48.07], [49.0, 54.94], [56.0, 56.54], [68.0, 67.93], [82.0, 82.86], [84.0, 84.99], [86.0, 87.79], [88.0, 88.67], [93.0, 93.8], [94.0, 96.38], [100.0, 101.02], [104.0, 104.65], [109.0, 109.61], [110.0, 110.56], [113.0, 116.06], [125.0, 126.45], [128.0, 129.1], [130.0, 130.52], [131.0, 131.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 74.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 2.33, 0.42, 0.17, 0.94, 0.66, 1.94, 2.07, 5.94, 0.54, -0.07, 0.86, 0.99, 1.79, 0.67, 0.8, 2.38, 1.02, 0.65, 0.61, 0.56, 3.06, 1.45, 1.1, 0.52, 0.33]} \ No newline at end of file diff --git a/annotations_filtered/sQPrjgzEcAc_filtered.json b/annotations_filtered/sQPrjgzEcAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51db418aa4112b37f40c23d4689ea457b4af2354 --- /dev/null +++ b/annotations_filtered/sQPrjgzEcAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.45], [7.0, 7.57], [14.0, 14.99], [19.0, 19.82], [21.0, 22.22], [24.0, 25.29], [28.0, 28.85], [36.0, 40.0], [42.0, 45.98], [48.0, 49.44], [51.0, 53.6], [57.0, 57.74], [59.0, 62.18], [63.0, 64.77], [66.0, 66.43], [67.0, 67.58], [68.0, 71.22], [76.0, 81.09], [83.0, 86.48], [88.0, 90.81], [92.0, 121.81], [122.0, 124.26], [126.0, 129.88], [130.0, 148.42], [149.0, 152.14], [153.0, 158.01], [163.0, 163.65], [165.0, 170.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 56.78, 0.0, 60.7, 0.0, 45.11, 0.0, 0.0, 0.0, 61.87, 60.7, 72.01, 60.89, 58.72, 65.09, 61.27, 45.69, 42.65, 39.09, 0.0, 41.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.06], ["music", 17.53], ["musical instrument", 1.79]], null, null, null, null, null, null, null, null, null, null, [["music", 51.95], ["speech", 19.59], ["synthesizer", 3.06]], [["music", 41.18], ["singing bowl", 15.06], ["harmonic", 5.28]], [["music", 45.16], ["singing bowl", 14.74], ["synthesizer", 7.37]], null, [["speech", 33.98], ["music", 29.95], ["synthesizer", 8.94]]], "duration": [2.45, 0.57, 0.99, 0.82, 1.22, 1.29, 0.85, 4.0, 3.98, 1.44, 2.6, 0.74, 3.18, 1.77, 0.43, 0.58, 3.22, 5.09, 3.48, 2.81, 29.81, 2.26, 3.88, 18.42, 3.14, 5.01, 0.65, 5.55]} \ No newline at end of file diff --git a/annotations_filtered/sQ_4m2ocxhI_filtered.json b/annotations_filtered/sQ_4m2ocxhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64b4c4c9074446abf2191c028033ac7375e9e051 --- /dev/null +++ b/annotations_filtered/sQ_4m2ocxhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.81], [15.0, 15.63], [20.0, 21.2], [50.0, 50.82], [101.0, 101.43], [105.0, 106.41], [148.0, 148.49], [150.0, 153.45], [155.0, 155.7], [168.0, 174.23]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.8, 0.0, 62.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["breaking", 19.08], ["speech", 14.19], ["ding", 14.11]], null, null], "duration": [1.81, 0.63, 1.2, 0.82, 0.43, 1.41, 0.49, 3.45, 0.7, 6.23]} \ No newline at end of file diff --git a/annotations_filtered/sQolThygoGk_filtered.json b/annotations_filtered/sQolThygoGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6068e05e30ebfee99b3c8765ddf9fcd5c20c4597 --- /dev/null +++ b/annotations_filtered/sQolThygoGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [7.0, 9.09], [11.0, 13.86], [15.0, 15.77], [20.0, 21.54], [22.0, 30.06], [41.0, 41.84], [46.0, 46.72], [47.0, 50.04], [60.0, 61.77], [65.0, 66.95], [74.0, 78.95], [80.0, 81.06], [81.0, 81.51], [82.0, 90.98], [91.0, 91.02], [94.0, 99.5], [100.0, 102.81]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [0.0, 77.53, 71.29, 0.0, 0.0, 48.52, 0.0, 0.0, 81.53, 0.0, 0.0, 47.46, 0.0, 0.0, 31.29, 0.0, 38.87, 37.96], "audiomae_on_audioset": [null, null, null, null, null, [["moo", 26.35], ["livestock, farm animals, working animals", 25.08], ["cattle, bovinae", 17.12]], null, null, null, null, null, [["speech", 28.78], ["music", 16.54], ["throbbing", 13.48]], null, null, [["music", 10.09], ["explosion", 9.89], ["vehicle", 8.02]], null, [["cattle, bovinae", 35.27], ["livestock, farm animals, working animals", 33.99], ["moo", 29.02]], [["cattle, bovinae", 29.15], ["moo", 22.28], ["livestock, farm animals, working animals", 10.15]]], "duration": [0.87, 2.09, 2.86, 0.77, 1.54, 8.06, 0.84, 0.72, 3.04, 1.77, 1.95, 4.95, 1.06, 0.51, 8.98, 0.02, 5.5, 2.81]} \ No newline at end of file diff --git a/annotations_filtered/sR0wCC271s4_filtered.json b/annotations_filtered/sR0wCC271s4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e9965205060d55a79c0093c48e0b74d5b907048 --- /dev/null +++ b/annotations_filtered/sR0wCC271s4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [16.0, 16.61], [26.0, 27.04], [52.0, 54.03], [70.0, 71.85], [73.0, 78.95], [80.0, 89.01], [94.0, 95.88], [96.0, 97.95], [99.0, 105.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 63.21, 0.0, 86.64, 51.66, 0.0, 0.0, 98.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.61, 1.04, 2.03, 1.85, 5.95, 9.01, 1.88, 1.95, 6.68]} \ No newline at end of file diff --git a/annotations_filtered/sR176VaCLXg_filtered.json b/annotations_filtered/sR176VaCLXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..263797897fe43014ad8d02503c6e427e0f2d946f --- /dev/null +++ b/annotations_filtered/sR176VaCLXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [8.0, 9.59], [10.0, 13.95], [14.0, 15.28], [16.0, 17.15], [19.0, 21.42], [22.0, 22.37], [24.0, 23.94], [24.0, 24.95], [26.0, 26.96], [35.0, 46.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 44.43, 0.0, 0.0, 63.74, 0.0, 0.0, 0.0, 0.0, 37.38], "audiomae_on_audioset": [null, null, [["music", 57.16], ["guitar", 9.96], ["musical instrument", 7.0]], null, null, null, null, null, null, null, [["music", 30.99], ["hum", 6.99], ["musical instrument", 6.78]]], "duration": [1.05, 1.59, 3.95, 1.28, 1.15, 2.42, 0.37, -0.06, 0.95, 0.96, 11.26]} \ No newline at end of file diff --git a/annotations_filtered/sR4iKRfUwOs_filtered.json b/annotations_filtered/sR4iKRfUwOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7044a0a3ac298c079c2ab7efa0a384a08a81076 --- /dev/null +++ b/annotations_filtered/sR4iKRfUwOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.0], [24.0, 26.2], [34.0, 36.17], [41.0, 42.31], [50.0, 54.28], [61.0, 67.76], [76.0, 76.17], [76.0, 80.69], [81.0, 83.3], [87.0, 106.93], [108.0, 108.5], [110.0, 110.79], [111.0, 113.14], [119.0, 121.02], [122.0, 123.36], [125.0, 128.02], [129.0, 131.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.4, 59.59, 0.0, 51.94, 44.29, 0.0, 53.78, 52.16, 37.14, 0.0, 0.0, 65.2, 50.02, 0.0, 82.07, 53.22], "audiomae_on_audioset": [null, null, null, null, null, [["music", 45.02], ["speech", 14.1], ["didgeridoo", 13.4]], null, null, null, [["music", 74.78], ["musical instrument", 3.82], ["didgeridoo", 2.33]], null, null, null, null, null, null, null], "duration": [0.0, 2.2, 2.17, 1.31, 4.28, 6.76, 0.17, 4.69, 2.3, 19.93, 0.5, 0.79, 2.14, 2.02, 1.36, 3.02, 2.82]} \ No newline at end of file diff --git a/annotations_filtered/sR528E5_8yI_filtered.json b/annotations_filtered/sR528E5_8yI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9eedfa88752708e8c33c88bff586858f38ad695 --- /dev/null +++ b/annotations_filtered/sR528E5_8yI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [5.0, 5.34], [16.0, 20.95], [22.0, 22.69], [26.0, 26.86], [32.0, 37.5], [39.0, 39.28], [45.0, 46.21], [48.0, 53.42], [57.0, 61.74], [74.0, 75.71], [81.0, 82.27], [83.0, 87.18], [89.0, 89.02], [91.0, 90.83], [94.0, 94.07], [96.0, 101.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 99.76, 0.0, 0.0, 50.11, 0.0, 0.0, 45.24, 36.2, 0.0, 0.0, 56.78, 0.0, 0.0, 0.0, 31.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["theremin", 66.07], ["music", 19.96], ["speech", 4.53]], [["theremin", 59.47], ["music", 15.06], ["speech", 7.98]], null, null, null, null, null, null, [["explosion", 49.3], ["burst, pop", 10.35], ["speech", 6.29]]], "duration": [1.04, 0.34, 4.95, 0.69, 0.86, 5.5, 0.28, 1.21, 5.42, 4.74, 1.71, 1.27, 4.18, 0.02, -0.17, 0.07, 5.55]} \ No newline at end of file diff --git a/annotations_filtered/sRKtU9FF-8w_filtered.json b/annotations_filtered/sRKtU9FF-8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ad7a427330804e8e60a16d177d0b7c74edfe6e5 --- /dev/null +++ b/annotations_filtered/sRKtU9FF-8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.35], [28.0, 30.55], [33.0, 36.98], [39.0, 39.01], [41.0, 41.39], [44.0, 49.65], [51.0, 52.05], [53.0, 55.14], [57.0, 66.99], [70.0, 70.65], [71.0, 72.35], [83.0, 82.88], [86.0, 86.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.21, 78.89, 0.0, 0.0, 77.36, 0.0, 99.98, 81.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.35, 2.55, 3.98, 0.01, 0.39, 5.65, 1.05, 2.14, 9.99, 0.65, 1.35, -0.12, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/sRPTqsO_SoM_filtered.json b/annotations_filtered/sRPTqsO_SoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..601bc7e4cd638ce9efcca6adf2856c6be1f6bdd1 --- /dev/null +++ b/annotations_filtered/sRPTqsO_SoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [5.0, 5.76], [7.0, 11.64], [14.0, 15.15], [16.0, 17.2], [31.0, 31.23], [32.0, 32.81], [41.0, 42.15], [46.0, 46.85], [49.0, 49.79], [52.0, 54.24], [58.0, 69.53], [71.0, 70.9], [80.0, 82.7], [86.0, 85.68], [87.0, 88.55], [95.0, 95.35], [97.0, 96.72], [97.0, 98.47], [110.0, 112.38], [127.0, 127.52], [133.0, 134.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 100.0, 0.0, 91.3, 0.0, 0.0, 0.0, 0.0, 0.0, 62.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 0.76, 4.64, 1.15, 1.2, 0.23, 0.81, 1.15, 0.85, 0.79, 2.24, 11.53, -0.1, 2.7, -0.32, 1.55, 0.35, -0.28, 1.47, 2.38, 0.52, 1.82]} \ No newline at end of file diff --git a/annotations_filtered/sRR3ukzqiGs_filtered.json b/annotations_filtered/sRR3ukzqiGs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e93b4dd3bd47661dbf66ba40bd43fa5a3a7bed04 --- /dev/null +++ b/annotations_filtered/sRR3ukzqiGs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.55], [14.0, 17.69], [23.0, 22.86], [27.0, 28.11], [30.0, 31.95], [35.0, 35.9], [38.0, 40.27], [41.0, 40.68], [42.0, 46.45], [61.0, 61.25], [62.0, 62.68], [69.0, 69.25], [73.0, 82.36], [83.0, 83.73], [90.0, 90.58], [94.0, 96.03], [116.0, 119.4], [121.0, 124.68], [128.0, 130.5], [139.0, 139.23]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.06, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 45.78, 0.0, 0.0, 0.0, 39.31, 0.0, 0.0, 38.49, 64.29, 66.39, 63.74, 0.0], "audiomae_on_audioset": [null, [["music", 41.93], ["didgeridoo", 5.08], ["fly, housefly", 4.47]], null, null, null, null, null, null, [["music", 69.95], ["musical instrument", 2.66], ["electronic music", 2.34]], null, null, null, [["speech", 38.47], ["music", 27.29], ["fart", 3.74]], null, null, [["music", 75.83], ["musical instrument", 2.93], ["laughter", 2.86]], null, null, null, null], "duration": [0.55, 3.69, -0.14, 1.11, 1.95, 0.9, 2.27, -0.32, 4.45, 0.25, 0.68, 0.25, 9.36, 0.73, 0.58, 2.03, 3.4, 3.68, 2.5, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/sRUb0GR0ZiE_filtered.json b/annotations_filtered/sRUb0GR0ZiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a12f7e7c72a856a6f370aecf551bdce00cdd424 --- /dev/null +++ b/annotations_filtered/sRUb0GR0ZiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 43.38], [46.0, 47.22], [47.0, 49.54], [50.0, 101.76], [103.0, 110.84], [121.0, 122.96], [127.0, 128.38], [129.0, 131.16], [132.0, 136.17], [137.0, 139.62], [142.0, 144.36], [146.0, 148.71], [150.0, 149.93], [151.0, 153.28], [155.0, 158.06], [159.0, 160.42], [161.0, 167.36], [169.0, 170.13], [172.0, 174.68]], "keep_status": [true, false, false, false, false, false, false, false, true, true, true, false, false, true, true, false, false, false, true], "silence_prob": [34.71, 0.0, 29.71, 0.0, 32.02, 0.0, 0.0, 43.64, 49.78, 49.31, 41.93, 50.41, 0.0, 46.12, 47.58, 0.0, 43.82, 0.0, 47.62], "audiomae_on_audioset": [[["music", 30.98], ["speech", 15.78], ["throbbing", 15.16]], null, [["speech", 60.29], ["music", 12.03], ["crowd", 5.21]], null, [["music", 41.6], ["throbbing", 20.71], ["electronic music", 12.31]], null, null, [["speech", 64.43], ["rumble", 5.63], ["vehicle", 4.37]], [["rumble", 29.07], ["vehicle", 11.94], ["buzz", 8.68]], [["rumble", 18.23], ["hum", 13.6], ["buzz", 5.49]], [["speech", 10.29], ["sidetone", 10.11], ["bee, wasp, etc.", 9.36]], null, null, [["rumble", 32.36], ["vehicle", 6.93], ["car", 5.23]], [["rumble", 24.83], ["vehicle", 15.1], ["car", 6.86]], null, [["speech", 57.7], ["rumble", 20.01], ["hum", 4.54]], null, [["rumble", 20.6], ["cat", 6.93], ["vehicle", 6.24]]], "duration": [6.38, 1.22, 2.54, 51.76, 7.84, 1.96, 1.38, 2.16, 4.17, 2.62, 2.36, 2.71, -0.07, 2.28, 3.06, 1.42, 6.36, 1.13, 2.68]} \ No newline at end of file diff --git a/annotations_filtered/sR_tidD4M_8_filtered.json b/annotations_filtered/sR_tidD4M_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adaa80e0c3fb4658fbda04d201cfc9330d0cde3e --- /dev/null +++ b/annotations_filtered/sR_tidD4M_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.1], [10.0, 16.56], [17.0, 20.31], [21.0, 29.1], [34.0, 39.93], [43.0, 74.06], [74.0, 104.87], [105.0, 106.41], [108.0, 116.31], [118.0, 117.88], [119.0, 132.63], [134.0, 158.6], [160.0, 177.01]], "keep_status": [false, true, true, true, true, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 41.83, 39.66, 28.69, 29.61, 0.0, 0.0, 0.0, 29.31, 0.0, 28.97, 30.94, 40.61], "audiomae_on_audioset": [null, [["sonar", 23.85], ["sine wave", 11.24], ["chirp tone", 8.52]], [["music", 36.92], ["chirp tone", 14.68], ["sine wave", 10.86]], [["sidetone", 30.28], ["speech", 15.49], ["music", 14.38]], [["speech", 27.73], ["vehicle", 8.32], ["hum", 7.79]], null, null, null, [["vehicle", 26.53], ["car", 16.34], ["motorcycle", 14.48]], null, [["speech", 32.22], ["vehicle", 28.36], ["car", 11.11]], [["music", 22.45], ["speech", 13.15], ["fly, housefly", 12.61]], [["music", 49.77], ["hum", 16.3], ["throbbing", 6.75]]], "duration": [0.1, 6.56, 3.31, 8.1, 5.93, 31.06, 30.87, 1.41, 8.31, -0.12, 13.63, 24.6, 17.01]} \ No newline at end of file diff --git a/annotations_filtered/sR_xG8DNCSI_filtered.json b/annotations_filtered/sR_xG8DNCSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44c0aa4b1e5c9a014c54adfda62d75b7e5f713d8 --- /dev/null +++ b/annotations_filtered/sR_xG8DNCSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 29.25], [30.0, 30.87], [35.0, 39.7], [45.0, 59.04], [63.0, 72.82], [75.0, 82.63], [85.0, 85.56], [86.0, 90.17], [96.0, 104.38], [108.0, 108.08], [109.0, 109.26], [111.0, 110.78], [115.0, 118.64], [122.0, 127.52], [129.0, 131.45]], "keep_status": [false, false, true, true, false, false, false, true, true, false, false, false, false, true, true], "silence_prob": [29.09, 0.0, 29.21, 29.49, 30.46, 29.52, 0.0, 29.82, 29.22, 0.0, 0.0, 0.0, 33.38, 31.03, 33.97], "audiomae_on_audioset": [[["music", 54.03], ["theremin", 15.24], ["musical instrument", 11.67]], null, [["music", 29.69], ["speech", 9.62], ["livestock, farm animals, working animals", 6.5]], [["music", 17.77], ["speech", 10.06], ["buzz", 8.82]], [["music", 52.24], ["speech", 22.46], ["didgeridoo", 2.78]], [["music", 51.91], ["speech", 26.22], ["grunt", 1.44]], null, [["speech", 32.12], ["music", 13.55], ["vehicle", 10.65]], [["cattle, bovinae", 17.06], ["moo", 16.23], ["livestock, farm animals, working animals", 10.64]], null, null, null, [["speech", 31.88], ["radio", 26.33], ["sidetone", 24.89]], [["speech", 49.09], ["vehicle", 14.6], ["mains hum", 4.28]], [["speech", 41.4], ["music", 17.35], ["hum", 6.57]]], "duration": [5.25, 0.87, 4.7, 14.04, 9.82, 7.63, 0.56, 4.17, 8.38, 0.08, 0.26, -0.22, 3.64, 5.52, 2.45]} \ No newline at end of file diff --git a/annotations_filtered/sRqeX6qMlak_filtered.json b/annotations_filtered/sRqeX6qMlak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..908681c00f3464d1a0b3644eed4282a67da055d1 --- /dev/null +++ b/annotations_filtered/sRqeX6qMlak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [3.0, 3.03], [5.0, 5.27], [7.0, 6.67], [16.0, 23.03], [26.0, 40.9], [41.0, 73.23], [77.0, 84.6]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.29, 31.95, 0.0, 70.16], "audiomae_on_audioset": [null, null, null, null, [["music", 40.55], ["theremin", 20.22], ["scary music", 10.09]], [["didgeridoo", 38.17], ["music", 28.15], ["speech", 20.06]], null, null], "duration": [1.17, 0.03, 0.27, -0.33, 7.03, 14.9, 32.23, 7.6]} \ No newline at end of file diff --git a/annotations_filtered/sRwqd3eCNUY_filtered.json b/annotations_filtered/sRwqd3eCNUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37c6fc186582dd8b1dda6301da9894b75624444e --- /dev/null +++ b/annotations_filtered/sRwqd3eCNUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.42], [17.0, 19.01], [20.0, 21.76], [27.0, 28.34], [34.0, 35.53], [38.0, 40.64], [47.0, 48.64], [51.0, 52.03], [54.0, 53.99], [69.0, 71.81], [79.0, 80.08], [83.0, 83.07], [85.0, 85.41], [87.0, 89.36], [94.0, 95.55], [104.0, 107.62], [110.0, 119.99], [121.0, 123.62], [125.0, 129.27], [130.0, 132.14], [133.0, 134.86], [137.0, 138.62], [140.0, 143.55], [144.0, 145.89], [147.0, 148.63], [150.0, 151.75], [153.0, 152.91], [155.0, 155.48], [156.0, 156.32], [159.0, 160.19], [161.0, 163.05], [168.0, 172.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 99.59, 100.0, 100.0, 99.1, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 2.01, 1.76, 1.34, 1.53, 2.64, 1.64, 1.03, -0.01, 2.81, 1.08, 0.07, 0.41, 2.36, 1.55, 3.62, 9.99, 2.62, 4.27, 2.14, 1.86, 1.62, 3.55, 1.89, 1.63, 1.75, -0.09, 0.48, 0.32, 1.19, 2.05, 4.4]} \ No newline at end of file diff --git a/annotations_filtered/sSRmhI94MUs_filtered.json b/annotations_filtered/sSRmhI94MUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72f1b41a5c38b2943356d2e6ef764347e636eb32 --- /dev/null +++ b/annotations_filtered/sSRmhI94MUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.3], [26.0, 27.21], [29.0, 29.52], [31.0, 31.28], [33.0, 41.23], [42.0, 42.2], [44.0, 55.0], [57.0, 57.32], [59.0, 62.5], [66.0, 66.31], [68.0, 68.99], [72.0, 108.9], [112.0, 125.47], [126.0, 128.33], [130.0, 130.87], [132.0, 132.68], [133.0, 134.72], [136.0, 136.38], [137.0, 137.83], [139.0, 142.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 96.17, 0.0, 36.28, 0.0, 0.0, 0.0, 31.1, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 32.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 56.39], ["radio", 34.81], ["sidetone", 2.25]], null, null, null, [["speech", 70.66], ["radio", 4.73], ["creak", 4.7]], null, null, null, null, null, null, [["hum", 23.64], ["bouncing", 8.19], ["noise", 7.73]]], "duration": [0.3, 1.21, 0.52, 0.28, 8.23, 0.2, 11.0, 0.32, 3.5, 0.31, 0.99, 36.9, 13.47, 2.33, 0.87, 0.68, 1.72, 0.38, 0.83, 3.53]} \ No newline at end of file diff --git a/annotations_filtered/sSc4Y4Z9lsk_filtered.json b/annotations_filtered/sSc4Y4Z9lsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27a9eb6abe4e82741e729fd18a133687f6e8ac4f --- /dev/null +++ b/annotations_filtered/sSc4Y4Z9lsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.62], [8.0, 12.23], [13.0, 14.69], [16.0, 19.67], [21.0, 23.41], [24.0, 25.49], [39.0, 38.74], [45.0, 45.1], [50.0, 52.08], [54.0, 57.32], [58.0, 60.98], [62.0, 63.96], [65.0, 67.04], [68.0, 69.75], [71.0, 73.35], [79.0, 79.68], [88.0, 88.8], [96.0, 96.7], [110.0, 110.98], [111.0, 112.23], [113.0, 115.43], [116.0, 122.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.18, 52.92, 0.0, 87.37, 100.0, 0.0, 0.0, 0.0, 85.72, 94.07, 93.45, 0.0, 82.43, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 82.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.62, 4.23, 1.69, 3.67, 2.41, 1.49, -0.26, 0.1, 2.08, 3.32, 2.98, 1.96, 2.04, 1.75, 2.35, 0.68, 0.8, 0.7, 0.98, 1.23, 2.43, 6.54]} \ No newline at end of file diff --git a/annotations_filtered/sSk2SvdopGY_filtered.json b/annotations_filtered/sSk2SvdopGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..180c91acd3a046e46daeb85df44d9012df586aea --- /dev/null +++ b/annotations_filtered/sSk2SvdopGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [16.0, 17.32], [44.0, 45.49], [47.0, 47.9], [48.0, 50.73]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 44.6], "audiomae_on_audioset": [null, null, null, null, [["speech", 55.99], ["sidetone", 19.99], ["animal", 3.39]]], "duration": [0.5, 1.32, 1.49, 0.9, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/sSvxvpY7PZM_filtered.json b/annotations_filtered/sSvxvpY7PZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79f81af0a8d877e4117f30bde0bdc0845d29e193 --- /dev/null +++ b/annotations_filtered/sSvxvpY7PZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.87], [19.0, 19.3], [22.0, 24.33], [30.0, 30.13], [31.0, 33.0], [34.0, 36.12], [37.0, 40.61], [41.0, 40.91], [45.0, 46.6], [50.0, 50.95], [60.0, 61.48], [64.0, 64.49], [73.0, 73.87], [77.0, 77.48], [83.0, 85.01], [89.0, 89.55], [94.0, 95.3], [99.0, 99.96], [103.0, 103.65], [107.0, 107.16], [109.0, 115.16], [116.0, 116.14], [117.0, 117.42], [119.0, 119.85], [120.0, 122.37], [123.0, 123.5], [125.0, 125.17]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 0.0, 61.18, 0.0, 47.5, 95.91, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.83, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 91.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["stomach rumble", 29.53], ["whale vocalization", 13.57], ["radio", 4.38]], null, null, null, null, null, null, null, null, null, [["music", 60.48], ["throbbing", 6.95], ["hum", 6.76]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.87, 0.3, 2.33, 0.13, 2.0, 2.12, 3.61, -0.09, 1.6, 0.95, 1.48, 0.49, 0.87, 0.48, 2.01, 0.55, 1.3, 0.96, 0.65, 0.16, 6.16, 0.14, 0.42, 0.85, 2.37, 0.5, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/sT-wJhtlMGs_filtered.json b/annotations_filtered/sT-wJhtlMGs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..252bb6115efb0cca17dcfb34eb210d9eb19f447c --- /dev/null +++ b/annotations_filtered/sT-wJhtlMGs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [8.0, 9.05], [16.0, 16.33], [18.0, 20.55], [24.0, 24.58], [34.0, 34.3], [35.0, 88.37], [93.0, 102.88], [105.0, 105.33], [106.0, 113.0]], "keep_status": [false, false, false, true, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 41.03, 0.0, 0.0, 0.0, 30.99, 0.0, 32.48], "audiomae_on_audioset": [null, null, null, [["hum", 22.76], ["mains hum", 13.9], ["music", 8.49]], null, null, null, [["speech", 36.4], ["hum", 15.41], ["vehicle", 8.03]], null, [["music", 24.76], ["vehicle", 22.69], ["car", 10.0]]], "duration": [0.78, 1.05, 0.33, 2.55, 0.58, 0.3, 53.37, 9.88, 0.33, 7.0]} \ No newline at end of file diff --git a/annotations_filtered/sT47KfDlwI8_filtered.json b/annotations_filtered/sT47KfDlwI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7f1f95eef6ab92a68a844e45ac2058c995ae68f --- /dev/null +++ b/annotations_filtered/sT47KfDlwI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [12.0, 12.01], [13.0, 18.39], [34.0, 34.13], [35.0, 36.88], [47.0, 47.48], [118.0, 119.57]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.83, 0.01, 5.39, 0.13, 1.88, 0.48, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/sT7Xef0oYLU_filtered.json b/annotations_filtered/sT7Xef0oYLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90eaa0994fe99d2047bc7c4de40aeb2ab36bb583 --- /dev/null +++ b/annotations_filtered/sT7Xef0oYLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.34], [20.0, 20.19], [23.0, 24.85], [26.0, 28.16], [30.0, 31.8], [33.0, 35.09], [40.0, 40.54], [42.0, 44.17], [47.0, 48.76], [49.0, 53.97], [55.0, 54.95], [66.0, 67.56], [78.0, 79.1], [83.0, 83.13], [84.0, 90.36], [92.0, 93.75], [100.0, 100.43], [104.0, 104.82], [106.0, 107.42], [109.0, 110.34], [111.0, 122.91], [125.0, 127.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.37, 0.0, 0.0, 49.04, 0.0, 99.99, 0.0, 99.36, 0.0, 37.99, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 45.56, 87.74], "audiomae_on_audioset": [null, null, null, [["speech", 64.49], ["mains hum", 5.75], ["hum", 4.89]], null, null, null, null, null, [["thunk", 51.05], ["speech", 28.98], ["creak", 3.94]], null, null, null, null, null, null, null, null, null, null, [["speech", 40.58], ["thunk", 38.19], ["music", 11.83]], null], "duration": [3.34, 0.19, 1.85, 2.16, 1.8, 2.09, 0.54, 2.17, 1.76, 4.97, -0.05, 1.56, 1.1, 0.13, 6.36, 1.75, 0.43, 0.82, 1.42, 1.34, 11.91, 2.47]} \ No newline at end of file diff --git a/annotations_filtered/sT7nVSNlpTE_filtered.json b/annotations_filtered/sT7nVSNlpTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a4db8fd7daeb1f0cd12c4d17720f2177e962fd5 --- /dev/null +++ b/annotations_filtered/sT7nVSNlpTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.81], [2.0, 2.79], [3.0, 3.37], [4.0, 5.22], [6.0, 6.37], [9.0, 19.87], [30.0, 43.48], [46.0, 51.95], [57.0, 64.56], [66.0, 80.94], [83.0, 85.7], [87.0, 87.22], [89.0, 100.04], [102.0, 102.95], [104.0, 103.81], [105.0, 105.12], [107.0, 107.74], [109.0, 108.75], [110.0, 111.01], [116.0, 117.12], [118.0, 118.42], [119.0, 121.14]], "keep_status": [false, false, false, false, false, false, false, true, true, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 33.59, 32.36, 35.5, 33.67, 33.38, 0.0, 35.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42], "audiomae_on_audioset": [null, null, null, null, null, null, [["wild animals", 35.72], ["roaring cats (lions, tigers)", 28.62], ["animal", 21.6]], [["music", 25.24], ["mosquito", 12.33], ["fly, housefly", 8.74]], [["speech", 34.49], ["music", 17.67], ["hum", 6.11]], [["speech", 52.25], ["music", 25.27], ["fart", 3.92]], [["music", 57.59], ["musical instrument", 6.99], ["clarinet", 3.32]], null, [["music", 31.92], ["hum", 9.31], ["whimper", 4.76]], null, null, null, null, null, null, null, null, null], "duration": [-0.19, 0.79, 0.37, 1.22, 0.37, 10.87, 13.48, 5.95, 7.56, 14.94, 2.7, 0.22, 11.04, 0.95, -0.19, 0.12, 0.74, -0.25, 1.01, 1.12, 0.42, 2.14]} \ No newline at end of file diff --git a/annotations_filtered/sT8wMBeVffk_filtered.json b/annotations_filtered/sT8wMBeVffk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84d86608f4a9d74d7c73def2a69300cd4f2c27e8 --- /dev/null +++ b/annotations_filtered/sT8wMBeVffk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 68.44], [71.0, 74.01]], "keep_status": [false, false], "silence_prob": [0.0, 32.54], "audiomae_on_audioset": [null, [["hum", 38.9], ["throbbing", 29.0], ["mains hum", 11.76]]], "duration": [1.44, 3.01]} \ No newline at end of file diff --git a/annotations_filtered/sTDhNLLglf8_filtered.json b/annotations_filtered/sTDhNLLglf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cb26914954b8d5ed952734028a89bdcb4cf150b --- /dev/null +++ b/annotations_filtered/sTDhNLLglf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.61], [12.0, 12.56], [15.0, 14.74], [16.0, 17.14], [19.0, 20.06], [21.0, 22.72], [24.0, 25.22], [26.0, 27.78], [28.0, 29.22], [30.0, 30.91], [33.0, 34.28], [39.0, 40.24], [44.0, 44.88], [48.0, 48.64], [56.0, 55.95], [58.0, 58.67], [69.0, 71.66], [80.0, 81.26], [82.0, 82.21], [85.0, 84.86], [86.0, 86.97], [88.0, 88.89], [93.0, 93.77], [95.0, 95.62], [97.0, 98.07], [100.0, 101.07], [102.0, 103.71], [111.0, 111.92], [113.0, 114.22], [115.0, 115.67], [116.0, 118.29], [121.0, 122.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.12, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.39], ["sidetone", 3.47], ["explosion", 3.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 0.56, -0.26, 1.14, 1.06, 1.72, 1.22, 1.78, 1.22, 0.91, 1.28, 1.24, 0.88, 0.64, -0.05, 0.67, 2.66, 1.26, 0.21, -0.14, 0.97, 0.89, 0.77, 0.62, 1.07, 1.07, 1.71, 0.92, 1.22, 0.67, 2.29, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/sTYIlyRGrA4_filtered.json b/annotations_filtered/sTYIlyRGrA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afc6af45a58b79ac7703fdc7187df3f0437a3cee --- /dev/null +++ b/annotations_filtered/sTYIlyRGrA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.82], [16.0, 17.32], [17.0, 17.76], [19.0, 20.39], [22.0, 22.77], [27.0, 28.56], [30.0, 50.68], [56.0, 68.86]], "keep_status": [false, false, false, false, false, false, true, true], "silence_prob": [30.28, 0.0, 0.0, 0.0, 0.0, 0.0, 30.89, 34.65], "audiomae_on_audioset": [[["music", 62.68], ["didgeridoo", 4.53], ["drum", 3.94]], null, null, null, null, null, [["music", 35.17], ["buzz", 16.52], ["crowd", 7.06]], [["frog", 35.83], ["speech", 22.2], ["animal", 10.54]]], "duration": [10.82, 1.32, 0.76, 1.39, 0.77, 1.56, 20.68, 12.86]} \ No newline at end of file diff --git a/annotations_filtered/sTbJQwezQZY_filtered.json b/annotations_filtered/sTbJQwezQZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1fb02449ad50f654c32b5b339081d517e9ecd36 --- /dev/null +++ b/annotations_filtered/sTbJQwezQZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.31], [11.0, 11.04], [13.0, 15.08], [20.0, 22.87], [31.0, 31.18], [50.0, 51.09], [56.0, 73.5], [75.0, 77.65], [81.0, 91.69], [93.0, 93.56], [95.0, 96.18], [97.0, 97.6], [100.0, 100.89], [102.0, 102.73], [104.0, 107.05], [107.0, 107.11], [108.0, 108.65]], "keep_status": [false, false, true, false, false, false, true, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 30.38, 31.48, 0.0, 0.0, 29.36, 28.11, 29.18, 0.0, 0.0, 0.0, 0.0, 0.0, 29.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.7], ["hum", 22.23], ["throbbing", 13.64]], [["music", 68.0], ["musical instrument", 8.26], ["guitar", 4.4]], null, null, [["music", 27.82], ["speech", 26.69], ["burst, pop", 7.39]], [["sound effect", 14.94], ["music", 11.71], ["whack, thwack", 5.86]], [["music", 51.4], ["throbbing", 27.12], ["hum", 7.97]], null, null, null, null, null, [["sidetone", 29.7], ["music", 26.23], ["speech", 10.65]], null, null], "duration": [1.31, 0.04, 2.08, 2.87, 0.18, 1.09, 17.5, 2.65, 10.69, 0.56, 1.18, 0.6, 0.89, 0.73, 3.05, 0.11, 0.65]} \ No newline at end of file diff --git a/annotations_filtered/sTcofHd5IlE_filtered.json b/annotations_filtered/sTcofHd5IlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c21eea0c3b995322e8544267996135441fd9086 --- /dev/null +++ b/annotations_filtered/sTcofHd5IlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.43], [28.0, 32.27], [34.0, 34.06], [34.0, 44.9], [45.0, 75.86], [76.0, 78.26], [80.0, 89.87], [90.0, 90.73], [95.0, 95.66], [96.0, 96.38], [100.0, 100.55]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.19, 0.0, 30.88, 0.0, 51.66, 30.45, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 26.32], ["throbbing", 16.48], ["sidetone", 13.04]], null, [["whack, thwack", 27.32], ["speech", 17.13], ["burst, pop", 16.48]], null, null, [["beatboxing", 29.52], ["whack, thwack", 22.2], ["speech", 20.4]], null, null, null, null], "duration": [0.43, 4.27, 0.06, 10.9, 30.86, 2.26, 9.87, 0.73, 0.66, 0.38, 0.55]} \ No newline at end of file diff --git a/annotations_filtered/sUQ9cisQpaY_filtered.json b/annotations_filtered/sUQ9cisQpaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74eedd5bf324c07cb5a341c5d71d2501e646a861 --- /dev/null +++ b/annotations_filtered/sUQ9cisQpaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.02], [15.0, 15.5], [24.0, 24.48], [25.0, 25.62], [26.0, 30.79], [32.0, 32.9], [39.0, 40.76], [44.0, 47.41], [62.0, 62.28], [65.0, 65.18], [106.0, 105.7], [116.0, 122.44], [136.0, 136.39], [140.0, 140.02], [141.0, 141.44], [144.0, 144.34], [146.0, 146.18], [148.0, 149.1], [150.0, 150.9], [158.0, 160.62], [162.0, 163.36], [164.0, 164.34]], "keep_status": [true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.3, 0.0, 0.0, 0.0, 45.49, 0.0, 0.0, 38.17, 0.0, 0.0, 0.0, 33.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.43, 0.0, 0.0], "audiomae_on_audioset": [[["music", 59.14], ["mosquito", 3.78], ["fly, housefly", 3.31]], null, null, null, [["music", 48.53], ["theremin", 10.46], ["musical instrument", 3.13]], null, null, [["music", 23.58], ["mains hum", 16.54], ["hum", 14.8]], null, null, null, [["music", 51.15], ["theremin", 19.63], ["musical instrument", 4.47]], null, null, null, null, null, null, null, [["music", 62.83], ["musical instrument", 8.37], ["piano", 5.98]], null, null], "duration": [2.02, 0.5, 0.48, 0.62, 4.79, 0.9, 1.76, 3.41, 0.28, 0.18, -0.3, 6.44, 0.39, 0.02, 0.44, 0.34, 0.18, 1.1, 0.9, 2.62, 1.36, 0.34]} \ No newline at end of file diff --git a/annotations_filtered/sUa29Kqpdn0_filtered.json b/annotations_filtered/sUa29Kqpdn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c9e05966434a908db62dd877142c11760407423 --- /dev/null +++ b/annotations_filtered/sUa29Kqpdn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.86], [5.0, 6.1], [7.0, 8.6], [9.0, 10.93], [12.0, 14.35], [16.0, 18.33], [20.0, 21.66], [23.0, 30.15], [32.0, 33.32], [35.0, 36.85], [39.0, 40.73], [41.0, 43.68], [45.0, 45.55], [48.0, 50.41], [52.0, 53.52], [54.0, 63.83], [67.0, 69.63], [72.0, 77.45], [77.0, 79.89], [81.0, 85.06], [85.0, 85.35], [88.0, 88.37], [89.0, 90.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [37.89, 0.0, 0.0, 0.0, 52.98, 34.22, 0.0, 35.4, 0.0, 0.0, 0.0, 36.41, 0.0, 76.7, 0.0, 38.23, 59.24, 31.09, 31.64, 30.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 57.22], ["didgeridoo", 9.82], ["musical instrument", 6.84]], null, null, null, null, [["music", 47.62], ["synthesizer", 17.28], ["musical instrument", 8.63]], null, [["speech", 40.75], ["music", 19.92], ["synthesizer", 10.64]], null, null, null, [["didgeridoo", 49.26], ["music", 23.66], ["cattle, bovinae", 2.66]], null, null, null, [["didgeridoo", 42.59], ["music", 36.34], ["throbbing", 3.13]], null, [["music", 50.16], ["didgeridoo", 12.24], ["speech", 10.64]], [["whale vocalization", 18.08], ["music", 16.71], ["hum", 15.05]], [["speech", 45.3], ["music", 43.37], ["effects unit", 1.98]], null, null, null], "duration": [2.86, 1.1, 1.6, 1.93, 2.35, 2.33, 1.66, 7.15, 1.32, 1.85, 1.73, 2.68, 0.55, 2.41, 1.52, 9.83, 2.63, 5.45, 2.89, 4.06, 0.35, 0.37, 1.27]} \ No newline at end of file diff --git a/annotations_filtered/sUa9WglkKCI_filtered.json b/annotations_filtered/sUa9WglkKCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1301846aa8ef5874bedb57284d875deedf5b9f51 --- /dev/null +++ b/annotations_filtered/sUa9WglkKCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.93], [16.0, 17.44], [20.0, 20.09]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.93, 1.44, 0.09]} \ No newline at end of file diff --git a/annotations_filtered/sUhg39GEqGA_filtered.json b/annotations_filtered/sUhg39GEqGA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..460b1f58cc9eedd21baa9d3642b752e20e6a939a --- /dev/null +++ b/annotations_filtered/sUhg39GEqGA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.08], [4.0, 3.67], [12.0, 13.12], [15.0, 15.94], [19.0, 19.01], [20.0, 20.58], [25.0, 31.06], [52.0, 52.0], [53.0, 53.92]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 79.5], ["thunk", 7.48], ["creak", 1.52]], null, null], "duration": [0.08, -0.33, 1.12, 0.94, 0.01, 0.58, 6.06, 0.0, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/sUv04cGjaDI_filtered.json b/annotations_filtered/sUv04cGjaDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1510dbfcc9e65d144935c65a1db4ccb7fc6c1ed3 --- /dev/null +++ b/annotations_filtered/sUv04cGjaDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.35], [5.0, 6.78], [8.0, 8.73], [13.0, 15.74], [19.0, 20.92], [24.0, 26.86], [31.0, 33.98], [35.0, 36.49], [38.0, 41.64], [44.0, 46.99], [50.0, 52.78]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [43.85, 0.0, 0.0, 82.07, 0.0, 60.42, 68.67, 0.0, 38.68, 41.64, 38.45], "audiomae_on_audioset": [[["speech", 22.65], ["music", 21.17], ["hum", 19.52]], null, null, null, null, null, null, null, [["speech", 27.89], ["music", 22.65], ["whale vocalization", 13.41]], [["music", 74.78], ["ambient music", 5.26], ["electronic music", 4.22]], [["music", 57.49], ["ambient music", 8.94], ["electronic music", 8.02]]], "duration": [2.35, 1.78, 0.73, 2.74, 1.92, 2.86, 2.98, 1.49, 3.64, 2.99, 2.78]} \ No newline at end of file diff --git a/annotations_filtered/sVZLKLWFDYs_filtered.json b/annotations_filtered/sVZLKLWFDYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df544a725027448fa86fee25070937a45b0d894c --- /dev/null +++ b/annotations_filtered/sVZLKLWFDYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.21], [10.0, 10.94], [12.0, 16.41], [19.0, 19.3], [22.0, 31.01], [33.0, 35.18], [38.0, 40.69], [42.0, 47.61], [49.0, 50.68], [52.0, 55.54], [60.0, 63.59], [65.0, 65.5], [66.0, 71.25], [76.0, 79.22], [80.0, 82.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.75, 0.0, 85.17, 0.0, 87.74, 86.45, 95.23, 95.09, 0.0, 96.77, 89.19, 0.0, 70.02, 80.64, 70.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.21, 0.94, 4.41, 0.3, 9.01, 2.18, 2.69, 5.61, 1.68, 3.54, 3.59, 0.5, 5.25, 3.22, 2.27]} \ No newline at end of file diff --git a/annotations_filtered/sVfmACBWnIY_filtered.json b/annotations_filtered/sVfmACBWnIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7309a5f708a95f653d2c1521eeaef0e8f1c05379 --- /dev/null +++ b/annotations_filtered/sVfmACBWnIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.83], [11.0, 11.65], [14.0, 14.96], [19.0, 19.72], [22.0, 24.02], [26.0, 26.72], [27.0, 35.51], [40.0, 40.74], [44.0, 47.17], [53.0, 54.06], [55.0, 56.94], [58.0, 60.05], [63.0, 63.96], [68.0, 68.34], [70.0, 71.64], [73.0, 74.61], [76.0, 77.48], [79.0, 80.57], [86.0, 90.49], [91.0, 91.91], [98.0, 129.79], [137.0, 141.47], [142.0, 143.04]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 30.82, 0.0, 36.61, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 31.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["explosion", 32.75], ["burst, pop", 11.54], ["speech", 4.78]], null, [["speech", 73.28], ["animal", 3.54], ["duck", 3.22]], null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 29.04], ["mains hum", 28.15], ["whale vocalization", 14.9]], null], "duration": [0.83, 0.65, 0.96, 0.72, 2.02, 0.72, 8.51, 0.74, 3.17, 1.06, 1.94, 2.05, 0.96, 0.34, 1.64, 1.61, 1.48, 1.57, 4.49, 0.91, 31.79, 4.47, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/sVfuigRSl8g_filtered.json b/annotations_filtered/sVfuigRSl8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc33262e3b149ac697f5e274c576d4f0b0768080 --- /dev/null +++ b/annotations_filtered/sVfuigRSl8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 27.63], [31.0, 33.99], [35.0, 37.23], [38.0, 42.18], [49.0, 55.34], [66.0, 67.91], [71.0, 72.55], [74.0, 74.66], [79.0, 78.8], [83.0, 102.86], [106.0, 107.42], [116.0, 116.7], [117.0, 117.49], [118.0, 119.21], [121.0, 123.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.5, 33.5, 35.52, 35.69, 36.43, 0.0, 0.0, 0.0, 0.0, 33.95, 0.0, 0.0, 0.0, 0.0, 80.11], "audiomae_on_audioset": [[["music", 75.32], ["boing", 15.28], ["speech", 2.58]], [["speech", 48.49], ["music", 31.78], ["crack", 2.66]], [["music", 71.8], ["speech", 8.28], ["sidetone", 2.8]], [["music", 46.58], ["boing", 28.49], ["speech", 6.41]], [["music", 70.07], ["speech", 16.06], ["throbbing", 2.22]], null, null, null, null, [["music", 35.65], ["speech", 25.52], ["sidetone", 14.86]], null, null, null, null, null], "duration": [5.63, 2.99, 2.23, 4.18, 6.34, 1.91, 1.55, 0.66, -0.2, 19.86, 1.42, 0.7, 0.49, 1.21, 2.25]} \ No newline at end of file diff --git a/annotations_filtered/sVg5_6gjzlg_filtered.json b/annotations_filtered/sVg5_6gjzlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da32dfd61dbe04a2869099c532e8b5091262b3d9 --- /dev/null +++ b/annotations_filtered/sVg5_6gjzlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 26.05], [27.0, 36.42], [39.0, 45.59], [46.0, 74.26], [75.0, 83.94], [88.0, 108.57], [109.0, 113.48], [114.0, 114.81], [115.0, 116.45], [117.0, 117.58], [118.0, 118.94], [120.0, 119.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.62, 83.34, 51.82, 77.03, 60.6, 44.93, 36.35, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 74.33], ["electronic music", 3.64], ["synthesizer", 2.6]], [["music", 67.93], ["didgeridoo", 5.32], ["electronic music", 2.76]], null, null, null, null, null], "duration": [9.05, 9.42, 6.59, 28.26, 8.94, 20.57, 4.48, 0.81, 1.45, 0.58, 0.94, -0.04]} \ No newline at end of file diff --git a/annotations_filtered/sWCQm58jJsk_filtered.json b/annotations_filtered/sWCQm58jJsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac7c0facc7e7bb45ff692e3eec51900ee5670e75 --- /dev/null +++ b/annotations_filtered/sWCQm58jJsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.77], [9.0, 9.44], [10.0, 11.53], [12.0, 14.34], [15.0, 17.04], [19.0, 22.64], [25.0, 26.01], [27.0, 27.99], [29.0, 30.4], [31.0, 33.96], [35.0, 38.35], [40.0, 41.57], [43.0, 45.22], [47.0, 48.84], [50.0, 50.7], [52.0, 52.59], [53.0, 55.81], [59.0, 59.71], [62.0, 63.54], [68.0, 69.36], [71.0, 71.37], [72.0, 73.16], [74.0, 75.25], [78.0, 78.46], [79.0, 80.6], [82.0, 82.46], [83.0, 88.37], [97.0, 97.71], [101.0, 102.47], [104.0, 105.51], [108.0, 114.18], [116.0, 116.24], [118.0, 118.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.8, 98.99, 99.99, 0.0, 0.0, 0.0, 87.55, 96.17, 0.0, 99.16, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 0.44, 1.53, 2.34, 2.04, 3.64, 1.01, 0.99, 1.4, 2.96, 3.35, 1.57, 2.22, 1.84, 0.7, 0.59, 2.81, 0.71, 1.54, 1.36, 0.37, 1.16, 1.25, 0.46, 1.6, 0.46, 5.37, 0.71, 1.47, 1.51, 6.18, 0.24, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/sWEvLBzMpYE_filtered.json b/annotations_filtered/sWEvLBzMpYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/sWEvLBzMpYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/sWKTV0ScR9k_filtered.json b/annotations_filtered/sWKTV0ScR9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..807be5c6aa4132e589afeadc028483796eb3a92e --- /dev/null +++ b/annotations_filtered/sWKTV0ScR9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.99], [7.0, 7.3], [8.0, 8.21], [10.0, 9.98], [10.0, 10.79], [11.0, 11.42], [12.0, 24.04], [25.0, 25.47], [26.0, 31.77], [32.0, 37.15], [38.0, 40.19], [45.0, 44.95], [48.0, 48.14], [53.0, 53.52], [55.0, 58.26], [60.0, 60.39], [63.0, 64.05], [66.0, 66.7], [74.0, 75.3], [82.0, 84.55], [86.0, 86.36], [88.0, 88.03], [89.0, 89.04], [90.0, 97.11], [99.0, 99.44], [102.0, 102.49], [109.0, 109.93], [117.0, 118.02], [119.0, 120.28], [122.0, 124.28], [127.0, 128.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 100.0, 100.0, 99.97, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.99, 0.3, 0.21, -0.02, 0.79, 0.42, 12.04, 0.47, 5.77, 5.15, 2.19, -0.05, 0.14, 0.52, 3.26, 0.39, 1.05, 0.7, 1.3, 2.55, 0.36, 0.03, 0.04, 7.11, 0.44, 0.49, 0.93, 1.02, 1.28, 2.28, 1.73]} \ No newline at end of file diff --git a/annotations_filtered/sWjVe9dMRHU_filtered.json b/annotations_filtered/sWjVe9dMRHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ef1c5d8afc46c9c1e79de3ebdcf173877e6d9a2 --- /dev/null +++ b/annotations_filtered/sWjVe9dMRHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.43], [12.0, 12.68], [14.0, 15.36], [16.0, 38.74], [44.0, 47.21], [48.0, 68.79], [70.0, 69.92], [70.0, 71.81], [72.0, 72.82], [86.0, 86.44], [94.0, 94.83], [95.0, 97.01], [98.0, 97.97], [99.0, 99.71], [101.0, 109.12], [109.0, 116.72], [122.0, 122.44], [131.0, 131.72], [134.0, 134.84], [151.0, 151.24], [155.0, 155.7], [156.0, 155.73], [156.0, 155.97], [156.0, 156.0], [156.0, 156.03], [156.0, 156.27], [157.0, 159.36], [163.0, 172.25], [173.0, 174.09], [175.0, 190.49], [203.0, 204.47], [205.0, 207.67], [212.0, 224.18], [225.0, 224.9]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.13, 0.0, 0.0, 30.87, 42.93, 32.63, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 0.0, 0.0, 46.19, 34.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.73, 31.46, 0.0, 30.69, 0.0, 66.88, 43.58, 0.0], "audiomae_on_audioset": [[["music", 48.13], ["sampler", 6.23], ["musical instrument", 5.11]], null, null, [["music", 60.96], ["speech", 6.85], ["hum", 5.2]], [["music", 54.92], ["speech", 9.41], ["electronic music", 8.83]], [["hum", 31.07], ["music", 19.25], ["mains hum", 14.84]], null, null, null, null, null, null, null, null, [["music", 35.23], ["speech", 26.31], ["sidetone", 4.37]], [["speech", 24.91], ["groan", 24.65], ["music", 19.18]], null, null, null, null, null, null, null, null, null, null, [["music", 29.99], ["fart", 24.96], ["speech", 5.64]], [["music", 36.78], ["speech", 20.34], ["whack, thwack", 17.86]], null, [["music", 54.71], ["speech", 16.97], ["buzz", 2.22]], null, null, [["music", 58.67], ["speech", 27.21], ["thunk", 5.78]], null], "duration": [2.43, 0.68, 1.36, 22.74, 3.21, 20.79, -0.08, 1.81, 0.82, 0.44, 0.83, 2.01, -0.03, 0.71, 8.12, 7.72, 0.44, 0.72, 0.84, 0.24, 0.7, -0.27, -0.03, 0.0, 0.03, 0.27, 2.36, 9.25, 1.09, 15.49, 1.47, 2.67, 12.18, -0.1]} \ No newline at end of file diff --git a/annotations_filtered/sWqTiz8caoM_filtered.json b/annotations_filtered/sWqTiz8caoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6439056605033eb3c2fb9ace0f8340bf9d4ac91 --- /dev/null +++ b/annotations_filtered/sWqTiz8caoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.22], [7.0, 10.03], [12.0, 12.46], [27.0, 28.22], [28.0, 28.29], [36.0, 40.56], [46.0, 47.85], [48.0, 52.22], [52.0, 52.57], [53.0, 82.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 80.11, 0.0, 0.0, 0.0, 98.93, 0.0, 75.55, 0.0, 49.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 72.02], ["hum", 3.62], ["zither", 1.93]]], "duration": [0.22, 3.03, 0.46, 1.22, 0.29, 4.56, 1.85, 4.22, 0.57, 29.19]} \ No newline at end of file diff --git a/annotations_filtered/sXHsY1eoIzA_filtered.json b/annotations_filtered/sXHsY1eoIzA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/sXHsY1eoIzA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/sXatQewZKRw_filtered.json b/annotations_filtered/sXatQewZKRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a71a3acbe474141391e66cb6649793c42e02d259 --- /dev/null +++ b/annotations_filtered/sXatQewZKRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.24], [14.0, 14.17]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.24, 0.17]} \ No newline at end of file diff --git a/annotations_filtered/sXnYoBCJGwI_filtered.json b/annotations_filtered/sXnYoBCJGwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4fdeaf7befae8f1924cc627e494b1d93eb8ddc0 --- /dev/null +++ b/annotations_filtered/sXnYoBCJGwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.71], [6.0, 29.0], [31.0, 31.46], [35.0, 51.54], [54.0, 77.01], [84.0, 105.93], [109.0, 113.19], [115.0, 119.33], [121.0, 123.42], [124.0, 126.96], [129.0, 145.52]], "keep_status": [false, true, false, false, true, true, false, true, false, true, true], "silence_prob": [0.0, 35.42, 0.0, 32.37, 31.52, 38.54, 96.54, 38.1, 94.66, 48.19, 36.72], "audiomae_on_audioset": [null, [["speech", 30.32], ["sidetone", 22.46], ["music", 12.76]], null, [["sidetone", 40.17], ["speech", 27.34], ["music", 20.63]], [["music", 37.79], ["speech", 26.8], ["boing", 4.77]], [["music", 48.78], ["sound effect", 6.59], ["synthesizer", 6.59]], null, [["sine wave", 33.22], ["chirp tone", 21.25], ["burping, eructation", 7.16]], null, [["fly, housefly", 25.93], ["mosquito", 16.53], ["mains hum", 14.49]], [["hum", 38.97], ["mains hum", 13.07], ["music", 11.78]]], "duration": [0.71, 23.0, 0.46, 16.54, 23.01, 21.93, 4.19, 4.33, 2.42, 2.96, 16.52]} \ No newline at end of file diff --git a/annotations_filtered/sXtlR_7l6xQ_filtered.json b/annotations_filtered/sXtlR_7l6xQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edf2e5dee75aa6855aa64351f59910fe39b3c33f --- /dev/null +++ b/annotations_filtered/sXtlR_7l6xQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.8], [7.0, 8.01], [10.0, 10.13], [13.0, 14.28], [36.0, 36.34], [38.0, 37.79], [50.0, 51.04], [56.0, 56.67], [59.0, 60.08], [61.0, 61.45], [63.0, 63.34], [65.0, 65.89], [67.0, 67.15], [69.0, 68.98], [72.0, 72.45], [74.0, 75.12], [76.0, 77.01], [81.0, 81.6], [83.0, 84.38], [93.0, 93.61], [96.0, 96.85], [111.0, 112.43], [114.0, 114.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.01, 0.13, 1.28, 0.34, -0.21, 1.04, 0.67, 1.08, 0.45, 0.34, 0.89, 0.15, -0.02, 0.45, 1.12, 1.01, 0.6, 1.38, 0.61, 0.85, 1.43, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/sYEGcfDCysI_filtered.json b/annotations_filtered/sYEGcfDCysI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91327221fb48bb30cdc9b17cedd042e8b8272215 --- /dev/null +++ b/annotations_filtered/sYEGcfDCysI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.97], [3.0, 9.05], [10.0, 11.31], [14.0, 14.84], [16.0, 16.48], [17.0, 17.37], [19.0, 19.26], [21.0, 27.45], [27.0, 27.48], [27.0, 27.51], [30.0, 30.6], [31.0, 31.73], [34.0, 39.45], [40.0, 39.53], [41.0, 41.62], [42.0, 43.82], [44.0, 43.85], [44.0, 43.88], [45.0, 50.16], [52.0, 52.61], [60.0, 60.47], [61.0, 61.05], [62.0, 61.99], [65.0, 67.42], [67.0, 71.31], [73.0, 73.26], [74.0, 74.28], [74.0, 75.19], [87.0, 87.51], [88.0, 99.93], [100.0, 100.89], [103.0, 103.25], [105.0, 105.53], [107.0, 109.68], [110.0, 111.92], [115.0, 115.92], [120.0, 120.56], [124.0, 123.74], [125.0, 124.92], [127.0, 127.57], [129.0, 130.13], [135.0, 136.26], [140.0, 150.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 36.73, 0.0, 0.0, 0.0, 0.0, 0.0, 41.62, 0.0, 0.0, 0.0, 0.0, 39.49, 0.0, 0.0, 0.0, 0.0, 0.0, 49.31, 0.0, 0.0, 0.0, 0.0, 37.71, 33.91, 0.0, 0.0, 0.0, 0.0, 33.23, 0.0, 0.0, 0.0, 39.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.71], "audiomae_on_audioset": [null, [["music", 39.42], ["speech", 36.09], ["mains hum", 7.32]], null, null, null, null, null, [["speech", 42.05], ["music", 34.75], ["mains hum", 5.03]], null, null, null, null, [["speech", 25.16], ["music", 19.22], ["mains hum", 15.98]], null, null, null, null, null, [["hum", 29.23], ["music", 24.99], ["mains hum", 21.42]], null, null, null, null, [["speech", 48.5], ["music", 11.58], ["didgeridoo", 10.22]], [["music", 21.88], ["speech", 20.06], ["mains hum", 19.02]], null, null, null, null, [["music", 73.58], ["musical instrument", 7.75], ["didgeridoo", 3.19]], null, null, null, [["television", 19.12], ["speech", 18.22], ["music", 10.17]], null, null, null, null, null, null, null, null, [["music", 22.62], ["speech", 19.92], ["throbbing", 12.31]]], "duration": [-0.03, 6.05, 1.31, 0.84, 0.48, 0.37, 0.26, 6.45, 0.48, 0.51, 0.6, 0.73, 5.45, -0.47, 0.62, 1.82, -0.15, -0.12, 5.16, 0.61, 0.47, 0.05, -0.01, 2.42, 4.31, 0.26, 0.28, 1.19, 0.51, 11.93, 0.89, 0.25, 0.53, 2.68, 1.92, 0.92, 0.56, -0.26, -0.08, 0.57, 1.13, 1.26, 10.92]} \ No newline at end of file diff --git a/annotations_filtered/sYNUp5rAZJo_filtered.json b/annotations_filtered/sYNUp5rAZJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52fe5d207b070393971ad50c83bd765761a50ecf --- /dev/null +++ b/annotations_filtered/sYNUp5rAZJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.09], [15.0, 41.61], [44.0, 45.87], [47.0, 48.1], [50.0, 49.96], [56.0, 56.62], [69.0, 69.87], [71.0, 71.51], [75.0, 76.1], [78.0, 78.65], [80.0, 79.88], [82.0, 86.91], [89.0, 91.3], [93.0, 101.7], [102.0, 103.03], [104.0, 107.55], [108.0, 110.3], [111.0, 111.87], [113.0, 114.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 92.48, 86.27, 0.0, 96.77, 60.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 26.61, 1.87, 1.1, -0.04, 0.62, 0.87, 0.51, 1.1, 0.65, -0.12, 4.91, 2.3, 8.7, 1.03, 3.55, 2.3, 0.87, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/sYWS5RSmJ-s_filtered.json b/annotations_filtered/sYWS5RSmJ-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1eb994475fe1765744d0822f33d61fe2c37e7372 --- /dev/null +++ b/annotations_filtered/sYWS5RSmJ-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [11.0, 11.96], [14.0, 15.21], [20.0, 22.99], [24.0, 47.44], [48.0, 50.13], [52.0, 52.39], [60.0, 60.64], [63.0, 63.64], [70.0, 73.74], [74.0, 74.01], [81.0, 96.65]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 79.76, 47.66, 36.06, 0.0, 0.0, 0.0, 30.16, 0.0, 32.78], "audiomae_on_audioset": [null, null, null, null, [["thunk", 16.02], ["cat", 15.5], ["music", 14.6]], [["speech", 42.31], ["music", 8.63], ["throbbing", 6.81]], null, null, null, [["speech", 67.12], ["music", 10.95], ["whack, thwack", 5.04]], null, [["throbbing", 29.81], ["hum", 23.27], ["music", 9.42]]], "duration": [1.14, 0.96, 1.21, 2.99, 23.44, 2.13, 0.39, 0.64, 0.64, 3.74, 0.01, 15.65]} \ No newline at end of file diff --git a/annotations_filtered/sYdqpWTQyaI_filtered.json b/annotations_filtered/sYdqpWTQyaI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16f8555bfc3fbd98c7283b00c9ad8dc1a6656b24 --- /dev/null +++ b/annotations_filtered/sYdqpWTQyaI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.35], [20.0, 19.97], [28.0, 28.21], [42.0, 47.55], [48.0, 73.08], [75.0, 82.26], [83.0, 91.13], [93.0, 95.37], [99.0, 111.15], [114.0, 114.59], [115.0, 114.84], [119.0, 119.92], [120.0, 121.37], [122.0, 134.89], [136.0, 139.82], [141.0, 147.38], [148.0, 149.89], [151.0, 162.28], [163.0, 163.9], [166.0, 166.8], [167.0, 183.73], [187.0, 191.69], [196.0, 215.82], [218.0, 219.55], [221.0, 221.49], [222.0, 225.59]], "keep_status": [false, false, false, false, true, true, true, true, true, false, false, false, false, false, true, false, false, true, false, false, true, false, true, false, false, true], "silence_prob": [31.08, 0.0, 0.0, 30.64, 31.77, 29.42, 31.07, 32.14, 28.67, 0.0, 0.0, 0.0, 0.0, 29.37, 33.0, 30.05, 0.0, 31.4, 0.0, 0.0, 29.58, 31.95, 32.03, 0.0, 0.0, 48.78], "audiomae_on_audioset": [[["fly, housefly", 42.15], ["insect", 15.94], ["speech", 12.12]], null, null, [["mains hum", 35.94], ["hum", 23.4], ["music", 21.12]], [["hum", 24.33], ["music", 22.6], ["speech", 10.9]], [["speech", 40.97], ["music", 18.72], ["whack, thwack", 4.9]], [["music", 10.12], ["didgeridoo", 8.12], ["buzz", 7.36]], [["music", 16.59], ["hum", 14.56], ["speech", 11.58]], [["speech", 57.1], ["music", 3.43], ["buzz", 2.87]], null, null, null, null, [["throbbing", 37.85], ["hum", 20.77], ["music", 13.05]], [["music", 20.41], ["foghorn", 14.03], ["animal", 10.13]], [["music", 66.62], ["throbbing", 4.09], ["hum", 3.67]], null, [["music", 35.81], ["speech", 14.4], ["groan", 4.43]], null, null, [["speech", 21.01], ["music", 19.27], ["breaking", 12.21]], [["music", 58.75], ["musical instrument", 10.26], ["didgeridoo", 6.96]], [["music", 38.79], ["speech", 15.83], ["hum", 7.05]], null, null, [["music", 28.81], ["speech", 20.87], ["hum", 18.94]]], "duration": [5.35, -0.03, 0.21, 5.55, 25.08, 7.26, 8.13, 2.37, 12.15, 0.59, -0.16, 0.92, 1.37, 12.89, 3.82, 6.38, 1.89, 11.28, 0.9, 0.8, 16.73, 4.69, 19.82, 1.55, 0.49, 3.59]} \ No newline at end of file diff --git a/annotations_filtered/sYk8M_ZTNlY_filtered.json b/annotations_filtered/sYk8M_ZTNlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c2f2072e29609c76cbea3be5377f15d96d0615f --- /dev/null +++ b/annotations_filtered/sYk8M_ZTNlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.72], [6.0, 7.1], [8.0, 10.59], [12.0, 18.13], [20.0, 22.42], [23.0, 25.3], [27.0, 29.98], [31.0, 41.17], [44.0, 50.55], [51.0, 56.19], [56.0, 56.57], [60.0, 60.3], [68.0, 70.5], [71.0, 70.65], [75.0, 80.72], [83.0, 89.82], [95.0, 114.47], [119.0, 127.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 71.29, 93.76, 78.89, 87.19, 84.8, 86.27, 48.39, 52.05, 0.0, 0.0, 57.48, 0.0, 49.97, 57.81, 62.78, 47.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 64.24], ["ambient music", 9.29], ["theremin", 4.26]], null, null, null, null, null, [["music", 77.12], ["musical instrument", 3.43], ["theremin", 2.47]], null, null, [["music", 72.05], ["ambient music", 7.08], ["theremin", 3.59]]], "duration": [-0.28, 1.1, 2.59, 6.13, 2.42, 2.3, 2.98, 10.17, 6.55, 5.19, 0.57, 0.3, 2.5, -0.35, 5.72, 6.82, 19.47, 8.7]} \ No newline at end of file diff --git a/annotations_filtered/sZ0nA_2qOWc_filtered.json b/annotations_filtered/sZ0nA_2qOWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65dfeec8d4affb4401aabc7c7a1119896a842455 --- /dev/null +++ b/annotations_filtered/sZ0nA_2qOWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [6.0, 14.74], [18.0, 20.33], [21.0, 21.74], [24.0, 25.1], [27.0, 29.32], [32.0, 36.66], [40.0, 42.28], [43.0, 44.2], [45.0, 58.46], [59.0, 60.96], [64.0, 64.74], [68.0, 70.78], [71.0, 72.13], [73.0, 73.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.76, 74.76, 0.0, 0.0, 99.36, 100.0, 100.0, 0.0, 87.55, 0.0, 0.0, 82.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 8.74, 2.33, 0.74, 1.1, 2.32, 4.66, 2.28, 1.2, 13.46, 1.96, 0.74, 2.78, 1.13, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/sZ6t_-wKImw_filtered.json b/annotations_filtered/sZ6t_-wKImw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef47b4205deb614a0e665780b17c769742eb504f --- /dev/null +++ b/annotations_filtered/sZ6t_-wKImw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.58], [12.0, 12.77], [14.0, 29.49], [31.0, 31.18], [33.0, 33.15], [35.0, 35.13], [36.0, 35.73], [37.0, 38.69], [42.0, 42.31], [44.0, 44.46], [47.0, 47.12], [49.0, 56.05], [57.0, 58.23], [61.0, 62.01], [63.0, 63.27], [64.0, 64.3], [66.0, 66.29], [67.0, 68.94], [70.0, 73.33], [75.0, 76.86], [78.0, 83.25], [85.0, 85.19]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.97, 0.0, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 32.45, 0.0], "audiomae_on_audioset": [null, null, [["frog", 41.29], ["radio", 12.07], ["speech", 9.01]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.03], ["speech", 20.91], ["theremin", 7.48]], null], "duration": [10.58, 0.77, 15.49, 0.18, 0.15, 0.13, -0.27, 1.69, 0.31, 0.46, 0.12, 7.05, 1.23, 1.01, 0.27, 0.3, 0.29, 1.94, 3.33, 1.86, 5.25, 0.19]} \ No newline at end of file diff --git a/annotations_filtered/sZTRUAFCzF4_filtered.json b/annotations_filtered/sZTRUAFCzF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfc89dea4b163733517460f2cd7f34339b71130c --- /dev/null +++ b/annotations_filtered/sZTRUAFCzF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.23], [6.0, 6.62], [9.0, 9.48], [36.0, 35.82], [36.0, 36.91], [39.0, 39.87], [40.0, 41.0], [41.0, 42.01], [49.0, 50.26], [56.0, 67.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 38.75], ["speech", 28.94], ["fly, housefly", 5.93]]], "duration": [0.23, 0.62, 0.48, -0.18, 0.91, 0.87, 1.0, 1.01, 1.26, 11.1]} \ No newline at end of file diff --git a/annotations_filtered/sZU26D42s2M_filtered.json b/annotations_filtered/sZU26D42s2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efa01aee308b927050725eb457e49c44bd0e65cf --- /dev/null +++ b/annotations_filtered/sZU26D42s2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.2], [8.0, 9.12], [10.0, 10.49], [14.0, 14.05], [15.0, 16.6], [18.0, 18.03], [19.0, 19.04], [20.0, 20.76], [24.0, 24.21], [27.0, 27.84], [28.0, 30.11], [32.0, 34.05], [38.0, 39.12], [43.0, 43.65], [47.0, 48.0], [65.0, 66.46], [73.0, 73.41], [88.0, 88.89], [99.0, 98.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [53.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 48.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.03], ["wood", 13.42], ["dial tone", 7.29]], null, null, null, null, null, null, null], "duration": [3.2, 1.12, 0.49, 0.05, 1.6, 0.03, 0.04, 0.76, 0.21, 0.84, 2.11, 2.05, 1.12, 0.65, 1.0, 1.46, 0.41, 0.89, -0.21]} \ No newline at end of file diff --git a/annotations_filtered/sZazSFEHfg8_filtered.json b/annotations_filtered/sZazSFEHfg8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d81a993f1b453c7ef0b291d66492c74da35c8b7c --- /dev/null +++ b/annotations_filtered/sZazSFEHfg8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.66], [23.0, 23.65], [33.0, 38.53], [40.0, 40.61], [43.0, 48.3], [49.0, 49.6], [51.0, 51.85], [52.0, 53.03], [54.0, 54.72], [55.0, 66.31], [69.0, 69.08], [71.0, 71.04]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [38.56, 0.0, 32.24, 0.0, 32.53, 0.0, 0.0, 0.0, 0.0, 30.81, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 58.57], ["screaming", 9.22], ["boing", 4.28]], null, [["speech", 41.62], ["groan", 25.91], ["clip-clop", 7.66]], null, [["cattle, bovinae", 16.42], ["animal", 15.86], ["moo", 14.57]], null, null, null, null, [["speech", 69.1], ["animal", 8.77], ["grunt", 6.56]], null, null], "duration": [5.66, 0.65, 5.53, 0.61, 5.3, 0.6, 0.85, 1.03, 0.72, 11.31, 0.08, 0.04]} \ No newline at end of file diff --git a/annotations_filtered/s_7PfocHTmc_filtered.json b/annotations_filtered/s_7PfocHTmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d3ed1916298c4c54b54d2da264f5595444ca5ec --- /dev/null +++ b/annotations_filtered/s_7PfocHTmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.55], [16.0, 16.46], [25.0, 29.57], [30.0, 29.61], [30.0, 34.87], [37.0, 37.12], [37.0, 38.72], [41.0, 41.99], [44.0, 46.57], [51.0, 52.03], [55.0, 59.31], [62.0, 84.18], [86.0, 94.88], [96.0, 95.93], [97.0, 122.91], [127.0, 128.04], [130.0, 157.77]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 40.88, 0.0, 39.78, 0.0, 0.0, 0.0, 48.56, 0.0, 41.66, 47.39, 37.27, 0.0, 29.76, 0.0, 30.27], "audiomae_on_audioset": [null, null, [["music", 39.74], ["theremin", 38.01], ["electronic music", 2.86]], null, [["music", 32.99], ["speech", 19.0], ["theremin", 12.89]], null, null, null, [["music", 43.63], ["theremin", 20.99], ["hum", 6.1]], null, [["music", 73.02], ["didgeridoo", 3.94], ["synthesizer", 3.61]], [["music", 33.27], ["hum", 21.05], ["throbbing", 9.1]], [["music", 65.58], ["synthesizer", 6.02], ["musical instrument", 5.88]], null, [["music", 36.94], ["speech", 23.01], ["theremin", 8.91]], null, [["music", 63.46], ["theremin", 21.23], ["shout", 1.43]]], "duration": [0.55, 0.46, 4.57, -0.39, 4.87, 0.12, 1.72, 0.99, 2.57, 1.03, 4.31, 22.18, 8.88, -0.07, 25.91, 1.04, 27.77]} \ No newline at end of file diff --git a/annotations_filtered/s_CwatXdxUA_filtered.json b/annotations_filtered/s_CwatXdxUA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e458b16c6fa8be7fb10567e2770084112240f23 --- /dev/null +++ b/annotations_filtered/s_CwatXdxUA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.01], [9.0, 11.11], [13.0, 14.13], [15.0, 15.01], [17.0, 17.59], [20.0, 20.49], [21.0, 21.79], [22.0, 23.08], [25.0, 26.16], [27.0, 28.46], [30.0, 30.91], [31.0, 34.96], [36.0, 36.83], [38.0, 43.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [80.82, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.44, 0.0, 33.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.09], ["throbbing", 8.74], ["mains hum", 8.27]]], "duration": [2.01, 2.11, 1.13, 0.01, 0.59, 0.49, 0.79, 1.08, 1.16, 1.46, 0.91, 3.96, 0.83, 5.56]} \ No newline at end of file diff --git a/annotations_filtered/s_PLAOcbbzI_filtered.json b/annotations_filtered/s_PLAOcbbzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..008597f8cab46edde7451ec51b919b7f2a7abf05 --- /dev/null +++ b/annotations_filtered/s_PLAOcbbzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.12], [8.0, 8.38], [9.0, 12.56], [14.0, 15.63], [17.0, 17.59], [22.0, 23.11], [24.0, 25.03], [26.0, 29.39], [37.0, 37.32], [41.0, 41.84], [44.0, 45.44]], "keep_status": [true, false, true, false, false, false, false, true, false, false, false], "silence_prob": [32.71, 0.0, 32.8, 0.0, 0.0, 0.0, 0.0, 41.58, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 43.33], ["gong", 12.3], ["percussion", 7.4]], null, [["gong", 25.98], ["speech", 16.1], ["music", 14.08]], null, null, null, null, [["speech", 40.35], ["music", 13.38], ["vehicle", 10.86]], null, null, null], "duration": [2.12, 0.38, 3.56, 1.63, 0.59, 1.11, 1.03, 3.39, 0.32, 0.84, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/s_SM1Hly-uw_filtered.json b/annotations_filtered/s_SM1Hly-uw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd88242063c56af6813c66ec1701c5cb5c2c8503 --- /dev/null +++ b/annotations_filtered/s_SM1Hly-uw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [4.0, 6.98], [9.0, 10.17], [11.0, 14.3], [16.0, 16.97], [20.0, 22.13], [23.0, 23.31], [25.0, 25.79], [29.0, 36.51], [38.0, 39.18], [47.0, 47.85], [55.0, 56.27], [60.0, 69.33], [73.0, 74.29], [75.0, 78.21], [80.0, 83.84], [85.0, 86.49], [88.0, 90.83], [93.0, 105.39], [110.0, 112.08], [114.0, 115.91], [122.0, 123.35], [124.0, 128.02], [138.0, 139.97], [146.0, 149.17], [151.0, 154.45], [159.0, 162.57], [164.0, 165.25], [167.0, 168.79], [170.0, 171.14]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 73.51, 0.0, 55.89, 0.0, 63.53, 0.0, 0.0, 36.8, 0.0, 0.0, 0.0, 40.62, 0.0, 60.98, 56.78, 0.0, 58.3, 73.21, 92.64, 0.0, 0.0, 62.58, 0.0, 87.74, 98.01, 95.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 22.58], ["speech", 16.64], ["mains hum", 8.89]], null, null, null, [["didgeridoo", 23.69], ["music", 17.39], ["hum", 10.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 2.98, 1.17, 3.3, 0.97, 2.13, 0.31, 0.79, 7.51, 1.18, 0.85, 1.27, 9.33, 1.29, 3.21, 3.84, 1.49, 2.83, 12.39, 2.08, 1.91, 1.35, 4.02, 1.97, 3.17, 3.45, 3.57, 1.25, 1.79, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/s_cz5JFWpzE_filtered.json b/annotations_filtered/s_cz5JFWpzE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f12b4d601ed70d2bfa13021182aa460ad84d6d4 --- /dev/null +++ b/annotations_filtered/s_cz5JFWpzE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.77], [28.0, 28.97], [30.0, 32.16], [34.0, 34.33], [36.0, 36.61], [37.0, 37.88], [41.0, 41.39], [43.0, 45.77], [49.0, 49.05], [50.0, 50.8], [52.0, 53.06], [60.0, 60.12], [61.0, 62.41], [64.0, 65.01], [66.0, 66.7], [69.0, 70.41], [72.0, 72.17], [76.0, 79.02], [83.0, 84.06], [86.0, 106.74], [108.0, 108.45], [110.0, 110.42], [120.0, 120.07], [123.0, 125.63], [132.0, 133.52], [136.0, 137.57], [138.0, 139.41], [140.0, 142.47], [146.0, 148.44], [149.0, 150.13]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.81, 0.0, 0.0, 0.0, 0.0, 48.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.15, 0.0, 30.76, 0.0, 0.0, 0.0, 35.74, 0.0, 0.0, 0.0, 54.83, 53.78, 0.0], "audiomae_on_audioset": [null, null, [["hum", 34.61], ["music", 27.68], ["speech", 10.32]], null, null, null, null, [["hum", 30.35], ["music", 24.98], ["ambient music", 7.2]], null, null, null, null, null, null, null, null, null, [["music", 59.52], ["electronic music", 10.06], ["ambient music", 3.92]], null, [["hum", 41.91], ["music", 20.05], ["mains hum", 17.96]], null, null, null, [["hum", 31.68], ["music", 30.45], ["throbbing", 19.36]], null, null, null, null, null, null], "duration": [0.77, 0.97, 2.16, 0.33, 0.61, 0.88, 0.39, 2.77, 0.05, 0.8, 1.06, 0.12, 1.41, 1.01, 0.7, 1.41, 0.17, 3.02, 1.06, 20.74, 0.45, 0.42, 0.07, 2.63, 1.52, 1.57, 1.41, 2.47, 2.44, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/sa2TE--j394_filtered.json b/annotations_filtered/sa2TE--j394_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a105916ad969a355c576de78ac38191637481138 --- /dev/null +++ b/annotations_filtered/sa2TE--j394_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.11], [35.0, 35.72], [54.0, 55.73], [68.0, 68.55], [75.0, 75.12], [76.0, 76.05], [77.0, 77.77], [81.0, 87.54], [100.0, 101.66], [123.0, 128.33], [135.0, 135.65], [136.0, 137.79]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.48, 0.0, 39.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 36.94], ["applause", 23.36], ["tap", 6.79]], null, [["speech", 75.14], ["applause", 11.34], ["tap", 1.52]], null, null], "duration": [0.11, 0.72, 1.73, 0.55, 0.12, 0.05, 0.77, 6.54, 1.66, 5.33, 0.65, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/sa9AzlyS9h0_filtered.json b/annotations_filtered/sa9AzlyS9h0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..562ab1153c1104a94d5871c87fc3f165be47ecbc --- /dev/null +++ b/annotations_filtered/sa9AzlyS9h0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.19], [9.0, 9.26], [11.0, 12.01], [12.0, 12.9], [14.0, 16.34], [17.0, 47.7], [49.0, 49.5], [53.0, 55.31], [57.0, 57.65], [59.0, 65.92], [67.0, 67.66], [71.0, 72.3], [74.0, 76.32], [79.0, 79.73], [82.0, 86.37], [89.0, 88.74], [92.0, 102.91], [104.0, 104.65], [105.0, 109.21], [112.0, 113.61], [115.0, 116.33], [116.0, 120.63], [125.0, 125.41], [129.0, 129.2], [131.0, 132.07], [136.0, 139.63], [142.0, 142.28], [144.0, 157.44], [159.0, 161.1]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, false, false, true, true], "silence_prob": [29.97, 0.0, 0.0, 0.0, 29.51, 0.0, 0.0, 29.32, 0.0, 30.29, 0.0, 0.0, 37.64, 0.0, 29.14, 0.0, 30.77, 0.0, 29.09, 0.0, 0.0, 29.89, 0.0, 0.0, 0.0, 29.27, 0.0, 29.73, 43.15], "audiomae_on_audioset": [[["speech", 65.47], ["radio", 3.79], ["buzz", 3.17]], null, null, null, [["speech", 62.69], ["buzzer", 5.94], ["alarm", 3.63]], null, null, [["cacophony", 19.9], ["speech", 16.62], ["explosion", 10.9]], null, [["hum", 17.85], ["mains hum", 12.32], ["sound effect", 6.36]], null, null, [["music", 18.75], ["noise", 16.84], ["hum", 11.45]], null, [["zipper (clothing)", 17.5], ["sound effect", 11.84], ["speech", 9.27]], null, [["speech", 86.95], ["music", 2.9], ["didgeridoo", 2.3]], null, [["music", 18.86], ["speech", 12.6], ["hum", 9.21]], null, null, [["speech", 54.8], ["sound effect", 5.52], ["music", 5.34]], null, null, null, [["speech", 43.02], ["music", 26.04], ["white noise", 3.33]], null, [["hum", 14.8], ["speech", 11.11], ["mains hum", 6.34]], [["hum", 30.92], ["mains hum", 18.91], ["music", 11.85]]], "duration": [6.19, 0.26, 1.01, 0.9, 2.34, 30.7, 0.5, 2.31, 0.65, 6.92, 0.66, 1.3, 2.32, 0.73, 4.37, -0.26, 10.91, 0.65, 4.21, 1.61, 1.33, 4.63, 0.41, 0.2, 1.07, 3.63, 0.28, 13.44, 2.1]} \ No newline at end of file diff --git a/annotations_filtered/saBoM7O_imM_filtered.json b/annotations_filtered/saBoM7O_imM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7969b6f21cec943b12e7cddf84fad8c5f54e7df3 --- /dev/null +++ b/annotations_filtered/saBoM7O_imM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [4.0, 5.02], [23.0, 23.46], [31.0, 32.12], [33.0, 33.56], [42.0, 42.84], [45.0, 45.87], [46.0, 46.48], [47.0, 47.31], [55.0, 56.0], [58.0, 57.74], [61.0, 64.71], [69.0, 70.95], [72.0, 73.14], [74.0, 74.93], [75.0, 77.75], [78.0, 79.69], [81.0, 81.84], [88.0, 89.21], [95.0, 96.92], [97.0, 98.09], [100.0, 106.12], [107.0, 107.49], [110.0, 110.35], [111.0, 116.95], [122.0, 124.33], [125.0, 125.93], [127.0, 128.19], [129.0, 130.92], [137.0, 137.13], [138.0, 140.86], [142.0, 143.43], [144.0, 145.96], [149.0, 150.6], [152.0, 154.16], [156.0, 156.3], [159.0, 159.73], [160.0, 161.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 31.63, 0.0, 0.0, 34.1, 58.22, 0.0, 0.0, 0.0, 0.0, 34.56, 0.0, 0.0, 0.0, 55.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 31.67], ["insect", 18.61], ["speech", 6.67]], null, null, [["fart", 35.52], ["fly, housefly", 26.39], ["mosquito", 14.42]], null, null, null, null, null, [["speech", 12.82], ["fart", 10.03], ["animal", 7.8]], null, null, null, null, null, null, null], "duration": [0.4, 1.02, 0.46, 1.12, 0.56, 0.84, 0.87, 0.48, 0.31, 1.0, -0.26, 3.71, 1.95, 1.14, 0.93, 2.75, 1.69, 0.84, 1.21, 1.92, 1.09, 6.12, 0.49, 0.35, 5.95, 2.33, 0.93, 1.19, 1.92, 0.13, 2.86, 1.43, 1.96, 1.6, 2.16, 0.3, 0.73, 1.94]} \ No newline at end of file diff --git a/annotations_filtered/saTBYjmhcok_filtered.json b/annotations_filtered/saTBYjmhcok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c712c6fe07c25fa9e56f7bc040c47fbf6a274260 --- /dev/null +++ b/annotations_filtered/saTBYjmhcok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.32], [14.0, 16.04], [17.0, 17.44], [19.0, 21.42], [22.0, 22.2], [23.0, 24.07], [25.0, 26.11], [28.0, 31.73], [33.0, 33.29], [34.0, 42.11], [43.0, 46.62], [51.0, 53.54], [54.0, 56.56], [60.0, 62.75], [64.0, 65.11], [65.0, 115.33], [118.0, 119.62], [120.0, 121.44], [123.0, 131.45], [133.0, 134.76], [137.0, 137.89], [146.0, 146.79], [149.0, 154.3]], "keep_status": [false, true, false, false, false, false, false, true, false, true, true, true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [44.09, 48.78, 0.0, 46.43, 0.0, 0.0, 0.0, 47.23, 0.0, 34.79, 44.43, 36.18, 35.52, 42.72, 0.0, 0.0, 0.0, 0.0, 32.37, 0.0, 0.0, 0.0, 47.62], "audiomae_on_audioset": [[["hum", 39.81], ["mains hum", 29.72], ["music", 5.38]], [["music", 37.83], ["speech", 19.52], ["hum", 11.97]], null, [["hum", 33.23], ["mains hum", 28.69], ["music", 9.84]], null, null, null, [["music", 60.08], ["hum", 5.31], ["musical instrument", 4.36]], null, [["music", 29.23], ["hum", 21.15], ["mains hum", 10.02]], [["music", 25.62], ["hum", 19.1], ["mains hum", 11.15]], [["whale vocalization", 16.69], ["music", 7.29], ["hum", 6.14]], [["hum", 36.58], ["music", 21.34], ["throbbing", 10.98]], [["music", 31.94], ["hum", 13.26], ["whale vocalization", 7.97]], null, null, null, null, [["music", 51.17], ["hum", 21.68], ["mains hum", 10.09]], null, null, null, [["mains hum", 47.34], ["hum", 34.8], ["music", 5.13]]], "duration": [2.32, 2.04, 0.44, 2.42, 0.2, 1.07, 1.11, 3.73, 0.29, 8.11, 3.62, 2.54, 2.56, 2.75, 1.11, 50.33, 1.62, 1.44, 8.45, 1.76, 0.89, 0.79, 5.3]} \ No newline at end of file diff --git a/annotations_filtered/sallI5PomoY_filtered.json b/annotations_filtered/sallI5PomoY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..999ca6d3673d744281cb98447e8dfffaecf94222 --- /dev/null +++ b/annotations_filtered/sallI5PomoY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.72], [9.0, 14.12], [14.0, 15.58], [18.0, 17.88], [19.0, 19.36], [46.0, 47.39], [50.0, 52.22], [55.0, 55.31], [59.0, 58.68]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.24, 0.0, 0.0, 0.0, 0.0, 34.74, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 60.03], ["hum", 6.03], ["inside, small room", 2.26]], null, null, null, null, [["speech", 55.53], ["fart", 14.83], ["cough", 4.25]], null, null], "duration": [-0.28, 5.12, 1.58, -0.12, 0.36, 1.39, 2.22, 0.31, -0.32]} \ No newline at end of file diff --git a/annotations_filtered/sb8IU6c5obc_filtered.json b/annotations_filtered/sb8IU6c5obc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02c1843dc212f4396cfde53628c833eea42cd717 --- /dev/null +++ b/annotations_filtered/sb8IU6c5obc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.2], [5.0, 5.05], [28.0, 28.75], [33.0, 33.27], [36.0, 36.49], [38.0, 37.98], [42.0, 42.18], [42.0, 42.4], [48.0, 48.02], [49.0, 48.81], [56.0, 56.67], [90.0, 90.32], [91.0, 92.94], [93.0, 94.88], [98.0, 98.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.2, 0.05, 0.75, 0.27, 0.49, -0.02, 0.18, 0.4, 0.02, -0.19, 0.67, 0.32, 1.94, 1.88, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/sbIfW_Pf9vk_filtered.json b/annotations_filtered/sbIfW_Pf9vk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba82f086490535c75c5b9333925424914e623c0 --- /dev/null +++ b/annotations_filtered/sbIfW_Pf9vk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.3], [7.0, 7.11], [17.0, 17.71], [19.0, 19.45], [20.0, 20.92], [21.0, 21.95], [23.0, 23.67], [25.0, 25.79], [29.0, 30.25], [32.0, 33.67], [38.0, 39.12], [41.0, 42.85], [49.0, 50.65], [53.0, 54.9], [57.0, 57.65], [61.0, 63.66], [67.0, 68.59], [69.0, 71.07], [80.0, 81.16], [90.0, 91.45], [99.0, 102.63], [103.0, 104.09], [111.0, 111.21], [114.0, 115.62], [116.0, 117.86], [121.0, 121.46], [124.0, 126.18], [127.0, 128.34], [129.0, 131.5], [133.0, 138.77], [145.0, 146.06], [147.0, 148.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 90.95, 0.0, 0.0, 34.36, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 90.25, 89.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 23.87], ["moo", 23.28], ["creak", 13.87]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 0.11, 0.71, 0.45, 0.92, 0.95, 0.67, 0.79, 1.25, 1.67, 1.12, 1.85, 1.65, 1.9, 0.65, 2.66, 1.59, 2.07, 1.16, 1.45, 3.63, 1.09, 0.21, 1.62, 1.86, 0.46, 2.18, 1.34, 2.5, 5.77, 1.06, 1.37]} \ No newline at end of file diff --git a/annotations_filtered/sbJ89LFheTs_filtered.json b/annotations_filtered/sbJ89LFheTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc4b75d9fb83ca91aa6345a56b597f4cf9f6bf0d --- /dev/null +++ b/annotations_filtered/sbJ89LFheTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.32], [5.0, 5.05], [5.0, 5.54], [7.0, 13.26], [14.0, 14.54], [19.0, 18.84], [21.0, 22.01], [25.0, 25.96], [28.0, 28.88], [30.0, 38.6], [40.0, 50.58], [51.0, 54.21], [56.0, 59.54], [61.0, 65.04], [67.0, 67.15], [71.0, 72.47], [75.0, 75.64], [77.0, 78.66], [81.0, 82.32], [84.0, 86.59], [87.0, 93.11], [93.0, 99.22], [100.0, 101.12], [103.0, 103.54]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [51.18, 0.0, 0.0, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 58.72, 59.15, 44.32, 70.02, 0.0, 0.0, 0.0, 0.0, 0.0, 38.7, 35.12, 36.78, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 26.51], ["speech", 25.8], ["music", 8.37]], null, null, null, null, null, null, null, null, [["speech", 51.29], ["radio", 13.66], ["music", 13.1]], null, null, null, null, null, null, [["music", 18.79], ["noise", 12.63], ["theremin", 8.14]], [["music", 45.93], ["speech", 9.98], ["radio", 9.82]], [["theremin", 42.63], ["music", 22.93], ["speech", 17.49]], null, null], "duration": [2.32, 0.05, 0.54, 6.26, 0.54, -0.16, 1.01, 0.96, 0.88, 8.6, 10.58, 3.21, 3.54, 4.04, 0.15, 1.47, 0.64, 1.66, 1.32, 2.59, 6.11, 6.22, 1.12, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/sbZB1drlKWI_filtered.json b/annotations_filtered/sbZB1drlKWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57368a15cdb4ae801b6c4d426846fdf73749fc6d --- /dev/null +++ b/annotations_filtered/sbZB1drlKWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.65], [11.0, 11.65], [12.0, 13.09], [15.0, 18.72], [20.0, 26.74], [32.0, 33.1], [36.0, 36.15], [37.0, 40.37], [42.0, 50.13], [51.0, 75.91], [76.0, 80.28], [81.0, 81.6]], "keep_status": [true, false, false, true, true, false, false, false, true, true, true, false], "silence_prob": [35.28, 0.0, 0.0, 36.93, 38.26, 0.0, 0.0, 30.48, 34.17, 31.92, 32.13, 0.0], "audiomae_on_audioset": [[["music", 33.84], ["boing", 7.07], ["didgeridoo", 5.53]], null, null, [["music", 29.53], ["speech", 15.89], ["didgeridoo", 8.57]], [["music", 30.67], ["clip-clop", 10.88], ["horse", 7.63]], null, null, [["cattle, bovinae", 45.11], ["moo", 29.96], ["livestock, farm animals, working animals", 23.44]], [["speech", 36.73], ["music", 16.69], ["horse", 13.72]], [["speech", 20.83], ["music", 14.55], ["clip-clop", 11.7]], [["noise", 31.11], ["hum", 10.77], ["sidetone", 9.16]], null], "duration": [2.65, 0.65, 1.09, 3.72, 6.74, 1.1, 0.15, 3.37, 8.13, 24.91, 4.28, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/sbz_Xq2aEQQ_filtered.json b/annotations_filtered/sbz_Xq2aEQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9da98aa172ce8d51ec3961f5bc5e95a702832f4 --- /dev/null +++ b/annotations_filtered/sbz_Xq2aEQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [9.0, 10.05], [16.0, 17.29], [21.0, 21.24], [23.0, 23.21], [23.0, 23.94], [29.0, 29.3], [30.0, 30.97], [33.0, 34.77], [36.0, 36.22], [37.0, 37.96], [47.0, 47.01], [51.0, 51.38], [52.0, 52.59], [53.0, 53.55], [54.0, 55.19], [56.0, 57.57], [59.0, 59.61], [60.0, 67.37], [69.0, 70.06], [72.0, 72.82], [74.0, 74.88], [75.0, 76.05], [77.0, 77.97], [79.0, 80.57], [83.0, 83.76], [86.0, 86.81], [89.0, 90.04], [92.0, 92.08], [93.0, 93.33], [94.0, 95.32], [98.0, 98.76], [101.0, 101.46], [102.0, 103.57], [106.0, 106.42], [110.0, 109.97], [111.0, 112.73], [113.0, 114.07], [115.0, 118.08], [121.0, 121.69], [123.0, 124.16], [125.0, 126.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 1.05, 1.29, 0.24, 0.21, 0.94, 0.3, 0.97, 1.77, 0.22, 0.96, 0.01, 0.38, 0.59, 0.55, 1.19, 1.57, 0.61, 7.37, 1.06, 0.82, 0.88, 1.05, 0.97, 1.57, 0.76, 0.81, 1.04, 0.08, 0.33, 1.32, 0.76, 0.46, 1.57, 0.42, -0.03, 1.73, 1.07, 3.08, 0.69, 1.16, 1.76]} \ No newline at end of file diff --git a/annotations_filtered/scEuS9-TozQ_filtered.json b/annotations_filtered/scEuS9-TozQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab3fbb68578a6ea74765cc24d2095b8fe77eadf9 --- /dev/null +++ b/annotations_filtered/scEuS9-TozQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.74]], "keep_status": [true], "silence_prob": [47.86], "audiomae_on_audioset": [[["music", 14.3], ["eruption", 12.17], ["hum", 10.97]]], "duration": [2.74]} \ No newline at end of file diff --git a/annotations_filtered/sceJ1R4JzMU_filtered.json b/annotations_filtered/sceJ1R4JzMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60c5eae15c6e3f8576ef72820842b888a361d408 --- /dev/null +++ b/annotations_filtered/sceJ1R4JzMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [3.0, 3.82], [8.0, 8.55], [9.0, 9.68], [11.0, 12.28], [16.0, 17.86], [19.0, 20.22], [21.0, 21.44], [22.0, 23.5], [25.0, 25.29], [27.0, 27.11], [31.0, 32.16], [36.0, 37.22], [38.0, 40.17], [41.0, 41.47], [42.0, 42.03], [42.0, 42.9], [43.0, 44.46], [45.0, 46.72], [47.0, 48.46], [50.0, 52.05], [53.0, 54.46], [55.0, 56.61], [57.0, 57.48], [60.0, 60.37], [61.0, 61.92], [63.0, 63.68], [66.0, 65.84], [67.0, 69.3], [71.0, 74.31], [75.0, 76.87], [77.0, 78.24], [80.0, 83.19], [86.0, 91.56], [94.0, 95.55], [97.0, 98.17], [99.0, 105.27], [108.0, 112.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 85.54, 0.0, 0.0, 76.37, 92.15, 0.0, 0.0, 92.97, 94.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.82, 0.55, 0.68, 1.28, 1.86, 1.22, 0.44, 1.5, 0.29, 0.11, 1.16, 1.22, 2.17, 0.47, 0.03, 0.9, 1.46, 1.72, 1.46, 2.05, 1.46, 1.61, 0.48, 0.37, 0.92, 0.68, -0.16, 2.3, 3.31, 1.87, 1.24, 3.19, 5.56, 1.55, 1.17, 6.27, 4.85]} \ No newline at end of file diff --git a/annotations_filtered/scrKz6PN92g_filtered.json b/annotations_filtered/scrKz6PN92g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37eddeea67410538eb19ecb4b6411eb51ddac85e --- /dev/null +++ b/annotations_filtered/scrKz6PN92g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.0], [13.0, 21.59], [22.0, 27.41], [28.0, 32.8], [37.0, 61.94], [64.0, 64.88]], "keep_status": [false, false, false, false, false, false], "silence_prob": [99.4, 96.29, 96.54, 83.7, 59.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [3.0, 8.59, 5.41, 4.8, 24.94, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/sd2pBde6gkw_filtered.json b/annotations_filtered/sd2pBde6gkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ae7251de4718c02ac37cca9d01a6f0b297879b3 --- /dev/null +++ b/annotations_filtered/sd2pBde6gkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.79], [19.0, 19.77], [20.0, 24.02], [28.0, 29.02], [31.0, 31.06], [38.0, 39.31], [45.0, 45.96], [47.0, 49.11], [50.0, 51.58], [53.0, 54.43], [55.0, 55.61], [57.0, 58.62], [60.0, 61.11], [62.0, 63.12], [65.0, 67.66], [68.0, 69.2], [69.0, 72.5], [79.0, 80.6], [83.0, 83.84], [85.0, 86.36], [88.0, 88.21], [94.0, 95.15], [108.0, 109.73], [110.0, 112.33], [115.0, 114.79], [118.0, 118.35], [122.0, 122.4], [126.0, 125.98], [128.0, 129.42], [132.0, 132.51], [134.0, 134.5], [135.0, 137.64], [140.0, 142.67], [145.0, 146.33], [148.0, 148.78], [149.0, 150.55], [152.0, 152.56], [153.0, 154.03], [160.0, 160.76], [162.0, 163.38], [164.0, 165.15], [169.0, 173.82], [174.0, 179.91], [181.0, 188.37], [191.0, 191.44], [194.0, 195.13], [197.0, 197.33], [198.0, 219.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.79, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 99.96, 62.27, 0.0, 0.0, 0.0, 62.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.79, 0.77, 4.02, 1.02, 0.06, 1.31, 0.96, 2.11, 1.58, 1.43, 0.61, 1.62, 1.11, 1.12, 2.66, 1.2, 3.5, 1.6, 0.84, 1.36, 0.21, 1.15, 1.73, 2.33, -0.21, 0.35, 0.4, -0.02, 1.42, 0.51, 0.5, 2.64, 2.67, 1.33, 0.78, 1.55, 0.56, 1.03, 0.76, 1.38, 1.15, 4.82, 5.91, 7.37, 0.44, 1.13, 0.33, 21.96]} \ No newline at end of file diff --git a/annotations_filtered/sdNPmpfgOMw_filtered.json b/annotations_filtered/sdNPmpfgOMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..174cd73b8d573182021c58cf90630a58633c4088 --- /dev/null +++ b/annotations_filtered/sdNPmpfgOMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.24], [5.0, 5.58], [8.0, 8.78], [11.0, 16.58], [20.0, 21.02], [23.0, 22.99], [28.0, 28.76], [32.0, 33.34], [36.0, 35.87], [38.0, 38.91], [50.0, 51.66], [59.0, 60.84], [66.0, 66.38], [72.0, 72.42], [82.0, 85.77], [88.0, 88.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0], "audiomae_on_audioset": [null, null, null, [["boing", 47.86], ["speech", 15.37], ["music", 13.52]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.58, 0.78, 5.58, 1.02, -0.01, 0.76, 1.34, -0.13, 0.91, 1.66, 1.84, 0.38, 0.42, 3.77, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/sd_I5ez3jwg_filtered.json b/annotations_filtered/sd_I5ez3jwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc0aaa07abe55f540a45cc0bc6b3fe00680c1442 --- /dev/null +++ b/annotations_filtered/sd_I5ez3jwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.53], [9.0, 10.1], [11.0, 91.74], [92.0, 117.56]], "keep_status": [false, false, false, false], "silence_prob": [99.31, 0.0, 0.0, 36.32], "audiomae_on_audioset": [null, null, null, [["hum", 38.37], ["mains hum", 23.61], ["music", 15.6]]], "duration": [4.53, 1.1, 80.74, 25.56]} \ No newline at end of file diff --git a/annotations_filtered/sdb8G26294A_filtered.json b/annotations_filtered/sdb8G26294A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f3b895e1e6e9b1ed6abdb8c4b978eba9cab1ebd --- /dev/null +++ b/annotations_filtered/sdb8G26294A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.47], [5.0, 5.7], [9.0, 9.91], [16.0, 23.08], [31.0, 31.21], [36.0, 35.85], [40.0, 48.12], [56.0, 60.83], [62.0, 64.02], [65.0, 68.18], [68.0, 69.79], [71.0, 71.91], [72.0, 72.77], [74.0, 75.66], [79.0, 80.18], [81.0, 82.32], [87.0, 86.81], [87.0, 87.81], [88.0, 89.7], [92.0, 97.5], [98.0, 99.76], [103.0, 105.68], [112.0, 112.65], [114.0, 115.86], [119.0, 119.53], [122.0, 124.16], [126.0, 125.95], [128.0, 128.8], [129.0, 130.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.66, 0.0, 0.0, 41.14, 31.88, 70.72, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.44, 0.0, 85.17, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 63.81], ["musical instrument", 5.63], ["synthesizer", 3.28]], null, null, [["music", 50.62], ["didgeridoo", 38.64], ["musical instrument", 2.71]], [["music", 38.92], ["speech", 32.35], ["musical instrument", 4.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.47, 0.7, 0.91, 7.08, 0.21, -0.15, 8.12, 4.83, 2.02, 3.18, 1.79, 0.91, 0.77, 1.66, 1.18, 1.32, -0.19, 0.81, 1.7, 5.5, 1.76, 2.68, 0.65, 1.86, 0.53, 2.16, -0.05, 0.8, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/sdc5bkFd2X4_filtered.json b/annotations_filtered/sdc5bkFd2X4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..807ba77bea5ab44a2edf6f495f74306ed2b05fee --- /dev/null +++ b/annotations_filtered/sdc5bkFd2X4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.3], [14.0, 13.96], [20.0, 20.07], [50.0, 50.53], [51.0, 51.87], [53.0, 54.03]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.3, -0.04, 0.07, 0.53, 0.87, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/sdea5Iq5D_U_filtered.json b/annotations_filtered/sdea5Iq5D_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ca2fc8a1cf5c0020716b1e8c5c1941ff3166c94 --- /dev/null +++ b/annotations_filtered/sdea5Iq5D_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 26.94], [27.0, 44.24], [45.0, 46.38], [49.0, 50.18], [53.0, 54.99], [58.0, 58.41], [59.0, 60.88], [61.0, 62.18], [63.0, 74.8], [75.0, 135.63], [136.0, 142.4], [143.0, 144.88], [147.0, 176.22], [179.0, 181.08], [182.0, 210.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 78.72, 0.0, 66.88, 92.64, 42.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.41], ["speech", 12.86], ["groan", 1.87]]], "duration": [-0.06, 17.24, 1.38, 1.18, 1.99, 0.41, 1.88, 1.18, 11.8, 60.63, 6.4, 1.88, 29.22, 2.08, 28.19]} \ No newline at end of file diff --git a/annotations_filtered/sdkgpg4Plxo_filtered.json b/annotations_filtered/sdkgpg4Plxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c33aa398b25dafa8b94a86c59ced262b2c31db6 --- /dev/null +++ b/annotations_filtered/sdkgpg4Plxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.07], [16.0, 19.21], [20.0, 21.12], [22.0, 24.88], [26.0, 27.9], [29.0, 32.29], [33.0, 35.83], [41.0, 45.33], [47.0, 52.78], [54.0, 58.6], [62.0, 62.87], [65.0, 65.69], [67.0, 75.14], [76.0, 93.07], [96.0, 102.22], [103.0, 108.9], [110.0, 112.35]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.34, 40.33, 0.0, 98.51, 0.0, 73.36, 100.0, 87.74, 77.7, 99.87, 0.0, 0.0, 99.98, 99.82, 98.8, 99.98, 79.94], "audiomae_on_audioset": [null, [["speech", 46.56], ["sidetone", 7.06], ["animal", 4.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.07, 3.21, 1.12, 2.88, 1.9, 3.29, 2.83, 4.33, 5.78, 4.6, 0.87, 0.69, 8.14, 17.07, 6.22, 5.9, 2.35]} \ No newline at end of file diff --git a/annotations_filtered/sdtIgE33BvQ_filtered.json b/annotations_filtered/sdtIgE33BvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d77ece7fe6482f6addf7c1a4e25e11ddca319815 --- /dev/null +++ b/annotations_filtered/sdtIgE33BvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [4.0, 4.99], [12.0, 12.53], [25.0, 25.1], [27.0, 28.59], [31.0, 33.18], [34.0, 35.01], [39.0, 44.22], [54.0, 54.13], [55.0, 54.97]], "keep_status": [false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.31, 0.0, 30.69, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 42.45], ["speech", 16.82], ["musical instrument", 6.42]], null, [["music", 44.21], ["speech", 25.9], ["musical instrument", 5.31]], null, null], "duration": [1.21, 0.99, 0.53, 0.1, 1.59, 2.18, 1.01, 5.22, 0.13, -0.03]} \ No newline at end of file diff --git a/annotations_filtered/sdvrA5qnZo4_filtered.json b/annotations_filtered/sdvrA5qnZo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a9f64f36def3cc73c49a0ce2c53c3c7afeb9d62 --- /dev/null +++ b/annotations_filtered/sdvrA5qnZo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [16.0, 16.75], [22.0, 26.91], [29.0, 29.64], [35.0, 42.79], [50.0, 64.57], [68.0, 68.93], [76.0, 76.08], [84.0, 84.25], [89.0, 89.63], [99.0, 101.9], [106.0, 107.16], [109.0, 109.39], [112.0, 112.6], [121.0, 130.92]], "keep_status": [false, false, true, false, true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 46.05, 0.0, 31.19, 32.66, 0.0, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 0.0, 93.45], "audiomae_on_audioset": [null, null, [["music", 34.61], ["bass guitar", 12.01], ["guitar", 11.84]], null, [["livestock, farm animals, working animals", 27.75], ["speech", 18.64], ["cattle, bovinae", 18.33]], [["music", 33.54], ["speech", 27.41], ["burst, pop", 1.92]], null, null, null, null, [["speech", 47.76], ["music", 10.78], ["crowd", 3.85]], null, null, null, null], "duration": [1.02, 0.75, 4.91, 0.64, 7.79, 14.57, 0.93, 0.08, 0.25, 0.63, 2.9, 1.16, 0.39, 0.6, 9.92]} \ No newline at end of file diff --git a/annotations_filtered/sdwghUH-K14_filtered.json b/annotations_filtered/sdwghUH-K14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35333ac8a4d994eeeec0cf105c644425d519d49c --- /dev/null +++ b/annotations_filtered/sdwghUH-K14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.26], [10.0, 12.99], [20.0, 21.07], [28.0, 32.71], [34.0, 42.67], [46.0, 48.81], [54.0, 58.53], [60.0, 61.99], [62.0, 63.02], [75.0, 107.57], [120.0, 120.83], [122.0, 123.26]], "keep_status": [false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [58.13, 90.78, 0.0, 57.81, 37.71, 43.43, 42.55, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 40.37], ["music", 8.78], ["explosion", 7.97]], [["hum", 32.59], ["music", 16.83], ["mains hum", 15.16]], [["music", 24.69], ["speech", 23.87], ["hum", 14.94]], null, null, null, null, null], "duration": [5.26, 2.99, 1.07, 4.71, 8.67, 2.81, 4.53, 1.99, 1.02, 32.57, 0.83, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/seMHoTTskQc_filtered.json b/annotations_filtered/seMHoTTskQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9cb4862e97400ff7944952b066644b466151cdd --- /dev/null +++ b/annotations_filtered/seMHoTTskQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 25.95], [27.0, 27.3], [33.0, 33.98], [35.0, 35.33], [37.0, 37.83], [41.0, 41.88], [43.0, 48.07], [49.0, 54.28], [57.0, 57.16], [64.0, 64.96], [68.0, 70.66], [90.0, 91.71], [94.0, 94.95], [96.0, 100.33], [101.0, 102.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [34.24, 0.0, 0.0, 0.0, 0.0, 0.0, 48.31, 37.52, 0.0, 0.0, 29.12, 0.0, 0.0, 33.32, 0.0], "audiomae_on_audioset": [[["speech", 43.61], ["thunk", 18.85], ["music", 6.03]], null, null, null, null, null, [["speech", 72.27], ["fart", 2.88], ["hum", 2.01]], [["speech", 78.24], ["rowboat, canoe, kayak", 3.04], ["gurgling", 2.36]], null, null, [["fart", 20.43], ["speech", 8.59], ["groan", 7.22]], null, null, [["screaming", 16.58], ["thunk", 8.01], ["fart", 7.73]], null], "duration": [6.95, 0.3, 0.98, 0.33, 0.83, 0.88, 5.07, 5.28, 0.16, 0.96, 2.66, 1.71, 0.95, 4.33, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/sehGLkGe-iI_filtered.json b/annotations_filtered/sehGLkGe-iI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d53d52ae7669f72d68d2d4bbe48d703de566aa0d --- /dev/null +++ b/annotations_filtered/sehGLkGe-iI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.14], [6.0, 8.34], [14.0, 16.12], [25.0, 30.69], [31.0, 37.4], [38.0, 95.54], [96.0, 99.2], [102.0, 107.35], [109.0, 111.99], [116.0, 124.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.56, 100.0, 100.0, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.14, 2.34, 2.12, 5.69, 6.4, 57.54, 3.2, 5.35, 2.99, 8.63]} \ No newline at end of file diff --git a/annotations_filtered/senNDipdmPo_filtered.json b/annotations_filtered/senNDipdmPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..725f827569349d9aee82b79f9e6140eadb46ac67 --- /dev/null +++ b/annotations_filtered/senNDipdmPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 18.93], [20.0, 41.34], [43.0, 71.29], [72.0, 72.15], [74.0, 75.03], [86.0, 87.67], [91.0, 92.89], [103.0, 120.7], [127.0, 126.89]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 98.59, 99.36, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [15.93, 21.34, 28.29, 0.15, 1.03, 1.67, 1.89, 17.7, -0.11]} \ No newline at end of file diff --git a/annotations_filtered/seqBLjTfnl4_filtered.json b/annotations_filtered/seqBLjTfnl4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..176bcbea4eb9c3f203e280c3aa0dff08e38b4180 --- /dev/null +++ b/annotations_filtered/seqBLjTfnl4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.6], [5.0, 5.22], [8.0, 8.21], [8.0, 15.4], [16.0, 35.67], [41.0, 46.67], [49.0, 48.78], [49.0, 49.67], [50.0, 51.43], [52.0, 69.26], [73.0, 87.44], [90.0, 92.52], [97.0, 97.34], [98.0, 101.8], [104.0, 107.64], [111.0, 111.64], [113.0, 114.42], [115.0, 115.7], [117.0, 127.28], [129.0, 130.06], [138.0, 138.05], [145.0, 174.9]], "keep_status": [false, false, false, false, true, true, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.09, 31.36, 33.49, 0.0, 0.0, 0.0, 31.54, 30.72, 49.97, 0.0, 46.19, 33.24, 0.0, 0.0, 0.0, 43.38, 0.0, 0.0, 30.71], "audiomae_on_audioset": [null, null, null, [["music", 39.56], ["speech", 35.8], ["fly, housefly", 4.79]], [["music", 33.2], ["speech", 28.36], ["fly, housefly", 8.36]], [["grunt", 50.29], ["music", 7.64], ["livestock, farm animals, working animals", 5.33]], null, null, null, [["vehicle", 29.49], ["buzz", 22.8], ["music", 6.03]], [["vehicle", 25.51], ["music", 9.48], ["buzz", 8.17]], [["music", 74.74], ["didgeridoo", 7.84], ["theremin", 5.31]], null, [["music", 64.29], ["theremin", 10.37], ["echo", 3.68]], [["music", 38.49], ["musical instrument", 8.83], ["mains hum", 8.68]], null, null, null, [["music", 79.67], ["speech", 4.52], ["scary music", 2.21]], null, null, [["music", 72.72], ["musical instrument", 5.05], ["synthesizer", 4.17]]], "duration": [0.6, 0.22, 0.21, 7.4, 19.67, 5.67, -0.22, 0.67, 1.43, 17.26, 14.44, 2.52, 0.34, 3.8, 3.64, 0.64, 1.42, 0.7, 10.28, 1.06, 0.05, 29.9]} \ No newline at end of file diff --git a/annotations_filtered/sf2RRCNlz38_filtered.json b/annotations_filtered/sf2RRCNlz38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e71b3545607dad32baf103c5ddb0486337073ec --- /dev/null +++ b/annotations_filtered/sf2RRCNlz38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 90.73], [93.0, 103.33], [105.0, 108.77], [110.0, 145.62], [149.0, 157.57], [160.0, 164.32], [165.0, 165.05], [166.0, 170.09]], "keep_status": [false, true, false, false, true, true, false, true], "silence_prob": [40.52, 39.05, 99.98, 0.0, 34.36, 34.01, 0.0, 31.19], "audiomae_on_audioset": [[["whale vocalization", 48.82], ["livestock, farm animals, working animals", 13.53], ["cattle, bovinae", 9.41]], [["animal", 16.49], ["whale vocalization", 10.54], ["speech", 9.93]], null, null, [["buzz", 26.06], ["speech", 25.58], ["fart", 14.75]], [["throbbing", 15.99], ["speech", 8.19], ["sound effect", 6.3]], null, [["music", 15.15], ["fart", 8.1], ["speech", 7.85]]], "duration": [10.73, 10.33, 3.77, 35.62, 8.57, 4.32, 0.05, 4.09]} \ No newline at end of file diff --git a/annotations_filtered/sf2eXsM6Kik_filtered.json b/annotations_filtered/sf2eXsM6Kik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f25b3c6f8e9dbde061b174d4a93053c3c30ba42 --- /dev/null +++ b/annotations_filtered/sf2eXsM6Kik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [3.0, 12.46], [14.0, 19.26], [21.0, 21.46], [22.0, 56.44], [57.0, 61.42], [65.0, 66.01], [67.0, 67.49], [74.0, 74.48], [77.0, 84.23]], "keep_status": [false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 44.9, 67.13, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 54.97], "audiomae_on_audioset": [null, [["music", 77.59], ["whale vocalization", 4.93], ["noise", 2.2]], null, null, null, [["music", 37.22], ["explosion", 12.38], ["hum", 11.69]], null, null, null, null], "duration": [0.0, 9.46, 5.26, 0.46, 34.44, 4.42, 1.01, 0.49, 0.48, 7.23]} \ No newline at end of file diff --git a/annotations_filtered/sf8rDpu1vCk_filtered.json b/annotations_filtered/sf8rDpu1vCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97be9ebcc96dac3bb687bf8c9e86feb24854b32f --- /dev/null +++ b/annotations_filtered/sf8rDpu1vCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.4], [7.0, 8.01], [11.0, 13.04], [17.0, 17.95], [23.0, 24.0], [26.0, 26.67], [29.0, 40.47], [42.0, 44.61], [46.0, 50.28], [63.0, 64.42], [70.0, 70.41], [70.0, 70.46], [73.0, 74.8], [79.0, 82.48], [87.0, 87.89], [90.0, 93.77], [96.0, 98.66], [105.0, 105.16], [109.0, 110.08], [120.0, 119.96], [125.0, 125.31]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 30.99, 0.0, 0.0, 0.0, 33.22, 29.53, 39.44, 0.0, 0.0, 0.0, 0.0, 34.01, 0.0, 38.15, 32.71, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 60.82], ["vehicle", 13.66], ["mains hum", 3.11]], null, null, null, [["vehicle", 16.96], ["siren", 10.06], ["buzzer", 9.99]], [["vehicle", 17.23], ["buzz", 11.14], ["hum", 8.25]], [["hum", 36.12], ["music", 16.64], ["mains hum", 15.39]], null, null, null, null, [["music", 24.64], ["hum", 14.75], ["throbbing", 6.02]], null, [["hum", 35.72], ["mains hum", 20.19], ["music", 5.78]], [["music", 45.76], ["noise", 13.02], ["synthesizer", 4.13]], null, null, null, null], "duration": [0.4, 1.01, 2.04, 0.95, 1.0, 0.67, 11.47, 2.61, 4.28, 1.42, 0.41, 0.46, 1.8, 3.48, 0.89, 3.77, 2.66, 0.16, 1.08, -0.04, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/sf9038zMVgo_filtered.json b/annotations_filtered/sf9038zMVgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..249413c89029da5183bb02936ce83d5d48203f57 --- /dev/null +++ b/annotations_filtered/sf9038zMVgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.83], [22.0, 22.32], [38.0, 39.19], [58.0, 60.03], [63.0, 63.58], [64.0, 64.61], [67.0, 69.11], [81.0, 80.76], [89.0, 89.78], [103.0, 103.99], [106.0, 106.25], [107.0, 108.53], [113.0, 113.04], [115.0, 115.45], [118.0, 119.23], [121.0, 140.61], [141.0, 141.93], [145.0, 144.93], [147.0, 147.11], [152.0, 152.17], [156.0, 157.05], [181.0, 182.11], [188.0, 188.16], [189.0, 190.09], [192.0, 192.67], [193.0, 194.98], [197.0, 197.24], [199.0, 199.18], [202.0, 202.53], [204.0, 204.09], [206.0, 208.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 51.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 0.32, 1.19, 2.03, 0.58, 0.61, 2.11, -0.24, 0.78, 0.99, 0.25, 1.53, 0.04, 0.45, 1.23, 19.61, 0.93, -0.07, 0.11, 0.17, 1.05, 1.11, 0.16, 1.09, 0.67, 1.98, 0.24, 0.18, 0.53, 0.09, 2.82]} \ No newline at end of file diff --git a/annotations_filtered/sfCQQLSwz3s_filtered.json b/annotations_filtered/sfCQQLSwz3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c9df236b28d3dcd3ee0a159a37829afa2e990dd --- /dev/null +++ b/annotations_filtered/sfCQQLSwz3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[74.0, 75.44], [81.0, 81.53], [87.0, 87.94], [89.0, 90.24], [93.0, 105.9], [108.0, 119.35]], "keep_status": [false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.29, 30.66], "audiomae_on_audioset": [null, null, null, null, [["buzz", 30.57], ["mains hum", 13.98], ["speech", 7.6]], [["music", 49.99], ["speech", 9.29], ["hum", 9.12]]], "duration": [1.44, 0.53, 0.94, 1.24, 12.9, 11.35]} \ No newline at end of file diff --git a/annotations_filtered/sfHaTenaRBI_filtered.json b/annotations_filtered/sfHaTenaRBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..464dba3aadf0539940b9c25adff8ef0c861fdea5 --- /dev/null +++ b/annotations_filtered/sfHaTenaRBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.68], [7.0, 9.0], [23.0, 23.5], [29.0, 29.88], [38.0, 38.01], [56.0, 60.51], [63.0, 63.98], [71.0, 73.14], [75.0, 74.93], [85.0, 86.63], [88.0, 88.87], [94.0, 97.16], [98.0, 99.13], [105.0, 105.06], [109.0, 110.24], [113.0, 113.8], [119.0, 119.87]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.3, 0.0, 0.0, 0.0, 40.16, 0.0, 60.98, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 26.77], ["mosquito", 11.73], ["laughter", 5.76]], null, null, null, null, null, [["speech", 41.3], ["music", 36.62], ["sidetone", 2.73]], null, null, null, null, null], "duration": [0.68, 2.0, 0.5, 0.88, 0.01, 4.51, 0.98, 2.14, -0.07, 1.63, 0.87, 3.16, 1.13, 0.06, 1.24, 0.8, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/sfWe6CUZUtc_filtered.json b/annotations_filtered/sfWe6CUZUtc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7710c21d55719fd1f0ec49a3dd96d12551a22be --- /dev/null +++ b/annotations_filtered/sfWe6CUZUtc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.08], [7.0, 10.98], [15.0, 15.62], [23.0, 24.8], [33.0, 34.64], [36.0, 36.75], [37.0, 38.77], [39.0, 39.31], [52.0, 52.25], [57.0, 57.1], [58.0, 59.29], [60.0, 60.74], [63.0, 64.23], [65.0, 68.54], [72.0, 72.32], [72.0, 74.07], [76.0, 77.3], [80.0, 80.65], [88.0, 88.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 0.0, 97.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.08, 3.98, 0.62, 1.8, 1.64, 0.75, 1.77, 0.31, 0.25, 0.1, 1.29, 0.74, 1.23, 3.54, 0.32, 2.07, 1.3, 0.65, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/sfgNK5f04iY_filtered.json b/annotations_filtered/sfgNK5f04iY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c46344de8081f39230bcbc16c75dc099c8b6ae6c --- /dev/null +++ b/annotations_filtered/sfgNK5f04iY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.56], [6.0, 19.52], [23.0, 35.95], [37.0, 54.36], [56.0, 70.17], [72.0, 83.35], [84.0, 100.09], [102.0, 105.56]], "keep_status": [false, false, false, false, true, false, false, true], "silence_prob": [0.0, 30.34, 30.02, 29.76, 30.09, 30.39, 30.18, 30.74], "audiomae_on_audioset": [null, [["speech", 51.24], ["music", 22.89], ["hum", 10.1]], [["music", 66.33], ["throbbing", 7.3], ["synthesizer", 6.02]], [["music", 63.19], ["throbbing", 18.66], ["hum", 7.17]], [["hum", 29.05], ["music", 22.34], ["throbbing", 16.39]], [["mains hum", 28.96], ["music", 22.96], ["hum", 21.3]], [["music", 67.06], ["speech", 7.0], ["electronic music", 3.61]], [["music", 48.44], ["speech", 6.3], ["throbbing", 4.06]]], "duration": [1.56, 13.52, 12.95, 17.36, 14.17, 11.35, 16.09, 3.56]} \ No newline at end of file diff --git a/annotations_filtered/sgB8cpEi_zU_filtered.json b/annotations_filtered/sgB8cpEi_zU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..727b95782a71ec983d7b94caeec594b256998487 --- /dev/null +++ b/annotations_filtered/sgB8cpEi_zU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.08], [21.0, 21.32], [22.0, 22.82], [24.0, 24.17], [25.0, 33.94], [34.0, 52.03], [56.0, 57.43], [58.0, 93.31], [96.0, 146.45], [148.0, 148.34], [149.0, 151.85], [153.0, 154.7], [155.0, 169.25], [170.0, 170.01], [171.0, 171.0], [172.0, 175.09], [176.0, 176.44]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.34, 31.96, 0.0, 0.0, 0.0, 0.0, 37.63, 0.0, 37.54, 0.0, 0.0, 37.82, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 64.11], ["radio", 4.94], ["vehicle", 3.95]], [["gurgling", 13.03], ["whale vocalization", 12.55], ["eruption", 11.67]], null, null, null, null, [["radio", 40.51], ["speech", 20.01], ["sidetone", 3.35]], null, [["frog", 23.53], ["whale vocalization", 16.45], ["gurgling", 13.48]], null, null, [["speech", 20.35], ["radio", 18.83], ["rain", 6.77]], null], "duration": [1.08, 0.32, 0.82, 0.17, 8.94, 18.03, 1.43, 35.31, 50.45, 0.34, 2.85, 1.7, 14.25, 0.01, 0.0, 3.09, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/sggwHnudtH0_filtered.json b/annotations_filtered/sggwHnudtH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89e9de2860b6a597d0eadf0376bdaae61036913a --- /dev/null +++ b/annotations_filtered/sggwHnudtH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 23.77], [29.0, 29.76], [31.0, 32.39], [33.0, 34.97], [37.0, 57.77], [62.0, 66.58], [67.0, 67.44], [67.0, 67.49], [68.0, 67.53], [68.0, 68.45], [70.0, 79.57], [85.0, 105.09], [110.0, 109.88], [110.0, 110.03], [112.0, 131.48], [134.0, 140.1], [142.0, 142.47], [143.0, 144.07], [145.0, 146.06], [149.0, 150.38], [152.0, 152.37], [155.0, 156.51], [157.0, 156.76], [157.0, 162.73], [168.0, 173.65]], "keep_status": [true, false, false, false, true, true, false, false, false, false, true, true, false, false, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [29.66, 0.0, 0.0, 0.0, 36.02, 29.42, 0.0, 0.0, 0.0, 0.0, 29.34, 30.15, 0.0, 0.0, 31.62, 29.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.15, 42.28], "audiomae_on_audioset": [[["music", 41.3], ["speech", 8.33], ["livestock, farm animals, working animals", 5.1]], null, null, null, [["throbbing", 25.45], ["hum", 21.48], ["music", 13.48]], [["music", 21.92], ["livestock, farm animals, working animals", 17.11], ["cattle, bovinae", 14.23]], null, null, null, null, [["music", 41.63], ["groan", 11.63], ["fart", 6.91]], [["music", 34.71], ["musical instrument", 8.32], ["effects unit", 6.27]], null, null, [["music", 52.98], ["hum", 8.84], ["gong", 5.15]], [["livestock, farm animals, working animals", 22.27], ["music", 13.41], ["groan", 9.89]], null, null, null, null, null, null, null, [["speech", 35.99], ["music", 18.3], ["hum", 9.71]], [["grunt", 39.09], ["hum", 23.13], ["burping, eructation", 9.63]]], "duration": [17.77, 0.76, 1.39, 1.97, 20.77, 4.58, 0.44, 0.49, -0.47, 0.45, 9.57, 20.09, -0.12, 0.03, 19.48, 6.1, 0.47, 1.07, 1.06, 1.38, 0.37, 1.51, -0.24, 5.73, 5.65]} \ No newline at end of file diff --git a/annotations_filtered/sh0IBg7GBeY_filtered.json b/annotations_filtered/sh0IBg7GBeY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c4f02e3d1266856d8b735c4bb2ddf2446a8e25a --- /dev/null +++ b/annotations_filtered/sh0IBg7GBeY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [5.0, 9.07], [17.0, 16.92], [40.0, 51.7], [53.0, 54.46], [56.0, 63.44], [64.0, 63.95]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 61.97, 0.0, 87.37, 0.0, 50.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.51, 4.07, -0.08, 11.7, 1.46, 7.44, -0.05]} \ No newline at end of file diff --git a/annotations_filtered/sh7lb9j3k5s_filtered.json b/annotations_filtered/sh7lb9j3k5s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..617a2342232ec96a1b77d4a544bd20494ec3f230 --- /dev/null +++ b/annotations_filtered/sh7lb9j3k5s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [7.0, 7.21], [8.0, 8.53], [13.0, 13.22], [19.0, 19.57], [23.0, 24.12], [29.0, 29.76], [31.0, 31.78], [32.0, 33.42], [38.0, 38.72], [40.0, 40.71], [42.0, 43.6], [44.0, 44.69], [47.0, 50.26], [52.0, 53.74], [55.0, 55.56], [58.0, 58.48], [59.0, 60.4], [61.0, 62.97], [67.0, 68.03], [77.0, 77.65], [88.0, 87.94], [88.0, 88.03], [88.0, 90.36], [91.0, 91.64], [98.0, 98.49], [108.0, 108.6], [110.0, 109.92], [111.0, 111.3], [114.0, 114.47], [117.0, 118.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.49], ["sidetone", 25.24], ["telephone", 2.87]], null, null, null, null, null, null, null], "duration": [0.43, 0.21, 0.53, 0.22, 0.57, 1.12, 0.76, 0.78, 1.42, 0.72, 0.71, 1.6, 0.69, 3.26, 1.74, 0.56, 0.48, 1.4, 1.97, 1.03, 0.65, -0.06, 0.03, 2.36, 0.64, 0.49, 0.6, -0.08, 0.3, 0.47, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/shE7b_6NNpU_filtered.json b/annotations_filtered/shE7b_6NNpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..193c6ab74811c964d07a383554ffff9a09305792 --- /dev/null +++ b/annotations_filtered/shE7b_6NNpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [5.0, 5.97], [8.0, 8.43], [10.0, 10.67], [13.0, 13.05], [13.0, 14.57], [17.0, 16.93], [18.0, 20.33], [21.0, 25.51], [28.0, 36.12], [37.0, 37.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 63.96, 31.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 36.4], ["gong", 23.64], ["timpani", 12.71]], null], "duration": [0.18, 0.97, 0.43, 0.67, 0.05, 1.57, -0.07, 2.33, 4.51, 8.12, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/shO2tSVK0IU_filtered.json b/annotations_filtered/shO2tSVK0IU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e412793323f8ff9460597cb845231804cc70710d --- /dev/null +++ b/annotations_filtered/shO2tSVK0IU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.36], [17.0, 51.73], [52.0, 53.15], [54.0, 54.46], [58.0, 65.28], [68.0, 70.61], [76.0, 77.5], [80.0, 90.49], [91.0, 107.37], [108.0, 109.46], [110.0, 122.94], [123.0, 131.3]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [32.73, 0.0, 0.0, 0.0, 31.89, 51.88, 0.0, 34.31, 32.86, 0.0, 32.0, 33.21], "audiomae_on_audioset": [[["music", 73.65], ["sampler", 3.32], ["reggae", 2.69]], null, null, null, [["music", 50.11], ["didgeridoo", 10.04], ["musical instrument", 6.49]], null, null, [["music", 72.85], ["didgeridoo", 7.71], ["musical instrument", 4.69]], [["music", 70.1], ["musical instrument", 3.82], ["sampler", 3.46]], null, [["music", 41.84], ["speech", 11.17], ["synthesizer", 8.44]], [["music", 49.4], ["speech", 16.68], ["synthesizer", 8.09]]], "duration": [13.36, 34.73, 1.15, 0.46, 7.28, 2.61, 1.5, 10.49, 16.37, 1.46, 12.94, 8.3]} \ No newline at end of file diff --git a/annotations_filtered/shal5AF2Gxc_filtered.json b/annotations_filtered/shal5AF2Gxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b501188e09501c2571d783d784cb1be05e37d74 --- /dev/null +++ b/annotations_filtered/shal5AF2Gxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.16], [6.0, 7.38], [9.0, 9.75], [11.0, 11.79], [13.0, 14.13], [17.0, 17.42], [18.0, 18.66], [24.0, 24.73], [25.0, 30.5], [34.0, 35.11], [36.0, 40.07], [42.0, 43.19], [43.0, 44.51], [48.0, 60.22], [61.0, 64.89], [86.0, 86.09], [87.0, 110.02], [111.0, 118.4], [119.0, 120.26], [121.0, 122.25], [126.0, 127.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.91, 0.0, 41.52, 0.0, 0.0, 35.16, 43.48, 0.0, 36.52, 37.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 52.65], ["beatboxing", 21.12], ["music", 5.69]], null, null, [["speech", 84.75], ["beatboxing", 4.39], ["fart", 4.18]], [["speech", 11.08], ["music", 10.63], ["sheep", 5.47]], null, [["music", 34.64], ["quack", 13.83], ["animal", 6.73]], [["music", 43.04], ["speech", 7.6], ["didgeridoo", 3.36]], null, null, null], "duration": [0.16, 1.38, 0.75, 0.79, 1.13, 0.42, 0.66, 0.73, 5.5, 1.11, 4.07, 1.19, 1.51, 12.22, 3.89, 0.09, 23.02, 7.4, 1.26, 1.25, 1.18]} \ No newline at end of file diff --git a/annotations_filtered/sheRsZ2HOYI_filtered.json b/annotations_filtered/sheRsZ2HOYI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4074580cd11e8e41c08f41b59d08347579090f7 --- /dev/null +++ b/annotations_filtered/sheRsZ2HOYI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [14.0, 16.14], [16.0, 16.73], [30.0, 31.65], [32.0, 32.7], [33.0, 34.72], [36.0, 37.71], [45.0, 51.97], [69.0, 71.73], [84.0, 84.0], [84.0, 86.46], [86.0, 86.49], [87.0, 86.53], [87.0, 86.56], [87.0, 86.63], [87.0, 86.66], [87.0, 86.7], [87.0, 86.73], [87.0, 86.76], [87.0, 86.83], [88.0, 92.94], [94.0, 98.22]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 51.5, 0.0, 0.0, 0.0, 0.0, 0.0, 35.71, 46.47, 0.0, 40.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.95, 68.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["noise", 26.46], ["speech", 16.26], ["music", 13.61]], [["speech", 67.35], ["sidetone", 2.86], ["music", 2.65]], null, [["speech", 35.36], ["music", 20.73], ["sidetone", 7.82]], null, null, null, null, null, null, null, null, null, [["music", 34.06], ["speech", 19.6], ["fly, housefly", 11.45]], null], "duration": [0.42, 2.14, 0.73, 1.65, 0.7, 1.72, 1.71, 6.97, 2.73, 0.0, 2.46, 0.49, -0.47, -0.44, -0.37, -0.34, -0.3, -0.27, -0.24, -0.17, 4.94, 4.22]} \ No newline at end of file diff --git a/annotations_filtered/shehrh353Oo_filtered.json b/annotations_filtered/shehrh353Oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..785de7c3db03a6c26f7441fae49a689fb4aa2e8c --- /dev/null +++ b/annotations_filtered/shehrh353Oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.46], [33.0, 33.57], [46.0, 47.06], [50.0, 50.04], [54.0, 56.78], [69.0, 69.08], [73.0, 72.99], [74.0, 73.9], [91.0, 91.5]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.46, 0.57, 1.06, 0.04, 2.78, 0.08, -0.01, -0.1, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/shj7YP98Yxs_filtered.json b/annotations_filtered/shj7YP98Yxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24aeff35f515f2400a80b45bdd2fa71650fce32d --- /dev/null +++ b/annotations_filtered/shj7YP98Yxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.06], [12.0, 11.99], [14.0, 14.64], [16.0, 20.93], [23.0, 29.96], [32.0, 40.49], [42.0, 48.19], [50.0, 61.15], [61.0, 61.37], [61.0, 61.43], [64.0, 70.66], [80.0, 92.1], [93.0, 103.79], [105.0, 105.49], [111.0, 112.02], [113.0, 117.27], [119.0, 125.64]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 95.09, 70.3, 55.11, 31.2, 33.43, 0.0, 0.0, 33.92, 32.67, 36.5, 0.0, 0.0, 43.13, 37.62], "audiomae_on_audioset": [null, null, null, null, null, null, [["livestock, farm animals, working animals", 40.02], ["moo", 14.96], ["cattle, bovinae", 14.22]], [["speech", 50.61], ["music", 13.31], ["sheep", 10.21]], null, null, [["music", 69.4], ["scary music", 7.12], ["soundtrack music", 3.42]], [["speech", 41.8], ["music", 21.61], ["hum", 10.0]], [["music", 56.77], ["hum", 11.28], ["speech", 5.83]], null, null, [["music", 58.84], ["scary music", 8.64], ["hum", 2.37]], [["music", 51.23], ["animal", 11.01], ["scary music", 7.93]]], "duration": [1.06, -0.01, 0.64, 4.93, 6.96, 8.49, 6.19, 11.15, 0.37, 0.43, 6.66, 12.1, 10.79, 0.49, 1.02, 4.27, 6.64]} \ No newline at end of file diff --git a/annotations_filtered/shogibE67W8_filtered.json b/annotations_filtered/shogibE67W8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cf94f1bd0733767e380202b2b72eef448c99f7f --- /dev/null +++ b/annotations_filtered/shogibE67W8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.74], [24.0, 23.89], [27.0, 26.96], [43.0, 44.78], [45.0, 46.45], [47.0, 48.17], [49.0, 50.82], [52.0, 54.68], [61.0, 62.5], [68.0, 68.62], [72.0, 71.63], [80.0, 81.09], [82.0, 87.56], [89.0, 112.19], [113.0, 127.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 0.0, 99.65, 34.07, 33.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.79], ["vibraphone", 12.1], ["musical instrument", 10.3]], [["gong", 39.18], ["music", 27.57], ["singing bowl", 8.43]]], "duration": [0.74, -0.11, -0.04, 1.78, 1.45, 1.17, 1.82, 2.68, 1.5, 0.62, -0.37, 1.09, 5.56, 23.19, 14.67]} \ No newline at end of file diff --git a/annotations_filtered/siHzbnn1Bxw_filtered.json b/annotations_filtered/siHzbnn1Bxw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..440546ad52e6af80892d3af6a58de6d5dddc8d06 --- /dev/null +++ b/annotations_filtered/siHzbnn1Bxw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.9], [12.0, 22.76], [23.0, 47.24], [48.0, 75.22], [78.0, 109.95]], "keep_status": [false, true, true, false, false], "silence_prob": [0.0, 41.91, 36.8, 30.61, 0.0], "audiomae_on_audioset": [null, [["music", 24.7], ["marimba, xylophone", 7.98], ["glockenspiel", 6.84]], [["music", 46.7], ["musical instrument", 5.49], ["marimba, xylophone", 5.31]], [["theremin", 65.65], ["music", 26.35], ["musical instrument", 1.55]], null], "duration": [0.9, 10.76, 24.24, 27.22, 31.95]} \ No newline at end of file diff --git a/annotations_filtered/siTZSTZwJ0E_filtered.json b/annotations_filtered/siTZSTZwJ0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27fae66f67ed0526a97bbf1d790604ea72e3566e --- /dev/null +++ b/annotations_filtered/siTZSTZwJ0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.76], [20.0, 21.25], [27.0, 28.43], [36.0, 41.37], [43.0, 44.79], [48.0, 51.12], [53.0, 53.33], [59.0, 59.83], [62.0, 63.41], [67.0, 66.97], [70.0, 72.03], [73.0, 77.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.76, 1.25, 1.43, 5.37, 1.79, 3.12, 0.33, 0.83, 1.41, -0.03, 2.03, 4.77]} \ No newline at end of file diff --git a/annotations_filtered/sidn04cetvU_filtered.json b/annotations_filtered/sidn04cetvU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..802ff4359bbb49455cf34e28e27612bcfba7cb4b --- /dev/null +++ b/annotations_filtered/sidn04cetvU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 63.63], [67.0, 79.54], [81.0, 83.24], [87.0, 89.38], [90.0, 107.03], [108.0, 108.16]], "keep_status": [true, false, false, true, true, false], "silence_prob": [30.72, 31.22, 33.03, 30.16, 30.54, 0.0], "audiomae_on_audioset": [[["music", 32.59], ["cacophony", 7.51], ["hum", 7.12]], [["music", 42.26], ["mains hum", 17.54], ["scary music", 13.54]], [["mains hum", 33.01], ["hum", 28.54], ["music", 14.94]], [["music", 36.33], ["whale vocalization", 12.6], ["hum", 12.18]], [["music", 51.08], ["singing bowl", 12.17], ["hum", 5.18]], null], "duration": [13.63, 12.54, 2.24, 2.38, 17.03, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/sj93sTcEJYA_filtered.json b/annotations_filtered/sj93sTcEJYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..407889ad2ce8cf99c5aa034ef23b6566b1c591ea --- /dev/null +++ b/annotations_filtered/sj93sTcEJYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.23], [24.0, 25.17], [31.0, 31.24], [37.0, 38.47], [45.0, 45.2], [48.0, 48.81], [53.0, 52.95], [55.0, 56.81], [59.0, 60.88], [71.0, 71.41], [73.0, 73.06], [75.0, 74.93], [86.0, 88.11], [91.0, 91.62], [93.0, 93.48], [100.0, 102.02], [106.0, 106.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 69.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.23, 1.17, 0.24, 1.47, 0.2, 0.81, -0.05, 1.81, 1.88, 0.41, 0.06, -0.07, 2.11, 0.62, 0.48, 2.02, 0.89]} \ No newline at end of file diff --git a/annotations_filtered/sjEDF282UvY_filtered.json b/annotations_filtered/sjEDF282UvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e21864d84610b8ad41c11a7ed9c5672e4530d118 --- /dev/null +++ b/annotations_filtered/sjEDF282UvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 46.95], [47.0, 49.54], [53.0, 54.75], [55.0, 58.33], [61.0, 62.5], [69.0, 71.59], [75.0, 90.48], [92.0, 100.11], [101.0, 105.58], [106.0, 112.29], [113.0, 115.11], [118.0, 123.16], [124.0, 133.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.3, 0.0, 67.63, 0.0, 93.45, 90.08, 87.19, 100.0, 99.98, 97.73, 99.94, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [44.95, 2.54, 1.75, 3.33, 1.5, 2.59, 15.48, 8.11, 4.58, 6.29, 2.11, 5.16, 9.95]} \ No newline at end of file diff --git a/annotations_filtered/sjPnuqcrL70_filtered.json b/annotations_filtered/sjPnuqcrL70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60212de2eb38beb80b9824d3c44588018b1ec333 --- /dev/null +++ b/annotations_filtered/sjPnuqcrL70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 35.92], [39.0, 39.38], [41.0, 41.28], [50.0, 57.33], [63.0, 69.33], [70.0, 86.71], [94.0, 98.69], [100.0, 100.5], [102.0, 103.64], [109.0, 110.54], [112.0, 115.18], [117.0, 117.88]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [74.13, 0.0, 0.0, 42.04, 68.15, 75.07, 42.13, 0.0, 0.0, 0.0, 55.39, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 17.95], ["sidetone", 16.59], ["sine wave", 11.87]], null, null, [["music", 50.27], ["theremin", 9.44], ["ambient music", 6.28]], null, null, null, null, null], "duration": [4.92, 0.38, 0.28, 7.33, 6.33, 16.71, 4.69, 0.5, 1.64, 1.54, 3.18, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/sjWdByLxTuI_filtered.json b/annotations_filtered/sjWdByLxTuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11095b21b0968b422d2d03b74fa7804e5c3b0205 --- /dev/null +++ b/annotations_filtered/sjWdByLxTuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.37], [10.0, 11.3], [16.0, 23.52], [26.0, 40.47], [46.0, 46.72], [49.0, 50.13], [54.0, 55.12], [55.0, 85.48], [86.0, 86.44], [86.0, 86.81], [87.0, 86.93], [87.0, 87.78], [89.0, 89.4], [91.0, 92.45], [95.0, 95.44], [102.0, 105.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 1.3, 7.52, 14.47, 0.72, 1.13, 1.12, 30.48, 0.44, 0.81, -0.07, 0.78, 0.4, 1.45, 0.44, 3.85]} \ No newline at end of file diff --git a/annotations_filtered/sjmh7BViBtg_filtered.json b/annotations_filtered/sjmh7BViBtg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66c25562920154520e49e15642770362b78e12f3 --- /dev/null +++ b/annotations_filtered/sjmh7BViBtg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 27.58], [30.0, 33.84], [35.0, 35.78], [39.0, 39.61], [41.0, 41.27], [43.0, 46.21]], "keep_status": [false, false, false, false, false, false], "silence_prob": [39.83, 50.26, 0.0, 0.0, 0.0, 46.4], "audiomae_on_audioset": [[["music", 34.85], ["sonar", 29.91], ["hum", 10.19]], null, null, null, null, [["music", 55.17], ["synthesizer", 12.65], ["ambient music", 5.72]]], "duration": [16.58, 3.84, 0.78, 0.61, 0.27, 3.21]} \ No newline at end of file diff --git a/annotations_filtered/sk0mjld_eow_filtered.json b/annotations_filtered/sk0mjld_eow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b36258fec5919e70f963f8de9ddfa777c6b8eb5b --- /dev/null +++ b/annotations_filtered/sk0mjld_eow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 31.97], [34.0, 58.4], [60.0, 65.69], [67.0, 68.69], [73.0, 72.98], [75.0, 76.91], [82.0, 83.76], [86.0, 91.67], [93.0, 93.48], [93.0, 100.95], [102.0, 102.29], [109.0, 110.76], [114.0, 115.13], [116.0, 117.93], [119.0, 119.28], [122.0, 122.15], [122.0, 128.43], [129.0, 129.34], [130.0, 130.71], [138.0, 138.72], [141.0, 145.64], [147.0, 148.14], [150.0, 151.36], [154.0, 153.89], [155.0, 156.88], [160.0, 160.2], [163.0, 163.32], [164.0, 174.68]], "keep_status": [true, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [29.54, 28.84, 31.34, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 31.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.35, 0.0, 0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.22], "audiomae_on_audioset": [[["music", 53.74], ["sampler", 6.02], ["didgeridoo", 5.88]], [["music", 18.79], ["vehicle", 18.54], ["speech", 13.01]], [["speech", 11.9], ["sheep", 11.29], ["breaking", 10.53]], null, null, null, null, [["cattle, bovinae", 35.62], ["moo", 28.65], ["livestock, farm animals, working animals", 13.12]], null, [["livestock, farm animals, working animals", 27.15], ["animal", 25.88], ["cattle, bovinae", 11.07]], null, null, null, null, null, null, [["cattle, bovinae", 35.29], ["livestock, farm animals, working animals", 30.95], ["moo", 30.48]], null, null, null, [["moo", 34.06], ["cattle, bovinae", 33.88], ["livestock, farm animals, working animals", 27.54]], null, null, null, null, null, null, [["music", 34.21], ["gunshot, gunfire", 14.91], ["speech", 13.36]]], "duration": [24.97, 24.4, 5.69, 1.69, -0.02, 1.91, 1.76, 5.67, 0.48, 7.95, 0.29, 1.76, 1.13, 1.93, 0.28, 0.15, 6.43, 0.34, 0.71, 0.72, 4.64, 1.14, 1.36, -0.11, 1.88, 0.2, 0.32, 10.68]} \ No newline at end of file diff --git a/annotations_filtered/sk3soFv1wHM_filtered.json b/annotations_filtered/sk3soFv1wHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..181cafac95170f7e170c9bcb83491d90f735bca2 --- /dev/null +++ b/annotations_filtered/sk3soFv1wHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.31], [12.0, 12.45], [13.0, 18.28], [20.0, 20.11], [26.0, 26.45], [30.0, 32.53], [34.0, 35.95], [40.0, 42.2], [43.0, 44.93], [53.0, 54.01], [58.0, 59.36], [62.0, 63.76], [65.0, 66.33], [69.0, 70.48], [71.0, 73.4], [75.0, 75.57], [77.0, 85.11], [86.0, 87.89], [89.0, 99.99], [102.0, 107.25], [108.0, 108.94], [109.0, 109.44]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.37, 0.0, 43.85, 0.0, 0.0, 34.91, 0.0, 32.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.39, 0.0, 35.59, 0.0, 31.83, 33.97, 0.0, 0.0], "audiomae_on_audioset": [[["music", 58.61], ["musical instrument", 8.01], ["guitar", 6.27]], null, [["music", 63.35], ["speech", 7.87], ["musical instrument", 5.78]], null, null, [["mains hum", 12.18], ["hum", 10.82], ["whale vocalization", 9.61]], null, [["music", 26.49], ["hum", 25.25], ["noise", 11.39]], null, null, null, null, null, null, [["music", 64.42], ["musical instrument", 4.04], ["hum", 3.78]], null, [["theremin", 40.83], ["music", 32.53], ["musical instrument", 4.3]], null, [["theremin", 56.26], ["music", 34.22], ["musical instrument", 1.36]], [["music", 48.18], ["ambient music", 14.42], ["didgeridoo", 8.99]], null, null], "duration": [3.31, 0.45, 5.28, 0.11, 0.45, 2.53, 1.95, 2.2, 1.93, 1.01, 1.36, 1.76, 1.33, 1.48, 2.4, 0.57, 8.11, 1.89, 10.99, 5.25, 0.94, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/skMchQx_U_k_filtered.json b/annotations_filtered/skMchQx_U_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b18f8823ed3a094b5ccee94967e07f975c27c549 --- /dev/null +++ b/annotations_filtered/skMchQx_U_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.69], [12.0, 14.59], [17.0, 23.45], [24.0, 30.94], [33.0, 35.01], [36.0, 38.21], [40.0, 81.58], [92.0, 93.31], [96.0, 97.83], [99.0, 102.02]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 60.51, 55.53, 39.54, 68.67, 59.96, 0.0, 0.0, 0.0, 32.93], "audiomae_on_audioset": [null, null, null, [["speech", 36.43], ["sidetone", 27.6], ["hum", 16.4]], null, null, null, null, null, [["mains hum", 19.33], ["hum", 18.41], ["pulse", 16.16]]], "duration": [1.69, 2.59, 6.45, 6.94, 2.01, 2.21, 41.58, 1.31, 1.83, 3.02]} \ No newline at end of file diff --git a/annotations_filtered/skrdyoabmgA_filtered.json b/annotations_filtered/skrdyoabmgA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0c099680df4d8cb77c3e1c32615806725e2bbe1 --- /dev/null +++ b/annotations_filtered/skrdyoabmgA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [10.0, 10.15], [15.0, 16.58], [19.0, 25.93], [27.0, 28.63], [30.0, 30.65], [33.0, 33.1], [36.0, 36.05], [40.0, 40.8], [46.0, 47.28], [50.0, 51.65], [56.0, 57.11], [58.0, 59.24], [60.0, 62.07], [63.0, 65.5], [69.0, 70.33], [71.0, 71.17], [73.0, 73.35], [82.0, 85.28], [87.0, 87.17], [89.0, 89.24], [93.0, 93.34], [95.0, 96.21], [98.0, 99.45], [107.0, 109.36], [111.0, 111.13], [124.0, 124.44], [128.0, 129.59], [132.0, 133.34], [136.0, 141.27], [143.0, 142.99], [144.0, 145.32], [149.0, 150.18], [156.0, 156.76], [163.0, 165.45], [168.0, 168.81], [173.0, 172.74], [176.0, 176.17], [177.0, 178.61], [181.0, 181.72], [186.0, 193.77], [197.0, 199.25], [200.0, 202.44], [205.0, 205.66], [213.0, 214.32], [216.0, 216.8], [218.0, 218.93], [222.0, 223.82], [227.0, 227.38], [230.0, 230.61], [235.0, 235.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.74, 71.43, 0.0, 0.0, 0.0, 33.48, 0.0, 0.0, 0.0, 0.0, 0.0, 32.75, 0.0, 0.0, 0.0, 0.0, 31.61, 0.0, 0.0, 0.0, 0.0, 29.63, 0.0, 0.0, 0.0, 0.0, 0.0, 29.45, 60.51, 48.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.85], ["cattle, bovinae", 8.28], ["speech", 5.97]], null, null, null, null, [["music", 31.0], ["throbbing", 14.41], ["hum", 6.53]], null, null, null, null, null, [["music", 25.1], ["synthesizer", 12.87], ["effects unit", 5.84]], null, null, null, null, [["hum", 31.24], ["throbbing", 28.46], ["music", 10.7]], null, null, null, null, [["hum", 20.52], ["throbbing", 12.34], ["mains hum", 7.37]], null, null, null, null, null, [["buzz", 11.58], ["vehicle", 11.32], ["motorcycle", 10.45]], null, [["music", 38.96], ["hum", 11.32], ["ambient music", 5.13]], null, null, null, null, null, null, null, null], "duration": [0.51, 0.15, 1.58, 6.93, 1.63, 0.65, 0.1, 0.05, 0.8, 1.28, 1.65, 1.11, 1.24, 2.07, 2.5, 1.33, 0.17, 0.35, 3.28, 0.17, 0.24, 0.34, 1.21, 1.45, 2.36, 0.13, 0.44, 1.59, 1.34, 5.27, -0.01, 1.32, 1.18, 0.76, 2.45, 0.81, -0.26, 0.17, 1.61, 0.72, 7.77, 2.25, 2.44, 0.66, 1.32, 0.8, 0.93, 1.82, 0.38, 0.61, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/skuMakhGnn4_filtered.json b/annotations_filtered/skuMakhGnn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9e1c7b3a11b3a35017ab795a8153a06b23e8c7b --- /dev/null +++ b/annotations_filtered/skuMakhGnn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 64.44], [65.0, 104.03]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [32.44, 39.03]} \ No newline at end of file diff --git a/annotations_filtered/sl1Jjq82XUA_filtered.json b/annotations_filtered/sl1Jjq82XUA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffa8769821df9027751f14fc064b6d756b6fbf9f --- /dev/null +++ b/annotations_filtered/sl1Jjq82XUA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 58.41], [60.0, 94.91], [96.0, 109.75], [115.0, 123.47]], "keep_status": [false, false, false, true], "silence_prob": [36.47, 0.0, 34.08, 40.22], "audiomae_on_audioset": [[["music", 61.88], ["hum", 13.96], ["mains hum", 9.0]], null, [["music", 49.28], ["speech", 27.3], ["groan", 4.13]], [["livestock, farm animals, working animals", 33.59], ["cattle, bovinae", 15.46], ["moo", 8.03]]], "duration": [23.41, 34.91, 13.75, 8.47]} \ No newline at end of file diff --git a/annotations_filtered/sloo9PMVoRE_filtered.json b/annotations_filtered/sloo9PMVoRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40e3ac692990abf8f17f616bc3a692bdb41dc775 --- /dev/null +++ b/annotations_filtered/sloo9PMVoRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.48], [11.0, 11.92], [13.0, 19.13], [21.0, 21.76], [28.0, 29.1], [30.0, 30.06], [40.0, 43.11], [44.0, 44.46], [48.0, 48.52], [52.0, 57.5], [58.0, 58.45], [64.0, 66.33], [68.0, 70.56], [71.0, 71.64], [75.0, 75.34], [81.0, 81.26], [88.0, 88.35], [89.0, 89.88], [92.0, 97.33], [99.0, 106.22], [108.0, 109.11], [110.0, 117.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0, 84.25, 0.0, 97.92, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 64.29, 0.0, 43.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.35], ["foghorn", 17.76], ["trombone", 8.78]]], "duration": [0.48, 0.92, 6.13, 0.76, 1.1, 0.06, 3.11, 0.46, 0.52, 5.5, 0.45, 2.33, 2.56, 0.64, 0.34, 0.26, 0.35, 0.88, 5.33, 7.22, 1.11, 7.86]} \ No newline at end of file diff --git a/annotations_filtered/sm5Zgj8kjD8_filtered.json b/annotations_filtered/sm5Zgj8kjD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f99ff733292a7048be9b751ff767663daa2e8b3 --- /dev/null +++ b/annotations_filtered/sm5Zgj8kjD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.07], [9.0, 12.85], [13.0, 14.25], [15.0, 16.51], [18.0, 40.78], [41.0, 43.98], [45.0, 129.98], [133.0, 149.25], [151.0, 153.62], [156.0, 159.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 99.26, 94.07, 95.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [4.07, 3.85, 1.25, 1.51, 22.78, 2.98, 84.98, 16.25, 2.62, 3.58]} \ No newline at end of file diff --git a/annotations_filtered/smHHU_ONdGU_filtered.json b/annotations_filtered/smHHU_ONdGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d20a30a2743c15300f22a7a6d0248af59fa56af3 --- /dev/null +++ b/annotations_filtered/smHHU_ONdGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.67], [1.0, 15.35], [15.0, 15.38], [16.0, 27.7], [29.0, 37.12]], "keep_status": [false, true, false, true, true], "silence_prob": [0.0, 32.61, 0.0, 34.14, 32.52], "audiomae_on_audioset": [null, [["music", 26.64], ["hum", 16.18], ["mains hum", 9.7]], null, [["music", 35.5], ["speech", 11.04], ["theremin", 8.63]], [["music", 31.05], ["hum", 13.77], ["speech", 13.48]]], "duration": [0.67, 14.35, 0.38, 11.7, 8.12]} \ No newline at end of file diff --git a/annotations_filtered/smVge5w077g_filtered.json b/annotations_filtered/smVge5w077g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97325cd8520fe45c93fc7be818a3717cea6510c8 --- /dev/null +++ b/annotations_filtered/smVge5w077g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.05], [4.0, 4.77], [14.0, 14.47], [26.0, 25.96], [29.0, 29.73], [35.0, 36.09], [37.0, 38.2], [41.0, 41.32], [42.0, 42.5], [48.0, 51.93], [61.0, 60.76], [69.0, 69.18], [71.0, 72.98], [74.0, 74.51], [80.0, 80.62], [81.0, 81.92], [87.0, 88.4], [93.0, 94.17], [102.0, 102.96], [107.0, 108.21], [118.0, 123.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 39.21], ["speech", 29.81], ["glockenspiel", 4.06]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.05, 0.77, 0.47, -0.04, 0.73, 1.09, 1.2, 0.32, 0.5, 3.93, -0.24, 0.18, 1.98, 0.51, 0.62, 0.92, 1.4, 1.17, 0.96, 1.21, 5.26]} \ No newline at end of file diff --git a/annotations_filtered/smtDfh1TXe8_filtered.json b/annotations_filtered/smtDfh1TXe8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/smtDfh1TXe8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/smwBZ-3HAPY_filtered.json b/annotations_filtered/smwBZ-3HAPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f5c6e51f5885a2782e33e5b47661fbb5f3c8bff --- /dev/null +++ b/annotations_filtered/smwBZ-3HAPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.41], [9.0, 12.88], [17.0, 22.3], [23.0, 25.02], [26.0, 27.24], [28.0, 27.94], [32.0, 34.62], [41.0, 41.89], [43.0, 43.36], [44.0, 48.86], [57.0, 58.55], [63.0, 63.0], [66.0, 66.58], [67.0, 67.96], [75.0, 75.15], [77.0, 77.55], [80.0, 79.96], [81.0, 82.19], [84.0, 85.09], [86.0, 87.91], [90.0, 93.06], [94.0, 96.47], [97.0, 99.1], [104.0, 105.0], [109.0, 109.88], [116.0, 122.55], [123.0, 123.87]], "keep_status": [false, true, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.61, 39.63, 40.45, 0.0, 0.0, 35.79, 0.0, 0.0, 33.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 97.54, 74.29, 0.0, 0.0, 78.04, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 28.92], ["insect", 18.06], ["mosquito", 12.66]], [["music", 47.24], ["musical instrument", 7.18], ["animal", 5.19]], [["music", 27.36], ["speech", 19.74], ["didgeridoo", 11.57]], null, null, [["moo", 36.42], ["cattle, bovinae", 34.49], ["livestock, farm animals, working animals", 9.1]], null, null, [["speech", 29.38], ["whimper", 18.08], ["music", 16.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 3.88, 5.3, 2.02, 1.24, -0.06, 2.62, 0.89, 0.36, 4.86, 1.55, 0.0, 0.58, 0.96, 0.15, 0.55, -0.04, 1.19, 1.09, 1.91, 3.06, 2.47, 2.1, 1.0, 0.88, 6.55, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/smxGSlqjZNk_filtered.json b/annotations_filtered/smxGSlqjZNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..228b88dff509dff8f2a54c7ae448bede2a113148 --- /dev/null +++ b/annotations_filtered/smxGSlqjZNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.7], [25.0, 25.84], [31.0, 34.1], [41.0, 41.82], [43.0, 43.7], [84.0, 86.61], [87.0, 91.84], [100.0, 99.93], [105.0, 105.75], [115.0, 115.87]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.72, 0.0, 0.0, 32.73, 55.31, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 29.08], ["boing", 19.1], ["speech", 8.95]], null, null, [["boing", 38.34], ["music", 36.87], ["speech", 1.95]], null, null, null, null], "duration": [-0.3, 0.84, 3.1, 0.82, 0.7, 2.61, 4.84, -0.07, 0.75, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/snKDmQJqQ1E_filtered.json b/annotations_filtered/snKDmQJqQ1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cf25687ae1a9e445787a18e65f8eb68eb458245 --- /dev/null +++ b/annotations_filtered/snKDmQJqQ1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 21.09], [23.0, 36.31], [39.0, 42.82], [43.0, 47.06], [47.0, 50.5], [51.0, 53.79], [55.0, 57.13], [58.0, 74.97], [78.0, 77.87], [78.0, 93.29]], "keep_status": [true, true, true, true, false, true, true, true, false, false], "silence_prob": [41.1, 39.7, 44.99, 40.17, 34.17, 47.16, 43.48, 31.98, 0.0, 31.48], "audiomae_on_audioset": [[["stomach rumble", 41.18], ["boing", 11.93], ["burping, eructation", 7.36]], [["speech", 53.71], ["hands", 5.78], ["bouncing", 4.94]], [["boing", 28.23], ["music", 21.91], ["alarm", 17.97]], [["speech", 21.77], ["hum", 13.76], ["mains hum", 10.11]], [["speech", 75.12], ["boing", 5.56], ["radio", 3.26]], [["effects unit", 14.35], ["noise", 10.71], ["music", 8.61]], [["music", 20.1], ["buzzer", 8.5], ["chirp tone", 8.18]], [["music", 41.39], ["grunt", 11.17], ["effects unit", 5.68]], null, [["music", 66.05], ["musical instrument", 9.91], ["brass instrument", 6.47]]], "duration": [7.09, 13.31, 3.82, 4.06, 3.5, 2.79, 2.13, 16.97, -0.13, 15.29]} \ No newline at end of file diff --git a/annotations_filtered/snRRa2Z3DFo_filtered.json b/annotations_filtered/snRRa2Z3DFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70109114c13f9d6ea36c92bb8d7af739049cb06a --- /dev/null +++ b/annotations_filtered/snRRa2Z3DFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.69], [4.0, 6.66], [7.0, 10.72], [17.0, 19.47], [22.0, 25.71], [29.0, 29.67], [30.0, 30.75], [31.0, 33.51], [34.0, 34.52]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.3, 59.59, 98.01, 74.29, 0.0, 0.0, 31.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 66.14], ["music", 15.97], ["zipper (clothing)", 1.64]], null], "duration": [1.69, 2.66, 3.72, 2.47, 3.71, 0.67, 0.75, 2.51, 0.52]} \ No newline at end of file diff --git a/annotations_filtered/snTaSJk0n_Y_filtered.json b/annotations_filtered/snTaSJk0n_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..666a01e7db43de24ded5e9dd57b3870835217a32 --- /dev/null +++ b/annotations_filtered/snTaSJk0n_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.42], [32.0, 32.7], [39.0, 39.58], [42.0, 42.82], [49.0, 52.37], [59.0, 59.73], [62.0, 72.2], [77.0, 77.63], [79.0, 79.47], [84.0, 105.24]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.75, 0.0, 31.96, 0.0, 0.0, 30.96], "audiomae_on_audioset": [null, null, null, null, [["music", 50.26], ["throbbing", 12.42], ["synthesizer", 11.98]], null, [["music", 73.42], ["musical instrument", 8.64], ["synthesizer", 3.08]], null, null, [["throbbing", 26.52], ["cacophony", 17.99], ["music", 17.37]]], "duration": [0.42, 0.7, 0.58, 0.82, 3.37, 0.73, 10.2, 0.63, 0.47, 21.24]} \ No newline at end of file diff --git a/annotations_filtered/snTvACYp8NA_filtered.json b/annotations_filtered/snTvACYp8NA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..476fd63afdbb986a09fdd9e9628ff8f0619b3b4f --- /dev/null +++ b/annotations_filtered/snTvACYp8NA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.72], [5.0, 5.53], [6.0, 5.97], [6.0, 7.97]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [-0.28, 0.53, -0.03, 1.97]} \ No newline at end of file diff --git a/annotations_filtered/sneQ02FCals_filtered.json b/annotations_filtered/sneQ02FCals_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91076b8ae5c912708702b432f5f3071b99e0aafb --- /dev/null +++ b/annotations_filtered/sneQ02FCals_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.93], [14.0, 21.22], [22.0, 30.55], [35.0, 35.65], [39.0, 39.39], [44.0, 44.68], [48.0, 48.41], [53.0, 54.09], [56.0, 57.82], [59.0, 59.36], [60.0, 122.18], [123.0, 123.94], [129.0, 129.56], [130.0, 133.59], [134.0, 136.61], [137.0, 137.46], [148.0, 149.23], [152.0, 152.63], [156.0, 160.07], [163.0, 163.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.58, 50.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 32.48, 0.0, 0.0, 0.0, 97.92, 0.0], "audiomae_on_audioset": [null, [["music", 66.2], ["didgeridoo", 5.35], ["synthesizer", 4.49]], null, null, null, null, null, null, null, null, null, null, null, [["gong", 42.81], ["speech", 19.04], ["music", 11.03]], [["speech", 56.26], ["music", 24.03], ["boing", 4.56]], null, null, null, null, null], "duration": [1.93, 7.22, 8.55, 0.65, 0.39, 0.68, 0.41, 1.09, 1.82, 0.36, 62.18, 0.94, 0.56, 3.59, 2.61, 0.46, 1.23, 0.63, 4.07, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/snqs566G_Zg_filtered.json b/annotations_filtered/snqs566G_Zg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cccc7a4be53e0a7827f045909c06560b76eb0ab --- /dev/null +++ b/annotations_filtered/snqs566G_Zg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.3], [24.0, 24.92], [27.0, 68.12]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.3, 0.92, 41.12]} \ No newline at end of file diff --git a/annotations_filtered/soEFK6PSKEY_filtered.json b/annotations_filtered/soEFK6PSKEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d36fd586add1e89765b3f6444f8a76e37bf151a --- /dev/null +++ b/annotations_filtered/soEFK6PSKEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.36], [13.0, 12.95], [16.0, 15.99], [19.0, 21.98], [33.0, 35.4], [35.0, 35.45], [37.0, 37.45], [41.0, 41.74], [43.0, 44.29], [45.0, 46.63], [55.0, 54.92], [56.0, 56.78], [69.0, 70.6], [74.0, 75.34], [76.0, 76.92], [79.0, 79.93], [81.0, 81.46], [86.0, 86.97], [88.0, 89.23], [104.0, 104.41], [105.0, 105.56], [109.0, 109.36], [110.0, 110.2], [115.0, 116.07], [116.0, 119.2], [122.0, 122.08]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.67, 37.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 58.52], ["sidetone", 18.82], ["radio", 4.39]], [["hands", 17.92], ["scratching (performance technique)", 15.01], ["music", 9.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, -0.05, -0.01, 2.98, 2.4, 0.45, 0.45, 0.74, 1.29, 1.63, -0.08, 0.78, 1.6, 1.34, 0.92, 0.93, 0.46, 0.97, 1.23, 0.41, 0.56, 0.36, 0.2, 1.07, 3.2, 0.08]} \ No newline at end of file diff --git a/annotations_filtered/soTciHbL4iA_filtered.json b/annotations_filtered/soTciHbL4iA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44ee75ab3f71477f66991f59a016517bdee1f11a --- /dev/null +++ b/annotations_filtered/soTciHbL4iA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.35], [12.0, 12.36], [15.0, 16.14], [19.0, 19.06], [25.0, 26.25], [27.0, 27.58], [38.0, 38.58], [44.0, 44.42], [47.0, 48.27], [49.0, 50.58], [52.0, 53.49], [60.0, 60.45]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 46.2], ["frog", 6.46], ["livestock, farm animals, working animals", 4.31]], null, null, null, null, null, null, null, null, null, null, null], "duration": [3.35, 0.36, 1.14, 0.06, 1.25, 0.58, 0.58, 0.42, 1.27, 1.58, 1.49, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/sohDA6TQuiE_filtered.json b/annotations_filtered/sohDA6TQuiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5623980d1342eef69255455ce1278bd255a584e --- /dev/null +++ b/annotations_filtered/sohDA6TQuiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.01], [20.0, 28.98], [34.0, 69.8]], "keep_status": [true, true, false], "silence_prob": [30.79, 29.32, 0.0], "audiomae_on_audioset": [[["music", 33.27], ["speech", 12.61], ["throbbing", 12.58]], [["mains hum", 33.75], ["music", 16.65], ["cacophony", 15.43]], null], "duration": [10.01, 8.98, 35.8]} \ No newline at end of file diff --git a/annotations_filtered/sp0O70Q5FAQ_filtered.json b/annotations_filtered/sp0O70Q5FAQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fb89f3269318beb8c9967758856809a08f089d4 --- /dev/null +++ b/annotations_filtered/sp0O70Q5FAQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[95.0, 95.79], [96.0, 97.66], [99.0, 107.01], [108.0, 110.25], [110.0, 113.86], [116.0, 119.87], [121.0, 121.95], [123.0, 123.84], [125.0, 125.76]], "keep_status": [false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 44.07, 40.64, 37.67, 90.25, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["bouncing", 24.24], ["speech", 10.35], ["radio", 10.06]], [["stomach rumble", 14.69], ["horse", 6.65], ["clip-clop", 5.78]], [["fly, housefly", 24.29], ["insect", 14.14], ["speech", 10.0]], null, null, null, null], "duration": [0.79, 1.66, 8.01, 2.25, 3.86, 3.87, 0.95, 0.84, 0.76]} \ No newline at end of file diff --git a/annotations_filtered/sp2FvfOi928_filtered.json b/annotations_filtered/sp2FvfOi928_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc076f5b9760708de22384549cbd7b4ae2f18c86 --- /dev/null +++ b/annotations_filtered/sp2FvfOi928_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.67], [11.0, 12.46], [14.0, 13.93], [23.0, 25.54], [28.0, 28.7], [40.0, 40.56], [41.0, 42.63], [49.0, 51.75], [53.0, 53.32], [58.0, 58.38], [61.0, 61.08], [63.0, 62.87], [64.0, 66.97], [69.0, 72.93], [75.0, 75.14], [87.0, 87.22], [87.0, 88.4], [91.0, 92.28], [96.0, 96.18], [99.0, 99.05]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [43.0, 0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 34.41, 0.0, 0.0, 0.0, 0.0, 37.33, 38.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 33.44], ["throbbing", 22.64], ["speech", 17.36]], null, null, null, null, null, null, [["music", 23.8], ["noise", 13.95], ["chuckle, chortle", 4.9]], null, null, null, null, [["squish", 10.06], ["mosquito", 9.19], ["horse", 6.97]], [["dishes, pots, and pans", 7.0], ["glass", 5.2], ["fire", 5.07]], null, null, null, null, null, null], "duration": [3.67, 1.46, -0.07, 2.54, 0.7, 0.56, 1.63, 2.75, 0.32, 0.38, 0.08, -0.13, 2.97, 3.93, 0.14, 0.22, 1.4, 1.28, 0.18, 0.05]} \ No newline at end of file diff --git a/annotations_filtered/sp4A_jU3oD0_filtered.json b/annotations_filtered/sp4A_jU3oD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f30d3c60622eb61f51c733ad0241ee198ad5977a --- /dev/null +++ b/annotations_filtered/sp4A_jU3oD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.79], [3.0, 3.52], [6.0, 5.68], [6.0, 7.52], [19.0, 19.77], [23.0, 23.13], [33.0, 33.61], [47.0, 46.95], [57.0, 57.38], [63.0, 63.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [-0.21, 0.52, -0.32, 1.52, 0.77, 0.13, 0.61, -0.05, 0.38, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/sp8Ufx3Ej24_filtered.json b/annotations_filtered/sp8Ufx3Ej24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d435f61853289ba6571bd6090d68d46b1b73f825 --- /dev/null +++ b/annotations_filtered/sp8Ufx3Ej24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.98], [19.0, 20.46], [21.0, 22.28], [26.0, 27.3], [30.0, 34.52], [36.0, 36.37], [39.0, 40.96], [46.0, 47.76], [49.0, 50.4], [57.0, 58.18], [73.0, 76.3], [79.0, 80.13], [82.0, 85.51], [88.0, 88.43], [92.0, 93.06], [97.0, 100.06], [102.0, 104.82], [110.0, 111.59], [113.0, 114.4], [116.0, 119.55], [123.0, 123.4], [125.0, 125.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 98.93, 0.0, 0.0, 99.31, 98.73, 0.0, 0.0, 96.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.02, 1.46, 1.28, 1.3, 4.52, 0.37, 1.96, 1.76, 1.4, 1.18, 3.3, 1.13, 3.51, 0.43, 1.06, 3.06, 2.82, 1.59, 1.4, 3.55, 0.4, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/spAkj5YYnIo_filtered.json b/annotations_filtered/spAkj5YYnIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6383a3398f6df2e8da4578d9ebeedd1397d23547 --- /dev/null +++ b/annotations_filtered/spAkj5YYnIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.61], [7.0, 9.15], [12.0, 14.71], [16.0, 16.85], [25.0, 26.06], [28.0, 28.65], [31.0, 32.39], [36.0, 39.8], [44.0, 58.85], [61.0, 60.94], [63.0, 62.83], [65.0, 65.64], [68.0, 71.54], [73.0, 73.55], [75.0, 76.92], [90.0, 89.82], [90.0, 90.75], [91.0, 91.5], [93.0, 93.63], [94.0, 96.77], [100.0, 101.33], [102.0, 102.81], [104.0, 104.97], [106.0, 106.46], [110.0, 109.81], [122.0, 123.09], [128.0, 129.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 85.9, 98.36, 0.0, 0.0, 0.0, 0.0, 99.99, 99.62, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 2.15, 2.71, 0.85, 1.06, 0.65, 1.39, 3.8, 14.85, -0.06, -0.17, 0.64, 3.54, 0.55, 1.92, -0.18, 0.75, 0.5, 0.63, 2.77, 1.33, 0.81, 0.97, 0.46, -0.19, 1.09, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/spI-9R3B6zk_filtered.json b/annotations_filtered/spI-9R3B6zk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e835d22b878918089ce068c3c80dc4ca60f0889c --- /dev/null +++ b/annotations_filtered/spI-9R3B6zk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.54], [12.0, 13.46], [16.0, 16.38], [21.0, 21.56], [25.0, 26.38], [27.0, 31.09], [32.0, 59.63], [60.0, 74.65], [78.0, 82.58], [85.0, 87.07], [88.0, 91.1], [92.0, 99.32], [100.0, 103.47], [107.0, 107.08], [108.0, 109.88]], "keep_status": [false, false, false, false, false, true, false, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.06, 31.04, 30.69, 29.52, 39.58, 49.27, 46.02, 44.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 43.28], ["speech", 21.27], ["cowbell", 5.26]], [["music", 50.07], ["speech", 33.85], ["burst, pop", 1.65]], [["music", 74.51], ["speech", 16.8], ["boing", 2.33]], [["music", 55.34], ["dubstep", 6.83], ["groan", 4.51]], [["speech", 20.44], ["music", 14.78], ["hum", 10.73]], [["music", 41.8], ["speech", 17.7], ["foghorn", 11.43]], [["music", 63.64], ["synthesizer", 6.72], ["throbbing", 3.42]], [["music", 47.13], ["theremin", 5.41], ["synthesizer", 3.48]], null, null], "duration": [1.54, 1.46, 0.38, 0.56, 1.38, 4.09, 27.63, 14.65, 4.58, 2.07, 3.1, 7.32, 3.47, 0.08, 1.88]} \ No newline at end of file diff --git a/annotations_filtered/spbfax8dOTk_filtered.json b/annotations_filtered/spbfax8dOTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dc500dab384d1e34ca2264d90e46a39b4a43754 --- /dev/null +++ b/annotations_filtered/spbfax8dOTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 83.49], [86.0, 91.81]], "keep_status": [true, true], "silence_prob": [43.79, 37.14], "audiomae_on_audioset": [[["hum", 25.36], ["music", 19.01], ["speech", 18.14]], [["buzz", 37.5], ["hum", 16.12], ["music", 14.73]]], "duration": [12.49, 5.81]} \ No newline at end of file diff --git a/annotations_filtered/spwoWkSEmsE_filtered.json b/annotations_filtered/spwoWkSEmsE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a7801d1437f6b392c73b04e28d339a9bccc95a7 --- /dev/null +++ b/annotations_filtered/spwoWkSEmsE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [5.0, 6.91], [8.0, 9.46], [10.0, 10.47], [11.0, 12.78], [15.0, 17.0], [18.0, 19.36], [20.0, 21.56], [23.0, 23.4], [25.0, 25.81], [33.0, 33.56], [36.0, 37.13], [41.0, 40.95], [42.0, 43.12], [44.0, 45.5], [46.0, 47.56], [48.0, 50.11], [53.0, 53.92]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 40.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 29.52], ["music", 12.19], ["singing bowl", 6.52]], null, null, null, null, null, null, null, null, null, null, [["speech", 23.77], ["moo", 8.99], ["inside, small room", 6.7]], null], "duration": [1.08, 1.91, 1.46, 0.47, 1.78, 2.0, 1.36, 1.56, 0.4, 0.81, 0.56, 1.13, -0.05, 1.12, 1.5, 1.56, 2.11, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/spy6L78o3-A_filtered.json b/annotations_filtered/spy6L78o3-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..691065ca956998c0c255b51d6beb166e9ead9923 --- /dev/null +++ b/annotations_filtered/spy6L78o3-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 32.19], [39.0, 43.38], [48.0, 49.2], [51.0, 51.81], [64.0, 65.08], [67.0, 76.52], [82.0, 84.5], [89.0, 111.0], [120.0, 125.15], [131.0, 132.17], [134.0, 136.63], [137.0, 138.84], [148.0, 154.84], [157.0, 158.06], [161.0, 189.31]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, true, false, true], "silence_prob": [30.89, 31.56, 0.0, 0.0, 0.0, 29.87, 29.39, 28.69, 30.64, 0.0, 30.54, 0.0, 31.77, 0.0, 28.69], "audiomae_on_audioset": [[["music", 80.78], ["electronic music", 2.58], ["boing", 1.68]], [["music", 45.27], ["speech", 28.88], ["fart", 8.24]], null, null, null, [["speech", 56.43], ["music", 7.5], ["vehicle", 6.6]], [["music", 22.91], ["sound effect", 6.74], ["siren", 5.37]], [["music", 33.01], ["speech", 15.36], ["livestock, farm animals, working animals", 8.67]], [["music", 37.8], ["vehicle", 9.14], ["buzz", 7.39]], null, [["music", 58.37], ["speech", 23.74], ["electronic music", 4.08]], null, [["music", 42.26], ["vehicle", 12.29], ["car", 9.46]], null, [["music", 31.64], ["vehicle", 18.09], ["car", 9.64]]], "duration": [3.19, 4.38, 1.2, 0.81, 1.08, 9.52, 2.5, 22.0, 5.15, 1.17, 2.63, 1.84, 6.84, 1.06, 28.31]} \ No newline at end of file diff --git a/annotations_filtered/sqLiTaVHPdo_filtered.json b/annotations_filtered/sqLiTaVHPdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1ae4c2e2c6546199c6398dc6107283bb213ab40 --- /dev/null +++ b/annotations_filtered/sqLiTaVHPdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.8], [17.0, 18.42], [19.0, 19.95], [21.0, 21.2], [46.0, 45.91], [48.0, 49.17], [51.0, 51.98], [53.0, 55.61], [62.0, 61.64], [71.0, 71.78], [73.0, 73.9], [74.0, 76.79], [91.0, 91.44], [95.0, 95.18], [100.0, 100.47], [103.0, 103.06], [104.0, 105.06], [106.0, 106.86], [108.0, 108.5], [110.0, 110.1], [119.0, 119.25], [120.0, 121.19], [156.0, 156.84], [157.0, 157.96]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 0.0, 0.0, 40.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 26.14], ["creak", 7.73], ["guitar", 4.11]], null, null, null, [["music", 57.15], ["speech", 23.69], ["synthesizer", 3.25]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 1.42, 0.95, 0.2, -0.09, 1.17, 0.98, 2.61, -0.36, 0.78, 0.9, 2.79, 0.44, 0.18, 0.47, 0.06, 1.06, 0.86, 0.5, 0.1, 0.25, 1.19, 0.84, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/sqZ6ZrVIemM_filtered.json b/annotations_filtered/sqZ6ZrVIemM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0507902286e69fcf0f8e131882b00a4ea99710c1 --- /dev/null +++ b/annotations_filtered/sqZ6ZrVIemM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.21], [13.0, 19.2], [37.0, 46.3], [47.0, 49.4], [50.0, 54.41], [55.0, 62.87], [63.0, 63.59], [64.0, 67.29], [73.0, 89.26], [90.0, 90.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.04, 97.43, 99.4, 96.04, 98.51, 98.86, 0.0, 99.16, 89.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 6.2, 9.3, 2.4, 4.41, 7.87, 0.59, 3.29, 16.26, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/sqhPvOlgzjo_filtered.json b/annotations_filtered/sqhPvOlgzjo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..499373a273b12bfad660cf0e2c373dd0c0a079bb --- /dev/null +++ b/annotations_filtered/sqhPvOlgzjo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [5.0, 6.37], [15.0, 16.26], [18.0, 19.45], [21.0, 23.01], [24.0, 26.03], [28.0, 30.81], [32.0, 33.79], [34.0, 72.03], [73.0, 92.62], [94.0, 129.37], [130.0, 131.63], [132.0, 131.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.97, 100.0, 99.95, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 1.37, 1.26, 1.45, 2.01, 2.03, 2.81, 1.79, 38.03, 19.62, 35.37, 1.63, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/sqmzvduQ-JY_filtered.json b/annotations_filtered/sqmzvduQ-JY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd485e93e9d3ef1aa6820a9e20dd1eb4f0916040 --- /dev/null +++ b/annotations_filtered/sqmzvduQ-JY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [2.0, 4.02], [5.0, 6.05], [8.0, 8.63], [10.0, 10.23], [11.0, 11.38], [13.0, 14.66], [15.0, 15.4], [17.0, 18.13], [20.0, 23.21], [25.0, 25.54], [29.0, 28.65], [31.0, 30.97], [32.0, 32.44], [34.0, 33.96], [35.0, 35.8], [37.0, 39.73], [42.0, 42.77], [45.0, 46.67], [50.0, 49.72], [51.0, 52.17], [52.0, 57.32], [59.0, 61.65], [64.0, 65.21], [69.0, 76.1], [79.0, 88.82], [90.0, 95.54], [97.0, 99.08], [103.0, 103.25], [104.0, 104.19], [105.0, 105.68], [108.0, 109.26], [110.0, 111.15], [114.0, 114.52], [115.0, 116.31], [117.0, 118.07], [119.0, 123.5], [124.0, 126.32], [129.0, 130.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 35.37, 99.98, 0.0, 99.8, 70.3, 88.83, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 48.74, 0.0], "audiomae_on_audioset": [null, [["sidetone", 86.13], ["dial tone", 4.52], ["speech", 3.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 16.84], ["speech", 15.41], ["explosion", 10.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 55.53], ["speech", 28.55], ["busy signal", 2.05]], null], "duration": [0.81, 2.02, 1.05, 0.63, 0.23, 0.38, 1.66, 0.4, 1.13, 3.21, 0.54, -0.35, -0.03, 0.44, -0.04, 0.8, 2.73, 0.77, 1.67, -0.28, 1.17, 5.32, 2.65, 1.21, 7.1, 9.82, 5.54, 2.08, 0.25, 0.19, 0.68, 1.26, 1.15, 0.52, 1.31, 1.07, 4.5, 2.32, 1.54]} \ No newline at end of file diff --git a/annotations_filtered/srDyToPqozI_filtered.json b/annotations_filtered/srDyToPqozI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec7aca847dcf1bcaa073e1d7b80dcc3e04258109 --- /dev/null +++ b/annotations_filtered/srDyToPqozI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 82.43], [87.0, 97.9], [99.0, 125.54]], "keep_status": [false, false, false], "silence_prob": [0.0, 32.12, 32.68], "audiomae_on_audioset": [null, [["music", 58.13], ["throbbing", 8.69], ["drum machine", 5.19]], [["music", 46.26], ["hum", 21.79], ["throbbing", 11.7]]], "duration": [73.43, 10.9, 26.54]} \ No newline at end of file diff --git a/annotations_filtered/srLwGlDe598_filtered.json b/annotations_filtered/srLwGlDe598_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08bdf809154a8c53315ce90216405e34972241a2 --- /dev/null +++ b/annotations_filtered/srLwGlDe598_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [5.0, 7.37], [15.0, 15.58], [18.0, 19.95], [21.0, 31.11], [33.0, 36.48], [41.0, 41.64], [46.0, 46.04], [48.0, 47.83], [49.0, 78.95], [80.0, 87.29], [89.0, 122.72]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 60.32, 0.0, 0.0, 39.75, 62.78, 0.0, 0.0, 0.0, 41.26, 51.66, 0.0], "audiomae_on_audioset": [null, null, null, null, [["buzz", 12.63], ["glass", 12.02], ["explosion", 7.85]], null, null, null, null, [["telephone dialing, dtmf", 25.76], ["speech", 11.86], ["sidetone", 6.88]], null, null], "duration": [0.58, 2.37, 0.58, 1.95, 10.11, 3.48, 0.64, 0.04, -0.17, 29.95, 7.29, 33.72]} \ No newline at end of file diff --git a/annotations_filtered/srR56T9-j5M_filtered.json b/annotations_filtered/srR56T9-j5M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29fb298f2b2f235bc4b92efe7e523fd001e50b02 --- /dev/null +++ b/annotations_filtered/srR56T9-j5M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 30.23], [34.0, 34.5], [36.0, 38.8], [56.0, 56.93], [59.0, 59.81], [64.0, 64.39], [69.0, 70.06], [75.0, 77.36], [81.0, 82.68], [91.0, 99.4], [110.0, 110.27], [113.0, 117.71], [123.0, 124.28]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.63, 0.0, 33.39, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 44.12, 0.0, 30.16, 0.0], "audiomae_on_audioset": [[["music", 42.29], ["musical instrument", 11.59], ["speech", 11.24]], null, [["music", 41.49], ["synthesizer", 11.37], ["echo", 8.36]], null, null, null, null, null, null, [["music", 70.04], ["theremin", 3.77], ["didgeridoo", 3.45]], null, [["music", 79.83], ["didgeridoo", 6.44], ["musical instrument", 1.59]], null], "duration": [2.23, 0.5, 2.8, 0.93, 0.81, 0.39, 1.06, 2.36, 1.68, 8.4, 0.27, 4.71, 1.28]} \ No newline at end of file diff --git a/annotations_filtered/srpCm9gPmZI_filtered.json b/annotations_filtered/srpCm9gPmZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e410ab4136d6b37d2f61c3e0cec94ccd9854704 --- /dev/null +++ b/annotations_filtered/srpCm9gPmZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [5.0, 5.88], [7.0, 8.68], [9.0, 9.58], [10.0, 10.13], [12.0, 12.97], [14.0, 32.8], [34.0, 36.56], [41.0, 52.95], [53.0, 53.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.91, 27.95, 27.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 75.93], ["electronic music", 3.72], ["drum machine", 3.53]], [["music", 67.92], ["dubstep", 2.97], ["echo", 2.71]], [["music", 88.79], ["electronic music", 1.3], ["funk", 0.94]], null], "duration": [0.16, 0.88, 1.68, 0.58, 0.13, 0.97, 18.8, 2.56, 11.95, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/ssgm3-sCY-Y_filtered.json b/annotations_filtered/ssgm3-sCY-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..432f61a404cb4a080dff940a6e6125df84c5c446 --- /dev/null +++ b/annotations_filtered/ssgm3-sCY-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [4.0, 5.41], [7.0, 7.33], [12.0, 17.1], [22.0, 93.99], [94.0, 103.91]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.02, 0.0, 30.35], "audiomae_on_audioset": [null, null, null, [["music", 41.51], ["hum", 18.87], ["throbbing", 8.5]], null, [["music", 29.63], ["theremin", 26.61], ["hum", 17.11]]], "duration": [1.13, 1.41, 0.33, 5.1, 71.99, 9.91]} \ No newline at end of file diff --git a/annotations_filtered/ssukL9a99JA_filtered.json b/annotations_filtered/ssukL9a99JA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c50bce3e9793751d7ffbd32fbe72b3bbe53ea8f --- /dev/null +++ b/annotations_filtered/ssukL9a99JA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.65], [8.0, 8.36], [10.0, 11.79], [13.0, 14.4], [15.0, 18.81], [20.0, 20.56], [21.0, 22.28], [23.0, 23.3], [25.0, 25.49], [27.0, 27.09], [33.0, 35.65], [39.0, 39.72], [40.0, 40.8], [42.0, 43.93], [47.0, 47.56], [50.0, 51.87], [55.0, 55.43], [59.0, 59.64], [60.0, 60.4], [61.0, 61.4], [62.0, 62.8], [66.0, 67.8], [69.0, 75.69], [77.0, 80.57], [83.0, 82.65], [84.0, 85.24], [86.0, 87.12], [88.0, 90.02], [98.0, 99.33], [101.0, 101.04], [106.0, 106.39], [107.0, 109.11], [111.0, 113.0], [114.0, 116.23], [120.0, 122.69], [125.0, 125.39], [126.0, 126.59], [128.0, 131.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 99.9, 0.0, 0.0, 0.0, 63.74, 0.0, 0.0, 0.0, 93.29, 89.19, 77.2, 99.95, 0.0, 0.0, 73.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.36, 1.79, 1.4, 3.81, 0.56, 1.28, 0.3, 0.49, 0.09, 2.65, 0.72, 0.8, 1.93, 0.56, 1.87, 0.43, 0.64, 0.4, 0.4, 0.8, 1.8, 6.69, 3.57, -0.35, 1.24, 1.12, 2.02, 1.33, 0.04, 0.39, 2.11, 2.0, 2.23, 2.69, 0.39, 0.59, 3.23]} \ No newline at end of file diff --git a/annotations_filtered/ssxqmxjrx2c_filtered.json b/annotations_filtered/ssxqmxjrx2c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f51f05e52e79c71db7bb3b512dd26a0c5430b19 --- /dev/null +++ b/annotations_filtered/ssxqmxjrx2c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [21.0, 21.09], [36.0, 38.53], [40.0, 41.49], [45.0, 46.57], [50.0, 50.25], [51.0, 51.19], [55.0, 55.39], [58.0, 59.17], [60.0, 59.78], [63.0, 65.2], [67.0, 67.59], [69.0, 69.96], [79.0, 80.79], [90.0, 90.31], [91.0, 91.35], [97.0, 96.87], [101.0, 102.81], [105.0, 107.7], [113.0, 113.59], [115.0, 116.01], [117.0, 118.08], [119.0, 125.12], [126.0, 131.11], [131.0, 134.3], [135.0, 136.32], [143.0, 144.29], [145.0, 147.55], [151.0, 152.56], [154.0, 154.16], [154.0, 156.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 38.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 75.88, 52.33, 33.12, 0.0, 0.0, 56.1, 0.0, 0.0, 34.47], "audiomae_on_audioset": [null, null, [["speech", 79.56], ["sidetone", 6.82], ["dial tone", 5.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 66.91], ["dial tone", 4.89], ["busy signal", 4.82]], null, null, null, null, null, [["music", 10.8], ["synthesizer", 8.48], ["throbbing", 8.22]]], "duration": [0.83, 0.09, 2.53, 1.49, 1.57, 0.25, 0.19, 0.39, 1.17, -0.22, 2.2, 0.59, 0.96, 1.79, 0.31, 0.35, -0.13, 1.81, 2.7, 0.59, 1.01, 1.08, 6.12, 5.11, 3.3, 1.32, 1.29, 2.55, 1.56, 0.16, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/st8QRZbJdPY_filtered.json b/annotations_filtered/st8QRZbJdPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e17d1db1ce1084b7f831cb1dd13f8a04f1ca6e1 --- /dev/null +++ b/annotations_filtered/st8QRZbJdPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.31], [13.0, 21.69], [22.0, 22.76], [24.0, 24.38], [26.0, 26.38], [33.0, 33.71], [35.0, 35.75], [36.0, 37.79], [40.0, 42.74], [43.0, 43.7], [45.0, 44.9], [49.0, 50.13], [52.0, 52.46], [55.0, 55.53], [56.0, 57.06], [58.0, 59.83], [62.0, 64.37], [65.0, 66.16], [68.0, 69.87], [72.0, 73.58], [75.0, 76.71], [79.0, 80.18], [81.0, 81.92], [83.0, 83.42], [84.0, 85.28], [86.0, 87.32], [88.0, 91.79], [93.0, 93.92], [96.0, 97.39], [98.0, 99.32], [101.0, 101.76], [103.0, 103.49], [104.0, 105.29], [107.0, 123.65], [126.0, 126.37], [127.0, 127.74], [129.0, 130.13], [132.0, 147.06], [149.0, 148.76], [149.0, 149.71], [152.0, 158.09], [160.0, 161.27], [162.0, 164.34], [165.0, 166.92], [168.0, 170.99], [176.0, 176.76], [188.0, 188.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 87.92, 0.0, 99.84, 0.0, 99.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 8.69, 0.76, 0.38, 0.38, 0.71, 0.75, 1.79, 2.74, 0.7, -0.1, 1.13, 0.46, 0.53, 1.06, 1.83, 2.37, 1.16, 1.87, 1.58, 1.71, 1.18, 0.92, 0.42, 1.28, 1.32, 3.79, 0.92, 1.39, 1.32, 0.76, 0.49, 1.29, 16.65, 0.37, 0.74, 1.13, 15.06, -0.24, 0.71, 6.09, 1.27, 2.34, 1.92, 2.99, 0.76, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/stSweLZol7U_filtered.json b/annotations_filtered/stSweLZol7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d17a0193cb3a2d878c91f98cade7740c39242d0b --- /dev/null +++ b/annotations_filtered/stSweLZol7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 21.56], [25.0, 25.49], [29.0, 35.78], [38.0, 41.59], [44.0, 44.76], [48.0, 48.84], [51.0, 55.92], [66.0, 70.39], [74.0, 78.8], [83.0, 83.93], [86.0, 86.22], [89.0, 98.79], [105.0, 110.69], [112.0, 115.37], [116.0, 117.73], [118.0, 121.2], [123.0, 126.62], [128.0, 135.94], [137.0, 140.48], [141.0, 142.5], [145.0, 146.21], [147.0, 148.68], [152.0, 155.95], [157.0, 160.24], [162.0, 162.95]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, true, false, true, false, false, false, false, false, false], "silence_prob": [75.07, 0.0, 75.39, 67.89, 0.0, 0.0, 43.48, 85.54, 79.07, 0.0, 0.0, 79.24, 62.17, 39.37, 0.0, 41.64, 44.63, 40.47, 39.64, 0.0, 0.0, 0.0, 32.15, 33.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 10.94], ["noise", 8.9], ["speech", 8.14]], null, null, null, null, null, null, [["hum", 39.46], ["music", 16.92], ["mains hum", 11.92]], null, [["music", 49.82], ["musical instrument", 8.24], ["didgeridoo", 4.04]], [["music", 31.91], ["hum", 20.75], ["throbbing", 10.12]], [["music", 54.07], ["hum", 13.09], ["throbbing", 6.07]], [["didgeridoo", 40.28], ["music", 12.75], ["throbbing", 5.52]], null, null, null, [["music", 52.18], ["didgeridoo", 22.52], ["musical instrument", 6.66]], [["music", 63.44], ["speech", 11.52], ["guitar", 8.11]], null], "duration": [3.56, 0.49, 6.78, 3.59, 0.76, 0.84, 4.92, 4.39, 4.8, 0.93, 0.22, 9.79, 5.69, 3.37, 1.73, 3.2, 3.62, 7.94, 3.48, 1.5, 1.21, 1.68, 3.95, 3.24, 0.95]} \ No newline at end of file diff --git a/annotations_filtered/stelirVdNdI_filtered.json b/annotations_filtered/stelirVdNdI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1413849ed9af5142bafe1184fae1c1b81b5c8647 --- /dev/null +++ b/annotations_filtered/stelirVdNdI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 26.11], [27.0, 27.89], [29.0, 29.94], [31.0, 32.07], [35.0, 47.04], [50.0, 50.14], [52.0, 51.7], [61.0, 63.17], [70.0, 70.83], [91.0, 91.07], [98.0, 98.37], [103.0, 107.32], [108.0, 108.72], [114.0, 114.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [74.44, 0.0, 0.0, 0.0, 33.49, 0.0, 0.0, 38.97, 0.0, 0.0, 0.0, 52.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 46.58], ["sidetone", 22.89], ["speech", 13.65]], null, null, [["speech", 42.29], ["sidetone", 26.28], ["hum", 7.2]], null, null, null, null, null, null], "duration": [4.11, 0.89, 0.94, 1.07, 12.04, 0.14, -0.3, 2.17, 0.83, 0.07, 0.37, 4.32, 0.72, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/stoxd02ubG4_filtered.json b/annotations_filtered/stoxd02ubG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68c4120e5f7ad10aeb78b16e9ceaf58d2dcf8d50 --- /dev/null +++ b/annotations_filtered/stoxd02ubG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.36], [9.0, 10.03], [16.0, 17.09], [19.0, 21.14], [23.0, 23.85], [25.0, 27.08], [28.0, 29.46], [33.0, 43.41], [45.0, 49.03], [53.0, 53.76], [56.0, 65.45], [67.0, 80.06], [82.0, 82.14], [83.0, 84.2], [85.0, 85.13], [86.0, 86.61], [87.0, 88.75], [90.0, 91.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 87.37, 0.0, 97.0, 0.0, 53.59, 83.7, 0.0, 76.53, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.36, 1.03, 1.09, 2.14, 0.85, 2.08, 1.46, 10.41, 4.03, 0.76, 9.45, 13.06, 0.14, 1.2, 0.13, 0.61, 1.75, 1.03]} \ No newline at end of file diff --git a/annotations_filtered/su2njbUCQhg_filtered.json b/annotations_filtered/su2njbUCQhg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c7102973daae3f7031471adc535f06de8929aeb --- /dev/null +++ b/annotations_filtered/su2njbUCQhg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.18], [28.0, 29.13], [30.0, 31.38], [32.0, 38.11], [48.0, 48.68], [50.0, 51.07], [54.0, 53.81]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 52.12], ["moo", 27.27], ["livestock, farm animals, working animals", 17.28]], null, null, null], "duration": [0.18, 1.13, 1.38, 6.11, 0.68, 1.07, -0.19]} \ No newline at end of file diff --git a/annotations_filtered/su64KIPecuo_filtered.json b/annotations_filtered/su64KIPecuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a0f91745e1a727017396764e1a70b49d76abcc7 --- /dev/null +++ b/annotations_filtered/su64KIPecuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 26.7], [28.0, 27.78], [28.0, 29.35], [30.0, 31.28], [37.0, 42.33], [43.0, 44.36], [45.0, 46.35], [60.0, 59.86], [61.0, 60.89], [70.0, 70.53], [71.0, 71.51], [79.0, 86.16], [90.0, 90.63], [104.0, 104.46], [105.0, 106.51], [115.0, 117.32]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.24, 0.0, 0.0, 0.0, 40.12], "audiomae_on_audioset": [null, null, null, null, [["music", 10.03], ["sonar", 8.14], ["telephone", 7.26]], null, null, null, null, null, null, [["fly, housefly", 33.21], ["bee, wasp, etc.", 28.23], ["insect", 11.62]], null, null, null, [["speech", 13.28], ["hum", 8.17], ["vehicle", 4.95]]], "duration": [-0.3, -0.22, 1.35, 1.28, 5.33, 1.36, 1.35, -0.14, -0.11, 0.53, 0.51, 7.16, 0.63, 0.46, 1.51, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/suYDvQwikn4_filtered.json b/annotations_filtered/suYDvQwikn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4035668dd8b2267386983a825d9a75c432b95cf7 --- /dev/null +++ b/annotations_filtered/suYDvQwikn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.95], [15.0, 16.14], [19.0, 20.07], [22.0, 23.21], [27.0, 28.93], [31.0, 40.88], [45.0, 49.01], [53.0, 55.34], [57.0, 66.07], [68.0, 68.49], [72.0, 89.04], [91.0, 91.72], [94.0, 94.56], [97.0, 110.51], [111.0, 114.69], [121.0, 130.28], [133.0, 133.88], [136.0, 141.1], [143.0, 152.15], [153.0, 155.26], [158.0, 161.81], [163.0, 174.31], [174.0, 175.15], [176.0, 176.4], [177.0, 177.62]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.81, 66.51, 70.44, 28.76, 0.0, 40.71, 0.0, 0.0, 46.97, 57.25, 49.78, 0.0, 33.88, 30.36, 51.12, 54.3, 37.69, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["whack, thwack", 39.2], ["speech", 31.93], ["thunk", 17.59]], null, null, [["speech", 34.73], ["music", 27.94], ["drum", 5.75]], null, [["music", 67.93], ["speech", 15.99], ["synthesizer", 2.18]], null, null, [["music", 57.47], ["throbbing", 12.02], ["hum", 10.77]], null, [["music", 62.64], ["synthesizer", 5.82], ["hum", 2.6]], null, [["music", 32.15], ["hum", 21.14], ["mains hum", 14.16]], [["throbbing", 39.54], ["music", 33.76], ["hum", 5.73]], null, null, [["fart", 23.45], ["music", 20.15], ["hum", 9.39]], null, null, null], "duration": [0.95, 1.14, 1.07, 1.21, 1.93, 9.88, 4.01, 2.34, 9.07, 0.49, 17.04, 0.72, 0.56, 13.51, 3.69, 9.28, 0.88, 5.1, 9.15, 2.26, 3.81, 11.31, 1.15, 0.4, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/sua9tcQ14hs_filtered.json b/annotations_filtered/sua9tcQ14hs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/sua9tcQ14hs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/suvJai5IC6c_filtered.json b/annotations_filtered/suvJai5IC6c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad76f3c8f0a97cd3a1be32be0aa8a83260ca0b2d --- /dev/null +++ b/annotations_filtered/suvJai5IC6c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.55], [19.0, 19.28], [22.0, 23.3], [26.0, 26.37], [34.0, 34.45], [39.0, 40.39], [42.0, 43.01], [50.0, 50.45], [51.0, 51.44], [52.0, 52.44], [52.0, 52.96], [58.0, 59.1], [60.0, 59.98], [67.0, 67.64], [69.0, 69.36], [78.0, 79.54], [85.0, 85.51], [93.0, 93.04], [94.0, 94.24], [111.0, 112.67], [113.0, 115.5], [118.0, 118.71], [121.0, 121.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.28, 1.3, 0.37, 0.45, 1.39, 1.01, 0.45, 0.44, 0.44, 0.96, 1.1, -0.02, 0.64, 0.36, 1.54, 0.51, 0.04, 0.24, 1.67, 2.5, 0.71, 0.31]} \ No newline at end of file diff --git a/annotations_filtered/sv9XNFpRdhg_filtered.json b/annotations_filtered/sv9XNFpRdhg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daf79d8580013348e4e6a9b1110afb243d370503 --- /dev/null +++ b/annotations_filtered/sv9XNFpRdhg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.46], [13.0, 12.68], [20.0, 22.42], [37.0, 37.0], [42.0, 44.49], [45.0, 49.71], [51.0, 53.15], [55.0, 55.19], [56.0, 57.92], [60.0, 62.45], [63.0, 64.94], [69.0, 71.86], [73.0, 75.14], [80.0, 81.13], [82.0, 83.52], [85.0, 85.21], [87.0, 87.84], [89.0, 90.17], [93.0, 94.91], [96.0, 98.24], [100.0, 99.94], [105.0, 106.74], [108.0, 109.73], [112.0, 112.72], [118.0, 118.4], [119.0, 121.05], [123.0, 123.8], [126.0, 127.09], [129.0, 130.77], [132.0, 131.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.11, 0.0, 100.0, 95.09, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, -0.32, 2.42, 0.0, 2.49, 4.71, 2.15, 0.19, 1.92, 2.45, 1.94, 2.86, 2.14, 1.13, 1.52, 0.21, 0.84, 1.17, 1.91, 2.24, -0.06, 1.74, 1.73, 0.72, 0.4, 2.05, 0.8, 1.09, 1.77, -0.28]} \ No newline at end of file diff --git a/annotations_filtered/svBPXPXgpqc_filtered.json b/annotations_filtered/svBPXPXgpqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fde25114764e6b770ca832559876c692c98e02a1 --- /dev/null +++ b/annotations_filtered/svBPXPXgpqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.41], [15.0, 21.95], [24.0, 31.01], [32.0, 32.44], [34.0, 42.08], [43.0, 44.51], [46.0, 46.08], [48.0, 48.52], [51.0, 52.32], [53.0, 73.6], [74.0, 99.18]], "keep_status": [false, false, true, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 43.64, 46.83, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 35.25, 32.38], "audiomae_on_audioset": [null, [["music", 69.66], ["pizzicato", 3.62], ["musical instrument", 3.52]], [["music", 22.63], ["livestock, farm animals, working animals", 14.33], ["cattle, bovinae", 12.72]], null, null, null, null, null, null, [["music", 38.35], ["speech", 25.65], ["basketball bounce", 4.68]], [["whack, thwack", 15.09], ["music", 14.11], ["livestock, farm animals, working animals", 12.37]]], "duration": [1.41, 6.95, 7.01, 0.44, 8.08, 1.51, 0.08, 0.52, 1.32, 20.6, 25.18]} \ No newline at end of file diff --git a/annotations_filtered/svXObgE9fXc_filtered.json b/annotations_filtered/svXObgE9fXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff194b30a25c348b64ed5e4cb545fe27a48b291e --- /dev/null +++ b/annotations_filtered/svXObgE9fXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 35.9], [36.0, 64.15], [67.0, 87.51], [89.0, 88.97], [90.0, 96.9]], "keep_status": [false, false, true, false, true], "silence_prob": [28.54, 28.28, 28.48, 0.0, 28.3], "audiomae_on_audioset": [[["music", 35.36], ["speech", 29.85], ["hum", 11.14]], [["music", 72.76], ["meow", 7.69], ["whack, thwack", 3.21]], [["music", 22.67], ["throbbing", 18.65], ["mains hum", 14.16]], null, [["music", 24.48], ["speech", 17.04], ["mains hum", 13.12]]], "duration": [7.9, 28.15, 20.51, -0.03, 6.9]} \ No newline at end of file diff --git a/annotations_filtered/svwcgrDZVPw_filtered.json b/annotations_filtered/svwcgrDZVPw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba508c9c66f2d5c724295f24bce070d68806956 --- /dev/null +++ b/annotations_filtered/svwcgrDZVPw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.46], [5.0, 9.14], [48.0, 57.94], [90.0, 90.27], [103.0, 102.81], [105.0, 107.47], [111.0, 111.42], [117.0, 117.68], [124.0, 123.7], [140.0, 139.97], [141.0, 157.37], [160.0, 164.59], [170.0, 170.48], [174.0, 176.07], [179.0, 180.3], [181.0, 183.93], [185.0, 189.4], [190.0, 192.62], [193.0, 195.39], [196.0, 197.34]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 35.71, 47.54, 0.0, 0.0, 39.5, 0.0, 0.0, 0.0, 0.0, 31.75, 58.64, 0.0, 53.16, 0.0, 33.6, 32.97, 46.5, 79.94, 0.0], "audiomae_on_audioset": [null, [["music", 62.8], ["theremin", 15.62], ["musical instrument", 3.59]], [["music", 36.38], ["effects unit", 8.98], ["musical instrument", 6.9]], null, null, [["music", 16.48], ["boing", 8.56], ["speech", 7.48]], null, null, null, null, [["music", 39.55], ["noise", 18.1], ["cacophony", 5.25]], null, null, null, null, [["music", 18.71], ["speech", 15.33], ["cattle, bovinae", 14.35]], [["music", 46.76], ["speech", 11.37], ["trombone", 2.22]], [["speech", 31.15], ["music", 22.28], ["gong", 5.35]], null, null], "duration": [0.46, 4.14, 9.94, 0.27, -0.19, 2.47, 0.42, 0.68, -0.3, -0.03, 16.37, 4.59, 0.48, 2.07, 1.3, 2.93, 4.4, 2.62, 2.39, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/svytEWJK6Qk_filtered.json b/annotations_filtered/svytEWJK6Qk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ca49feee9f2dda3926c7193948998cfb27365c3 --- /dev/null +++ b/annotations_filtered/svytEWJK6Qk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [24.0, 24.16], [32.0, 32.29], [33.0, 33.57], [34.0, 34.08], [39.0, 40.37], [52.0, 52.83], [58.0, 61.15], [64.0, 66.07], [67.0, 67.8], [74.0, 75.0], [89.0, 89.58], [124.0, 125.56], [144.0, 144.54], [155.0, 156.02], [157.0, 159.58], [161.0, 162.97], [164.0, 163.9], [164.0, 164.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 61.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.16, 0.29, 0.57, 0.08, 1.37, 0.83, 3.15, 2.07, 0.8, 1.0, 0.58, 1.56, 0.54, 1.02, 2.58, 1.97, -0.1, 0.64]} \ No newline at end of file diff --git a/annotations_filtered/sw-oQlitqCY_filtered.json b/annotations_filtered/sw-oQlitqCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..346f67cea0eab32edca0f6b8615791d1220f9436 --- /dev/null +++ b/annotations_filtered/sw-oQlitqCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.42], [9.0, 9.22], [10.0, 22.05], [23.0, 23.85], [25.0, 27.08], [30.0, 29.94], [33.0, 34.16], [37.0, 36.91], [38.0, 42.96], [48.0, 57.69], [61.0, 73.85], [80.0, 80.33], [83.0, 83.02], [83.0, 91.13], [96.0, 108.94], [111.0, 112.19], [116.0, 117.1]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [85.9, 0.0, 33.93, 0.0, 36.51, 0.0, 0.0, 0.0, 34.36, 34.98, 32.95, 0.0, 0.0, 32.41, 30.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 63.67], ["speech", 9.11], ["synthesizer", 6.42]], null, [["speech", 34.15], ["boing", 19.65], ["music", 17.64]], null, null, null, [["music", 28.7], ["didgeridoo", 27.03], ["boing", 10.96]], [["music", 38.22], ["livestock, farm animals, working animals", 19.82], ["boing", 8.24]], [["livestock, farm animals, working animals", 33.95], ["cattle, bovinae", 25.96], ["moo", 20.43]], null, null, [["speech", 26.86], ["groan", 24.0], ["music", 11.66]], [["music", 62.0], ["sound effect", 4.93], ["synthesizer", 3.43]], null, null], "duration": [4.42, 0.22, 12.05, 0.85, 2.08, -0.06, 1.16, -0.09, 4.96, 9.69, 12.85, 0.33, 0.02, 8.13, 12.94, 1.19, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/sw1tJoYrs7M_filtered.json b/annotations_filtered/sw1tJoYrs7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad00d4795bfcb0c6daf40f590bd419c4796d528a --- /dev/null +++ b/annotations_filtered/sw1tJoYrs7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.22], [19.0, 20.33], [22.0, 22.84], [25.0, 24.97], [26.0, 38.85], [46.0, 46.18], [48.0, 48.22], [51.0, 51.9], [54.0, 54.89], [58.0, 58.19], [59.0, 59.21], [61.0, 61.26], [63.0, 63.95], [68.0, 69.21], [70.0, 71.68], [72.0, 73.45], [77.0, 90.41], [91.0, 92.37], [105.0, 104.75], [106.0, 106.29], [107.0, 107.81], [109.0, 109.68], [111.0, 112.4], [114.0, 129.69], [131.0, 144.02], [145.0, 146.6], [151.0, 152.0], [153.0, 153.33], [154.0, 154.21], [157.0, 158.62], [160.0, 160.34], [161.0, 182.26], [183.0, 193.33], [200.0, 200.03], [200.0, 201.55], [209.0, 210.05]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.11, 58.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.84, 34.1, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["noise", 33.18], ["vehicle", 14.83], ["aircraft", 7.62]], null, null, null, null, null, null, null, null, null, null, null, [["jet engine", 18.38], ["vehicle", 14.37], ["microwave oven", 5.22]], null, null, null, null, null, null, [["mains hum", 34.06], ["hum", 27.07], ["white noise", 11.31]], null, null, null, null, null, null, null, [["music", 50.42], ["theremin", 24.35], ["musical instrument", 6.77]], [["hum", 26.58], ["music", 25.16], ["mains hum", 10.24]], null, null, null], "duration": [1.22, 1.33, 0.84, -0.03, 12.85, 0.18, 0.22, 0.9, 0.89, 0.19, 0.21, 0.26, 0.95, 1.21, 1.68, 1.45, 13.41, 1.37, -0.25, 0.29, 0.81, 0.68, 1.4, 15.69, 13.02, 1.6, 1.0, 0.33, 0.21, 1.62, 0.34, 21.26, 10.33, 0.03, 1.55, 1.05]} \ No newline at end of file diff --git a/annotations_filtered/swEgflM5Ol4_filtered.json b/annotations_filtered/swEgflM5Ol4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41aef4ed90883fe1ae69807915177029fb1ec3b1 --- /dev/null +++ b/annotations_filtered/swEgflM5Ol4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.91], [14.0, 31.55], [32.0, 33.94], [35.0, 39.53], [41.0, 50.08], [53.0, 54.41], [70.0, 70.33], [78.0, 78.61], [83.0, 83.56], [85.0, 85.94], [87.0, 87.66], [90.0, 98.12], [100.0, 101.71], [107.0, 107.65], [109.0, 113.26], [114.0, 120.66], [121.0, 125.27], [131.0, 131.33], [132.0, 133.79], [136.0, 137.56], [142.0, 149.71], [151.0, 182.01], [184.0, 184.64], [186.0, 188.47], [192.0, 192.03], [192.0, 192.06]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 33.54, 0.0, 48.14, 31.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.59, 0.0, 0.0, 33.92, 31.06, 30.18, 0.0, 0.0, 0.0, 33.78, 0.0, 0.0, 32.64, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 48.62], ["hum", 17.75], ["throbbing", 9.28]], null, [["hum", 21.12], ["bee, wasp, etc.", 19.93], ["mains hum", 14.67]], [["whale vocalization", 20.25], ["buzz", 16.83], ["noise", 13.78]], null, null, null, null, null, null, [["explosion", 40.25], ["artillery fire", 33.26], ["burst, pop", 8.35]], null, null, [["bee, wasp, etc.", 35.85], ["fly, housefly", 27.81], ["insect", 20.25]], [["mains hum", 27.87], ["hum", 21.96], ["speech", 19.14]], [["speech", 30.15], ["music", 11.07], ["buzz", 3.31]], null, null, null, [["animal", 21.82], ["speech", 13.29], ["hum", 7.87]], null, null, [["speech", 73.14], ["radio", 4.48], ["hum", 3.53]], null, null], "duration": [0.91, 17.55, 1.94, 4.53, 9.08, 1.41, 0.33, 0.61, 0.56, 0.94, 0.66, 8.12, 1.71, 0.65, 4.26, 6.66, 4.27, 0.33, 1.79, 1.56, 7.71, 31.01, 0.64, 2.47, 0.03, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/swOuQBjbiLU_filtered.json b/annotations_filtered/swOuQBjbiLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/swOuQBjbiLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/swo423cXQuE_filtered.json b/annotations_filtered/swo423cXQuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..420f8d58c4b2159ba61e81a8a64bee935d6c6404 --- /dev/null +++ b/annotations_filtered/swo423cXQuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.99], [23.0, 29.08], [30.0, 38.4], [39.0, 39.5], [49.0, 50.62], [53.0, 54.36], [55.0, 55.29], [56.0, 78.21], [80.0, 81.57], [83.0, 83.24], [86.0, 86.36], [89.0, 89.13], [91.0, 91.39], [94.0, 96.55], [98.0, 98.59], [100.0, 100.8], [101.0, 105.76], [107.0, 107.57], [108.0, 111.7], [112.0, 117.19], [118.0, 119.43], [121.0, 124.02], [124.0, 124.73], [129.0, 129.07], [130.0, 129.93], [133.0, 134.18], [138.0, 139.78], [140.0, 140.48], [141.0, 143.04], [144.0, 144.61], [146.0, 146.1], [150.0, 155.16], [155.0, 158.18], [159.0, 159.27], [163.0, 167.98], [169.0, 173.96], [174.0, 176.93], [180.0, 182.92], [186.0, 187.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 86.27, 0.0, 100.0, 99.94, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 99.96, 95.23, 0.0, 100.0, 70.16, 92.48, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 6.08, 8.4, 0.5, 1.62, 1.36, 0.29, 22.21, 1.57, 0.24, 0.36, 0.13, 0.39, 2.55, 0.59, 0.8, 4.76, 0.57, 3.7, 5.19, 1.43, 3.02, 0.73, 0.07, -0.07, 1.18, 1.78, 0.48, 2.04, 0.61, 0.1, 5.16, 3.18, 0.27, 4.98, 4.96, 2.93, 2.92, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/swpveBgb0Zs_filtered.json b/annotations_filtered/swpveBgb0Zs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..623d3705c1d70eabb2a1f7616ece4fa20ebbaf97 --- /dev/null +++ b/annotations_filtered/swpveBgb0Zs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 22.57], [25.0, 25.47], [32.0, 32.24], [34.0, 34.25]], "keep_status": [false, false, false, false], "silence_prob": [37.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 74.54], ["fart", 2.96], ["sidetone", 2.62]], null, null, null], "duration": [9.57, 0.47, 0.24, 0.25]} \ No newline at end of file diff --git a/annotations_filtered/sx-obtKU1jM_filtered.json b/annotations_filtered/sx-obtKU1jM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e3d128faf413d962281e978f1592a3c94aa0f19 --- /dev/null +++ b/annotations_filtered/sx-obtKU1jM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 24.87], [26.0, 33.08], [35.0, 46.48], [49.0, 80.43], [83.0, 83.59], [84.0, 85.04], [85.0, 85.08], [87.0, 97.31]], "keep_status": [true, true, false, false, false, false, false, true], "silence_prob": [30.56, 37.01, 30.22, 0.0, 0.0, 0.0, 0.0, 29.9], "audiomae_on_audioset": [[["music", 60.42], ["sound effect", 3.31], ["noise", 3.17]], [["speech", 43.33], ["fly, housefly", 9.99], ["fart", 9.03]], [["speech", 62.17], ["music", 13.6], ["didgeridoo", 6.15]], null, null, null, null, [["music", 36.52], ["synthesizer", 7.67], ["speech", 6.99]]], "duration": [19.87, 7.08, 11.48, 31.43, 0.59, 1.04, 0.08, 10.31]} \ No newline at end of file diff --git a/annotations_filtered/sxNHNxmgzJU_filtered.json b/annotations_filtered/sxNHNxmgzJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83f980477fb650da11fb53366a85f862071406da --- /dev/null +++ b/annotations_filtered/sxNHNxmgzJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.33], [10.0, 22.17], [25.0, 26.64], [27.0, 42.89], [44.0, 51.38], [54.0, 57.23], [59.0, 60.84], [62.0, 63.04], [65.0, 65.8], [67.0, 70.41], [71.0, 72.59], [76.0, 76.76], [77.0, 81.78], [83.0, 89.28], [90.0, 92.33], [93.0, 96.92], [98.0, 100.26], [105.0, 107.77], [109.0, 114.57], [117.0, 121.56], [123.0, 127.52], [128.0, 130.22], [131.0, 139.97], [140.0, 140.0], [140.0, 168.76]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 38.43, 0.0, 43.43, 37.95, 34.27, 0.0, 0.0, 0.0, 54.23, 0.0, 0.0, 59.24, 77.36, 60.14, 63.74, 70.02, 62.17, 55.31, 58.98, 59.59, 42.39, 61.37, 0.0, 30.36], "audiomae_on_audioset": [null, [["music", 57.19], ["musical instrument", 4.63], ["fly, housefly", 4.34]], null, [["music", 62.13], ["hum", 6.07], ["speech", 4.86]], [["music", 78.21], ["musical instrument", 3.38], ["theremin", 2.0]], [["music", 58.81], ["musical instrument", 4.51], ["synthesizer", 3.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.53], ["speech", 19.94], ["theremin", 9.36]], null, null, [["music", 58.16], ["ambient music", 16.01], ["theremin", 5.49]]], "duration": [1.33, 12.17, 1.64, 15.89, 7.38, 3.23, 1.84, 1.04, 0.8, 3.41, 1.59, 0.76, 4.78, 6.28, 2.33, 3.92, 2.26, 2.77, 5.57, 4.56, 4.52, 2.22, 8.97, 0.0, 28.76]} \ No newline at end of file diff --git a/annotations_filtered/sxo7GjhsghQ_filtered.json b/annotations_filtered/sxo7GjhsghQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26466c59344bc3232d360bddf4edf48155c15464 --- /dev/null +++ b/annotations_filtered/sxo7GjhsghQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.27], [10.0, 14.88], [15.0, 21.96], [22.0, 22.47], [24.0, 35.31], [39.0, 40.59], [41.0, 42.31], [44.0, 53.27], [55.0, 55.49], [56.0, 56.49], [58.0, 58.73]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 99.88, 51.07, 0.0, 30.14, 0.0, 0.0, 43.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 47.34], ["artillery fire", 9.74], ["explosion", 7.8]], null, null, [["creak", 39.39], ["mechanisms", 16.46], ["noise", 10.39]], null, null, null], "duration": [1.27, 4.88, 6.96, 0.47, 11.31, 1.59, 1.31, 9.27, 0.49, 0.49, 0.73]} \ No newline at end of file diff --git a/annotations_filtered/sxtENaaaPpQ_filtered.json b/annotations_filtered/sxtENaaaPpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..927b2b1ee9e5987e7da230885197ae9ad7d5e21f --- /dev/null +++ b/annotations_filtered/sxtENaaaPpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.52], [9.0, 10.07], [11.0, 13.51], [15.0, 16.78], [19.0, 21.73], [22.0, 26.16], [34.0, 34.33], [36.0, 37.81], [39.0, 41.42], [43.0, 44.54], [47.0, 48.12], [48.0, 50.52], [51.0, 51.76], [53.0, 53.22], [56.0, 58.01], [60.0, 60.15], [61.0, 61.75], [62.0, 63.02], [66.0, 66.23], [67.0, 67.8], [68.0, 69.03], [69.0, 71.61], [73.0, 75.15], [76.0, 76.6], [78.0, 79.89], [83.0, 84.25], [85.0, 86.09], [87.0, 88.47], [89.0, 91.67], [92.0, 93.39], [94.0, 96.58], [98.0, 98.25], [102.0, 103.18], [104.0, 106.22], [108.0, 108.43], [117.0, 118.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 100.0, 99.96, 0.0, 0.0, 100.0, 0.0, 0.0, 95.91, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 99.94, 0.0, 0.0, 95.78, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.52, 1.07, 2.51, 1.78, 2.73, 4.16, 0.33, 1.81, 2.42, 1.54, 1.12, 2.52, 0.76, 0.22, 2.01, 0.15, 0.75, 1.02, 0.23, 0.8, 1.03, 2.61, 2.15, 0.6, 1.89, 1.25, 1.09, 1.47, 2.67, 1.39, 2.58, 0.25, 1.18, 2.22, 0.43, 1.86]} \ No newline at end of file diff --git a/annotations_filtered/sy7Lx7jY2SU_filtered.json b/annotations_filtered/sy7Lx7jY2SU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8edaf8ba135fa76ac0239a321a069403638a5b19 --- /dev/null +++ b/annotations_filtered/sy7Lx7jY2SU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.8], [3.0, 3.75], [6.0, 31.5], [34.0, 34.32], [34.0, 34.35], [34.0, 34.38], [34.0, 34.42], [34.0, 42.79], [44.0, 44.46], [46.0, 46.94], [47.0, 55.43], [55.0, 55.48], [56.0, 55.54], [56.0, 63.71], [75.0, 77.25], [79.0, 81.95], [93.0, 93.83], [105.0, 111.87], [118.0, 121.95], [122.0, 122.52], [126.0, 127.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 36.51, 0.0, 0.0, 0.0, 0.0, 32.83, 0.0, 0.0, 34.79, 0.0, 0.0, 31.6, 34.15, 30.35, 0.0, 33.58, 31.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 62.16], ["mains hum", 11.91], ["music", 9.2]], null, null, null, null, [["music", 51.76], ["speech", 15.25], ["throbbing", 9.61]], null, null, [["hum", 28.75], ["throbbing", 24.56], ["music", 16.22]], null, null, [["music", 24.3], ["speech", 22.5], ["hum", 15.4]], [["music", 41.91], ["whale vocalization", 10.19], ["cattle, bovinae", 8.9]], [["speech", 39.66], ["explosion", 15.7], ["burst, pop", 9.0]], null, [["music", 31.48], ["speech", 29.24], ["throbbing", 11.18]], [["speech", 32.03], ["music", 26.96], ["hum", 6.94]], null, null], "duration": [0.8, 0.75, 25.5, 0.32, 0.35, 0.38, 0.42, 8.79, 0.46, 0.94, 8.43, 0.48, -0.46, 7.71, 2.25, 2.95, 0.83, 6.87, 3.95, 0.52, 1.2]} \ No newline at end of file diff --git a/annotations_filtered/sz8itUBsCTk_filtered.json b/annotations_filtered/sz8itUBsCTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d1eb1e442ddf8c9451b1eb98bf841171043b14d --- /dev/null +++ b/annotations_filtered/sz8itUBsCTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 49.22], [58.0, 62.24]], "keep_status": [true, false], "silence_prob": [34.49, 31.01], "audiomae_on_audioset": [[["music", 25.69], ["noise", 10.79], ["didgeridoo", 9.2]], [["cattle, bovinae", 32.92], ["moo", 29.72], ["livestock, farm animals, working animals", 12.54]]], "duration": [18.22, 4.24]} \ No newline at end of file diff --git a/annotations_filtered/szIOuIIbVfQ_filtered.json b/annotations_filtered/szIOuIIbVfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/szIOuIIbVfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/szLCkEBB6xs_filtered.json b/annotations_filtered/szLCkEBB6xs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2f519b4b07aec72ce9a48605cfadcc488031210 --- /dev/null +++ b/annotations_filtered/szLCkEBB6xs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.97], [28.0, 40.05], [45.0, 55.02], [55.0, 57.65], [58.0, 57.72], [62.0, 64.5], [68.0, 67.83], [68.0, 88.89], [91.0, 98.83], [105.0, 112.5], [117.0, 123.04]], "keep_status": [false, true, false, true, false, true, false, true, false, true, false], "silence_prob": [0.0, 34.34, 37.66, 32.3, 0.0, 33.09, 0.0, 33.56, 54.43, 33.7, 32.4], "audiomae_on_audioset": [null, [["music", 57.05], ["theremin", 8.87], ["speech", 3.9]], [["music", 62.16], ["theremin", 7.43], ["brass instrument", 3.35]], [["music", 57.14], ["theremin", 5.82], ["musical instrument", 3.07]], null, [["music", 38.6], ["didgeridoo", 15.9], ["musical instrument", 5.84]], null, [["music", 40.98], ["double bass", 10.14], ["bowed string instrument", 9.95]], null, [["music", 48.21], ["bowed string instrument", 7.22], ["musical instrument", 6.14]], [["music", 64.66], ["theremin", 5.75], ["musical instrument", 4.37]]], "duration": [0.97, 12.05, 10.02, 2.65, -0.28, 2.5, -0.17, 20.89, 7.83, 7.5, 6.04]} \ No newline at end of file diff --git a/annotations_filtered/szNrOdjjhkw_filtered.json b/annotations_filtered/szNrOdjjhkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5f433c4fc0d78fe92fa1bb26a5ee01b662b7d62 --- /dev/null +++ b/annotations_filtered/szNrOdjjhkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.78], [6.0, 8.92], [11.0, 14.3], [16.0, 16.6], [19.0, 21.66], [25.0, 25.14], [29.0, 30.11], [33.0, 34.67], [40.0, 41.98], [46.0, 47.29], [48.0, 49.2], [51.0, 51.39], [53.0, 54.67], [60.0, 61.06], [63.0, 63.54], [64.0, 66.66], [71.0, 71.86], [73.0, 73.36], [82.0, 83.98], [84.0, 85.24], [86.0, 87.05], [87.0, 87.62], [89.0, 89.34], [100.0, 100.72], [101.0, 111.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.31, 99.59, 93.91, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.56], ["cacophony", 6.43], ["hum", 5.25]]], "duration": [2.78, 2.92, 3.3, 0.6, 2.66, 0.14, 1.11, 1.67, 1.98, 1.29, 1.2, 0.39, 1.67, 1.06, 0.54, 2.66, 0.86, 0.36, 1.98, 1.24, 1.05, 0.62, 0.34, 0.72, 10.67]} \ No newline at end of file diff --git a/annotations_filtered/szpq76d4ipk_filtered.json b/annotations_filtered/szpq76d4ipk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6daec19106890154d37182f458c0a5fd1bcd303f --- /dev/null +++ b/annotations_filtered/szpq76d4ipk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 36.98], [39.0, 41.5], [42.0, 63.73], [65.0, 65.45]], "keep_status": [false, true, true, false], "silence_prob": [0.0, 30.05, 29.48, 0.0], "audiomae_on_audioset": [null, [["music", 63.41], ["throbbing", 2.96], ["electronic music", 2.64]], [["music", 59.96], ["wild animals", 4.37], ["electronic music", 3.21]], null], "duration": [-0.02, 2.5, 21.73, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/t--mSXDeETc_filtered.json b/annotations_filtered/t--mSXDeETc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf27ba7048e4e33b58101795a8540233cac576e1 --- /dev/null +++ b/annotations_filtered/t--mSXDeETc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.46], [26.0, 27.65], [30.0, 42.69], [45.0, 49.1], [52.0, 53.01], [53.0, 54.8], [56.0, 57.25], [58.0, 57.92], [59.0, 59.44], [61.0, 61.47], [65.0, 65.2], [65.0, 65.65], [66.0, 66.66], [70.0, 70.61], [74.0, 74.65], [81.0, 81.67], [84.0, 83.69], [86.0, 86.76], [95.0, 96.33], [97.0, 99.6], [102.0, 102.66], [105.0, 104.97], [110.0, 112.7], [113.0, 114.54], [115.0, 117.1], [118.0, 119.74], [123.0, 125.24], [126.0, 127.53], [132.0, 131.87], [132.0, 132.48], [136.0, 136.11], [136.0, 137.34], [141.0, 141.79], [142.0, 143.04], [143.0, 148.39], [150.0, 151.73], [153.0, 152.93], [156.0, 158.82], [160.0, 161.28], [162.0, 162.41], [165.0, 168.51], [169.0, 171.75]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.55, 29.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 0.0, 58.3, 0.0, 58.13, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.1, 0.0, 0.0, 68.28, 0.0, 0.0, 98.93, 35.37], "audiomae_on_audioset": [null, null, [["music", 49.53], ["didgeridoo", 7.23], ["effects unit", 5.93]], [["crack", 39.1], ["breaking", 31.07], ["crackle", 3.35]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 10.3], ["noise", 10.08], ["hum", 9.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.07], ["radio", 2.85], ["snicker", 2.82]]], "duration": [0.46, 1.65, 12.69, 4.1, 1.01, 1.8, 1.25, -0.08, 0.44, 0.47, 0.2, 0.65, 0.66, 0.61, 0.65, 0.67, -0.31, 0.76, 1.33, 2.6, 0.66, -0.03, 2.7, 1.54, 2.1, 1.74, 2.24, 1.53, -0.13, 0.48, 0.11, 1.34, 0.79, 1.04, 5.39, 1.73, -0.07, 2.82, 1.28, 0.41, 3.51, 2.75]} \ No newline at end of file diff --git a/annotations_filtered/t-B2zR5O5Ys_filtered.json b/annotations_filtered/t-B2zR5O5Ys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b116c03910c6a56573252fd849b6cca955a61236 --- /dev/null +++ b/annotations_filtered/t-B2zR5O5Ys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.35], [23.0, 24.17], [52.0, 59.49], [77.0, 81.31], [93.0, 92.75], [98.0, 99.98], [124.0, 127.14], [129.0, 128.78]], "keep_status": [true, false, true, false, false, false, false, false], "silence_prob": [29.41, 0.0, 33.09, 37.82, 0.0, 0.0, 31.99, 0.0], "audiomae_on_audioset": [[["music", 34.41], ["guitar", 12.41], ["musical instrument", 11.07]], null, [["music", 58.5], ["throbbing", 5.48], ["cacophony", 5.25]], [["music", 67.52], ["theremin", 7.81], ["synthesizer", 2.24]], null, null, [["music", 80.85], ["synthesizer", 5.65], ["electronic music", 3.77]], null], "duration": [3.35, 1.17, 7.49, 4.31, -0.25, 1.98, 3.14, -0.22]} \ No newline at end of file diff --git a/annotations_filtered/t-T4RYRUNWk_filtered.json b/annotations_filtered/t-T4RYRUNWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16b93aef53a5ece07faafc5027773a1debf1c09b --- /dev/null +++ b/annotations_filtered/t-T4RYRUNWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.31], [9.0, 8.65], [9.0, 10.37], [15.0, 18.33], [19.0, 22.65], [24.0, 34.94], [38.0, 38.75], [41.0, 46.16], [65.0, 64.99], [65.0, 65.21], [65.0, 66.31], [77.0, 79.03], [104.0, 105.9], [121.0, 122.25], [124.0, 124.31], [125.0, 125.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 86.64, 71.72, 51.28, 0.0, 68.41, 0.0, 0.0, 0.0, 63.42, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, -0.35, 1.37, 3.33, 3.65, 10.94, 0.75, 5.16, -0.01, 0.21, 1.31, 2.03, 1.9, 1.25, 0.31, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/t-dJ4I7rGp8_filtered.json b/annotations_filtered/t-dJ4I7rGp8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b01acb26dd0884f625e2d3096bcfb9b8975b59b --- /dev/null +++ b/annotations_filtered/t-dJ4I7rGp8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.89], [9.0, 20.41], [22.0, 23.19], [25.0, 25.98], [36.0, 36.04], [50.0, 50.23], [61.0, 62.18], [66.0, 73.14], [74.0, 74.36], [77.0, 81.45], [82.0, 83.29], [90.0, 90.34], [97.0, 99.64], [104.0, 108.11], [109.0, 124.78], [127.0, 127.7], [130.0, 140.34], [142.0, 142.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 37.78, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 0.0, 37.5, 0.0, 0.0, 71.29, 34.39, 42.06, 0.0, 33.78, 0.0], "audiomae_on_audioset": [null, [["speech", 55.06], ["music", 21.77], ["groan", 5.06]], null, null, null, null, null, null, null, [["speech", 58.09], ["fart", 22.88], ["boing", 2.8]], null, null, null, [["music", 29.86], ["speech", 13.33], ["crowd", 9.42]], [["music", 63.09], ["electronic music", 2.15], ["carnatic music", 1.71]], null, [["music", 78.73], ["theremin", 10.65], ["electronic music", 0.94]], null], "duration": [1.89, 11.41, 1.19, 0.98, 0.04, 0.23, 1.18, 7.14, 0.36, 4.45, 1.29, 0.34, 2.64, 4.11, 15.78, 0.7, 10.34, 0.82]} \ No newline at end of file diff --git a/annotations_filtered/t-lIuwPGT9w_filtered.json b/annotations_filtered/t-lIuwPGT9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73fa6b85a1b6f9e712e901eb08f37bda7b9f5aaf --- /dev/null +++ b/annotations_filtered/t-lIuwPGT9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.95], [11.0, 11.75], [15.0, 16.12], [19.0, 19.35], [20.0, 21.29], [22.0, 25.19], [25.0, 25.24], [25.0, 36.56], [38.0, 45.1], [47.0, 47.75], [49.0, 48.84], [51.0, 51.26], [53.0, 57.65], [59.0, 63.19], [65.0, 65.84], [67.0, 84.23], [85.0, 87.51], [90.0, 96.82], [99.0, 99.81], [103.0, 162.97]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 0.0, 48.56, 47.58, 0.0, 0.0, 0.0, 53.59, 30.31, 0.0, 31.92, 31.28, 28.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 44.1], ["hum", 21.19], ["throbbing", 9.42]], [["hum", 30.45], ["music", 18.7], ["mains hum", 10.18]], null, null, null, null, [["animal", 51.95], ["roaring cats (lions, tigers)", 11.31], ["wild animals", 6.63]], null, [["music", 21.6], ["fly, housefly", 15.81], ["hum", 11.18]], [["music", 23.41], ["whale vocalization", 14.0], ["hum", 13.71]], [["speech", 38.43], ["music", 16.21], ["sidetone", 9.69]], null, null], "duration": [0.95, 0.75, 1.12, 0.35, 1.29, 3.19, 0.24, 11.56, 7.1, 0.75, -0.16, 0.26, 4.65, 4.19, 0.84, 17.23, 2.51, 6.82, 0.81, 59.97]} \ No newline at end of file diff --git a/annotations_filtered/t-t8eVDckH8_filtered.json b/annotations_filtered/t-t8eVDckH8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c534c73855a8aa4c63d32fa9565b7a15a3e03c56 --- /dev/null +++ b/annotations_filtered/t-t8eVDckH8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.66], [2.0, 2.73], [3.0, 11.06], [14.0, 17.56], [23.0, 33.4], [36.0, 63.56], [64.0, 68.37], [69.0, 70.01], [70.0, 96.13], [99.0, 100.38], [100.0, 100.41], [103.0, 153.17], [157.0, 173.38], [174.0, 185.48], [186.0, 219.65]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.15, 28.3, 28.11, 28.22, 28.37, 0.0, 28.22, 0.0, 0.0, 0.0, 28.23, 28.65, 0.0], "audiomae_on_audioset": [null, null, [["music", 54.48], ["vehicle", 12.07], ["motorcycle", 8.11]], [["music", 64.74], ["electronic music", 4.95], ["sound effect", 3.98]], [["music", 40.36], ["speech", 16.49], ["electronic music", 6.98]], [["music", 79.8], ["electronic music", 5.42], ["techno", 3.63]], [["music", 65.91], ["speech", 11.43], ["electronic music", 3.61]], null, [["music", 54.71], ["speech", 10.21], ["vehicle", 6.94]], null, null, null, [["music", 65.33], ["throbbing", 7.8], ["electronic music", 5.77]], [["mains hum", 52.9], ["music", 16.99], ["hum", 11.39]], null], "duration": [-0.34, 0.73, 8.06, 3.56, 10.4, 27.56, 4.37, 1.01, 26.13, 1.38, 0.41, 50.17, 16.38, 11.48, 33.65]} \ No newline at end of file diff --git a/annotations_filtered/t09QqjBkg0c_filtered.json b/annotations_filtered/t09QqjBkg0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..988ede081e0071872418729966d316826ac94523 --- /dev/null +++ b/annotations_filtered/t09QqjBkg0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[157.0, 157.37], [159.0, 159.49], [160.0, 162.57]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 62.17], "audiomae_on_audioset": [null, null, null], "duration": [0.37, 0.49, 2.57]} \ No newline at end of file diff --git a/annotations_filtered/t0Hr0YA9_H0_filtered.json b/annotations_filtered/t0Hr0YA9_H0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89a235aea014fcdb4a94234aaf173b83365f82bc --- /dev/null +++ b/annotations_filtered/t0Hr0YA9_H0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.31], [26.0, 26.5], [27.0, 29.03], [30.0, 31.82], [40.0, 42.74], [43.0, 44.36], [45.0, 45.86], [50.0, 50.45], [59.0, 59.8], [61.0, 62.83], [68.0, 69.42], [73.0, 74.19], [79.0, 79.17], [80.0, 81.38], [82.0, 82.17], [85.0, 85.75], [92.0, 92.74], [93.0, 93.82], [94.0, 95.5], [96.0, 96.69], [101.0, 101.61], [120.0, 124.06]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [47.27, 0.0, 47.35, 0.0, 53.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.93], "audiomae_on_audioset": [[["music", 30.09], ["speech", 14.48], ["outside, urban or manmade", 4.5]], null, [["speech", 29.31], ["laughter", 15.15], ["fart", 6.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["grunt", 15.12], ["fart", 12.82], ["music", 11.22]]], "duration": [2.31, 0.5, 2.03, 1.82, 2.74, 1.36, 0.86, 0.45, 0.8, 1.83, 1.42, 1.19, 0.17, 1.38, 0.17, 0.75, 0.74, 0.82, 1.5, 0.69, 0.61, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/t0R7IRtvvFA_filtered.json b/annotations_filtered/t0R7IRtvvFA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b4ab1a31bcd55bee0718f0357e4ae2edd90543c --- /dev/null +++ b/annotations_filtered/t0R7IRtvvFA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.84], [9.0, 11.13], [14.0, 14.67], [18.0, 19.36], [21.0, 20.85], [27.0, 27.08], [48.0, 49.23], [49.0, 91.02], [91.0, 91.37], [94.0, 93.9], [95.0, 95.3], [96.0, 97.85], [101.0, 119.7]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.68], "audiomae_on_audioset": [null, [["speech", 56.51], ["didgeridoo", 7.04], ["fart", 5.35]], null, null, null, null, null, null, null, null, null, null, [["music", 81.51], ["electronic music", 2.45], ["trance music", 2.17]]], "duration": [0.84, 2.13, 0.67, 1.36, -0.15, 0.08, 1.23, 42.02, 0.37, -0.1, 0.3, 1.85, 18.7]} \ No newline at end of file diff --git a/annotations_filtered/t0Yf_fvD-lY_filtered.json b/annotations_filtered/t0Yf_fvD-lY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb405b7a75c33b231a56034dc24d3d4618a66885 --- /dev/null +++ b/annotations_filtered/t0Yf_fvD-lY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.07], [10.0, 22.69], [29.0, 32.14], [39.0, 41.1], [43.0, 49.13], [54.0, 55.9], [60.0, 62.92], [63.0, 84.0], [87.0, 88.43], [90.0, 91.52], [106.0, 106.35], [108.0, 107.89], [108.0, 107.99], [108.0, 108.03], [108.0, 110.12], [112.0, 111.91], [113.0, 114.05], [118.0, 118.45], [119.0, 119.48], [129.0, 129.37], [132.0, 132.14]], "keep_status": [true, true, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.59, 30.38, 31.03, 43.71, 31.63, 0.0, 30.34, 29.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.46], ["musical instrument", 9.36], ["synthesizer", 7.76]], [["music", 30.22], ["hum", 20.39], ["mains hum", 12.68]], [["speech", 18.6], ["crowd", 16.69], ["eruption", 10.56]], [["music", 64.77], ["synthesizer", 6.05], ["musical instrument", 2.68]], [["music", 53.65], ["throbbing", 13.99], ["boing", 4.34]], null, [["music", 43.31], ["synthesizer", 7.27], ["bird", 6.61]], [["music", 21.44], ["livestock, farm animals, working animals", 21.38], ["cattle, bovinae", 14.25]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.07, 12.69, 3.14, 2.1, 6.13, 1.9, 2.92, 21.0, 1.43, 1.52, 0.35, -0.11, -0.01, 0.03, 2.12, -0.09, 1.05, 0.45, 0.48, 0.37, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/t0oqEjxOUww_filtered.json b/annotations_filtered/t0oqEjxOUww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7b5b986b139691a683586ec40fd19bb67920e0b --- /dev/null +++ b/annotations_filtered/t0oqEjxOUww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [5.0, 10.23], [13.0, 14.69], [19.0, 20.31], [22.0, 23.18], [26.0, 26.28], [28.0, 29.03], [30.0, 61.67], [62.0, 63.05], [65.0, 69.42], [72.0, 73.45], [80.0, 81.36], [84.0, 85.53], [90.0, 90.64], [95.0, 96.63], [100.0, 100.77], [102.0, 102.52], [107.0, 118.13], [119.0, 120.29], [129.0, 129.05], [131.0, 131.57], [137.0, 141.42], [143.0, 143.78], [147.0, 147.93], [149.0, 152.0], [154.0, 155.02], [159.0, 159.81], [166.0, 172.42], [177.0, 177.47], [178.0, 183.52], [184.0, 184.59], [185.0, 185.75], [187.0, 200.18], [202.0, 205.78], [207.0, 207.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.6, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 95.78, 0.0, 0.0, 60.05, 0.0, 31.14, 0.0, 0.0, 39.86, 92.8, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.54], ["music", 14.75], ["didgeridoo", 4.58]], null, null, [["cattle, bovinae", 44.88], ["livestock, farm animals, working animals", 29.33], ["moo", 19.94]], null, null], "duration": [0.88, 5.23, 1.69, 1.31, 1.18, 0.28, 1.03, 31.67, 1.05, 4.42, 1.45, 1.36, 1.53, 0.64, 1.63, 0.77, 0.52, 11.13, 1.29, 0.05, 0.57, 4.42, 0.78, 0.93, 3.0, 1.02, 0.81, 6.42, 0.47, 5.52, 0.59, 0.75, 13.18, 3.78, 0.49]} \ No newline at end of file diff --git a/annotations_filtered/t0qYTDYyNvs_filtered.json b/annotations_filtered/t0qYTDYyNvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c12f16f540f54afc0f4d4846ea928ad0942dd58 --- /dev/null +++ b/annotations_filtered/t0qYTDYyNvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [5.0, 6.94], [10.0, 10.15], [13.0, 13.47], [19.0, 21.3], [22.0, 23.45], [27.0, 28.27], [30.0, 66.87], [68.0, 73.85], [76.0, 78.56], [80.0, 84.96], [86.0, 86.75], [90.0, 92.85], [93.0, 94.32], [96.0, 97.8], [99.0, 104.03], [105.0, 104.94], [111.0, 112.43], [116.0, 117.8], [126.0, 126.89], [128.0, 130.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.1, 0.0, 0.0, 0.0, 54.17, 56.93, 58.55, 0.0, 52.62, 0.0, 0.0, 36.85, 0.0, 0.0, 0.0, 0.0, 53.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.54], ["didgeridoo", 22.48], ["speech", 10.28]], null, null, null, null, null], "duration": [0.72, 1.94, 0.15, 0.47, 2.3, 1.45, 1.27, 36.87, 5.85, 2.56, 4.96, 0.75, 2.85, 1.32, 1.8, 5.03, -0.06, 1.43, 1.8, 0.89, 2.15]} \ No newline at end of file diff --git a/annotations_filtered/t0tIXAlLX8s_filtered.json b/annotations_filtered/t0tIXAlLX8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b7561337796d0c011601b9c312e2c5229f3084f --- /dev/null +++ b/annotations_filtered/t0tIXAlLX8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [13.0, 15.62], [16.0, 16.63], [24.0, 32.36], [34.0, 36.36], [38.0, 39.38], [41.0, 48.34], [52.0, 123.16], [130.0, 130.1], [131.0, 131.63], [142.0, 143.6], [145.0, 145.34], [149.0, 151.11]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 37.64, 0.0, 31.03, 30.82, 0.0, 30.21, 0.0, 0.0, 0.0, 0.0, 0.0, 32.45], "audiomae_on_audioset": [null, [["speech", 75.25], ["gears", 3.05], ["mechanisms", 2.65]], null, [["speech", 27.61], ["mains hum", 16.66], ["hum", 13.77]], [["music", 43.7], ["speech", 29.6], ["electronic music", 4.38]], null, [["music", 84.45], ["hum", 3.07], ["didgeridoo", 2.72]], null, null, null, null, null, [["speech", 43.58], ["siren", 6.81], ["music", 6.5]]], "duration": [0.67, 2.62, 0.63, 8.36, 2.36, 1.38, 7.34, 71.16, 0.1, 0.63, 1.6, 0.34, 2.11]} \ No newline at end of file diff --git a/annotations_filtered/t15VVQjK16Y_filtered.json b/annotations_filtered/t15VVQjK16Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/t15VVQjK16Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/t1JsC1ur2X8_filtered.json b/annotations_filtered/t1JsC1ur2X8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7282cf5f6396b9fee5282deee796776d8f0cd261 --- /dev/null +++ b/annotations_filtered/t1JsC1ur2X8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.11], [18.0, 21.27], [23.0, 23.11], [25.0, 30.92], [32.0, 33.49], [36.0, 38.52], [41.0, 42.67], [45.0, 47.53], [51.0, 58.6], [61.0, 116.5]], "keep_status": [true, false, false, true, false, false, false, false, false, false], "silence_prob": [40.79, 42.42, 0.0, 38.98, 0.0, 35.51, 0.0, 34.37, 34.39, 0.0], "audiomae_on_audioset": [[["hum", 27.6], ["music", 24.49], ["mains hum", 8.62]], [["music", 62.45], ["guitar", 5.19], ["effects unit", 3.54]], null, [["music", 52.14], ["mains hum", 6.1], ["effects unit", 4.36]], null, [["mains hum", 46.29], ["hum", 25.03], ["music", 7.0]], null, [["music", 71.07], ["effects unit", 4.26], ["hum", 2.47]], [["music", 78.72], ["musical instrument", 3.31], ["guitar", 2.27]], null], "duration": [7.11, 3.27, 0.11, 5.92, 1.49, 2.52, 1.67, 2.53, 7.6, 55.5]} \ No newline at end of file diff --git a/annotations_filtered/t1RkYJaG9bo_filtered.json b/annotations_filtered/t1RkYJaG9bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e4526c44f17e7a31835feab3cd2aa8f08426b57 --- /dev/null +++ b/annotations_filtered/t1RkYJaG9bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.35], [11.0, 11.6], [13.0, 13.8], [15.0, 16.09], [17.0, 17.71], [19.0, 19.79], [29.0, 29.89], [39.0, 39.63], [111.0, 111.57], [113.0, 113.9], [146.0, 146.28], [149.0, 149.4], [151.0, 151.46], [157.0, 157.44], [159.0, 161.2], [179.0, 178.83], [191.0, 194.76], [213.0, 217.61], [222.0, 224.07], [227.0, 229.9], [232.0, 237.9], [239.0, 240.75], [242.0, 250.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 32.0, 99.36, 64.86, 50.91, 41.54, 0.0, 55.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.32], ["speech", 7.62], ["swing music", 2.69]], null, null, null, [["music", 58.27], ["theremin", 13.39], ["singing", 2.07]], null, null], "duration": [0.35, 0.6, 0.8, 1.09, 0.71, 0.79, 0.89, 0.63, 0.57, 0.9, 0.28, 0.4, 0.46, 0.44, 2.2, -0.17, 3.76, 4.61, 2.07, 2.9, 5.9, 1.75, 8.7]} \ No newline at end of file diff --git a/annotations_filtered/t1TC-pegncQ_filtered.json b/annotations_filtered/t1TC-pegncQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0a85b9c8b908957d182246031051a94d2704f6a --- /dev/null +++ b/annotations_filtered/t1TC-pegncQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [6.0, 6.99], [8.0, 8.5], [11.0, 10.66], [11.0, 12.5], [14.0, 20.88], [25.0, 27.89], [31.0, 33.61], [34.0, 35.53], [37.0, 37.37], [41.0, 42.13], [45.0, 47.48], [48.0, 48.39], [49.0, 51.68], [59.0, 60.67], [65.0, 67.39], [69.0, 69.99], [70.0, 79.76], [81.0, 83.44], [86.0, 95.71], [97.0, 110.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 95.64, 86.09, 0.0, 0.0, 0.0, 95.64, 0.0, 85.35, 0.0, 75.72, 0.0, 75.72, 57.89, 70.02, 96.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.99, 0.5, -0.34, 1.5, 6.88, 2.89, 2.61, 1.53, 0.37, 1.13, 2.48, 0.39, 2.68, 1.67, 2.39, 0.99, 9.76, 2.44, 9.71, 13.64]} \ No newline at end of file diff --git a/annotations_filtered/t1Wk3H5Xur0_filtered.json b/annotations_filtered/t1Wk3H5Xur0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..516ad5ce7c22ca3f8b5e7ca8111362b9c98c5711 --- /dev/null +++ b/annotations_filtered/t1Wk3H5Xur0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.02], [5.0, 6.59], [13.0, 13.41], [14.0, 16.38], [17.0, 19.41], [24.0, 25.51], [28.0, 28.26], [34.0, 35.19], [37.0, 37.76], [42.0, 43.55], [48.0, 48.83], [51.0, 51.41], [53.0, 53.89], [61.0, 62.24], [69.0, 72.06], [74.0, 76.62], [79.0, 79.84], [85.0, 85.14], [89.0, 90.69], [98.0, 98.42], [109.0, 110.52], [132.0, 133.39], [160.0, 160.57], [163.0, 163.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.23, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 1.59, 0.41, 2.38, 2.41, 1.51, 0.26, 1.19, 0.76, 1.55, 0.83, 0.41, 0.89, 1.24, 3.06, 2.62, 0.84, 0.14, 1.69, 0.42, 1.52, 1.39, 0.57, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/t1gkRAWvxOs_filtered.json b/annotations_filtered/t1gkRAWvxOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..517428587fafd76640964d866e29d0a64b8f59e4 --- /dev/null +++ b/annotations_filtered/t1gkRAWvxOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [2.0, 2.52], [5.0, 6.57], [7.0, 8.92], [10.0, 10.81], [12.0, 12.53], [16.0, 17.41], [20.0, 21.46], [26.0, 26.96], [35.0, 35.45], [42.0, 42.11], [51.0, 51.93], [74.0, 74.53], [75.0, 75.64], [87.0, 87.88], [89.0, 89.85], [100.0, 100.48], [106.0, 109.04], [114.0, 115.5], [117.0, 117.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.91], ["hum", 22.67], ["sidetone", 13.89]], null, null], "duration": [0.36, 0.52, 1.57, 1.92, 0.81, 0.53, 1.41, 1.46, 0.96, 0.45, 0.11, 0.93, 0.53, 0.64, 0.88, 0.85, 0.48, 3.04, 1.5, 0.15]} \ No newline at end of file diff --git a/annotations_filtered/t1x6i73klIs_filtered.json b/annotations_filtered/t1x6i73klIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9da21367e33aee0504ae8f117c9c467c3222c3df --- /dev/null +++ b/annotations_filtered/t1x6i73klIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.86], [16.0, 16.41], [18.0, 18.12], [19.0, 19.63], [21.0, 22.25], [24.0, 25.03], [27.0, 29.08], [30.0, 33.22], [35.0, 35.77], [37.0, 37.32], [38.0, 38.26], [39.0, 51.22], [52.0, 54.04], [59.0, 60.03], [62.0, 63.36], [64.0, 64.67], [65.0, 66.95], [68.0, 68.44], [71.0, 71.32], [72.0, 75.14], [78.0, 79.35], [80.0, 82.05], [84.0, 84.11], [85.0, 88.32], [90.0, 90.98], [92.0, 93.09], [96.0, 97.97], [100.0, 101.04], [102.0, 102.66], [103.0, 103.79], [105.0, 107.22], [109.0, 109.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 72.9, 0.0, 0.0, 0.0, 55.25, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.16, 0.0, 95.23, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.41, 0.12, 0.63, 1.25, 1.03, 2.08, 3.22, 0.77, 0.32, 0.26, 12.22, 2.04, 1.03, 1.36, 0.67, 1.95, 0.44, 0.32, 3.14, 1.35, 2.05, 0.11, 3.32, 0.98, 1.09, 1.97, 1.04, 0.66, 0.79, 2.22, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/t2NytKIhd68_filtered.json b/annotations_filtered/t2NytKIhd68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc55fed4fc6002ad96daac216c20deb181776c6e --- /dev/null +++ b/annotations_filtered/t2NytKIhd68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.42], [7.0, 22.81], [23.0, 23.95], [28.0, 28.49], [31.0, 37.13], [39.0, 39.65], [41.0, 45.08], [48.0, 51.56], [53.0, 53.43], [55.0, 70.58], [73.0, 76.08], [79.0, 82.86], [85.0, 85.43], [110.0, 115.43], [121.0, 121.1], [123.0, 123.57], [124.0, 125.09], [145.0, 150.35], [157.0, 158.16]], "keep_status": [true, true, false, false, true, false, true, true, false, true, true, true, false, true, false, false, false, false, false], "silence_prob": [35.94, 34.4, 0.0, 0.0, 32.22, 0.0, 32.37, 35.13, 0.0, 30.32, 32.74, 34.28, 0.0, 37.9, 0.0, 0.0, 0.0, 28.9, 0.0], "audiomae_on_audioset": [[["whale vocalization", 27.91], ["speech", 9.51], ["livestock, farm animals, working animals", 9.38]], [["speech", 31.4], ["hum", 13.53], ["mains hum", 10.15]], null, null, [["speech", 16.65], ["music", 13.55], ["vehicle", 2.56]], null, [["music", 34.18], ["hum", 9.64], ["mains hum", 8.39]], [["fly, housefly", 23.15], ["bee, wasp, etc.", 16.39], ["insect", 11.08]], null, [["insect", 23.5], ["fly, housefly", 21.03], ["buzz", 15.49]], [["fly, housefly", 23.89], ["mains hum", 9.04], ["insect", 7.64]], [["mains hum", 17.01], ["hum", 16.37], ["buzz", 9.1]], null, [["thunk", 31.18], ["hum", 22.98], ["mains hum", 8.25]], null, null, null, [["cattle, bovinae", 36.18], ["speech", 18.64], ["moo", 16.96]], null], "duration": [3.42, 15.81, 0.95, 0.49, 6.13, 0.65, 4.08, 3.56, 0.43, 15.58, 3.08, 3.86, 0.43, 5.43, 0.1, 0.57, 1.09, 5.35, 1.16]} \ No newline at end of file diff --git a/annotations_filtered/t2QvuZpxmeo_filtered.json b/annotations_filtered/t2QvuZpxmeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc8ab528a4bb42ee977c586bc2575767a4f121ef --- /dev/null +++ b/annotations_filtered/t2QvuZpxmeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 19.14], [20.0, 24.0], [25.0, 33.69], [35.0, 45.17], [46.0, 48.24], [49.0, 61.77], [64.0, 65.7], [67.0, 76.28], [77.0, 78.46], [80.0, 80.74], [83.0, 84.5], [88.0, 88.25], [91.0, 91.57], [92.0, 96.42]], "keep_status": [true, false, false, true, false, true, false, true, false, false, false, false, false, true], "silence_prob": [39.85, 87.0, 37.69, 48.95, 90.6, 43.77, 0.0, 36.36, 0.0, 0.0, 0.0, 0.0, 0.0, 42.51], "audiomae_on_audioset": [[["music", 37.79], ["gong", 11.95], ["whale vocalization", 7.4]], null, [["music", 64.1], ["guitar", 6.62], ["musical instrument", 5.34]], [["speech", 36.93], ["patter", 13.49], ["whale vocalization", 8.79]], null, [["speech", 23.07], ["insect", 21.63], ["fly, housefly", 16.3]], null, [["frog", 28.44], ["animal", 20.66], ["whale vocalization", 19.2]], null, null, null, null, null, [["whale vocalization", 28.83], ["livestock, farm animals, working animals", 15.47], ["cattle, bovinae", 13.83]]], "duration": [6.14, 4.0, 8.69, 10.17, 2.24, 12.77, 1.7, 9.28, 1.46, 0.74, 1.5, 0.25, 0.57, 4.42]} \ No newline at end of file diff --git a/annotations_filtered/t31U3QAkClM_filtered.json b/annotations_filtered/t31U3QAkClM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8ac02f7af107d1eb3417476df164fa62709ef3b --- /dev/null +++ b/annotations_filtered/t31U3QAkClM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 98.09], [99.0, 111.27], [113.0, 135.01], [136.0, 136.02], [137.0, 145.49], [146.0, 186.98]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 99.68, 98.86, 0.0, 82.79, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [84.09, 12.27, 22.01, 0.02, 8.49, 40.98]} \ No newline at end of file diff --git a/annotations_filtered/t3XewsVnx9E_filtered.json b/annotations_filtered/t3XewsVnx9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acdfe19a79453123e6323ea388592d12539b1a4e --- /dev/null +++ b/annotations_filtered/t3XewsVnx9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.17], [12.0, 12.75], [15.0, 16.24], [19.0, 19.7], [22.0, 23.01], [33.0, 34.18], [44.0, 44.88], [48.0, 51.97], [70.0, 71.27], [76.0, 80.03], [80.0, 80.08], [93.0, 92.87], [99.0, 99.96], [113.0, 113.41], [119.0, 122.66], [128.0, 130.45], [135.0, 135.94], [137.0, 137.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.91, 0.0, 49.68, 0.0, 0.0, 0.0, 0.0, 45.43, 45.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 83.28], ["yodeling", 1.98], ["singing", 1.58]], null, null, null, null, [["music", 76.71], ["yodeling", 5.98], ["singing", 1.58]], [["music", 84.88], ["theremin", 5.04], ["didgeridoo", 1.28]], null, null], "duration": [1.17, 0.75, 1.24, 0.7, 1.01, 1.18, 0.88, 3.97, 1.27, 4.03, 0.08, -0.13, 0.96, 0.41, 3.66, 2.45, 0.94, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/t3c_a9M1E7s_filtered.json b/annotations_filtered/t3c_a9M1E7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3b228458976d22854fbdcf045a527c2ec866fec --- /dev/null +++ b/annotations_filtered/t3c_a9M1E7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 24.9], [30.0, 30.48], [32.0, 36.14], [38.0, 40.39], [41.0, 50.6], [52.0, 52.07], [53.0, 54.11], [56.0, 56.35], [58.0, 58.65], [61.0, 61.1], [62.0, 66.01], [67.0, 67.44], [73.0, 73.63], [74.0, 76.5], [78.0, 80.01]], "keep_status": [false, false, true, true, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [38.84, 0.0, 35.8, 36.81, 35.78, 0.0, 0.0, 0.0, 0.0, 0.0, 40.06, 0.0, 0.0, 67.25, 97.54], "audiomae_on_audioset": [[["music", 43.87], ["didgeridoo", 22.27], ["gong", 18.74]], null, [["music", 39.59], ["speech", 16.48], ["musical instrument", 12.56]], [["music", 51.14], ["gong", 7.89], ["musical instrument", 7.41]], [["speech", 19.05], ["didgeridoo", 17.34], ["music", 13.24]], null, null, null, null, null, [["boing", 44.66], ["thunk", 5.12], ["speech", 3.96]], null, null, null, null], "duration": [9.9, 0.48, 4.14, 2.39, 9.6, 0.07, 1.11, 0.35, 0.65, 0.1, 4.01, 0.44, 0.63, 2.5, 2.01]} \ No newline at end of file diff --git a/annotations_filtered/t3dmXdp2O0Q_filtered.json b/annotations_filtered/t3dmXdp2O0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7af81fe915eb6a38fbf1598b5f4f916693682755 --- /dev/null +++ b/annotations_filtered/t3dmXdp2O0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 30.97], [31.0, 104.73], [105.0, 118.96], [119.0, 123.13]], "keep_status": [false, false, false, true], "silence_prob": [97.73, 0.0, 36.66, 37.08], "audiomae_on_audioset": [null, null, [["speech", 73.18], ["rumble", 5.85], ["hum", 1.98]], [["speech", 42.53], ["rumble", 14.17], ["sidetone", 8.73]]], "duration": [27.97, 73.73, 13.96, 4.13]} \ No newline at end of file diff --git a/annotations_filtered/t3gqjXINvac_filtered.json b/annotations_filtered/t3gqjXINvac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69fefbb4f0b79a547701ef468a8edb9df4ebe59d --- /dev/null +++ b/annotations_filtered/t3gqjXINvac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.15], [12.0, 12.33], [30.0, 30.6], [31.0, 33.32], [36.0, 39.83], [43.0, 44.09], [52.0, 52.88], [54.0, 54.65], [55.0, 56.3], [57.0, 58.89], [60.0, 61.72], [63.0, 63.76], [66.0, 66.38], [72.0, 73.03], [75.0, 76.06], [77.0, 78.61], [80.0, 80.74], [82.0, 84.33], [87.0, 86.88], [108.0, 109.86], [115.0, 116.61], [117.0, 118.86], [120.0, 120.99], [126.0, 127.68], [128.0, 129.59], [130.0, 133.35], [134.0, 135.67], [139.0, 142.67], [144.0, 145.08], [147.0, 148.9], [149.0, 150.97], [157.0, 158.55], [161.0, 162.63], [164.0, 164.37], [165.0, 165.94], [166.0, 170.73], [172.0, 173.33], [174.0, 183.57], [185.0, 185.4]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.97, 0.0, 0.0, 37.12, 44.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 47.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 65.55, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 21.65], ["speech", 17.38], ["sidetone", 16.41]], [["speech", 14.13], ["burping, eructation", 13.22], ["fly, housefly", 8.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.19], ["sine wave", 4.65], ["insect", 3.57]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.15, 0.33, 0.6, 2.32, 3.83, 1.09, 0.88, 0.65, 1.3, 1.89, 1.72, 0.76, 0.38, 1.03, 1.06, 1.61, 0.74, 2.33, -0.12, 1.86, 1.61, 1.86, 0.99, 1.68, 1.59, 3.35, 1.67, 3.67, 1.08, 1.9, 1.97, 1.55, 1.63, 0.37, 0.94, 4.73, 1.33, 9.57, 0.4]} \ No newline at end of file diff --git a/annotations_filtered/t3mwyiOBDrk_filtered.json b/annotations_filtered/t3mwyiOBDrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c98491cd0f81fcd2d277c96096605ac46e1a0dd3 --- /dev/null +++ b/annotations_filtered/t3mwyiOBDrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.16], [16.0, 17.27], [18.0, 19.55], [20.0, 21.1], [22.0, 23.94], [25.0, 26.15], [28.0, 27.97], [30.0, 70.93], [84.0, 122.93], [124.0, 127.26], [129.0, 131.87], [133.0, 134.38], [135.0, 135.58], [137.0, 137.08], [138.0, 140.21], [141.0, 145.57], [150.0, 151.56], [160.0, 160.61], [165.0, 165.91], [166.0, 167.36], [168.0, 172.18], [174.0, 177.48]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 56.03, 0.0, 0.0, 0.0, 82.43, 99.52, 0.0, 0.0, 0.0, 0.0, 91.64, 86.45], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 21.44], ["whale vocalization", 20.05], ["moo", 8.94]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.16, 1.27, 1.55, 1.1, 1.94, 1.15, -0.03, 40.93, 38.93, 3.26, 2.87, 1.38, 0.58, 0.08, 2.21, 4.57, 1.56, 0.61, 0.91, 1.36, 4.18, 3.48]} \ No newline at end of file diff --git a/annotations_filtered/t3ttyoPvivk_filtered.json b/annotations_filtered/t3ttyoPvivk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e10fe0e4e0df07e23f37fbf908d31906cc6f3119 --- /dev/null +++ b/annotations_filtered/t3ttyoPvivk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 29.19], [35.0, 110.88], [115.0, 115.57], [120.0, 120.46], [121.0, 121.53], [123.0, 123.33], [125.0, 125.44], [130.0, 130.32]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [47.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.39], ["effects unit", 13.92], ["guitar", 7.43]], null, null, null, null, null, null, null], "duration": [27.19, 75.88, 0.57, 0.46, 0.53, 0.33, 0.44, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/t45uy-QuRDU_filtered.json b/annotations_filtered/t45uy-QuRDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd68f6c1ba59acf23ee405302caa461834f49e18 --- /dev/null +++ b/annotations_filtered/t45uy-QuRDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.83], [2.0, 3.16], [19.0, 20.73], [22.0, 23.57], [28.0, 31.08], [36.0, 41.62], [42.0, 47.46], [50.0, 55.44], [56.0, 56.56], [57.0, 58.45], [65.0, 65.89], [68.0, 68.3]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 78.04, 36.2, 30.9, 32.99, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 62.16], ["speech", 10.98], ["hum", 2.82]], [["music", 62.07], ["animal", 4.57], ["theremin", 2.58]], [["music", 34.59], ["cattle, bovinae", 12.32], ["moo", 9.73]], null, null, null, null], "duration": [0.83, 1.16, 1.73, 1.57, 3.08, 5.62, 5.46, 5.44, 0.56, 1.45, 0.89, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/t4DCOpG1oNE_filtered.json b/annotations_filtered/t4DCOpG1oNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02a2724f0c7ba830eb8b4231e75e2d3ab0679b91 --- /dev/null +++ b/annotations_filtered/t4DCOpG1oNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.82], [7.0, 13.44], [14.0, 16.58], [22.0, 21.81], [24.0, 25.32], [27.0, 27.38], [32.0, 32.93], [34.0, 42.31], [44.0, 45.96], [47.0, 47.61], [54.0, 54.75], [56.0, 56.98], [61.0, 62.29], [64.0, 66.39], [68.0, 70.16], [72.0, 75.71], [78.0, 79.78]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.45, 31.43, 0.0, 0.0, 0.0, 0.0, 52.22, 0.0, 0.0, 0.0, 0.0, 0.0, 70.86, 36.5, 30.67, 0.0], "audiomae_on_audioset": [null, [["music", 48.08], ["hum", 8.49], ["synthesizer", 7.06]], [["theremin", 42.83], ["music", 38.37], ["didgeridoo", 2.64]], null, null, null, null, null, null, null, null, null, null, null, [["music", 49.58], ["synthesizer", 16.83], ["musical instrument", 3.7]], [["music", 73.38], ["throbbing", 4.63], ["hum", 3.05]], null], "duration": [1.82, 6.44, 2.58, -0.19, 1.32, 0.38, 0.93, 8.31, 1.96, 0.61, 0.75, 0.98, 1.29, 2.39, 2.16, 3.71, 1.78]} \ No newline at end of file diff --git a/annotations_filtered/t4M3hbVh3U4_filtered.json b/annotations_filtered/t4M3hbVh3U4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab925d585c68f60603ee2ec8e884bdd4b8c23c34 --- /dev/null +++ b/annotations_filtered/t4M3hbVh3U4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.63], [8.0, 7.86], [9.0, 16.28], [18.0, 18.91], [19.0, 22.11], [42.0, 41.89], [42.0, 52.96], [60.0, 60.99], [65.0, 65.89], [69.0, 71.2], [76.0, 76.59], [80.0, 81.35], [83.0, 83.89], [86.0, 87.34], [90.0, 89.77], [92.0, 91.86], [92.0, 100.77], [115.0, 116.43]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.97, 0.0, 35.59, 0.0, 32.01, 0.0, 0.0, 32.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.08, 0.0], "audiomae_on_audioset": [null, null, [["speech", 65.52], ["explosion", 11.6], ["noise", 7.55]], null, [["speech", 24.95], ["animal", 18.96], ["roaring cats (lions, tigers)", 8.81]], null, [["speech", 38.59], ["machine gun", 23.9], ["gunshot, gunfire", 19.86]], null, null, [["speech", 52.31], ["eruption", 9.67], ["sidetone", 4.36]], null, null, null, null, null, null, [["explosion", 64.49], ["speech", 16.38], ["burst, pop", 6.05]], null], "duration": [0.63, -0.14, 7.28, 0.91, 3.11, -0.11, 10.96, 0.99, 0.89, 2.2, 0.59, 1.35, 0.89, 1.34, -0.23, -0.14, 8.77, 1.43]} \ No newline at end of file diff --git a/annotations_filtered/t4U-Q2nd6u4_filtered.json b/annotations_filtered/t4U-Q2nd6u4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1a87f52889a4c7bfdc026c217bec495f918905b --- /dev/null +++ b/annotations_filtered/t4U-Q2nd6u4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [5.0, 16.38], [18.0, 18.89], [20.0, 22.49], [25.0, 26.65], [28.0, 28.05], [38.0, 38.99], [42.0, 42.26], [44.0, 44.59], [47.0, 47.17], [49.0, 49.5], [50.0, 51.39], [53.0, 54.46], [56.0, 56.46], [58.0, 60.27], [61.0, 61.33], [67.0, 69.42], [72.0, 74.58], [76.0, 76.74], [81.0, 82.76], [83.0, 87.17], [89.0, 107.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 81.35, 0.0, 89.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 98.19, 98.19, 0.0, 0.0, 33.82, 74.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.92], ["music", 11.46], ["fart", 5.4]], null], "duration": [0.75, 11.38, 0.89, 2.49, 1.65, 0.05, 0.99, 0.26, 0.59, 0.17, 0.5, 1.39, 1.46, 0.46, 2.27, 0.33, 2.42, 2.58, 0.74, 1.76, 4.17, 18.86]} \ No newline at end of file diff --git a/annotations_filtered/t4WP3bODmfo_filtered.json b/annotations_filtered/t4WP3bODmfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d825621927316967c9c3a33ca494ade83f84d05 --- /dev/null +++ b/annotations_filtered/t4WP3bODmfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.84], [8.0, 10.44], [25.0, 32.85], [38.0, 39.19], [43.0, 45.25], [45.0, 45.28], [63.0, 63.59], [64.0, 64.0], [67.0, 79.79], [84.0, 84.35], [85.0, 87.83], [95.0, 95.89], [99.0, 99.01], [108.0, 115.3]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 36.82, 32.56, 0.0, 31.95, 0.0, 0.0, 0.0, 32.85, 0.0, 31.64, 0.0, 0.0, 34.2], "audiomae_on_audioset": [null, [["music", 48.89], ["zither", 8.1], ["musical instrument", 4.8]], [["music", 73.42], ["funny music", 3.06], ["musical instrument", 1.97]], null, [["music", 83.53], ["guitar", 4.1], ["musical instrument", 3.21]], null, null, null, [["music", 83.59], ["clarinet", 2.59], ["musical instrument", 2.19]], null, [["music", 41.42], ["musical instrument", 11.0], ["guitar", 6.04]], null, null, [["music", 75.8], ["musical instrument", 2.17], ["guitar", 1.86]]], "duration": [-0.16, 2.44, 7.85, 1.19, 2.25, 0.28, 0.59, 0.0, 12.79, 0.35, 2.83, 0.89, 0.01, 7.3]} \ No newline at end of file diff --git a/annotations_filtered/t4_obOCNYls_filtered.json b/annotations_filtered/t4_obOCNYls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bad0c61677f470bc1d8a980d770570f2feb3053 --- /dev/null +++ b/annotations_filtered/t4_obOCNYls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [5.0, 5.81], [8.0, 9.64], [11.0, 11.62], [13.0, 13.91], [15.0, 17.52], [18.0, 20.22], [24.0, 25.17], [26.0, 26.97], [28.0, 30.03], [31.0, 32.02], [33.0, 36.09], [37.0, 37.98], [39.0, 41.42], [43.0, 44.12], [47.0, 49.32]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.87, 41.1, 0.0, 0.0, 48.06, 0.0, 46.79, 0.0, 35.84, 0.0, 43.35], "audiomae_on_audioset": [null, null, null, null, null, [["rain", 29.83], ["rain on surface", 21.79], ["raindrop", 9.34]], [["rain on surface", 38.63], ["rain", 21.21], ["thunderstorm", 9.91]], null, null, [["hum", 23.39], ["throbbing", 15.88], ["static", 6.79]], null, [["rain", 33.16], ["rain on surface", 29.45], ["raindrop", 18.03]], null, [["speech", 34.3], ["rain on surface", 14.57], ["rain", 13.1]], null, [["rain on surface", 23.79], ["rain", 23.72], ["raindrop", 7.89]]], "duration": [0.86, 0.81, 1.64, 0.62, 0.91, 2.52, 2.22, 1.17, 0.97, 2.03, 1.02, 3.09, 0.98, 2.42, 1.12, 2.32]} \ No newline at end of file diff --git a/annotations_filtered/t4fqGbC2mQM_filtered.json b/annotations_filtered/t4fqGbC2mQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6896afbecb2606f4bd7b05db5c61ed7d9f848ffe --- /dev/null +++ b/annotations_filtered/t4fqGbC2mQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.99], [16.0, 18.62], [20.0, 51.76], [53.0, 103.03], [105.0, 108.85], [111.0, 111.21], [112.0, 113.64], [116.0, 117.85], [119.0, 119.47], [121.0, 121.1], [122.0, 124.34], [131.0, 134.57], [136.0, 137.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 96.29, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 93.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.99, 2.62, 31.76, 50.03, 3.85, 0.21, 1.64, 1.85, 0.47, 0.1, 2.34, 3.57, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/t4qrfjEgdt4_filtered.json b/annotations_filtered/t4qrfjEgdt4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06089f07dc7f2be413b32ba4362b4063d7d252b4 --- /dev/null +++ b/annotations_filtered/t4qrfjEgdt4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.09], [7.0, 8.31], [10.0, 11.92], [14.0, 17.14], [18.0, 19.4], [21.0, 22.45], [23.0, 25.57], [32.0, 33.0], [34.0, 64.15], [67.0, 69.47], [70.0, 70.66], [72.0, 72.91], [85.0, 84.97], [97.0, 96.74], [97.0, 97.26], [99.0, 100.57], [102.0, 103.37], [105.0, 106.49], [107.0, 107.06], [109.0, 109.53], [111.0, 112.89], [114.0, 116.94], [119.0, 119.26], [121.0, 124.19], [126.0, 126.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 43.96, 0.0, 0.0, 40.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.95, 0.0, 64.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 77.5], ["chirp tone", 3.06], ["inside, small room", 2.92]], null, null, [["chirp tone", 57.39], ["sine wave", 29.97], ["tuning fork", 2.22]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 1.31, 1.92, 3.14, 1.4, 1.45, 2.57, 1.0, 30.15, 2.47, 0.66, 0.91, -0.03, -0.26, 0.26, 1.57, 1.37, 1.49, 0.06, 0.53, 1.89, 2.94, 0.26, 3.19, 0.69]} \ No newline at end of file diff --git a/annotations_filtered/t4zyH4BsmgQ_filtered.json b/annotations_filtered/t4zyH4BsmgQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4830b50ae496736d06f9e5ca142439af2c22bb84 --- /dev/null +++ b/annotations_filtered/t4zyH4BsmgQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.63], [18.0, 18.5], [25.0, 35.36], [36.0, 37.47], [41.0, 40.74], [43.0, 52.93], [68.0, 71.71]], "keep_status": [true, false, true, false, false, true, true], "silence_prob": [32.74, 0.0, 30.88, 0.0, 0.0, 32.61, 36.49], "audiomae_on_audioset": [[["music", 54.95], ["synthesizer", 8.77], ["hum", 5.65]], null, [["speech", 47.1], ["music", 12.66], ["clang", 8.49]], null, null, [["speech", 29.36], ["music", 19.34], ["hum", 18.14]], [["music", 18.93], ["hum", 11.21], ["throbbing", 8.31]]], "duration": [4.63, 0.5, 10.36, 1.47, -0.26, 9.93, 3.71]} \ No newline at end of file diff --git a/annotations_filtered/t5GdZx7AS-E_filtered.json b/annotations_filtered/t5GdZx7AS-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c28cd632f8e85d6ca4dd57f5a8111caa408413e3 --- /dev/null +++ b/annotations_filtered/t5GdZx7AS-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.67], [5.0, 6.64], [7.0, 11.1], [11.0, 17.19], [18.0, 32.86], [34.0, 45.96], [48.0, 50.84], [52.0, 58.18], [60.0, 61.1], [64.0, 102.44], [104.0, 115.23], [122.0, 125.76], [126.0, 127.7], [129.0, 130.44], [131.0, 137.52], [138.0, 146.45], [147.0, 158.08], [158.0, 167.07], [171.0, 172.44], [174.0, 183.22]], "keep_status": [true, false, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.57, 0.0, 44.99, 46.72, 44.78, 32.6, 46.05, 34.38, 0.0, 0.0, 31.14, 34.65, 0.0, 0.0, 33.05, 29.51, 36.05, 37.63, 0.0, 29.66], "audiomae_on_audioset": [[["music", 39.3], ["speech", 10.44], ["didgeridoo", 4.32]], null, [["music", 40.96], ["speech", 15.92], ["synthesizer", 6.39]], [["music", 50.62], ["didgeridoo", 25.58], ["speech", 2.2]], [["music", 55.42], ["didgeridoo", 7.9], ["ambient music", 4.27]], [["speech", 27.36], ["music", 13.52], ["explosion", 9.88]], [["music", 40.72], ["speech", 31.17], ["synthesizer", 2.02]], [["music", 38.87], ["hum", 17.3], ["throbbing", 9.58]], null, null, [["music", 80.71], ["soundtrack music", 3.01], ["throbbing", 2.33]], [["hum", 38.12], ["music", 23.19], ["mains hum", 20.81]], null, null, [["speech", 41.78], ["music", 34.46], ["hum", 3.71]], [["music", 74.97], ["throbbing", 3.95], ["hum", 3.93]], [["music", 49.35], ["hum", 11.23], ["sonar", 11.07]], [["music", 44.45], ["hum", 19.69], ["mains hum", 15.05]], null, [["hum", 51.56], ["mains hum", 36.7], ["music", 4.72]]], "duration": [2.67, 1.64, 4.1, 6.19, 14.86, 11.96, 2.84, 6.18, 1.1, 38.44, 11.23, 3.76, 1.7, 1.44, 6.52, 8.45, 11.08, 9.07, 1.44, 9.22]} \ No newline at end of file diff --git a/annotations_filtered/t5KEbS5soMA_filtered.json b/annotations_filtered/t5KEbS5soMA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22e80b8da39839fa9910a8c72ad6de147279bd06 --- /dev/null +++ b/annotations_filtered/t5KEbS5soMA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.78], [7.0, 16.93], [17.0, 17.44], [17.0, 19.38], [20.0, 25.71], [27.0, 28.98], [32.0, 31.85], [33.0, 34.86], [38.0, 38.18], [40.0, 41.89], [58.0, 58.56], [59.0, 92.64], [100.0, 103.18], [105.0, 105.34], [106.0, 106.39], [108.0, 109.49], [119.0, 120.23], [124.0, 124.5]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 56.78, 0.0, 56.86, 46.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.69, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 21.0], ["fart", 8.92], ["fly, housefly", 7.33]], null, null, null, null, null, null, null, [["music", 36.07], ["hum", 5.64], ["throbbing", 3.31]], null, null, null, null, null], "duration": [0.78, 9.93, 0.44, 2.38, 5.71, 1.98, -0.15, 1.86, 0.18, 1.89, 0.56, 33.64, 3.18, 0.34, 0.39, 1.49, 1.23, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/t5eRT32QWdg_filtered.json b/annotations_filtered/t5eRT32QWdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/t5eRT32QWdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/t5nBikdQ1kE_filtered.json b/annotations_filtered/t5nBikdQ1kE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1987b7db3093d083e9926b059323c475f8438230 --- /dev/null +++ b/annotations_filtered/t5nBikdQ1kE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 46.62], [50.0, 51.7], [53.0, 54.21], [56.0, 55.7], [57.0, 57.4], [58.0, 58.83], [62.0, 62.43], [64.0, 65.48], [67.0, 66.61], [69.0, 68.82], [71.0, 71.41], [79.0, 80.33], [88.0, 89.45], [95.0, 96.28], [100.0, 100.63], [102.0, 109.41], [111.0, 113.34], [114.0, 114.3], [116.0, 117.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.2, 44.15, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 43.99], ["mains hum", 11.28], ["ambient music", 7.91]], [["speech", 22.42], ["vehicle", 9.84], ["hum", 8.54]], null, null], "duration": [0.62, 1.7, 1.21, -0.3, 0.4, 0.83, 0.43, 1.48, -0.39, -0.18, 0.41, 1.33, 1.45, 1.28, 0.63, 7.41, 2.34, 0.3, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/t5qkPMvpDfg_filtered.json b/annotations_filtered/t5qkPMvpDfg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05a8fb80d1193b026ea05f9a10757b2fefa66263 --- /dev/null +++ b/annotations_filtered/t5qkPMvpDfg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 22.77], [27.0, 27.84], [29.0, 30.6], [32.0, 33.39], [35.0, 35.72], [36.0, 37.61], [40.0, 42.82], [50.0, 53.84], [56.0, 57.1], [59.0, 60.35], [63.0, 63.48], [66.0, 65.8], [66.0, 69.99], [75.0, 77.63], [79.0, 84.99], [85.0, 86.12], [89.0, 89.67], [92.0, 93.09], [94.0, 94.46], [96.0, 97.34], [101.0, 102.47], [106.0, 106.81], [110.0, 114.62], [115.0, 114.79], [115.0, 115.06], [115.0, 118.5], [121.0, 121.49], [122.0, 129.07]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.61, 0.0, 0.0, 0.0, 0.0, 0.0, 35.22, 68.67, 0.0, 0.0, 0.0, 0.0, 64.29, 99.36, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 98.59, 0.0, 88.46], "audiomae_on_audioset": [[["music", 43.24], ["crowd", 10.17], ["speech", 7.14]], null, null, null, null, null, [["music", 30.79], ["speech", 21.96], ["sidetone", 20.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.77, 0.84, 1.6, 1.39, 0.72, 1.61, 2.82, 3.84, 1.1, 1.35, 0.48, -0.2, 3.99, 2.63, 5.99, 1.12, 0.67, 1.09, 0.46, 1.34, 1.47, 0.81, 4.62, -0.21, 0.06, 3.5, 0.49, 7.07]} \ No newline at end of file diff --git a/annotations_filtered/t5vDcrQIig0_filtered.json b/annotations_filtered/t5vDcrQIig0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af1b830f53d3bb653aa68f6bda558a82b9c45755 --- /dev/null +++ b/annotations_filtered/t5vDcrQIig0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.46], [14.0, 17.22], [18.0, 19.95], [22.0, 21.76], [25.0, 25.76], [27.0, 29.08], [29.0, 39.78], [41.0, 49.47], [51.0, 58.08], [59.0, 66.16], [69.0, 71.27], [73.0, 73.6], [75.0, 79.95], [82.0, 87.71], [89.0, 92.47], [93.0, 93.73], [114.0, 118.0], [120.0, 121.36], [123.0, 125.31], [127.0, 128.56], [131.0, 131.43], [133.0, 133.27], [137.0, 137.73], [143.0, 142.94], [154.0, 154.14], [158.0, 159.06], [162.0, 162.23], [163.0, 164.49]], "keep_status": [false, true, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.37, 0.0, 0.0, 0.0, 44.32, 45.14, 54.97, 47.27, 44.78, 66.88, 0.0, 32.53, 63.96, 99.78, 0.0, 100.0, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 46.08], ["musical instrument", 8.01], ["marimba, xylophone", 4.22]], null, null, null, [["music", 54.16], ["synthesizer", 5.16], ["musical instrument", 4.43]], [["music", 54.32], ["speech", 27.21], ["radio", 3.36]], null, [["speech", 42.44], ["music", 28.73], ["marimba, xylophone", 2.91]], [["music", 39.04], ["speech", 20.3], ["musical instrument", 5.22]], null, null, [["music", 53.52], ["musical instrument", 11.24], ["piano", 10.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 3.22, 1.95, -0.24, 0.76, 2.08, 10.78, 8.47, 7.08, 7.16, 2.27, 0.6, 4.95, 5.71, 3.47, 0.73, 4.0, 1.36, 2.31, 1.56, 0.43, 0.27, 0.73, -0.06, 0.14, 1.06, 0.23, 1.49]} \ No newline at end of file diff --git a/annotations_filtered/t5xpX6krGmE_filtered.json b/annotations_filtered/t5xpX6krGmE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..115d422f5ebad0fe7c275a800a751310f8beb8c3 --- /dev/null +++ b/annotations_filtered/t5xpX6krGmE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [7.0, 7.47], [10.0, 10.42], [10.0, 10.89], [14.0, 18.6], [19.0, 101.78], [103.0, 103.65], [104.0, 104.65], [105.0, 114.84]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.61, 0.0, 0.0, 0.0, 34.55], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 60.22], ["mosquito", 9.89], ["fly, housefly", 8.13]], null, null, null, [["music", 62.6], ["throbbing", 8.07], ["electronic music", 5.07]]], "duration": [0.43, 0.47, 0.42, 0.89, 4.6, 82.78, 0.65, 0.65, 9.84]} \ No newline at end of file diff --git a/annotations_filtered/t5zLt-NZrtI_filtered.json b/annotations_filtered/t5zLt-NZrtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d114fd0bb6a987e508b425a357c98d75d87d24c --- /dev/null +++ b/annotations_filtered/t5zLt-NZrtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [2.0, 3.21], [5.0, 5.64], [7.0, 7.53], [11.0, 12.12], [16.0, 17.52], [22.0, 23.55], [27.0, 29.51], [31.0, 37.54], [44.0, 46.08], [47.0, 47.7], [51.0, 51.16], [54.0, 54.3], [59.0, 60.37], [62.0, 62.5], [63.0, 65.11], [69.0, 73.01], [76.0, 77.45], [78.0, 81.04], [81.0, 84.6], [88.0, 94.98], [96.0, 98.93], [113.0, 113.32], [119.0, 119.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 67.76, 54.5, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 95.09, 0.0, 72.75, 76.53, 99.95, 96.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 1.21, 0.64, 0.53, 1.12, 1.52, 1.55, 2.51, 6.54, 2.08, 0.7, 0.16, 0.3, 1.37, 0.5, 2.11, 4.01, 1.45, 3.04, 3.6, 6.98, 2.93, 0.32, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/t5zrRGTShZA_filtered.json b/annotations_filtered/t5zrRGTShZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64b5f3c1f0b012c1eb9f205867b1a74ac1351ac9 --- /dev/null +++ b/annotations_filtered/t5zrRGTShZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.78], [2.0, 2.84], [5.0, 5.9], [7.0, 7.72], [9.0, 9.41], [11.0, 11.87], [12.0, 12.63], [15.0, 15.97], [17.0, 17.34], [23.0, 24.9], [27.0, 27.7], [30.0, 30.21], [33.0, 32.88], [33.0, 33.61], [41.0, 40.81], [42.0, 41.93], [44.0, 43.68], [45.0, 45.32], [47.0, 47.43], [48.0, 48.88], [50.0, 50.01], [52.0, 52.47], [53.0, 53.35], [59.0, 60.45], [61.0, 61.25], [63.0, 63.36], [67.0, 67.26], [67.0, 67.47], [69.0, 70.87], [71.0, 72.81], [73.0, 73.21], [73.0, 75.02], [75.0, 76.5], [78.0, 78.68], [85.0, 85.67], [87.0, 96.18], [96.0, 96.8], [97.0, 96.85], [97.0, 100.74], [103.0, 103.6], [110.0, 110.56], [112.0, 114.72], [116.0, 117.12], [119.0, 126.23], [139.0, 148.8], [164.0, 167.14], [168.0, 168.44], [168.0, 170.16], [172.0, 173.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 57.01, 0.0, 0.0, 61.47, 0.0, 51.55, 34.09, 38.67, 0.0, 34.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.49], ["whimper", 14.51], ["speech", 3.53]], [["music", 45.42], ["carnatic music", 24.35], ["musical instrument", 3.64]], null, [["music", 55.39], ["carnatic music", 9.3], ["theremin", 6.12]], null], "duration": [0.78, 0.84, 0.9, 0.72, 0.41, 0.87, 0.63, 0.97, 0.34, 1.9, 0.7, 0.21, -0.12, 0.61, -0.19, -0.07, -0.32, 0.32, 0.43, 0.88, 0.01, 0.47, 0.35, 1.45, 0.25, 0.36, 0.26, 0.47, 1.87, 1.81, 0.21, 2.02, 1.5, 0.68, 0.67, 9.18, 0.8, -0.15, 3.74, 0.6, 0.56, 2.72, 1.12, 7.23, 9.8, 3.14, 0.44, 2.16, 1.11]} \ No newline at end of file diff --git a/annotations_filtered/t69ZfcWPZFY_filtered.json b/annotations_filtered/t69ZfcWPZFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b25414fef9c6c6290a4d68627fed60cd8210a1c4 --- /dev/null +++ b/annotations_filtered/t69ZfcWPZFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.15], [19.0, 19.94], [21.0, 22.18], [23.0, 23.48], [24.0, 26.91], [27.0, 28.51], [35.0, 35.51], [39.0, 39.77], [42.0, 42.4], [46.0, 47.41], [50.0, 51.61], [64.0, 65.08], [67.0, 66.88], [69.0, 68.69], [69.0, 70.87], [73.0, 74.93], [76.0, 89.41], [100.0, 99.86], [100.0, 101.43], [102.0, 104.09], [107.0, 109.88], [112.0, 115.08], [118.0, 119.03], [121.0, 121.53]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.76, 0.0, 0.0, 32.2, 28.61, 33.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["ding", 19.36], ["clang", 16.84], ["coin (dropping)", 12.23]], null, null, null, null, null, null, null, null, null, null, null, [["music", 37.09], ["speech", 30.86], ["synthesizer", 3.26]], null, null, [["music", 59.04], ["speech", 21.57], ["electronic music", 1.37]], [["music", 22.34], ["jingle bell", 15.25], ["speech", 11.35]], [["music", 44.36], ["speech", 11.4], ["sidetone", 5.43]], null, null], "duration": [1.15, 0.94, 1.18, 0.48, 2.91, 1.51, 0.51, 0.77, 0.4, 1.41, 1.61, 1.08, -0.12, -0.31, 1.87, 1.93, 13.41, -0.14, 1.43, 2.09, 2.88, 3.08, 1.03, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/t6FIm6TCkCE_filtered.json b/annotations_filtered/t6FIm6TCkCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/t6FIm6TCkCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/t6UyEPrqaQI_filtered.json b/annotations_filtered/t6UyEPrqaQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0f44bf69a5b28db0b826ae8836125387e507b23 --- /dev/null +++ b/annotations_filtered/t6UyEPrqaQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.82], [12.0, 13.39], [14.0, 16.07], [27.0, 41.71], [42.0, 43.21], [49.0, 54.11], [55.0, 55.41], [59.0, 61.99], [63.0, 64.5], [65.0, 73.89], [74.0, 75.3], [78.0, 91.49], [95.0, 149.72], [151.0, 180.59], [182.0, 181.99], [182.0, 182.39], [184.0, 186.83], [187.0, 188.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [99.1, 0.0, 87.92, 87.74, 0.0, 66.03, 0.0, 90.43, 0.0, 58.81, 0.0, 29.78, 0.0, 28.7, 0.0, 0.0, 42.69, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.63], ["gong", 18.15], ["music", 12.22]], null, [["music", 39.87], ["scary music", 26.17], ["hum", 4.48]], null, null, [["music", 32.32], ["whale vocalization", 17.86], ["speech", 8.94]], null], "duration": [2.82, 1.39, 2.07, 14.71, 1.21, 5.11, 0.41, 2.99, 1.5, 8.89, 1.3, 13.49, 54.72, 29.59, -0.01, 0.39, 2.83, 1.74]} \ No newline at end of file diff --git a/annotations_filtered/t6bhgzR3gkY_filtered.json b/annotations_filtered/t6bhgzR3gkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5aa45d05fedbd18f256d5ed44eba4080e4d9259b --- /dev/null +++ b/annotations_filtered/t6bhgzR3gkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [4.0, 4.63], [7.0, 7.2], [10.0, 11.1], [25.0, 26.79]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.25, 0.63, 0.2, 1.1, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/t6nqp5MdMp0_filtered.json b/annotations_filtered/t6nqp5MdMp0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e9c50a7def1735b04302f982c11f256e7fbb042 --- /dev/null +++ b/annotations_filtered/t6nqp5MdMp0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.46], [11.0, 11.97], [21.0, 23.82], [28.0, 29.17], [29.0, 30.06], [31.0, 43.77], [46.0, 66.55], [69.0, 94.83], [96.0, 103.77], [106.0, 126.54], [129.0, 136.19], [138.0, 138.67], [141.0, 143.06], [144.0, 175.44], [176.0, 176.28], [178.0, 178.28]], "keep_status": [false, false, true, false, false, false, true, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.18, 0.0, 0.0, 29.94, 29.08, 29.25, 28.42, 28.75, 28.42, 0.0, 29.03, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 49.57], ["throbbing", 6.91], ["vehicle", 6.59]], null, null, [["music", 62.29], ["hum", 13.02], ["mains hum", 9.49]], [["explosion", 32.5], ["speech", 13.13], ["burst, pop", 8.8]], [["speech", 58.1], ["music", 13.44], ["throbbing", 4.95]], [["music", 28.17], ["cacophony", 8.37], ["sound effect", 4.91]], [["speech", 53.61], ["music", 22.07], ["sound effect", 2.53]], [["speech", 67.32], ["music", 15.25], ["sound effect", 1.91]], null, [["music", 33.66], ["speech", 17.25], ["throbbing", 3.98]], null, null, null], "duration": [1.46, 0.97, 2.82, 1.17, 1.06, 12.77, 20.55, 25.83, 7.77, 20.54, 7.19, 0.67, 2.06, 31.44, 0.28, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/t6wgyc8p_hY_filtered.json b/annotations_filtered/t6wgyc8p_hY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dad75a0bb8a4bf21a6a022fb673c0a238292d08e --- /dev/null +++ b/annotations_filtered/t6wgyc8p_hY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.27], [8.0, 8.95], [11.0, 12.04], [17.0, 18.2], [25.0, 27.4], [32.0, 34.1], [43.0, 44.31], [47.0, 47.78], [91.0, 91.56], [93.0, 94.59], [95.0, 96.08], [97.0, 96.67], [105.0, 104.95], [110.0, 111.27], [114.0, 114.47], [115.0, 121.56], [122.0, 124.68], [128.0, 128.11], [128.0, 129.36], [131.0, 135.63], [137.0, 140.51], [141.0, 142.08], [145.0, 146.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 59.59, 50.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.56, 41.28, 0.0, 0.0, 89.19, 47.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 51.1], ["speech", 6.3], ["music", 6.23]], null, null, null, [["speech", 33.21], ["sine wave", 23.78], ["sidetone", 19.81]], null, null], "duration": [0.27, 0.95, 1.04, 1.2, 2.4, 2.1, 1.31, 0.78, 0.56, 1.59, 1.08, -0.33, -0.05, 1.27, 0.47, 6.56, 2.68, 0.11, 1.36, 4.63, 3.51, 1.08, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/t794eVHOIvo_filtered.json b/annotations_filtered/t794eVHOIvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..336eedecca210c0bd9f70405dbb8418e5b651bb2 --- /dev/null +++ b/annotations_filtered/t794eVHOIvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.83], [10.0, 11.64], [12.0, 17.44], [19.0, 19.67], [21.0, 21.61]], "keep_status": [false, false, false, false, false], "silence_prob": [63.21, 0.0, 78.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [4.83, 1.64, 5.44, 0.67, 0.61]} \ No newline at end of file diff --git a/annotations_filtered/t7DgbPjFOfY_filtered.json b/annotations_filtered/t7DgbPjFOfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..360f98e48dd57deb299527d38f73ea46ff72f6ad --- /dev/null +++ b/annotations_filtered/t7DgbPjFOfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.05], [24.0, 24.11], [98.0, 98.54], [103.0, 103.79], [105.0, 106.56], [107.0, 107.32]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.05, 0.11, 0.54, 0.79, 1.56, 0.32]} \ No newline at end of file diff --git a/annotations_filtered/t7OQIn7Yuvc_filtered.json b/annotations_filtered/t7OQIn7Yuvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1ae9715f0bed69abbd7ac9c07da5581f74e382e --- /dev/null +++ b/annotations_filtered/t7OQIn7Yuvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.12], [6.0, 8.04], [12.0, 17.78], [18.0, 23.73], [26.0, 25.93], [28.0, 43.82], [46.0, 48.51], [51.0, 52.93], [54.0, 54.33], [58.0, 59.09], [61.0, 70.85], [71.0, 76.03], [81.0, 85.24], [86.0, 87.17], [90.0, 102.96], [104.0, 114.44], [118.0, 122.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 97.83, 50.21, 53.28, 0.0, 70.16, 97.0, 0.0, 0.0, 0.0, 53.4, 47.9, 43.18, 0.0, 35.08, 29.31, 29.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 27.86], ["hum", 16.72], ["mains hum", 14.22]], [["speech", 37.94], ["music", 28.43], ["synthesizer", 6.08]], null, [["speech", 57.47], ["sidetone", 15.55], ["music", 14.04]], [["hum", 12.71], ["vehicle", 10.6], ["speech", 9.08]], [["speech", 29.45], ["music", 23.55], ["throbbing", 5.08]]], "duration": [1.12, 2.04, 5.78, 5.73, -0.07, 15.82, 2.51, 1.93, 0.33, 1.09, 9.85, 5.03, 4.24, 1.17, 12.96, 10.44, 4.64]} \ No newline at end of file diff --git a/annotations_filtered/t7S_kRqYshw_filtered.json b/annotations_filtered/t7S_kRqYshw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4652e7c94f1b10ea41054efffc4765a26c57b391 --- /dev/null +++ b/annotations_filtered/t7S_kRqYshw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.18], [8.0, 11.13], [13.0, 14.55], [16.0, 33.44], [33.0, 33.49], [36.0, 37.05], [40.0, 85.55], [87.0, 89.9], [92.0, 126.64]], "keep_status": [true, true, false, false, false, false, false, false, false], "silence_prob": [49.68, 43.61, 0.0, 51.07, 0.0, 0.0, 0.0, 55.74, 0.0], "audiomae_on_audioset": [[["music", 20.0], ["hum", 7.7], ["ambient music", 6.79]], [["music", 10.27], ["sonar", 6.29], ["sheep", 5.08]], null, null, null, null, null, null, null], "duration": [2.18, 3.13, 1.55, 17.44, 0.49, 1.05, 45.55, 2.9, 34.64]} \ No newline at end of file diff --git a/annotations_filtered/t8HQInlblys_filtered.json b/annotations_filtered/t8HQInlblys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9135b0001dce1f13d76dc8873ad6e42721328c00 --- /dev/null +++ b/annotations_filtered/t8HQInlblys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.15], [9.0, 10.17], [11.0, 11.47], [13.0, 14.08], [16.0, 18.44], [22.0, 22.4], [23.0, 25.2], [25.0, 26.03], [28.0, 28.02], [30.0, 31.09], [32.0, 37.81], [39.0, 42.87], [46.0, 83.32], [84.0, 84.99], [86.0, 86.64], [87.0, 87.83], [89.0, 89.13], [90.0, 91.18], [94.0, 96.57], [97.0, 97.65], [98.0, 101.83]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.2, 0.0, 53.16, 0.0, 0.0, 0.0, 46.05, 40.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.38, 0.0, 41.22], "audiomae_on_audioset": [null, null, null, null, [["insect", 40.33], ["cricket", 17.07], ["music", 9.89]], null, null, null, null, null, [["insect", 44.21], ["cricket", 37.79], ["music", 5.95]], [["music", 21.08], ["insect", 20.25], ["cricket", 18.8]], null, null, null, null, null, null, [["sidetone", 27.08], ["boing", 21.48], ["music", 6.62]], null, [["speech", 30.24], ["inside, small room", 8.47], ["hum", 6.23]]], "duration": [0.15, 1.17, 0.47, 1.08, 2.44, 0.4, 2.2, 1.03, 0.02, 1.09, 5.81, 3.87, 37.32, 0.99, 0.64, 0.83, 0.13, 1.18, 2.57, 0.65, 3.83]} \ No newline at end of file diff --git a/annotations_filtered/t8Ql94ApRSI_filtered.json b/annotations_filtered/t8Ql94ApRSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1413ea07c02b86099ebaf7f2fe89338c03f5205e --- /dev/null +++ b/annotations_filtered/t8Ql94ApRSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.05], [9.0, 9.39], [17.0, 27.01], [29.0, 29.08], [30.0, 30.03], [31.0, 33.27], [33.0, 40.59], [42.0, 44.69], [46.0, 46.36], [47.0, 47.83], [51.0, 51.7], [52.0, 53.3], [54.0, 54.35], [57.0, 59.83], [61.0, 65.37], [66.0, 67.26]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 60.6, 0.0, 0.0, 34.01, 39.28, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87, 65.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["noise", 29.09], ["sound effect", 14.02], ["grunt", 7.49]], [["screaming", 30.53], ["groan", 18.76], ["throbbing", 4.72]], null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.39, 10.01, 0.08, 0.03, 2.27, 7.59, 2.69, 0.36, 0.83, 0.7, 1.3, 0.35, 2.83, 4.37, 1.26]} \ No newline at end of file diff --git a/annotations_filtered/t8eNpwLPwog_filtered.json b/annotations_filtered/t8eNpwLPwog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b78b9066563835a20c4c0d32f0fb72129ca767b3 --- /dev/null +++ b/annotations_filtered/t8eNpwLPwog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.32], [9.0, 12.82], [13.0, 37.56]], "keep_status": [false, true, false], "silence_prob": [0.0, 30.37, 35.25], "audiomae_on_audioset": [null, [["speech", 24.54], ["hum", 19.21], ["mains hum", 12.73]], [["mains hum", 50.63], ["hum", 35.44], ["insect", 2.97]]], "duration": [0.32, 3.82, 24.56]} \ No newline at end of file diff --git a/annotations_filtered/t8loKEw-wlA_filtered.json b/annotations_filtered/t8loKEw-wlA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b7c0e1440f3bb6c294610e3b483987d2b7eb932 --- /dev/null +++ b/annotations_filtered/t8loKEw-wlA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.89], [9.0, 8.85], [14.0, 17.96], [21.0, 24.7], [27.0, 28.93], [30.0, 30.45], [33.0, 33.13], [44.0, 46.52], [49.0, 50.55], [53.0, 56.94], [58.0, 58.24], [62.0, 68.52], [73.0, 79.14], [81.0, 88.8], [93.0, 97.21]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 34.44, 32.27, 0.0, 0.0, 0.0, 37.88, 0.0, 33.77, 0.0, 32.44, 32.94, 31.21, 31.61], "audiomae_on_audioset": [null, null, [["music", 41.39], ["hum", 9.31], ["theremin", 7.6]], [["music", 25.11], ["speech", 23.44], ["theremin", 17.89]], null, null, null, [["hum", 35.69], ["music", 23.18], ["mains hum", 21.25]], null, [["throbbing", 31.51], ["music", 24.48], ["hum", 19.43]], null, [["hum", 45.38], ["mains hum", 44.84], ["throbbing", 2.54]], [["music", 32.21], ["noise", 21.0], ["hum", 14.67]], [["hum", 38.52], ["mains hum", 31.84], ["noise", 6.4]], [["music", 26.18], ["hum", 8.61], ["mains hum", 8.04]]], "duration": [-0.11, -0.15, 3.96, 3.7, 1.93, 0.45, 0.13, 2.52, 1.55, 3.94, 0.24, 6.52, 6.14, 7.8, 4.21]} \ No newline at end of file diff --git a/annotations_filtered/t8vRwv9kRjg_filtered.json b/annotations_filtered/t8vRwv9kRjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b78316bc45cdec5951396d660b077d4decb91335 --- /dev/null +++ b/annotations_filtered/t8vRwv9kRjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 23.52], [26.0, 50.46], [51.0, 56.67], [62.0, 72.55], [78.0, 78.98], [80.0, 80.67], [87.0, 88.42], [94.0, 94.81], [96.0, 98.51], [103.0, 104.21], [105.0, 105.71], [106.0, 108.01], [112.0, 115.86], [117.0, 117.22], [122.0, 125.41], [125.0, 142.97], [144.0, 147.19], [149.0, 150.47], [153.0, 162.65], [163.0, 168.49], [173.0, 174.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.56, 96.54, 97.33, 84.98, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 62.37, 70.86, 0.0, 99.62, 61.08, 61.57, 0.0, 51.88, 50.02, 0.0], "audiomae_on_audioset": [[["mains hum", 36.02], ["hum", 24.81], ["music", 15.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [19.52, 24.46, 5.67, 10.55, 0.98, 0.67, 1.42, 0.81, 2.51, 1.21, 0.71, 2.01, 3.86, 0.22, 3.41, 17.97, 3.19, 1.47, 9.65, 5.49, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/t9BqiLLt9SI_filtered.json b/annotations_filtered/t9BqiLLt9SI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..705ad5b3dd209473b0f7f3d77380dd310a57e959 --- /dev/null +++ b/annotations_filtered/t9BqiLLt9SI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.7], [7.0, 11.77], [14.0, 15.48], [20.0, 23.48], [24.0, 25.78], [29.0, 30.54], [33.0, 33.54], [36.0, 40.1], [42.0, 45.49], [47.0, 48.52], [57.0, 57.72], [65.0, 65.94], [71.0, 73.36], [74.0, 74.97], [77.0, 77.84], [80.0, 81.04], [82.0, 83.86], [85.0, 85.26], [92.0, 93.11], [95.0, 97.53], [100.0, 101.6], [103.0, 104.19], [109.0, 109.24]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 44.57, 0.0, 40.75, 0.0, 0.0, 0.0, 91.47, 33.52, 0.0, 0.0, 0.0, 57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.97], ["effects unit", 16.78], ["guitar", 8.72]], null, [["sidetone", 18.65], ["hum", 15.41], ["mains hum", 12.55]], null, null, null, null, [["sidetone", 78.49], ["speech", 10.25], ["radio", 4.45]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 19.51], ["frog", 15.31], ["insect", 13.01]], null, null, null], "duration": [1.7, 4.77, 1.48, 3.48, 1.78, 1.54, 0.54, 4.1, 3.49, 1.52, 0.72, 0.94, 2.36, 0.97, 0.84, 1.04, 1.86, 0.26, 1.11, 2.53, 1.6, 1.19, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/t9P2B7NUPfM_filtered.json b/annotations_filtered/t9P2B7NUPfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f1c44a36391f47c5f64c00b0b525dc1fac626ec --- /dev/null +++ b/annotations_filtered/t9P2B7NUPfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.89], [10.0, 10.88], [12.0, 17.02], [18.0, 18.77], [20.0, 21.29], [23.0, 24.27], [25.0, 25.96], [29.0, 30.28], [31.0, 33.56], [36.0, 38.55], [39.0, 41.79], [44.0, 47.11], [48.0, 56.91], [58.0, 64.13], [64.0, 65.28], [68.0, 67.85], [76.0, 79.56], [86.0, 86.51], [93.0, 98.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 99.95, 100.0, 38.17, 30.59, 30.57, 0.0, 0.0, 30.69, 0.0, 62.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 88.3], ["sidetone", 2.98], ["dial tone", 2.96]], null, null, [["throbbing", 19.12], ["hum", 18.48], ["noise", 11.67]], [["music", 32.88], ["sidetone", 27.61], ["speech", 16.44]], [["music", 74.37], ["musical instrument", 8.47], ["synthesizer", 3.66]], null, null, [["music", 69.56], ["theremin", 4.54], ["shout", 4.5]], null, null], "duration": [0.89, 0.88, 5.02, 0.77, 1.29, 1.27, 0.96, 1.28, 2.56, 2.55, 2.79, 3.11, 8.91, 6.13, 1.28, -0.15, 3.56, 0.51, 5.32]} \ No newline at end of file diff --git a/annotations_filtered/t9XjAhGr8us_filtered.json b/annotations_filtered/t9XjAhGr8us_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..645c125cab37d71b41cea046efbb1102f0292fb9 --- /dev/null +++ b/annotations_filtered/t9XjAhGr8us_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 44.69], [45.0, 45.33], [46.0, 46.14], [50.0, 51.68], [69.0, 70.56], [85.0, 85.72]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.69, 0.33, 0.14, 1.68, 1.56, 0.72]} \ No newline at end of file diff --git a/annotations_filtered/t9eDVFrQDXM_filtered.json b/annotations_filtered/t9eDVFrQDXM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..396081717bfd4a196e19feb2c5e162d8d4ce93a9 --- /dev/null +++ b/annotations_filtered/t9eDVFrQDXM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [6.0, 7.03], [12.0, 13.46], [16.0, 17.76], [21.0, 20.83], [30.0, 30.59], [37.0, 37.47], [39.0, 41.91], [43.0, 44.31], [49.0, 50.46], [52.0, 52.98], [54.0, 54.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.63, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 1.03, 1.46, 1.76, -0.17, 0.59, 0.47, 2.91, 1.31, 1.46, 0.98, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/t9f5FmSQeB4_filtered.json b/annotations_filtered/t9f5FmSQeB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e307ae1137ba8b1359ea811a04caf672ef50a891 --- /dev/null +++ b/annotations_filtered/t9f5FmSQeB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [4.0, 4.46], [6.0, 13.49], [18.0, 19.47], [26.0, 26.2], [28.0, 29.2], [34.0, 34.94], [37.0, 39.33], [40.0, 41.98], [44.0, 45.54], [46.0, 47.65], [49.0, 50.85], [55.0, 55.0], [56.0, 56.94], [59.0, 72.28], [79.0, 79.41], [82.0, 83.19], [84.0, 87.71], [91.0, 95.23], [96.0, 96.63], [97.0, 98.96], [100.0, 102.36], [105.0, 106.95], [109.0, 112.8], [113.0, 113.19], [114.0, 115.5], [116.0, 117.39], [118.0, 118.18], [119.0, 119.37], [120.0, 120.21], [121.0, 124.55]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 49.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 91.47, 99.73, 0.0, 0.0, 30.21, 0.0, 60.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["arrow", 20.85], ["cap gun", 15.2], ["tuning fork", 13.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["whistle", 47.48], ["crow", 17.51], ["bird", 5.7]], null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 17.22], ["speech", 12.33], ["animal", 7.91]]], "duration": [0.42, 0.46, 7.49, 1.47, 0.2, 1.2, 0.94, 2.33, 1.98, 1.54, 1.65, 1.85, 0.0, 0.94, 13.28, 0.41, 1.19, 3.71, 4.23, 0.63, 1.96, 2.36, 1.95, 3.8, 0.19, 1.5, 1.39, 0.18, 0.37, 0.21, 3.55]} \ No newline at end of file diff --git a/annotations_filtered/t9vWi2ItxMc_filtered.json b/annotations_filtered/t9vWi2ItxMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e38415c4d240d2b50bb585d9daa1f8b4237509e0 --- /dev/null +++ b/annotations_filtered/t9vWi2ItxMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.29], [7.0, 7.32], [11.0, 11.11], [17.0, 17.07], [19.0, 19.43], [20.0, 21.61], [22.0, 24.65], [27.0, 27.36], [28.0, 29.69], [32.0, 35.48], [38.0, 38.97], [50.0, 49.86], [53.0, 59.16], [60.0, 59.97], [71.0, 70.66], [72.0, 71.71], [73.0, 73.68], [74.0, 74.88], [77.0, 77.41], [80.0, 79.79], [94.0, 94.9], [102.0, 101.66], [111.0, 111.7], [118.0, 123.03], [124.0, 124.43], [124.0, 124.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 0.0, 62.27, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 66.29], ["speech", 14.5], ["music", 7.58]], null, null], "duration": [0.29, 0.32, 0.11, 0.07, 0.43, 1.61, 2.65, 0.36, 1.69, 3.48, 0.97, -0.14, 6.16, -0.03, -0.34, -0.29, 0.68, 0.88, 0.41, -0.21, 0.9, -0.34, 0.7, 5.03, 0.43, 0.46]} \ No newline at end of file diff --git a/annotations_filtered/tAHCa87P8YI_filtered.json b/annotations_filtered/tAHCa87P8YI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b74015a26206bbec94aaad1cac2c99b678abd7c8 --- /dev/null +++ b/annotations_filtered/tAHCa87P8YI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 20.39], [22.0, 27.75], [30.0, 31.02], [32.0, 42.47], [51.0, 51.65], [58.0, 61.05], [62.0, 62.56], [64.0, 66.48], [70.0, 69.99], [71.0, 74.24], [77.0, 77.87], [90.0, 90.21], [91.0, 92.28], [100.0, 101.19], [104.0, 104.41], [105.0, 110.51], [113.0, 113.48], [115.0, 122.0], [123.0, 123.63], [131.0, 131.53], [138.0, 139.36], [140.0, 142.79]], "keep_status": [true, true, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [41.72, 43.61, 0.0, 33.52, 0.0, 35.98, 0.0, 36.86, 0.0, 33.88, 0.0, 0.0, 0.0, 0.0, 0.0, 32.88, 0.0, 30.64, 0.0, 0.0, 0.0, 49.36], "audiomae_on_audioset": [[["whale vocalization", 34.98], ["speech", 21.84], ["hum", 5.34]], [["hum", 39.52], ["whale vocalization", 15.9], ["music", 9.68]], null, [["music", 34.26], ["hum", 17.14], ["synthesizer", 7.82]], null, [["throbbing", 28.59], ["hum", 15.33], ["noise", 14.94]], null, [["throbbing", 38.14], ["hum", 25.01], ["music", 8.61]], null, [["music", 18.69], ["throbbing", 11.96], ["hum", 9.72]], null, null, null, null, null, [["sidetone", 67.97], ["speech", 18.77], ["music", 2.72]], null, [["music", 27.02], ["speech", 18.82], ["throbbing", 13.55]], null, null, null, [["music", 32.63], ["whale vocalization", 8.79], ["didgeridoo", 7.69]]], "duration": [3.39, 5.75, 1.02, 10.47, 0.65, 3.05, 0.56, 2.48, -0.01, 3.24, 0.87, 0.21, 1.28, 1.19, 0.41, 5.51, 0.48, 7.0, 0.63, 0.53, 1.36, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/tANIXMqv77U_filtered.json b/annotations_filtered/tANIXMqv77U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00b23342735b2d0cb0b2cf969351921d07225dbf --- /dev/null +++ b/annotations_filtered/tANIXMqv77U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.34], [12.0, 13.27], [15.0, 16.8], [20.0, 20.02], [21.0, 21.3], [26.0, 26.82], [31.0, 33.4], [35.0, 38.58], [41.0, 42.33], [43.0, 51.26], [54.0, 56.2], [59.0, 64.47], [65.0, 67.85], [69.0, 74.97], [77.0, 78.68], [80.0, 86.19], [87.0, 123.85], [124.0, 126.62], [128.0, 131.5], [132.0, 135.4], [137.0, 138.28], [139.0, 140.19], [141.0, 143.78], [147.0, 150.3], [153.0, 158.14], [159.0, 163.32], [170.0, 173.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 100.0, 0.0, 100.0, 100.0, 99.82, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 96.42, 0.0, 0.0, 99.05, 100.0, 100.0, 99.94, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.34, 1.27, 1.8, 0.02, 0.3, 0.82, 2.4, 3.58, 1.33, 8.26, 2.2, 5.47, 2.85, 5.97, 1.68, 6.19, 36.85, 2.62, 3.5, 3.4, 1.28, 1.19, 2.78, 3.3, 5.14, 4.32, 3.04]} \ No newline at end of file diff --git a/annotations_filtered/tAx_zjVXTOs_filtered.json b/annotations_filtered/tAx_zjVXTOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..215c60753727e3ee1a8abcbeee31dd03f11e31ee --- /dev/null +++ b/annotations_filtered/tAx_zjVXTOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.57], [11.0, 25.14], [28.0, 28.09], [29.0, 45.84], [46.0, 47.95], [48.0, 50.58], [53.0, 53.37], [55.0, 55.48], [57.0, 59.68], [60.0, 61.74], [63.0, 64.72], [68.0, 69.55], [73.0, 73.97], [75.0, 83.39], [89.0, 91.1], [92.0, 92.38], [93.0, 94.85], [96.0, 97.61], [98.0, 98.17], [99.0, 100.21], [104.0, 104.18], [105.0, 105.61], [107.0, 107.55], [110.0, 110.93], [112.0, 114.03], [117.0, 122.3], [124.0, 123.8], [128.0, 128.39]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [100.0, 91.47, 0.0, 58.64, 0.0, 49.64, 0.0, 0.0, 77.87, 0.0, 0.0, 0.0, 0.0, 46.36, 57.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.54, 28.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 55.72], ["sidetone", 5.8], ["music", 5.76]], null, null, null, null, null, null, null, [["synthesizer", 27.53], ["noise", 11.62], ["throbbing", 7.87]], null, null, null, null, null, null, null, null, null, null, [["speech", 17.78], ["vehicle", 13.37], ["music", 7.76]], [["speech", 29.55], ["music", 25.05], ["hum", 4.6]], null, null], "duration": [5.57, 14.14, 0.09, 16.84, 1.95, 2.58, 0.37, 0.48, 2.68, 1.74, 1.72, 1.55, 0.97, 8.39, 2.1, 0.38, 1.85, 1.61, 0.17, 1.21, 0.18, 0.61, 0.55, 0.93, 2.03, 5.3, -0.2, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/tB0th8vNLxo_filtered.json b/annotations_filtered/tB0th8vNLxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..460dd0d7d12e4c2df47d0d9d1ccfd83af25eaeb4 --- /dev/null +++ b/annotations_filtered/tB0th8vNLxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.04], [16.0, 17.79], [19.0, 28.21], [29.0, 30.5], [32.0, 35.67], [37.0, 41.27], [42.0, 49.59], [51.0, 53.47], [55.0, 58.41], [60.0, 64.03], [65.0, 69.36], [71.0, 73.6], [77.0, 80.7], [84.0, 84.81], [88.0, 87.96], [88.0, 95.17], [97.0, 100.45], [102.0, 106.57], [108.0, 115.87], [117.0, 119.37], [120.0, 122.22], [123.0, 126.1]], "keep_status": [false, false, false, false, true, true, true, true, false, false, true, true, true, false, false, false, false, false, false, true, false, false], "silence_prob": [92.8, 0.0, 36.29, 0.0, 33.54, 35.71, 35.61, 37.11, 43.25, 34.07, 32.62, 36.19, 34.56, 0.0, 0.0, 31.83, 36.15, 32.91, 32.33, 35.99, 50.81, 53.65], "audiomae_on_audioset": [null, null, [["singing bowl", 42.41], ["music", 35.96], ["ambient music", 4.59]], null, [["music", 47.98], ["musical instrument", 8.31], ["singing bowl", 7.18]], [["singing bowl", 35.66], ["music", 16.69], ["hum", 14.34]], [["singing bowl", 37.58], ["music", 14.29], ["gong", 6.28]], [["music", 30.64], ["harp", 24.85], ["musical instrument", 6.72]], [["singing bowl", 66.95], ["music", 4.99], ["chirp tone", 3.59]], [["music", 62.21], ["speech", 5.5], ["hum", 3.59]], [["music", 40.43], ["marimba, xylophone", 7.16], ["singing bowl", 5.96]], [["music", 28.43], ["quack", 10.1], ["singing bowl", 7.99]], [["music", 47.65], ["theremin", 9.34], ["singing bowl", 7.03]], null, null, [["hum", 40.3], ["music", 19.6], ["mains hum", 15.7]], [["music", 46.18], ["hum", 15.73], ["mains hum", 8.38]], [["music", 60.8], ["synthesizer", 6.12], ["ambient music", 6.07]], [["music", 63.04], ["ambient music", 14.02], ["synthesizer", 6.17]], [["speech", 20.24], ["music", 20.0], ["singing bowl", 10.93]], null, null], "duration": [6.04, 1.79, 9.21, 1.5, 3.67, 4.27, 7.59, 2.47, 3.41, 4.03, 4.36, 2.6, 3.7, 0.81, -0.04, 7.17, 3.45, 4.57, 7.87, 2.37, 2.22, 3.1]} \ No newline at end of file diff --git a/annotations_filtered/tB6Uj2RGhPU_filtered.json b/annotations_filtered/tB6Uj2RGhPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b27711618ed55781eb20de9135834dfa59af9321 --- /dev/null +++ b/annotations_filtered/tB6Uj2RGhPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.98], [11.0, 11.01], [13.0, 13.46], [15.0, 17.71], [20.0, 20.17], [21.0, 21.17], [24.0, 27.31], [29.0, 29.49], [30.0, 31.04], [33.0, 38.53], [39.0, 41.2], [42.0, 43.61], [45.0, 46.67], [47.0, 48.88], [49.0, 51.24], [54.0, 56.52], [57.0, 58.65], [60.0, 60.67], [64.0, 65.48], [66.0, 75.59], [77.0, 77.48], [78.0, 78.46], [79.0, 80.97], [84.0, 85.4], [88.0, 88.25], [91.0, 91.32], [92.0, 93.88], [98.0, 98.9], [100.0, 103.03], [106.0, 109.26], [112.0, 114.39], [115.0, 116.07], [119.0, 119.79], [124.0, 124.66], [128.0, 130.5]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.29, 0.0, 0.0, 37.56, 0.0, 0.0, 38.06, 55.18, 0.0, 0.0, 0.0, 40.57, 41.36, 0.0, 0.0, 0.0, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.71, 43.25, 37.34, 0.0, 0.0, 0.0, 43.64], "audiomae_on_audioset": [null, null, null, [["telephone", 17.87], ["rowboat, canoe, kayak", 11.89], ["telephone dialing, dtmf", 7.41]], null, null, [["sidetone", 50.35], ["speech", 29.93], ["telephone", 7.69]], null, null, [["music", 25.18], ["effects unit", 15.24], ["noise", 13.85]], null, null, null, null, [["speech", 74.75], ["sidetone", 6.66], ["radio", 4.22]], [["speech", 62.22], ["telephone", 10.35], ["radio", 6.86]], null, null, null, null, null, null, null, null, null, null, null, null, [["skateboard", 11.0], ["wood", 9.69], ["thunk", 8.72]], [["radio", 31.09], ["sidetone", 13.01], ["noise", 12.8]], [["music", 55.31], ["synthesizer", 11.02], ["cacophony", 2.62]], null, null, null, [["music", 49.86], ["synthesizer", 17.55], ["cacophony", 4.59]]], "duration": [1.98, 0.01, 0.46, 2.71, 0.17, 0.17, 3.31, 0.49, 1.04, 5.53, 2.2, 1.61, 1.67, 1.88, 2.24, 2.52, 1.65, 0.67, 1.48, 9.59, 0.48, 0.46, 1.97, 1.4, 0.25, 0.32, 1.88, 0.9, 3.03, 3.26, 2.39, 1.07, 0.79, 0.66, 2.5]} \ No newline at end of file diff --git a/annotations_filtered/tB9_C5zQLZw_filtered.json b/annotations_filtered/tB9_C5zQLZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2e407a1dbdde8514cc1b68c80ea011516c69f72 --- /dev/null +++ b/annotations_filtered/tB9_C5zQLZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[97.0, 114.59], [116.0, 119.13]], "keep_status": [true, true], "silence_prob": [32.33, 36.86], "audiomae_on_audioset": [[["music", 32.01], ["hum", 17.26], ["throbbing", 13.01]], [["music", 45.75], ["speech", 16.53], ["throbbing", 5.11]]], "duration": [17.59, 3.13]} \ No newline at end of file diff --git a/annotations_filtered/tBMAuUeeqdE_filtered.json b/annotations_filtered/tBMAuUeeqdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..827405f721f5aa4ca6369653efdde77707752f39 --- /dev/null +++ b/annotations_filtered/tBMAuUeeqdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 33.99], [36.0, 37.13], [38.0, 39.12], [41.0, 50.7], [51.0, 50.73], [51.0, 64.81], [66.0, 68.1], [69.0, 70.55], [71.0, 73.72], [74.0, 90.49], [92.0, 95.54], [97.0, 99.05], [101.0, 102.29], [103.0, 119.15], [123.0, 123.43], [124.0, 126.32], [128.0, 128.22], [131.0, 132.27], [133.0, 138.65], [139.0, 144.91], [146.0, 153.99]], "keep_status": [true, false, false, false, false, true, true, false, true, true, false, false, false, true, false, true, false, false, true, false, false], "silence_prob": [30.25, 0.0, 0.0, 29.93, 0.0, 30.81, 48.48, 0.0, 42.74, 33.85, 53.28, 52.8, 0.0, 31.63, 0.0, 46.15, 0.0, 0.0, 38.3, 43.66, 54.5], "audiomae_on_audioset": [[["music", 30.65], ["whack, thwack", 14.25], ["speech", 12.22]], null, null, [["whack, thwack", 28.28], ["speech", 24.59], ["music", 19.77]], null, [["whack, thwack", 14.16], ["speech", 12.79], ["music", 12.32]], [["music", 35.97], ["rumble", 4.68], ["speech", 3.1]], null, [["mains hum", 25.95], ["hum", 23.37], ["music", 13.69]], [["hum", 25.13], ["music", 22.68], ["throbbing", 15.84]], null, null, null, [["fart", 31.59], ["whack, thwack", 21.67], ["speech", 13.48]], null, [["speech", 30.11], ["music", 21.72], ["hum", 9.5]], null, null, [["speech", 22.97], ["whack, thwack", 19.41], ["breaking", 10.05]], [["speech", 40.18], ["hum", 18.5], ["mains hum", 14.32]], null], "duration": [12.99, 1.13, 1.12, 9.7, -0.27, 13.81, 2.1, 1.55, 2.72, 16.49, 3.54, 2.05, 1.29, 16.15, 0.43, 2.32, 0.22, 1.27, 5.65, 5.91, 7.99]} \ No newline at end of file diff --git a/annotations_filtered/tBNjWDkNbms_filtered.json b/annotations_filtered/tBNjWDkNbms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46242c1fd8d14cd6281783e496f362078b07df26 --- /dev/null +++ b/annotations_filtered/tBNjWDkNbms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.91], [13.0, 16.83], [19.0, 20.51], [22.0, 24.76], [27.0, 28.59], [29.0, 30.01], [33.0, 33.15], [35.0, 36.24], [37.0, 38.48], [43.0, 43.04], [44.0, 44.04], [44.0, 44.86], [53.0, 53.42], [55.0, 56.81], [58.0, 59.44], [61.0, 61.18], [67.0, 69.06], [72.0, 74.6], [75.0, 78.29], [79.0, 80.6], [84.0, 84.38], [89.0, 89.8], [91.0, 92.06], [96.0, 98.36], [99.0, 108.95], [110.0, 111.5], [114.0, 118.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 99.96, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 99.98, 99.88, 0.0, 0.0, 0.0, 0.0, 99.91, 90.95, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.91, 3.83, 1.51, 2.76, 1.59, 1.01, 0.15, 1.24, 1.48, 0.04, 0.04, 0.86, 0.42, 1.81, 1.44, 0.18, 2.06, 2.6, 3.29, 1.6, 0.38, 0.8, 1.06, 2.36, 9.95, 1.5, 4.88]} \ No newline at end of file diff --git a/annotations_filtered/tBOZNOYMHEg_filtered.json b/annotations_filtered/tBOZNOYMHEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3594972de23ce6972edf0875c47c43c1975b745 --- /dev/null +++ b/annotations_filtered/tBOZNOYMHEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.7], [13.0, 16.41], [18.0, 19.52], [20.0, 22.55], [23.0, 34.7]], "keep_status": [false, true, false, false, true], "silence_prob": [0.0, 34.57, 0.0, 44.99, 29.11], "audiomae_on_audioset": [null, [["singing bowl", 29.6], ["music", 23.12], ["speech", 4.38]], null, [["speech", 37.68], ["music", 27.09], ["singing bowl", 8.57]], [["music", 28.05], ["musical instrument", 9.57], ["sonar", 9.26]]], "duration": [0.7, 3.41, 1.52, 2.55, 11.7]} \ No newline at end of file diff --git a/annotations_filtered/tBSbjKyamRo_filtered.json b/annotations_filtered/tBSbjKyamRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42c4e05dfd63a2c41d2652a1c676aad9fc3a771a --- /dev/null +++ b/annotations_filtered/tBSbjKyamRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.64], [11.0, 11.33], [12.0, 12.6], [14.0, 13.61], [16.0, 17.07], [18.0, 18.28], [21.0, 22.6], [23.0, 24.76], [26.0, 26.32], [27.0, 28.07], [29.0, 30.15], [31.0, 32.1], [33.0, 33.1], [35.0, 38.15], [40.0, 41.12], [44.0, 44.74], [45.0, 48.84], [50.0, 51.65], [52.0, 55.95], [57.0, 58.01], [59.0, 61.64], [63.0, 63.93], [65.0, 65.67], [67.0, 69.57], [70.0, 70.92], [72.0, 72.79], [74.0, 74.17], [79.0, 81.99], [84.0, 85.56], [88.0, 90.14], [92.0, 94.14], [96.0, 97.98], [105.0, 106.2], [109.0, 111.08], [112.0, 113.68], [121.0, 126.64], [128.0, 129.98], [132.0, 132.88], [138.0, 139.97], [141.0, 141.52], [146.0, 146.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 0.0, 0.0, 66.39, 0.0, 47.27, 0.0, 41.54, 0.0, 0.0, 79.41, 0.0, 0.0, 0.0, 62.78, 0.0, 46.54, 55.04, 0.0, 0.0, 44.29, 0.0, 31.79, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 52.59], ["insect", 23.03], ["bee, wasp, etc.", 18.48]], null, [["insect", 22.17], ["fly, housefly", 22.03], ["speech", 10.55]], null, null, null, null, null, null, null, null, [["music", 17.33], ["speech", 10.63], ["hum", 6.77]], null, null, null, [["mains hum", 37.34], ["hum", 34.94], ["music", 5.58]], null, [["hum", 51.97], ["mains hum", 37.87], ["throbbing", 4.48]], null, null, null, null, null], "duration": [0.64, 0.33, 0.6, -0.39, 1.07, 0.28, 1.6, 1.76, 0.32, 1.07, 1.15, 1.1, 0.1, 3.15, 1.12, 0.74, 3.84, 1.65, 3.95, 1.01, 2.64, 0.93, 0.67, 2.57, 0.92, 0.79, 0.17, 2.99, 1.56, 2.14, 2.14, 1.98, 1.2, 2.08, 1.68, 5.64, 1.98, 0.88, 1.97, 0.52, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/tBeJkq_by_8_filtered.json b/annotations_filtered/tBeJkq_by_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..758b7df04cd6ff4b381076c729b055900a4807fe --- /dev/null +++ b/annotations_filtered/tBeJkq_by_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.65], [18.0, 26.06], [27.0, 27.85], [29.0, 48.73], [51.0, 58.85], [60.0, 63.04], [81.0, 81.67], [83.0, 84.23], [85.0, 85.89], [87.0, 87.22], [90.0, 90.76], [92.0, 93.61], [95.0, 95.71], [97.0, 98.12], [99.0, 100.13], [104.0, 105.31], [111.0, 113.07], [114.0, 115.33], [115.0, 122.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.73, 92.15, 0.0, 99.78, 97.92, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 99.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.65, 8.06, 0.85, 19.73, 7.85, 3.04, 0.67, 1.23, 0.89, 0.22, 0.76, 1.61, 0.71, 1.12, 1.13, 1.31, 2.07, 1.33, 7.67]} \ No newline at end of file diff --git a/annotations_filtered/tBw_BTLbjJI_filtered.json b/annotations_filtered/tBw_BTLbjJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af234d3fcbfa8f06ba902de885ba685c944378e9 --- /dev/null +++ b/annotations_filtered/tBw_BTLbjJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.75], [21.0, 21.12], [27.0, 27.14], [29.0, 29.22], [33.0, 33.89], [35.0, 34.86], [35.0, 36.76], [44.0, 45.89], [47.0, 51.76], [55.0, 57.87], [59.0, 59.05], [63.0, 62.68], [65.0, 66.04], [71.0, 72.59], [74.0, 75.69], [76.0, 77.18], [80.0, 81.35], [84.0, 84.84], [85.0, 86.49], [95.0, 99.33], [100.0, 105.04], [106.0, 108.53], [111.0, 111.81], [113.0, 112.72], [119.0, 121.9], [126.0, 126.59], [131.0, 131.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 99.85, 0.0, 0.0, 60.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.25, 0.12, 0.14, 0.22, 0.89, -0.14, 1.76, 1.89, 4.76, 2.87, 0.05, -0.32, 1.04, 1.59, 1.69, 1.18, 1.35, 0.84, 1.49, 4.33, 5.04, 2.53, 0.81, -0.28, 2.9, 0.59, 0.84]} \ No newline at end of file diff --git a/annotations_filtered/tCb_6mO6CmE_filtered.json b/annotations_filtered/tCb_6mO6CmE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf7886cb29357804d1e0da19612126f39f083687 --- /dev/null +++ b/annotations_filtered/tCb_6mO6CmE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.47], [19.0, 23.43], [28.0, 30.99], [33.0, 41.67], [42.0, 73.79], [76.0, 76.6], [78.0, 84.55], [86.0, 86.56], [88.0, 88.84], [92.0, 97.26], [102.0, 150.2], [152.0, 158.48], [161.0, 166.99]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [30.06, 29.97, 30.15, 30.04, 0.0, 0.0, 31.83, 0.0, 0.0, 33.03, 0.0, 30.23, 31.09], "audiomae_on_audioset": [[["vehicle", 28.16], ["music", 16.14], ["skidding", 8.69]], [["music", 45.34], ["hum", 13.0], ["throbbing", 7.99]], [["music", 23.24], ["cattle, bovinae", 13.93], ["livestock, farm animals, working animals", 11.21]], [["music", 54.89], ["race car, auto racing", 8.62], ["car", 6.78]], null, null, [["music", 32.22], ["throbbing", 27.73], ["hum", 16.8]], null, null, [["music", 48.02], ["throbbing", 22.17], ["hum", 9.44]], null, [["hum", 33.9], ["throbbing", 23.41], ["music", 20.6]], [["music", 26.02], ["throbbing", 13.02], ["hum", 9.12]]], "duration": [2.47, 4.43, 2.99, 8.67, 31.79, 0.6, 6.55, 0.56, 0.84, 5.26, 48.2, 6.48, 5.99]} \ No newline at end of file diff --git a/annotations_filtered/tCjohxqJ-0c_filtered.json b/annotations_filtered/tCjohxqJ-0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27a3930a2d1466d2fd45886da33a9e43f1c8095b --- /dev/null +++ b/annotations_filtered/tCjohxqJ-0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 21.32], [21.0, 21.39], [22.0, 24.51], [32.0, 34.21], [36.0, 36.95], [40.0, 41.5], [43.0, 43.58], [46.0, 51.29], [54.0, 56.51], [59.0, 66.83], [71.0, 95.23], [96.0, 96.13], [97.0, 108.51], [110.0, 116.95], [121.0, 122.32]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.15, 0.0, 29.48, 29.9, 0.0, 0.0, 0.0, 29.58, 29.79, 29.13, 29.01, 0.0, 29.02, 29.15, 0.0], "audiomae_on_audioset": [[["music", 71.79], ["musical instrument", 3.05], ["echo", 2.69]], null, [["music", 32.17], ["echo", 17.66], ["drum and bass", 5.64]], [["music", 70.6], ["musical instrument", 4.6], ["echo", 4.44]], null, null, null, [["music", 76.27], ["musical instrument", 4.59], ["didgeridoo", 3.7]], [["clarinet", 35.93], ["music", 29.22], ["steelpan", 10.32]], [["music", 82.44], ["musical instrument", 3.36], ["music of latin america", 1.55]], [["music", 86.53], ["glockenspiel", 0.96], ["marimba, xylophone", 0.85]], null, [["music", 56.92], ["theremin", 21.41], ["musical instrument", 6.28]], [["music", 72.19], ["musical instrument", 8.78], ["echo", 1.72]], null], "duration": [15.32, 0.39, 2.51, 2.21, 0.95, 1.5, 0.58, 5.29, 2.51, 7.83, 24.23, 0.13, 11.51, 6.95, 1.32]} \ No newline at end of file diff --git a/annotations_filtered/tCtZfBVS1Tg_filtered.json b/annotations_filtered/tCtZfBVS1Tg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5be91ebc00ea68b50ac0f75c16d4f0615d1bc1b --- /dev/null +++ b/annotations_filtered/tCtZfBVS1Tg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.08], [20.0, 19.63], [23.0, 23.6], [26.0, 27.11], [32.0, 39.33], [44.0, 47.01], [52.0, 56.2], [58.0, 60.34], [62.0, 64.27], [69.0, 75.03], [76.0, 77.19], [78.0, 79.88], [82.0, 83.49], [85.0, 87.4], [89.0, 90.34], [91.0, 104.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.44, 97.83, 99.99, 96.54, 99.1, 99.36, 0.0, 0.0, 0.0, 100.0, 0.0, 42.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.31], ["rumble", 18.23], ["mains hum", 8.46]]], "duration": [0.08, -0.37, 0.6, 1.11, 7.33, 3.01, 4.2, 2.34, 2.27, 6.03, 1.19, 1.88, 1.49, 2.4, 1.34, 13.65]} \ No newline at end of file diff --git a/annotations_filtered/tD3vc9KZ9lQ_filtered.json b/annotations_filtered/tD3vc9KZ9lQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6266c833b6f64f65f45bdf5a81e0e2055666038e --- /dev/null +++ b/annotations_filtered/tD3vc9KZ9lQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.07], [19.0, 35.77], [36.0, 37.07], [39.0, 39.33], [42.0, 43.53], [45.0, 100.45], [104.0, 104.87]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [74.13, 42.69, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 24.17], ["hum", 18.49], ["mains hum", 10.04]], null, null, null, null, null], "duration": [9.07, 16.77, 1.07, 0.33, 1.53, 55.45, 0.87]} \ No newline at end of file diff --git a/annotations_filtered/tD8f4Xk30bg_filtered.json b/annotations_filtered/tD8f4Xk30bg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c82b590785a32417bb3a477c24fc0899bc96adaa --- /dev/null +++ b/annotations_filtered/tD8f4Xk30bg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [15.0, 15.62], [23.0, 22.94], [70.0, 70.68], [79.0, 80.15], [82.0, 82.21], [83.0, 83.61], [84.0, 85.36], [86.0, 91.2]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 28.4], ["speech", 16.8], ["explosion", 7.43]]], "duration": [1.01, 0.62, -0.06, 0.68, 1.15, 0.21, 0.61, 1.36, 5.2]} \ No newline at end of file diff --git a/annotations_filtered/tD9DfbbK6OE_filtered.json b/annotations_filtered/tD9DfbbK6OE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8bb228c7ff5a24e93f21bfae9d82d18d69dc987 --- /dev/null +++ b/annotations_filtered/tD9DfbbK6OE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.74], [8.0, 11.04], [14.0, 14.1], [19.0, 25.05], [26.0, 26.52], [27.0, 53.5], [55.0, 55.04], [59.0, 76.37], [80.0, 87.27], [89.0, 89.38], [91.0, 95.93], [99.0, 119.33], [121.0, 121.37], [121.0, 139.8], [142.0, 142.87], [148.0, 154.68], [156.0, 163.36], [165.0, 166.04]], "keep_status": [false, true, false, false, false, false, false, true, false, false, true, true, false, true, false, false, true, false], "silence_prob": [0.0, 47.54, 0.0, 64.18, 0.0, 40.28, 0.0, 31.97, 31.59, 0.0, 34.46, 34.93, 0.0, 32.74, 0.0, 38.59, 46.29, 0.0], "audiomae_on_audioset": [null, [["whale vocalization", 25.78], ["theremin", 20.74], ["animal", 8.01]], null, null, null, [["music", 51.61], ["theremin", 23.16], ["musical instrument", 4.95]], null, [["music", 46.54], ["theremin", 15.74], ["animal", 3.88]], [["speech", 51.39], ["music", 22.18], ["whale vocalization", 1.84]], null, [["music", 34.22], ["speech", 17.53], ["theremin", 11.39]], [["bee, wasp, etc.", 16.71], ["animal", 14.26], ["music", 13.43]], null, [["music", 48.91], ["theremin", 13.2], ["animal", 4.26]], null, [["music", 39.84], ["theremin", 20.55], ["speech", 9.72]], [["music", 47.14], ["theremin", 5.35], ["speech", 5.18]], null], "duration": [0.74, 3.04, 0.1, 6.05, 0.52, 26.5, 0.04, 17.37, 7.27, 0.38, 4.93, 20.33, 0.37, 18.8, 0.87, 6.68, 7.36, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/tDD6wnNN-IQ_filtered.json b/annotations_filtered/tDD6wnNN-IQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3712bf39fdd629f1ac7b4d0b8b9232f94a5e722b --- /dev/null +++ b/annotations_filtered/tDD6wnNN-IQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 31.26], [32.0, 33.57], [34.0, 36.36], [37.0, 37.72], [38.0, 38.35], [39.0, 40.68], [41.0, 42.08], [42.0, 43.39], [44.0, 45.37], [54.0, 57.91], [61.0, 62.68], [72.0, 75.15], [78.0, 78.58], [81.0, 82.16], [85.0, 84.94], [88.0, 89.21], [92.0, 92.45], [95.0, 95.42], [102.0, 102.91], [115.0, 117.81]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [54.17, 0.0, 52.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.83, 0.0, 32.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 32.95], ["inside, small room", 17.74], ["cough", 5.19]], null, [["speech", 41.62], ["radio", 7.01], ["whack, thwack", 6.46]], null, null, null, null, null, null, null, [["speech", 44.2], ["beatboxing", 25.69], ["radio", 2.44]]], "duration": [3.26, 1.57, 2.36, 0.72, 0.35, 1.68, 1.08, 1.39, 1.37, 3.91, 1.68, 3.15, 0.58, 1.16, -0.06, 1.21, 0.45, 0.42, 0.91, 2.81]} \ No newline at end of file diff --git a/annotations_filtered/tDW4X-r1dQI_filtered.json b/annotations_filtered/tDW4X-r1dQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5801a02a801af1d2cdfbfcce41cb28407b1724d4 --- /dev/null +++ b/annotations_filtered/tDW4X-r1dQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [16.0, 25.27], [35.0, 49.23], [73.0, 92.45], [101.0, 110.08], [115.0, 115.21], [116.0, 115.75], [117.0, 129.95]], "keep_status": [false, true, true, false, true, false, false, true], "silence_prob": [0.0, 32.37, 30.79, 29.54, 34.03, 0.0, 0.0, 30.96], "audiomae_on_audioset": [null, [["music", 32.87], ["speech", 10.26], ["vehicle", 7.92]], [["music", 48.36], ["speech", 5.84], ["animal", 4.74]], [["livestock, farm animals, working animals", 31.67], ["moo", 26.64], ["cattle, bovinae", 21.13]], [["hum", 17.04], ["speech", 15.11], ["music", 9.43]], null, null, [["cattle, bovinae", 12.46], ["livestock, farm animals, working animals", 11.42], ["speech", 11.41]]], "duration": [0.45, 9.27, 14.23, 19.45, 9.08, 0.21, -0.25, 12.95]} \ No newline at end of file diff --git a/annotations_filtered/tDWQvA6IhG8_filtered.json b/annotations_filtered/tDWQvA6IhG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a31d5c74ce01a2e80f38a48eb08553bc4c497d0 --- /dev/null +++ b/annotations_filtered/tDWQvA6IhG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.81], [9.0, 10.18], [11.0, 11.1], [12.0, 24.97], [26.0, 26.97], [27.0, 78.48], [79.0, 80.3]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [50.66, 0.0, 0.0, 36.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 57.23], ["theremin", 10.36], ["ambient music", 4.09]], null, null, null], "duration": [3.81, 1.18, 0.1, 12.97, 0.97, 51.48, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/tDlL6QWvKNk_filtered.json b/annotations_filtered/tDlL6QWvKNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c78de0a007f14811caa5f7e9a397cc01315bf383 --- /dev/null +++ b/annotations_filtered/tDlL6QWvKNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.23], [12.0, 13.19], [14.0, 14.81], [16.0, 16.41], [21.0, 22.86], [24.0, 24.75], [27.0, 27.51], [29.0, 29.76], [31.0, 32.09], [37.0, 42.63], [43.0, 44.29], [46.0, 46.4], [48.0, 49.99], [53.0, 53.49], [54.0, 54.63], [60.0, 60.59], [61.0, 61.94], [63.0, 63.37], [64.0, 65.3], [66.0, 67.02], [68.0, 74.07], [75.0, 76.57], [79.0, 80.25], [81.0, 81.46], [83.0, 83.12], [83.0, 85.67], [86.0, 89.14], [90.0, 93.61], [95.0, 95.39], [98.0, 99.96], [102.0, 103.44], [104.0, 104.3], [105.0, 105.44], [106.0, 123.65], [124.0, 124.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 62.27, 83.7, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 54.5, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 1.19, 0.81, 0.41, 1.86, 0.75, 0.51, 0.76, 1.09, 5.63, 1.29, 0.4, 1.99, 0.49, 0.63, 0.59, 0.94, 0.37, 1.3, 1.02, 6.07, 1.57, 1.25, 0.46, 0.12, 2.67, 3.14, 3.61, 0.39, 1.96, 1.44, 0.3, 0.44, 17.65, 0.9]} \ No newline at end of file diff --git a/annotations_filtered/tDpyGID-qHI_filtered.json b/annotations_filtered/tDpyGID-qHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b216caec46edad359699f2dc6b5a2b81d020a2e --- /dev/null +++ b/annotations_filtered/tDpyGID-qHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.34], [11.0, 12.73], [14.0, 15.31], [16.0, 15.96], [19.0, 20.04], [21.0, 21.27], [23.0, 23.4], [25.0, 28.0], [29.0, 29.74], [36.0, 36.9], [39.0, 38.91], [40.0, 41.25], [45.0, 45.23], [46.0, 46.03], [51.0, 50.85], [51.0, 51.22], [52.0, 52.68], [54.0, 54.63], [56.0, 57.23], [58.0, 58.51], [60.0, 61.8], [62.0, 63.59], [69.0, 69.43], [70.0, 70.43], [71.0, 71.47], [73.0, 74.16], [75.0, 75.29], [75.0, 75.76], [77.0, 77.09], [77.0, 78.41], [79.0, 80.81], [81.0, 83.51], [89.0, 89.82], [93.0, 94.39], [96.0, 98.2], [101.0, 101.51], [104.0, 104.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 99.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 1.73, 1.31, -0.04, 1.04, 0.27, 0.4, 3.0, 0.74, 0.9, -0.09, 1.25, 0.23, 0.03, -0.15, 0.22, 0.68, 0.63, 1.23, 0.51, 1.8, 1.59, 0.43, 0.43, 0.47, 1.16, 0.29, 0.76, 0.09, 1.41, 1.81, 2.51, 0.82, 1.39, 2.2, 0.51, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/tEWLG9sG1VM_filtered.json b/annotations_filtered/tEWLG9sG1VM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70ff86d91020127be1ec98c90b7165c1052c6bac --- /dev/null +++ b/annotations_filtered/tEWLG9sG1VM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.41], [13.0, 13.56], [14.0, 17.05], [18.0, 19.36], [21.0, 99.64], [101.0, 101.58], [104.0, 104.75]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.41, 0.56, 3.05, 1.36, 78.64, 0.58, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/tEs0OuspG4w_filtered.json b/annotations_filtered/tEs0OuspG4w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..984de5b8d43a1d7383f76925715362525cd3712a --- /dev/null +++ b/annotations_filtered/tEs0OuspG4w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 54.8], [55.0, 59.63], [61.0, 61.32], [63.0, 67.39], [68.0, 68.49], [69.0, 71.19], [73.0, 73.14], [76.0, 83.94], [97.0, 97.01], [97.0, 97.5], [103.0, 109.56], [111.0, 128.24], [136.0, 141.13], [146.0, 148.29]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, true, true, true], "silence_prob": [90.43, 52.98, 0.0, 37.81, 0.0, 53.16, 0.0, 31.68, 0.0, 0.0, 28.13, 28.94, 28.32, 29.05], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 17.31], ["frog", 13.63], ["music", 12.16]], null, null, null, [["music", 55.53], ["thunk", 9.64], ["thump, thud", 6.44]], null, null, [["sheep", 17.65], ["speech", 16.24], ["groan", 13.22]], [["hum", 36.21], ["music", 12.28], ["whale vocalization", 11.41]], [["speech", 30.1], ["music", 17.54], ["animal", 4.65]], [["music", 31.58], ["didgeridoo", 19.2], ["throbbing", 4.09]]], "duration": [7.8, 4.63, 0.32, 4.39, 0.49, 2.19, 0.14, 7.94, 0.01, 0.5, 6.56, 17.24, 5.13, 2.29]} \ No newline at end of file diff --git a/annotations_filtered/tEyY-ijoyaQ_filtered.json b/annotations_filtered/tEyY-ijoyaQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc82089faa0af5921513ea1b981257d04629253c --- /dev/null +++ b/annotations_filtered/tEyY-ijoyaQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.94], [9.0, 9.96], [10.0, 11.18], [14.0, 14.37], [15.0, 16.58], [18.0, 18.42], [19.0, 21.81], [23.0, 23.55], [24.0, 24.51], [32.0, 33.59], [34.0, 35.83], [38.0, 41.03], [62.0, 83.22], [84.0, 87.44], [89.0, 89.56], [94.0, 96.26], [98.0, 98.78], [100.0, 100.21], [101.0, 100.85], [104.0, 105.26], [110.0, 110.1], [110.0, 111.94], [115.0, 116.82], [118.0, 118.56], [120.0, 120.61], [122.0, 122.62], [124.0, 125.19], [126.0, 134.45], [135.0, 141.34], [142.0, 144.71], [148.0, 149.0], [150.0, 151.17], [152.0, 155.02], [157.0, 161.42], [165.0, 167.49], [170.0, 175.83], [178.0, 178.77], [180.0, 185.41], [187.0, 189.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.71, 0.0, 0.0, 0.0, 0.0, 41.64, 43.1, 43.15, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 51.18, 59.68, 0.0, 0.0, 53.97, 71.14, 70.86, 55.04, 0.0, 82.79, 73.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.56], ["beatboxing", 8.75], ["vocal music", 5.71]], [["music", 13.32], ["speech", 12.15], ["beatboxing", 9.66]], [["music", 72.08], ["didgeridoo", 6.07], ["bass guitar", 4.68]], null, [["sidetone", 41.55], ["speech", 25.54], ["mains hum", 5.26]], null, null, null, null, null, null, null, null, null, null, null, [["music", 42.73], ["synthesizer", 7.52], ["singing bowl", 5.77]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.94, 0.96, 1.18, 0.37, 1.58, 0.42, 2.81, 0.55, 0.51, 1.59, 1.83, 3.03, 21.22, 3.44, 0.56, 2.26, 0.78, 0.21, -0.15, 1.26, 0.1, 1.94, 1.82, 0.56, 0.61, 0.62, 1.19, 8.45, 6.34, 2.71, 1.0, 1.17, 3.02, 4.42, 2.49, 5.83, 0.77, 5.41, 2.78]} \ No newline at end of file diff --git a/annotations_filtered/tF3eceBqcik_filtered.json b/annotations_filtered/tF3eceBqcik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2c6c0a1c4511907ea92dff25e8aa167de0a339d --- /dev/null +++ b/annotations_filtered/tF3eceBqcik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [4.0, 4.56], [5.0, 5.66], [6.0, 8.41], [13.0, 13.53], [15.0, 16.56], [27.0, 27.14], [38.0, 38.25], [49.0, 51.48], [52.0, 53.87], [64.0, 64.81], [82.0, 82.54], [83.0, 84.1], [87.0, 87.25], [88.0, 91.23], [92.0, 92.92], [96.0, 97.68], [114.0, 115.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.66, 0.0, 0.0, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.16], ["music", 10.75], ["whale vocalization", 2.15]], null, null, null], "duration": [0.49, 0.56, 0.66, 2.41, 0.53, 1.56, 0.14, 0.25, 2.48, 1.87, 0.81, 0.54, 1.1, 0.25, 3.23, 0.92, 1.68, 1.62]} \ No newline at end of file diff --git a/annotations_filtered/tF6XBuvWdPs_filtered.json b/annotations_filtered/tF6XBuvWdPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6694707a3ad8ad3ef2a073f48ee71126124d276c --- /dev/null +++ b/annotations_filtered/tF6XBuvWdPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.32], [5.0, 5.75], [9.0, 8.85], [11.0, 11.57], [16.0, 16.34], [18.0, 17.95], [22.0, 22.05], [23.0, 23.28], [25.0, 25.05], [29.0, 29.2], [32.0, 32.78], [34.0, 34.38], [38.0, 38.85], [40.0, 41.15], [43.0, 43.56], [46.0, 46.4], [54.0, 54.06], [55.0, 56.02], [57.0, 58.68], [62.0, 62.07], [64.0, 63.75], [68.0, 69.65], [74.0, 74.06], [77.0, 78.88], [84.0, 84.77], [86.0, 86.0], [90.0, 91.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 0.75, -0.15, 0.57, 0.34, -0.05, 0.05, 0.28, 0.05, 0.2, 0.78, 0.38, 0.85, 1.15, 0.56, 0.4, 0.06, 1.02, 1.68, 0.07, -0.25, 1.65, 0.06, 1.88, 0.77, 0.0, 1.08]} \ No newline at end of file diff --git a/annotations_filtered/tFAX4TdV6ak_filtered.json b/annotations_filtered/tFAX4TdV6ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20e2c09ac790bc7e2d79cb0e023531a6925432f3 --- /dev/null +++ b/annotations_filtered/tFAX4TdV6ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [8.0, 10.56], [12.0, 14.74], [17.0, 19.67], [23.0, 26.35], [29.0, 30.92], [32.0, 34.91], [36.0, 38.52], [41.0, 42.74], [43.0, 49.17], [49.0, 50.77], [52.0, 55.97], [57.0, 65.64], [67.0, 68.88], [70.0, 72.96], [74.0, 75.64], [77.0, 82.38], [83.0, 99.59], [100.0, 114.37], [115.0, 124.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.67, 95.78, 99.95, 99.97, 0.0, 99.16, 94.66, 0.0, 96.42, 0.0, 99.36, 99.26, 0.0, 95.37, 0.0, 77.53, 98.66, 95.23, 97.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 2.56, 2.74, 2.67, 3.35, 1.92, 2.91, 2.52, 1.74, 6.17, 1.77, 3.97, 8.64, 1.88, 2.96, 1.64, 5.38, 16.59, 14.37, 9.43]} \ No newline at end of file diff --git a/annotations_filtered/tFBSGc3v7BI_filtered.json b/annotations_filtered/tFBSGc3v7BI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a03f6d7257e3d3301c5a5c62a31e1b37fd09d945 --- /dev/null +++ b/annotations_filtered/tFBSGc3v7BI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [4.0, 4.8], [6.0, 7.74], [9.0, 9.21], [14.0, 17.27], [20.0, 25.22], [26.0, 27.16], [29.0, 30.77], [35.0, 35.5], [36.0, 38.28], [40.0, 41.3], [48.0, 49.89], [56.0, 56.59], [61.0, 60.67], [67.0, 67.22], [70.0, 70.04], [78.0, 80.18], [83.0, 83.81], [86.0, 87.29], [96.0, 97.21], [124.0, 125.27], [128.0, 128.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.55, 97.64, 0.0, 0.0, 0.0, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.8, 1.74, 0.21, 3.27, 5.22, 1.16, 1.77, 0.5, 2.28, 1.3, 1.89, 0.59, -0.33, 0.22, 0.04, 2.18, 0.81, 1.29, 1.21, 1.27, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/tFEKMdUMjEk_filtered.json b/annotations_filtered/tFEKMdUMjEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..809dd77e041df8479d052120f1342c3ad7c6bfd0 --- /dev/null +++ b/annotations_filtered/tFEKMdUMjEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.6], [10.0, 12.6], [15.0, 17.58], [22.0, 22.67], [26.0, 27.94], [29.0, 31.11], [33.0, 35.4], [42.0, 42.43], [43.0, 43.48], [44.0, 47.07], [50.0, 51.83], [53.0, 55.04], [55.0, 59.39], [60.0, 64.29], [65.0, 68.77], [70.0, 74.26], [75.0, 87.2], [87.0, 118.98], [120.0, 122.12], [123.0, 128.73], [129.0, 133.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 52.05, 100.0, 0.0, 0.0, 100.0, 64.07, 0.0, 0.0, 99.87, 0.0, 38.87, 66.63, 78.55, 59.42, 84.25, 49.45, 0.0, 41.42, 37.3, 31.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.06], ["sidetone", 3.85], ["hum", 3.09]], null, null, null, null, [["speech", 27.3], ["singing bowl", 25.55], ["music", 15.82]], null, [["music", 32.24], ["theremin", 27.83], ["ambient music", 11.94]], [["music", 48.39], ["theremin", 14.38], ["synthesizer", 6.54]], [["music", 36.65], ["speech", 33.48], ["foghorn", 9.94]]], "duration": [0.6, 2.6, 2.58, 0.67, 1.94, 2.11, 2.4, 0.43, 0.48, 3.07, 1.83, 2.04, 4.39, 4.29, 3.77, 4.26, 12.2, 31.98, 2.12, 5.73, 4.81]} \ No newline at end of file diff --git a/annotations_filtered/tFeew6TgM8w_filtered.json b/annotations_filtered/tFeew6TgM8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c552b006ddcfe2a7b93246e5758903c2f330f0e --- /dev/null +++ b/annotations_filtered/tFeew6TgM8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.81], [23.0, 23.14], [24.0, 24.78], [30.0, 30.55], [31.0, 35.31], [39.0, 44.46], [46.0, 47.06], [50.0, 62.43], [65.0, 83.37], [85.0, 95.55]], "keep_status": [false, false, false, false, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.05, 30.99, 0.0, 31.59, 30.24, 30.42], "audiomae_on_audioset": [null, null, null, null, [["speech", 67.94], ["music", 9.22], ["hum", 3.1]], [["music", 60.33], ["speech", 4.02], ["whack, thwack", 3.65]], null, [["hum", 31.44], ["mains hum", 27.35], ["music", 12.45]], [["speech", 34.53], ["music", 22.54], ["thump, thud", 5.86]], [["music", 28.66], ["hum", 19.43], ["throbbing", 7.04]]], "duration": [0.81, 0.14, 0.78, 0.55, 4.31, 5.46, 1.06, 12.43, 18.37, 10.55]} \ No newline at end of file diff --git a/annotations_filtered/tFkpixS3QZQ_filtered.json b/annotations_filtered/tFkpixS3QZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..442028d46aa8588cfd5d61050e73381b7d435ac9 --- /dev/null +++ b/annotations_filtered/tFkpixS3QZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 40.9], [44.0, 54.99], [55.0, 57.64], [62.0, 89.67], [90.0, 90.96], [91.0, 100.36], [101.0, 102.15], [103.0, 103.44], [104.0, 117.14], [126.0, 126.84], [129.0, 130.25]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 31.41, 41.42, 32.01, 0.0, 33.81, 0.0, 0.0, 37.81, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.63], ["speech", 6.85], ["hum", 4.08]], [["music", 56.83], ["ambient music", 14.81], ["scary music", 13.34]], [["music", 71.25], ["scary music", 10.16], ["hum", 6.08]], null, [["mains hum", 37.41], ["hum", 35.89], ["speech", 11.74]], null, null, [["music", 42.23], ["electronic music", 10.48], ["hum", 7.9]], null, null], "duration": [1.9, 10.99, 2.64, 27.67, 0.96, 9.36, 1.15, 0.44, 13.14, 0.84, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/tG1crFI87ro_filtered.json b/annotations_filtered/tG1crFI87ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f19c9891b7625b05080f9a61af0a48019a30ec8d --- /dev/null +++ b/annotations_filtered/tG1crFI87ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.65], [5.0, 11.38], [18.0, 18.57], [21.0, 21.3], [22.0, 23.11], [28.0, 28.86], [32.0, 40.39], [44.0, 49.06], [52.0, 59.31], [60.0, 86.41], [91.0, 95.44], [98.0, 97.87], [98.0, 98.32], [100.0, 100.3], [101.0, 103.11], [104.0, 105.19], [107.0, 107.99], [116.0, 115.79], [128.0, 128.26], [138.0, 142.11], [143.0, 145.03], [148.0, 148.95], [150.0, 150.92], [156.0, 156.42], [162.0, 164.54], [166.0, 167.27], [170.0, 170.24], [172.0, 172.47], [174.0, 176.49]], "keep_status": [true, true, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false], "silence_prob": [33.73, 34.16, 0.0, 0.0, 0.0, 0.0, 29.94, 28.55, 31.31, 34.89, 31.7, 0.0, 0.0, 0.0, 40.86, 0.0, 0.0, 0.0, 0.0, 32.61, 31.92, 0.0, 0.0, 0.0, 35.41, 0.0, 0.0, 0.0, 64.07], "audiomae_on_audioset": [[["music", 44.25], ["theremin", 10.42], ["clarinet", 4.57]], [["music", 37.22], ["hum", 15.31], ["speech", 12.01]], null, null, null, null, [["fly, housefly", 13.34], ["mains hum", 8.95], ["boat, water vehicle", 8.74]], [["speech", 48.16], ["music", 7.39], ["foghorn", 4.41]], [["livestock, farm animals, working animals", 46.75], ["cattle, bovinae", 30.08], ["moo", 10.36]], [["cattle, bovinae", 21.76], ["livestock, farm animals, working animals", 15.73], ["moo", 14.41]], [["music", 40.89], ["throbbing", 34.32], ["hum", 9.94]], null, null, null, [["throbbing", 58.42], ["music", 22.78], ["hum", 5.85]], null, null, null, null, [["cattle, bovinae", 29.98], ["moo", 19.3], ["livestock, farm animals, working animals", 13.93]], [["speech", 29.43], ["sidetone", 12.51], ["boing", 6.64]], null, null, null, [["hum", 31.5], ["speech", 14.61], ["throbbing", 6.31]], null, null, null, null], "duration": [2.65, 6.38, 0.57, 0.3, 1.11, 0.86, 8.39, 5.06, 7.31, 26.41, 4.44, -0.13, 0.32, 0.3, 2.11, 1.19, 0.99, -0.21, 0.26, 4.11, 2.03, 0.95, 0.92, 0.42, 2.54, 1.27, 0.24, 0.47, 2.49]} \ No newline at end of file diff --git a/annotations_filtered/tG2qsoC_-hs_filtered.json b/annotations_filtered/tG2qsoC_-hs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..894a4ea9055aa1eaf025c474a1c56c44f048d5e3 --- /dev/null +++ b/annotations_filtered/tG2qsoC_-hs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.62], [8.0, 12.85], [14.0, 16.04], [17.0, 26.33], [27.0, 27.38], [28.0, 28.05], [29.0, 29.96], [32.0, 32.83], [38.0, 40.26], [43.0, 43.97], [47.0, 47.8], [49.0, 49.25], [52.0, 52.61], [58.0, 58.31], [61.0, 61.79], [65.0, 66.24], [76.0, 76.23], [82.0, 82.51], [84.0, 84.52], [86.0, 86.07], [93.0, 93.36], [103.0, 102.98], [106.0, 109.24], [110.0, 111.06], [113.0, 113.02], [120.0, 120.43], [124.0, 124.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 99.73, 99.4, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 4.85, 2.04, 9.33, 0.38, 0.05, 0.96, 0.83, 2.26, 0.97, 0.8, 0.25, 0.61, 0.31, 0.79, 1.24, 0.23, 0.51, 0.52, 0.07, 0.36, -0.02, 3.24, 1.06, 0.02, 0.43, 0.24]} \ No newline at end of file diff --git a/annotations_filtered/tGDO-9hfaiI_filtered.json b/annotations_filtered/tGDO-9hfaiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2f24cac8657cd4a6f7c9da7eda1c9213cb929ee --- /dev/null +++ b/annotations_filtered/tGDO-9hfaiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [6.0, 6.4], [7.0, 8.53], [9.0, 11.82], [12.0, 16.5], [20.0, 20.82], [25.0, 26.4], [27.0, 27.09], [29.0, 28.81], [36.0, 36.02], [38.0, 38.82], [46.0, 46.06], [55.0, 55.93], [57.0, 57.65], [58.0, 59.43], [62.0, 61.96], [63.0, 64.03], [65.0, 65.21], [68.0, 68.44], [76.0, 75.84], [78.0, 78.68], [80.0, 80.35], [82.0, 82.0], [84.0, 83.91], [85.0, 85.83], [90.0, 89.73]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.78, 33.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 28.98], ["rowboat, canoe, kayak", 14.49], ["vehicle", 7.18]], [["livestock, farm animals, working animals", 24.47], ["cattle, bovinae", 16.56], ["speech", 11.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 0.4, 1.53, 2.82, 4.5, 0.82, 1.4, 0.09, -0.19, 0.02, 0.82, 0.06, 0.93, 0.65, 1.43, -0.04, 1.03, 0.21, 0.44, -0.16, 0.68, 0.35, 0.0, -0.09, 0.83, -0.27]} \ No newline at end of file diff --git a/annotations_filtered/tGNBdjVO04Y_filtered.json b/annotations_filtered/tGNBdjVO04Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..311f75a1386ecd59c65d75cdd56caeeb4d0e678c --- /dev/null +++ b/annotations_filtered/tGNBdjVO04Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.21], [5.0, 5.83], [7.0, 8.28], [11.0, 23.08], [24.0, 23.94], [35.0, 37.74], [38.0, 38.74], [39.0, 40.27], [44.0, 44.02], [46.0, 46.3], [51.0, 52.14], [55.0, 55.59], [59.0, 60.18], [68.0, 70.36], [71.0, 72.05], [78.0, 79.49], [82.0, 82.39], [88.0, 88.28], [89.0, 94.31], [96.0, 96.15], [97.0, 98.58], [101.0, 101.66], [104.0, 107.64]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.29, 0.0, 47.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.36, 0.0, 0.0, 0.0, 0.0, 50.51, 0.0, 0.0, 0.0, 56.25], "audiomae_on_audioset": [null, null, null, [["music", 53.73], ["effects unit", 11.51], ["musical instrument", 5.68]], null, [["music", 46.87], ["hum", 10.4], ["synthesizer", 7.27]], null, null, null, null, null, null, null, [["hum", 43.42], ["mains hum", 43.4], ["throbbing", 2.46]], null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.83, 1.28, 12.08, -0.06, 2.74, 0.74, 1.27, 0.02, 0.3, 1.14, 0.59, 1.18, 2.36, 1.05, 1.49, 0.39, 0.28, 5.31, 0.15, 1.58, 0.66, 3.64]} \ No newline at end of file diff --git a/annotations_filtered/tGYc5woadps_filtered.json b/annotations_filtered/tGYc5woadps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..845e2aedac28ff1dd61477970a062e2258a18710 --- /dev/null +++ b/annotations_filtered/tGYc5woadps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.97], [3.0, 4.04], [6.0, 8.04], [10.0, 11.48], [12.0, 13.66], [16.0, 16.33], [17.0, 18.6], [20.0, 20.16], [21.0, 22.5], [24.0, 25.14], [27.0, 27.38], [31.0, 33.12], [35.0, 36.49], [38.0, 38.7], [40.0, 42.2], [43.0, 45.23], [48.0, 50.19], [52.0, 52.14], [53.0, 54.68], [56.0, 56.76], [57.0, 58.46], [60.0, 62.87], [65.0, 65.67], [67.0, 68.81], [70.0, 71.24], [72.0, 74.61], [76.0, 77.77], [80.0, 81.77], [84.0, 83.86], [88.0, 88.74], [93.0, 95.57], [97.0, 99.6], [103.0, 105.43], [107.0, 107.84], [109.0, 109.81], [112.0, 114.59], [116.0, 115.97], [118.0, 120.33], [123.0, 124.07], [126.0, 128.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.22, 0.0, 0.0, 98.99, 57.89, 99.88, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 75.07, 42.53, 97.83, 0.0, 0.0, 99.9, 0.0, 99.62, 0.0, 99.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.3], ["tuning fork", 12.51], ["sidetone", 6.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.76], ["cattle, bovinae", 4.68], ["moo", 4.33]], null, null, null, null, null, null, null, null], "duration": [0.97, 1.04, 2.04, 1.48, 1.66, 0.33, 1.6, 0.16, 1.5, 1.14, 0.38, 2.12, 1.49, 0.7, 2.2, 2.23, 2.19, 0.14, 1.68, 0.76, 1.46, 2.87, 0.67, 1.81, 1.24, 2.61, 1.77, 1.77, -0.14, 0.74, 2.57, 2.6, 2.43, 0.84, 0.81, 2.59, -0.03, 2.33, 1.07, 2.48]} \ No newline at end of file diff --git a/annotations_filtered/tGg3h7NtiXs_filtered.json b/annotations_filtered/tGg3h7NtiXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b80c5149cd6034bfab87e890b5f280c5ed1ad6f --- /dev/null +++ b/annotations_filtered/tGg3h7NtiXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 40.58], [44.0, 51.11]], "keep_status": [false, true], "silence_prob": [31.99, 46.12], "audiomae_on_audioset": [[["mains hum", 32.2], ["hum", 27.49], ["music", 11.91]], [["animal", 26.9], ["fart", 13.24], ["wild animals", 9.19]]], "duration": [15.58, 7.11]} \ No newline at end of file diff --git a/annotations_filtered/tGxxl7LOe_4_filtered.json b/annotations_filtered/tGxxl7LOe_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33d373fa4ce084989fba14297856954b257acf0c --- /dev/null +++ b/annotations_filtered/tGxxl7LOe_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.88], [8.0, 24.88], [25.0, 25.93], [27.0, 27.7], [29.0, 28.98], [29.0, 30.13], [30.0, 30.94], [39.0, 40.54], [42.0, 48.68], [50.0, 59.66], [70.0, 69.87], [71.0, 86.98], [99.0, 98.83], [105.0, 104.94]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [68.15, 39.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.09, 39.0, 0.0, 45.49, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 39.49], ["speech", 21.12], ["mains hum", 8.32]], null, null, null, null, null, null, [["speech", 56.66], ["screaming", 12.44], ["groan", 4.93]], [["speech", 62.4], ["whack, thwack", 8.45], ["ping", 5.0]], null, [["music", 47.58], ["marimba, xylophone", 7.67], ["glockenspiel", 7.09]], null, null], "duration": [5.88, 16.88, 0.93, 0.7, -0.02, 1.13, 0.94, 1.54, 6.68, 9.66, -0.13, 15.98, -0.17, -0.06]} \ No newline at end of file diff --git a/annotations_filtered/tH4JJtuyLp4_filtered.json b/annotations_filtered/tH4JJtuyLp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce350f0342f2ab6e9c3ef9df30ec13025ad9df75 --- /dev/null +++ b/annotations_filtered/tH4JJtuyLp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.42], [27.0, 27.7]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.42, 0.7]} \ No newline at end of file diff --git a/annotations_filtered/tHHqfGeeXps_filtered.json b/annotations_filtered/tHHqfGeeXps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9773dadc774fe89f24b34ac76f46992a0c4fab9f --- /dev/null +++ b/annotations_filtered/tHHqfGeeXps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.39], [18.0, 18.76], [22.0, 27.89], [34.0, 34.79], [41.0, 41.3], [44.0, 46.01], [48.0, 49.77], [60.0, 60.42], [60.0, 60.45], [73.0, 75.49], [77.0, 77.11], [82.0, 87.79], [90.0, 90.26], [95.0, 98.05], [99.0, 99.82], [100.0, 105.56], [111.0, 111.5], [112.0, 112.24], [119.0, 119.38], [124.0, 124.63], [125.0, 127.43]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [31.6, 0.0, 38.3, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 46.61, 0.0, 31.5, 0.0, 30.41, 0.0, 31.33, 0.0, 0.0, 0.0, 0.0, 31.13], "audiomae_on_audioset": [[["music", 41.14], ["speech", 6.2], ["throbbing", 5.81]], null, [["boing", 23.37], ["hum", 14.57], ["mains hum", 8.57]], null, null, null, null, null, null, [["chirp tone", 55.42], ["sine wave", 8.51], ["boing", 6.95]], null, [["music", 66.29], ["didgeridoo", 10.6], ["synthesizer", 4.1]], null, [["moo", 48.02], ["cattle, bovinae", 34.44], ["livestock, farm animals, working animals", 16.99]], null, [["moo", 20.3], ["cattle, bovinae", 14.99], ["speech", 12.35]], null, null, null, null, [["music", 65.24], ["guitar", 5.35], ["musical instrument", 3.23]]], "duration": [3.39, 0.76, 5.89, 0.79, 0.3, 2.01, 1.77, 0.42, 0.45, 2.49, 0.11, 5.79, 0.26, 3.05, 0.82, 5.56, 0.5, 0.24, 0.38, 0.63, 2.43]} \ No newline at end of file diff --git a/annotations_filtered/tHe6ar-X2cQ_filtered.json b/annotations_filtered/tHe6ar-X2cQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..930058bce51f9bbbedc7250a4733edc054fe0c26 --- /dev/null +++ b/annotations_filtered/tHe6ar-X2cQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.24], [8.0, 8.36], [10.0, 10.25], [11.0, 11.92], [15.0, 15.09], [22.0, 21.88], [26.0, 25.98], [29.0, 29.52], [30.0, 31.21], [32.0, 36.31], [37.0, 38.91], [43.0, 50.84], [52.0, 52.68], [54.0, 53.86], [55.0, 55.8], [57.0, 56.98], [60.0, 60.62], [62.0, 63.14], [65.0, 66.01], [67.0, 68.49], [70.0, 70.06], [70.0, 71.05], [72.0, 72.06], [73.0, 73.23], [76.0, 75.83], [82.0, 82.14], [93.0, 93.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.89, 0.0, 61.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["moo", 42.01], ["cattle, bovinae", 24.73], ["livestock, farm animals, working animals", 16.02]], null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 34.21], ["cattle, bovinae", 22.01], ["moo", 13.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.24, 0.36, 0.25, 0.92, 0.09, -0.12, -0.02, 0.52, 1.21, 4.31, 1.91, 7.84, 0.68, -0.14, 0.8, -0.02, 0.62, 1.14, 1.01, 1.49, 0.06, 1.05, 0.06, 0.23, -0.17, 0.14, 0.53]} \ No newline at end of file diff --git a/annotations_filtered/tIB4z4uMeNs_filtered.json b/annotations_filtered/tIB4z4uMeNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b715a6006434cae8776b2963af5411322338390 --- /dev/null +++ b/annotations_filtered/tIB4z4uMeNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.91], [3.0, 5.39], [6.0, 7.89], [9.0, 9.1], [10.0, 13.85], [15.0, 19.85], [21.0, 23.94], [28.0, 28.46], [31.0, 31.33], [33.0, 34.13], [36.0, 36.98], [38.0, 39.6], [41.0, 44.24], [46.0, 45.94], [48.0, 50.4], [52.0, 52.44], [53.0, 53.47], [54.0, 55.44], [56.0, 56.84], [58.0, 58.73], [61.0, 61.42], [62.0, 62.75], [68.0, 73.55], [75.0, 77.97], [81.0, 81.51], [83.0, 83.44], [87.0, 88.26], [91.0, 92.06], [95.0, 95.67], [99.0, 99.44], [101.0, 101.56], [105.0, 107.55], [108.0, 109.65], [111.0, 113.51], [114.0, 114.86], [117.0, 117.07], [119.0, 120.14], [122.0, 122.91], [124.0, 124.39]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 85.17, 0.0, 0.0, 100.0, 39.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 44.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 41.96], ["wind instrument, woodwind instrument", 7.5], ["effects unit", 4.81]], null, null, null, null, null, null, null, null, [["music", 60.15], ["musical instrument", 9.39], ["theremin", 7.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 2.39, 1.89, 0.1, 3.85, 4.85, 2.94, 0.46, 0.33, 1.13, 0.98, 1.6, 3.24, -0.06, 2.4, 0.44, 0.47, 1.44, 0.84, 0.73, 0.42, 0.75, 5.55, 2.97, 0.51, 0.44, 1.26, 1.06, 0.67, 0.44, 0.56, 2.55, 1.65, 2.51, 0.86, 0.07, 1.14, 0.91, 0.39]} \ No newline at end of file diff --git a/annotations_filtered/tImxhYu2PG8_filtered.json b/annotations_filtered/tImxhYu2PG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..076554f245f6bef00f1c7f369321f0f00e1d4a32 --- /dev/null +++ b/annotations_filtered/tImxhYu2PG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [3.0, 3.57], [5.0, 6.18], [7.0, 10.44], [12.0, 12.9], [14.0, 15.33], [17.0, 22.23], [24.0, 24.78], [26.0, 28.54], [30.0, 34.16], [35.0, 35.75], [36.0, 38.7], [39.0, 47.06], [49.0, 51.29], [52.0, 54.09], [55.0, 55.75], [58.0, 59.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 97.22, 0.0, 61.67, 66.88, 0.0, 88.46, 80.82, 97.83, 64.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.98, 0.57, 1.18, 3.44, 0.9, 1.33, 5.23, 0.78, 2.54, 4.16, 0.75, 2.7, 8.06, 2.29, 2.09, 0.75, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/tIy7sQGKtJA_filtered.json b/annotations_filtered/tIy7sQGKtJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51b1b9b3740d4cc1b68dcfeb8adb81254f82ce5d --- /dev/null +++ b/annotations_filtered/tIy7sQGKtJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 22.6], [24.0, 58.38], [63.0, 64.02], [68.0, 79.24], [81.0, 81.36]], "keep_status": [false, false, false, false, false], "silence_prob": [37.19, 0.0, 0.0, 33.77, 0.0], "audiomae_on_audioset": [[["music", 57.1], ["speech", 11.02], ["whale vocalization", 5.33]], null, null, [["music", 50.43], ["speech", 16.0], ["mains hum", 7.27]], null], "duration": [10.6, 34.38, 1.02, 11.24, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/tJ1uXsPXyao_filtered.json b/annotations_filtered/tJ1uXsPXyao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b60751d33c4b3b537345249baa013078b962271d --- /dev/null +++ b/annotations_filtered/tJ1uXsPXyao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [7.0, 11.7], [13.0, 16.51], [17.0, 18.01], [21.0, 22.27], [25.0, 26.94], [36.0, 44.9], [46.0, 51.66], [55.0, 65.26], [66.0, 78.04], [80.0, 81.73], [83.0, 85.29], [86.0, 88.57], [95.0, 95.52], [97.0, 99.33], [101.0, 102.9], [103.0, 108.48], [111.0, 112.21], [114.0, 114.86], [116.0, 145.86]], "keep_status": [false, false, true, false, false, false, true, true, false, false, false, true, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 28.74, 29.38, 0.0, 0.0, 0.0, 28.8, 30.06, 30.33, 29.33, 0.0, 32.44, 30.5, 0.0, 32.75, 0.0, 29.23, 0.0, 0.0, 29.11], "audiomae_on_audioset": [null, [["speech", 64.76], ["explosion", 10.19], ["outside, rural or natural", 2.49]], [["speech", 32.84], ["music", 24.97], ["throbbing", 3.73]], null, null, null, [["music", 45.85], ["hum", 8.07], ["cacophony", 4.14]], [["speech", 21.07], ["hum", 19.57], ["whale vocalization", 18.06]], [["throbbing", 40.66], ["hum", 20.84], ["music", 19.15]], [["music", 54.86], ["throbbing", 15.35], ["hum", 13.45]], null, [["music", 32.39], ["speech", 26.56], ["musical instrument", 2.84]], [["cattle, bovinae", 46.21], ["moo", 39.6], ["livestock, farm animals, working animals", 13.51]], null, [["cattle, bovinae", 29.58], ["moo", 13.27], ["cowbell", 12.23]], null, [["vehicle", 21.81], ["speech", 21.72], ["motorboat, speedboat", 19.84]], null, null, [["hum", 34.97], ["mains hum", 27.57], ["music", 13.49]]], "duration": [0.5, 4.7, 3.51, 1.01, 1.27, 1.94, 8.9, 5.66, 10.26, 12.04, 1.73, 2.29, 2.57, 0.52, 2.33, 1.9, 5.48, 1.21, 0.86, 29.86]} \ No newline at end of file diff --git a/annotations_filtered/tJ4H77qrLjI_filtered.json b/annotations_filtered/tJ4H77qrLjI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..136699e331b10c3c59868dd4ee9cabc2f5011add --- /dev/null +++ b/annotations_filtered/tJ4H77qrLjI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.32], [21.0, 21.1], [22.0, 40.8], [53.0, 53.23], [56.0, 65.91], [67.0, 69.8], [72.0, 74.26], [78.0, 78.43], [81.0, 88.53], [98.0, 115.47], [118.0, 124.56], [125.0, 130.2], [133.0, 138.18], [140.0, 161.05]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [35.92, 0.0, 33.11, 0.0, 34.49, 34.78, 44.29, 0.0, 36.82, 35.66, 34.37, 35.0, 32.06, 32.49], "audiomae_on_audioset": [[["music", 57.92], ["didgeridoo", 8.28], ["synthesizer", 7.58]], null, [["speech", 47.33], ["music", 27.82], ["quack", 5.59]], null, [["speech", 42.34], ["music", 20.46], ["vehicle", 13.25]], [["music", 41.3], ["speech", 21.02], ["trombone", 7.79]], [["music", 61.6], ["musical instrument", 6.29], ["brass instrument", 3.25]], null, [["fly, housefly", 27.59], ["speech", 16.98], ["mosquito", 12.87]], [["speech", 54.28], ["music", 17.14], ["vehicle", 4.11]], [["speech", 62.78], ["aircraft", 9.88], ["vehicle", 6.6]], [["music", 47.79], ["trombone", 10.09], ["musical instrument", 6.56]], [["music", 46.65], ["speech", 31.29], ["musical instrument", 1.79]], [["music", 53.43], ["trombone", 6.57], ["brass instrument", 3.78]]], "duration": [9.32, 0.1, 18.8, 0.23, 9.91, 2.8, 2.26, 0.43, 7.53, 17.47, 6.56, 5.2, 5.18, 21.05]} \ No newline at end of file diff --git a/annotations_filtered/tJBeQ9Ewo3o_filtered.json b/annotations_filtered/tJBeQ9Ewo3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90d4ee775539508eb8af34c61b57297841d7254f --- /dev/null +++ b/annotations_filtered/tJBeQ9Ewo3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.72], [6.0, 5.93], [11.0, 11.52], [13.0, 15.06], [16.0, 30.4], [35.0, 35.63], [37.0, 39.33], [39.0, 42.31], [44.0, 45.81], [49.0, 55.16], [57.0, 67.09], [67.0, 71.15], [72.0, 73.85], [75.0, 96.45], [97.0, 97.24], [100.0, 101.78], [103.0, 103.67], [105.0, 105.97], [108.0, 109.05], [117.0, 117.8], [119.0, 119.85], [121.0, 122.08], [123.0, 126.05], [126.0, 127.45]], "keep_status": [false, false, false, true, true, false, true, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.35, 28.78, 0.0, 30.46, 29.42, 0.0, 29.04, 29.03, 30.74, 0.0, 29.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 45.06], ["hum", 6.85], ["noise", 2.4]], [["hum", 27.54], ["music", 23.07], ["mains hum", 15.34]], null, [["music", 40.13], ["speech", 26.43], ["vehicle", 3.29]], [["cattle, bovinae", 47.98], ["moo", 28.86], ["livestock, farm animals, working animals", 9.66]], null, [["livestock, farm animals, working animals", 45.63], ["cattle, bovinae", 22.43], ["moo", 17.64]], [["livestock, farm animals, working animals", 22.69], ["cattle, bovinae", 21.61], ["wild animals", 14.23]], [["fly, housefly", 30.0], ["mosquito", 25.88], ["insect", 9.02]], null, [["vehicle", 16.48], ["music", 14.22], ["speech", 11.53]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.28, -0.07, 0.52, 2.06, 14.4, 0.63, 2.33, 3.31, 1.81, 6.16, 10.09, 4.15, 1.85, 21.45, 0.24, 1.78, 0.67, 0.97, 1.05, 0.8, 0.85, 1.08, 3.05, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/tJHkiRzd05M_filtered.json b/annotations_filtered/tJHkiRzd05M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47ff7e4eab9b87d0c9464c1208199fa960901cdb --- /dev/null +++ b/annotations_filtered/tJHkiRzd05M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [5.0, 7.16], [8.0, 8.16], [13.0, 18.86], [20.0, 21.83], [29.0, 31.7], [34.0, 34.11], [39.0, 39.75], [48.0, 51.36], [52.0, 52.49], [53.0, 54.51], [63.0, 63.32], [64.0, 66.66], [67.0, 68.1], [69.0, 69.87], [77.0, 77.41], [79.0, 79.81], [83.0, 83.81], [106.0, 106.78], [110.0, 110.51], [113.0, 113.04], [124.0, 126.32], [129.0, 129.84], [143.0, 143.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.22, 0.0, 42.62, 0.0, 54.56, 0.0, 0.0, 55.31, 0.0, 0.0, 0.0, 49.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 60.8], ["musical instrument", 5.92], ["cello", 4.68]], null, null, null, null, null, null, null, null, [["mosquito", 51.95], ["fly, housefly", 20.88], ["insect", 12.91]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 2.16, 0.16, 5.86, 1.83, 2.7, 0.11, 0.75, 3.36, 0.49, 1.51, 0.32, 2.66, 1.1, 0.87, 0.41, 0.81, 0.81, 0.78, 0.51, 0.04, 2.32, 0.84, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/tJLdaKUBGzo_filtered.json b/annotations_filtered/tJLdaKUBGzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c52c80d4b7ca992c276fcfd0326254f692d4465 --- /dev/null +++ b/annotations_filtered/tJLdaKUBGzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.18], [12.0, 13.42], [14.0, 16.29], [18.0, 18.89], [21.0, 25.35], [27.0, 29.96], [32.0, 34.89], [37.0, 39.66], [41.0, 42.25], [44.0, 47.02], [48.0, 51.26], [52.0, 59.29], [62.0, 64.4], [65.0, 67.0], [73.0, 75.3], [77.0, 77.95], [82.0, 84.84], [87.0, 89.23], [90.0, 91.03], [91.0, 92.82], [94.0, 97.63], [99.0, 103.33], [105.0, 110.52], [116.0, 117.8], [119.0, 120.04], [122.0, 122.89], [124.0, 125.05], [126.0, 127.67], [129.0, 129.86], [132.0, 137.29], [139.0, 139.65], [140.0, 140.32], [141.0, 141.13], [142.0, 143.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.0, 0.0, 73.36, 0.0, 97.0, 91.81, 97.73, 92.64, 0.0, 99.4, 99.52, 99.48, 69.74, 98.59, 96.66, 0.0, 98.36, 97.73, 0.0, 0.0, 99.4, 99.52, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.18, 1.42, 2.29, 0.89, 4.35, 2.96, 2.89, 2.66, 1.25, 3.02, 3.26, 7.29, 2.4, 2.0, 2.3, 0.95, 2.84, 2.23, 1.03, 1.82, 3.63, 4.33, 5.52, 1.8, 1.04, 0.89, 1.05, 1.67, 0.86, 5.29, 0.65, 0.32, 0.13, 1.83]} \ No newline at end of file diff --git a/annotations_filtered/tJPokP3FVl8_filtered.json b/annotations_filtered/tJPokP3FVl8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17b47024f9d185c8d322ce5ad4e20e1d6314ade7 --- /dev/null +++ b/annotations_filtered/tJPokP3FVl8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 28.66], [31.0, 43.92], [46.0, 67.14], [68.0, 89.01], [92.0, 94.81], [99.0, 99.89], [102.0, 112.14], [112.0, 135.24], [138.0, 141.71]], "keep_status": [true, true, true, true, true, false, false, true, true], "silence_prob": [38.19, 43.08, 34.71, 40.33, 30.09, 0.0, 30.07, 30.9, 34.11], "audiomae_on_audioset": [[["speech", 24.18], ["music", 19.23], ["grunt", 16.91]], [["music", 44.43], ["whale vocalization", 12.72], ["animal", 9.83]], [["sonar", 29.05], ["hum", 16.3], ["music", 7.19]], [["music", 42.93], ["speech", 17.11], ["clang", 8.23]], [["fart", 24.39], ["fly, housefly", 24.31], ["mosquito", 14.23]], null, [["animal", 40.46], ["wild animals", 19.87], ["roaring cats (lions, tigers)", 10.75]], [["music", 44.96], ["speech", 7.84], ["groan", 7.28]], [["explosion", 25.06], ["eruption", 13.23], ["hum", 11.57]]], "duration": [12.66, 12.92, 21.14, 21.01, 2.81, 0.89, 10.14, 23.24, 3.71]} \ No newline at end of file diff --git a/annotations_filtered/tJimPUh3vmQ_filtered.json b/annotations_filtered/tJimPUh3vmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..800e9633a6327083afdb6af6f83ef1bb2d94ac6b --- /dev/null +++ b/annotations_filtered/tJimPUh3vmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.77], [25.0, 39.63], [46.0, 58.9], [61.0, 119.53], [123.0, 125.44]], "keep_status": [false, false, false, false, false], "silence_prob": [99.71, 73.36, 83.52, 0.0, 60.7], "audiomae_on_audioset": [null, null, null, null, null], "duration": [3.77, 14.63, 12.9, 58.53, 2.44]} \ No newline at end of file diff --git a/annotations_filtered/tJya-fbl4R8_filtered.json b/annotations_filtered/tJya-fbl4R8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d1f1c6292ce5ad298e4c45ca4a695ee85885e89 --- /dev/null +++ b/annotations_filtered/tJya-fbl4R8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 44.34], [45.0, 60.79], [62.0, 69.36], [70.0, 71.96], [74.0, 74.39], [75.0, 77.09], [79.0, 83.0], [84.0, 85.83], [87.0, 97.66], [99.0, 102.56], [104.0, 106.15], [107.0, 108.84], [109.0, 115.37], [117.0, 124.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 99.97, 0.0, 0.0, 99.88, 73.97, 0.0, 84.62, 100.0, 100.0, 0.0, 75.55, 82.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 15.79, 7.36, 1.96, 0.39, 2.09, 4.0, 1.83, 10.66, 3.56, 2.15, 1.84, 6.37, 7.65]} \ No newline at end of file diff --git a/annotations_filtered/tK49SBXBK_U_filtered.json b/annotations_filtered/tK49SBXBK_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f72bfd6f1b8806dad56b855c8841315bffd53e3 --- /dev/null +++ b/annotations_filtered/tK49SBXBK_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [7.0, 8.99], [10.0, 10.72], [15.0, 14.71], [15.0, 15.35], [16.0, 16.44], [18.0, 18.23], [25.0, 25.52], [26.0, 27.19], [29.0, 29.4], [33.0, 34.26], [39.0, 38.94], [40.0, 42.01], [45.0, 64.17], [65.0, 65.08], [66.0, 81.01], [83.0, 83.02], [84.0, 84.5], [87.0, 87.15], [96.0, 96.89], [98.0, 98.59], [102.0, 124.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 44.57, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.69], ["musical instrument", 7.16], ["brass instrument", 5.15]], null, null, null, null, null, null, null, null], "duration": [0.93, 1.99, 0.72, -0.29, 0.35, 0.44, 0.23, 0.52, 1.19, 0.4, 1.26, -0.06, 2.01, 19.17, 0.08, 15.01, 0.02, 0.5, 0.15, 0.89, 0.59, 22.43]} \ No newline at end of file diff --git a/annotations_filtered/tKei1kTWmKU_filtered.json b/annotations_filtered/tKei1kTWmKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95db936e2a341af2328c89bbaedada4b89282afd --- /dev/null +++ b/annotations_filtered/tKei1kTWmKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 72.03], [74.0, 100.84], [101.0, 102.41], [104.0, 111.2], [112.0, 112.89], [115.0, 129.22], [133.0, 139.75]], "keep_status": [false, true, false, true, false, true, false], "silence_prob": [0.0, 33.31, 0.0, 46.83, 0.0, 32.18, 78.21], "audiomae_on_audioset": [null, [["music", 43.12], ["throbbing", 18.84], ["hum", 6.56]], null, [["whale vocalization", 11.74], ["fly, housefly", 11.19], ["speech", 11.16]], null, [["whale vocalization", 25.09], ["music", 11.91], ["speech", 7.65]], null], "duration": [37.03, 26.84, 1.41, 7.2, 0.89, 14.22, 6.75]} \ No newline at end of file diff --git a/annotations_filtered/tKjyNywkBEQ_filtered.json b/annotations_filtered/tKjyNywkBEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c36a93e24c54b035f9a3ad3feb307ee23a643fa0 --- /dev/null +++ b/annotations_filtered/tKjyNywkBEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.54], [8.0, 19.3], [20.0, 21.88], [23.0, 23.55], [24.0, 24.68], [26.0, 26.38], [31.0, 32.41], [33.0, 51.65], [55.0, 56.49], [73.0, 73.03], [78.0, 78.39], [90.0, 91.3], [101.0, 101.78], [116.0, 116.67], [118.0, 118.61], [120.0, 121.0], [133.0, 139.75], [141.0, 143.88], [144.0, 146.1], [147.0, 148.17], [153.0, 153.69], [155.0, 155.22], [156.0, 166.23], [167.0, 167.8], [169.0, 172.99], [175.0, 177.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.39, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.33, 77.2, 50.02, 0.0, 0.0, 0.0, 95.64, 0.0, 99.99, 90.6], "audiomae_on_audioset": [null, [["speech", 67.99], ["whale vocalization", 9.57], ["music", 2.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 83.04], ["fireworks", 2.04], ["firecracker", 1.31]], null, null, null, null, null, null, null, null, null], "duration": [1.54, 11.3, 1.88, 0.55, 0.68, 0.38, 1.41, 18.65, 1.49, 0.03, 0.39, 1.3, 0.78, 0.67, 0.61, 1.0, 6.75, 2.88, 2.1, 1.17, 0.69, 0.22, 10.23, 0.8, 3.99, 2.94]} \ No newline at end of file diff --git a/annotations_filtered/tLXNDzc-2fA_filtered.json b/annotations_filtered/tLXNDzc-2fA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..968a5b67145c9c0b1b13ffd84957a18e16249282 --- /dev/null +++ b/annotations_filtered/tLXNDzc-2fA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 63.44], [67.0, 118.44], [123.0, 123.9], [124.0, 126.96], [129.0, 173.72], [176.0, 176.47], [177.0, 212.33], [218.0, 219.69], [222.0, 222.79], [227.0, 228.73], [231.0, 231.3]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 32.42], ["didgeridoo", 11.79], ["hum", 6.37]], null, null, null, null, null, null, null], "duration": [37.44, 51.44, 0.9, 2.96, 44.72, 0.47, 35.33, 1.69, 0.79, 1.73, 0.3]} \ No newline at end of file diff --git a/annotations_filtered/tLiJueTgu44_filtered.json b/annotations_filtered/tLiJueTgu44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f71e926b56d74ae682d2246a9accce0d50b23968 --- /dev/null +++ b/annotations_filtered/tLiJueTgu44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 45.86], [48.0, 76.45], [77.0, 82.73], [84.0, 107.28], [108.0, 131.82]], "keep_status": [true, true, false, false, false], "silence_prob": [36.91, 31.11, 74.44, 79.59, 56.1], "audiomae_on_audioset": [[["speech", 33.85], ["vehicle", 14.97], ["animal", 2.86]], [["machine gun", 27.33], ["speech", 22.17], ["gunshot, gunfire", 7.59]], null, null, null], "duration": [29.86, 28.45, 5.73, 23.28, 23.82]} \ No newline at end of file diff --git a/annotations_filtered/tLiM-49DJ7k_filtered.json b/annotations_filtered/tLiM-49DJ7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48d2c19773182271be3f29143e054ba747aa117f --- /dev/null +++ b/annotations_filtered/tLiM-49DJ7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.97], [8.0, 8.87], [9.0, 10.64], [13.0, 14.42], [21.0, 22.45], [23.0, 23.7], [24.0, 46.92], [53.0, 69.9], [72.0, 74.82], [78.0, 78.51], [100.0, 100.47], [102.0, 104.31], [107.0, 135.4], [137.0, 138.72], [140.0, 140.21]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.75, 32.42, 47.62, 0.0, 0.0, 87.55, 29.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 33.38], ["moo", 18.47], ["cattle, bovinae", 14.39]], [["whale vocalization", 17.63], ["music", 15.99], ["theremin", 9.15]], [["moo", 16.69], ["busy signal", 15.73], ["cattle, bovinae", 12.06]], null, null, null, [["music", 59.94], ["thunk", 10.97], ["thump, thud", 3.83]], null, null], "duration": [0.97, 0.87, 1.64, 1.42, 1.45, 0.7, 22.92, 16.9, 2.82, 0.51, 0.47, 2.31, 28.4, 1.72, 0.21]} \ No newline at end of file diff --git a/annotations_filtered/tLzcAofC4WA_filtered.json b/annotations_filtered/tLzcAofC4WA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cea1192c851ac7ff35349f492becf3d5c063c6d3 --- /dev/null +++ b/annotations_filtered/tLzcAofC4WA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.15], [13.0, 14.12], [15.0, 17.05], [18.0, 20.04], [23.0, 22.99], [24.0, 25.81], [28.0, 29.62], [35.0, 35.24], [36.0, 37.99], [39.0, 40.22], [44.0, 44.32], [47.0, 47.58], [50.0, 50.8], [60.0, 60.67], [63.0, 63.07], [66.0, 65.8], [68.0, 68.37], [69.0, 72.59], [95.0, 95.57], [99.0, 99.47], [101.0, 101.07], [106.0, 106.47], [108.0, 108.04], [108.0, 109.38], [120.0, 121.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.02, 58.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 68.03], ["rumble", 2.91], ["music", 2.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 20.75], ["speech", 15.97], ["whale vocalization", 11.59]], null, null, null, null, null, null, null], "duration": [1.15, 1.12, 2.05, 2.04, -0.01, 1.81, 1.62, 0.24, 1.99, 1.22, 0.32, 0.58, 0.8, 0.67, 0.07, -0.2, 0.37, 3.59, 0.57, 0.47, 0.07, 0.47, 0.04, 1.38, 1.58]} \ No newline at end of file diff --git a/annotations_filtered/tM3Zg8m373Y_filtered.json b/annotations_filtered/tM3Zg8m373Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..feb73baae9b09d4554431e05069f6b3bd0aad9c1 --- /dev/null +++ b/annotations_filtered/tM3Zg8m373Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [8.0, 8.83], [11.0, 11.64], [15.0, 15.62], [20.0, 21.25], [31.0, 38.77]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.24], "audiomae_on_audioset": [null, null, null, null, null, [["fart", 20.37], ["hum", 11.41], ["speech", 7.57]]], "duration": [1.17, 0.83, 0.64, 0.62, 1.25, 7.77]} \ No newline at end of file diff --git a/annotations_filtered/tM47HMT8GGE_filtered.json b/annotations_filtered/tM47HMT8GGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d338184061c69b01ae739754ab7db613f613c5bb --- /dev/null +++ b/annotations_filtered/tM47HMT8GGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 138.37]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [113.37]} \ No newline at end of file diff --git a/annotations_filtered/tMB7LgnO2Wo_filtered.json b/annotations_filtered/tMB7LgnO2Wo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92d12569d2e91bf5b4a789d0d03b76eac15f8a9e --- /dev/null +++ b/annotations_filtered/tMB7LgnO2Wo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.86], [4.0, 5.02], [7.0, 9.04], [11.0, 11.55], [14.0, 16.85], [20.0, 21.03], [21.0, 21.49], [22.0, 21.91], [23.0, 25.51], [26.0, 27.53], [29.0, 32.68], [34.0, 34.48], [36.0, 37.61], [41.0, 42.85], [48.0, 48.09], [49.0, 52.0], [53.0, 55.8], [57.0, 59.05], [60.0, 61.67], [64.0, 63.9], [65.0, 66.48], [69.0, 71.05], [72.0, 77.13], [81.0, 81.4], [85.0, 85.45], [87.0, 88.43], [91.0, 92.55], [94.0, 97.34], [99.0, 100.79], [104.0, 109.76]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.93, 0.0, 51.6, 0.0, 0.0, 0.0, 53.78, 0.0, 57.97, 0.0, 0.0, 0.0, 0.0, 80.29, 40.21, 41.89, 0.0, 0.0, 0.0, 70.86, 70.58, 0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 57.56], "audiomae_on_audioset": [null, null, [["speech", 37.21], ["music", 21.31], ["singing bowl", 11.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.84], ["music", 13.53], ["hum", 6.62]], [["music", 27.3], ["gong", 24.26], ["singing bowl", 10.1]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.14, 1.02, 2.04, 0.55, 2.85, 1.03, 0.49, -0.09, 2.51, 1.53, 3.68, 0.48, 1.61, 1.85, 0.09, 3.0, 2.8, 2.05, 1.67, -0.1, 1.48, 2.05, 5.13, 0.4, 0.45, 1.43, 1.55, 3.34, 1.79, 5.76]} \ No newline at end of file diff --git a/annotations_filtered/tMIO48oFmHc_filtered.json b/annotations_filtered/tMIO48oFmHc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..553151b6fb87c81348d3f944446f9a1919bc3438 --- /dev/null +++ b/annotations_filtered/tMIO48oFmHc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.71], [12.0, 12.29], [15.0, 15.97], [22.0, 22.23], [29.0, 29.19], [30.0, 31.02], [34.0, 36.48], [37.0, 41.76], [50.0, 52.86], [55.0, 55.41], [59.0, 59.46], [69.0, 71.1], [75.0, 76.03], [78.0, 79.88], [83.0, 83.73], [85.0, 86.36], [94.0, 94.44], [96.0, 96.04], [98.0, 99.18], [100.0, 100.62], [103.0, 104.14], [106.0, 112.94], [114.0, 121.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 58.13, 35.03, 0.0, 0.0, 88.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 83.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 74.93], ["sidetone", 5.15], ["radio", 5.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.71, 0.29, 0.97, 0.23, 0.19, 1.02, 2.48, 4.76, 2.86, 0.41, 0.46, 2.1, 1.03, 1.88, 0.73, 1.36, 0.44, 0.04, 1.18, 0.62, 1.14, 6.94, 7.49]} \ No newline at end of file diff --git a/annotations_filtered/tMYOmMWbUME_filtered.json b/annotations_filtered/tMYOmMWbUME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0434d204722f5dbd8c8fd21956135f80c44b4b5e --- /dev/null +++ b/annotations_filtered/tMYOmMWbUME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.05], [14.0, 15.67], [20.0, 19.79], [21.0, 21.52], [28.0, 30.23], [32.0, 35.36], [38.0, 38.21], [39.0, 39.41], [42.0, 41.91], [43.0, 44.42], [46.0, 54.33], [59.0, 62.01], [67.0, 75.36], [80.0, 81.28], [82.0, 92.45], [94.0, 95.94], [97.0, 105.07], [106.0, 109.12], [117.0, 118.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 74.76, 87.37, 0.0, 0.0, 0.0, 0.0, 99.85, 89.54, 36.95, 0.0, 74.29, 0.0, 87.0, 59.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["eruption", 13.46], ["speech", 9.63], ["fart", 6.93]], null, null, null, null, null, null], "duration": [1.05, 1.67, -0.21, 0.52, 2.23, 3.36, 0.21, 0.41, -0.09, 1.42, 8.33, 3.01, 8.36, 1.28, 10.45, 1.94, 8.07, 3.12, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/tMaXLU_KG-k_filtered.json b/annotations_filtered/tMaXLU_KG-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d1c6993d397fa88ae23562b38b948077e03e7f5 --- /dev/null +++ b/annotations_filtered/tMaXLU_KG-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [4.0, 6.78], [8.0, 8.02], [8.0, 12.73], [14.0, 14.86], [15.0, 20.88], [22.0, 23.06], [27.0, 29.46], [30.0, 35.75], [38.0, 60.18], [63.0, 62.97], [66.0, 66.36], [69.0, 69.13], [71.0, 71.86], [72.0, 72.87], [74.0, 75.63], [79.0, 80.67], [85.0, 85.56], [87.0, 88.87], [90.0, 90.63], [92.0, 92.11], [95.0, 95.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.51, 0.0, 59.59, 0.0, 97.83, 0.0, 99.96, 94.22, 94.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 2.78, 0.02, 4.73, 0.86, 5.88, 1.06, 2.46, 5.75, 22.18, -0.03, 0.36, 0.13, 0.86, 0.87, 1.63, 1.67, 0.56, 1.87, 0.63, 0.11, 0.47]} \ No newline at end of file diff --git a/annotations_filtered/tMcUZSJ3xDY_filtered.json b/annotations_filtered/tMcUZSJ3xDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa89db9da6960903df6a1a37aa9042131825f284 --- /dev/null +++ b/annotations_filtered/tMcUZSJ3xDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 56.83], [64.0, 67.69], [76.0, 153.47]], "keep_status": [false, false, false], "silence_prob": [0.0, 29.75, 0.0], "audiomae_on_audioset": [null, [["music", 59.24], ["speech", 13.85], ["throbbing", 5.35]], null], "duration": [40.83, 3.69, 77.47]} \ No newline at end of file diff --git a/annotations_filtered/tMw_xOuU9DA_filtered.json b/annotations_filtered/tMw_xOuU9DA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..054b1ce3fb6344a526e247a01aeec042a9776de9 --- /dev/null +++ b/annotations_filtered/tMw_xOuU9DA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 72.03], [74.0, 82.8], [85.0, 111.25], [114.0, 115.13]], "keep_status": [true, false, true, false], "silence_prob": [30.45, 37.9, 31.05, 0.0], "audiomae_on_audioset": [[["speech", 34.05], ["music", 21.07], ["hum", 11.67]], [["music", 41.15], ["hum", 29.49], ["mains hum", 8.64]], [["hum", 13.08], ["mains hum", 12.46], ["buzz", 10.0]], null], "duration": [9.03, 8.8, 26.25, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/tN4mmLewz_E_filtered.json b/annotations_filtered/tN4mmLewz_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f099bf8adf445104a70e2045894c43e293df412 --- /dev/null +++ b/annotations_filtered/tN4mmLewz_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.06], [9.0, 8.92], [10.0, 10.61], [13.0, 13.47], [17.0, 18.76], [20.0, 19.75], [20.0, 20.88], [22.0, 22.42], [26.0, 26.54], [27.0, 27.36], [28.0, 28.32], [29.0, 29.37], [30.0, 30.28], [31.0, 31.29], [33.0, 33.62], [36.0, 36.96], [64.0, 64.96], [73.0, 73.26], [84.0, 84.69], [87.0, 88.16], [106.0, 106.71], [108.0, 108.24], [109.0, 109.09], [111.0, 111.05], [114.0, 114.86], [116.0, 115.99], [119.0, 120.61], [124.0, 124.23], [132.0, 132.73], [134.0, 135.31], [139.0, 144.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["civil defense siren", 39.14], ["siren", 17.65], ["effects unit", 16.17]]], "duration": [1.06, -0.08, 0.61, 0.47, 1.76, -0.25, 0.88, 0.42, 0.54, 0.36, 0.32, 0.37, 0.28, 0.29, 0.62, 0.96, 0.96, 0.26, 0.69, 1.16, 0.71, 0.24, 0.09, 0.05, 0.86, -0.01, 1.61, 0.23, 0.73, 1.31, 5.91]} \ No newline at end of file diff --git a/annotations_filtered/tNZKO_68_WI_filtered.json b/annotations_filtered/tNZKO_68_WI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8b1cd030fc591f81ae57844c891bb7b00063c60 --- /dev/null +++ b/annotations_filtered/tNZKO_68_WI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[124.0, 125.52], [127.0, 128.61]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.52, 1.61]} \ No newline at end of file diff --git a/annotations_filtered/tNuPwipxx94_filtered.json b/annotations_filtered/tNuPwipxx94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c493df7e8c7b2729ec72151aa34ba2ec94c9f6e4 --- /dev/null +++ b/annotations_filtered/tNuPwipxx94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [3.0, 4.04], [7.0, 7.55], [12.0, 12.83], [14.0, 15.72], [17.0, 17.47], [20.0, 21.36], [23.0, 23.31], [26.0, 25.98], [28.0, 31.56], [32.0, 33.61], [35.0, 35.88], [38.0, 38.23], [39.0, 39.41], [42.0, 42.52], [50.0, 51.19], [53.0, 53.96], [54.0, 55.38], [56.0, 58.29], [61.0, 61.91], [63.0, 67.63], [69.0, 70.02], [71.0, 71.69], [72.0, 76.1], [77.0, 80.03], [81.0, 81.78], [83.0, 83.49], [85.0, 86.34], [87.0, 87.29], [89.0, 90.63], [92.0, 92.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 91.3, 0.0, 0.0, 75.88, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 1.04, 0.55, 0.83, 1.72, 0.47, 1.36, 0.31, -0.02, 3.56, 1.61, 0.88, 0.23, 0.41, 0.52, 1.19, 0.96, 1.38, 2.29, 0.91, 4.63, 1.02, 0.69, 4.1, 3.03, 0.78, 0.49, 1.34, 0.29, 1.63, 0.28]} \ No newline at end of file diff --git a/annotations_filtered/tNvDa9kTDUw_filtered.json b/annotations_filtered/tNvDa9kTDUw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8587725a03d79c2a483741c37957ce7cc8d5aa6 --- /dev/null +++ b/annotations_filtered/tNvDa9kTDUw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.74], [33.0, 36.8], [44.0, 44.0], [46.0, 46.58], [47.0, 50.82], [56.0, 56.51]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 36.19, 0.0, 0.0, 34.35, 0.0], "audiomae_on_audioset": [null, [["music", 74.75], ["yodeling", 3.54], ["synthesizer", 2.82]], null, null, [["music", 70.15], ["musical instrument", 2.84], ["funk", 2.4]], null], "duration": [0.74, 3.8, 0.0, 0.58, 3.82, 0.51]} \ No newline at end of file diff --git a/annotations_filtered/tOcnYAE2i4Q_filtered.json b/annotations_filtered/tOcnYAE2i4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45d6e2617ab32f2a39352f5ab1e65665136b4e39 --- /dev/null +++ b/annotations_filtered/tOcnYAE2i4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.78], [20.0, 20.51], [24.0, 24.49], [25.0, 24.73], [29.0, 31.38], [35.0, 36.85], [38.0, 38.8], [48.0, 49.64], [69.0, 70.75], [76.0, 77.5], [81.0, 81.41], [84.0, 85.6], [87.0, 100.62], [120.0, 120.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.33], ["ambient music", 18.78], ["singing bowl", 5.77]], null], "duration": [1.78, 0.51, 0.49, -0.27, 2.38, 1.85, 0.8, 1.64, 1.75, 1.5, 0.41, 1.6, 13.62, 0.38]} \ No newline at end of file diff --git a/annotations_filtered/tPJ9WsQhpMw_filtered.json b/annotations_filtered/tPJ9WsQhpMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d5d6d4896675fcc3ab128a4aa3892fbf661a343 --- /dev/null +++ b/annotations_filtered/tPJ9WsQhpMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.77], [21.0, 21.14], [22.0, 22.59], [30.0, 33.74], [37.0, 46.52], [56.0, 110.29], [111.0, 111.92], [113.0, 115.69], [117.0, 119.94], [120.0, 121.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 84.98, 50.97, 0.0, 0.0, 78.21, 99.1, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 0.14, 0.59, 3.74, 9.52, 54.29, 0.92, 2.69, 2.94, 1.69]} \ No newline at end of file diff --git a/annotations_filtered/tPJJlCdrJ0M_filtered.json b/annotations_filtered/tPJJlCdrJ0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f27139329cb2e149996e91d3780a9920cdfbc8b1 --- /dev/null +++ b/annotations_filtered/tPJJlCdrJ0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.47], [6.0, 11.82], [18.0, 28.86], [31.0, 31.23], [31.0, 33.0], [38.0, 40.78], [44.0, 54.82], [57.0, 58.21], [60.0, 62.19], [65.0, 67.63], [69.0, 69.42], [73.0, 76.2], [77.0, 101.97], [103.0, 116.24], [116.0, 117.86], [119.0, 126.98], [128.0, 132.19]], "keep_status": [false, true, true, false, true, true, false, false, true, true, false, false, true, true, false, false, true], "silence_prob": [0.0, 29.65, 29.79, 0.0, 32.15, 29.84, 30.74, 0.0, 30.78, 30.23, 0.0, 30.13, 30.23, 33.92, 0.0, 30.29, 32.26], "audiomae_on_audioset": [null, [["speech", 33.37], ["music", 14.83], ["hum", 14.75]], [["music", 42.6], ["speech", 22.15], ["explosion", 2.44]], null, [["music", 39.11], ["speech", 11.53], ["throbbing", 6.95]], [["music", 53.76], ["hum", 8.22], ["throbbing", 6.04]], [["music", 75.35], ["breaking", 4.32], ["buzz", 2.89]], null, [["music", 33.11], ["speech", 22.85], ["theremin", 7.38]], [["sound effect", 19.48], ["music", 16.1], ["groan", 8.21]], null, [["music", 70.92], ["speech", 3.04], ["noise", 3.0]], [["music", 45.68], ["speech", 14.15], ["sine wave", 5.8]], [["music", 44.62], ["boing", 9.34], ["clarinet", 9.26]], null, [["music", 42.96], ["hum", 15.12], ["throbbing", 12.4]], [["music", 48.29], ["speech", 8.75], ["double bass", 8.23]]], "duration": [1.47, 5.82, 10.86, 0.23, 2.0, 2.78, 10.82, 1.21, 2.19, 2.63, 0.42, 3.2, 24.97, 13.24, 1.86, 7.98, 4.19]} \ No newline at end of file diff --git a/annotations_filtered/tPgRnFg8ZTU_filtered.json b/annotations_filtered/tPgRnFg8ZTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e390ccf1adb886d6ac968661cf0789fa98a83d8 --- /dev/null +++ b/annotations_filtered/tPgRnFg8ZTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.31], [26.0, 30.35], [32.0, 32.48], [36.0, 53.3], [54.0, 54.38], [54.0, 65.89], [69.0, 73.08], [73.0, 74.22], [77.0, 87.22], [88.0, 96.33], [102.0, 103.01], [103.0, 113.21], [115.0, 138.32]], "keep_status": [false, true, false, true, false, false, true, false, false, true, false, true, true], "silence_prob": [0.0, 40.7, 0.0, 44.49, 0.0, 43.87, 44.18, 0.0, 40.71, 45.21, 0.0, 42.62, 40.59], "audiomae_on_audioset": [null, [["music", 24.53], ["moo", 10.86], ["cattle, bovinae", 7.83]], null, [["music", 57.77], ["didgeridoo", 3.51], ["electronic music", 3.17]], null, [["music", 83.34], ["didgeridoo", 1.25], ["soundtrack music", 1.13]], [["music", 47.29], ["throbbing", 6.86], ["electronic music", 3.1]], null, [["music", 72.36], ["didgeridoo", 3.76], ["boing", 2.56]], [["music", 39.64], ["cattle, bovinae", 13.99], ["moo", 12.02]], null, [["music", 35.22], ["sidetone", 18.9], ["whale vocalization", 11.55]], [["music", 48.63], ["throbbing", 10.88], ["electronic music", 3.2]]], "duration": [0.31, 4.35, 0.48, 17.3, 0.38, 11.89, 4.08, 1.22, 10.22, 8.33, 1.01, 10.21, 23.32]} \ No newline at end of file diff --git a/annotations_filtered/tPgwaQKNKRk_filtered.json b/annotations_filtered/tPgwaQKNKRk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98ca1727b23f58c088fb99bc90496af87cb7daf2 --- /dev/null +++ b/annotations_filtered/tPgwaQKNKRk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.02], [11.0, 16.77], [19.0, 19.31], [20.0, 22.54], [23.0, 22.64], [23.0, 23.28], [28.0, 27.87], [28.0, 27.9], [28.0, 31.36], [46.0, 50.11], [60.0, 61.74], [64.0, 68.76], [71.0, 79.79], [90.0, 90.93], [92.0, 99.87], [105.0, 105.6], [106.0, 106.96], [108.0, 115.05], [117.0, 117.0], [117.0, 117.1], [120.0, 120.16], [124.0, 124.19], [126.0, 126.01]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.4, 0.0, 67.25, 0.0, 0.0, 0.0, 0.0, 38.68, 37.67, 0.0, 36.47, 37.24, 0.0, 68.41, 0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 30.6], ["music", 21.06], ["boing", 15.76]], [["music", 58.42], ["boing", 12.95], ["speech", 11.22]], null, [["music", 35.99], ["speech", 20.65], ["sidetone", 8.39]], [["music", 79.39], ["synthesizer", 3.1], ["musical instrument", 2.49]], null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 5.77, 0.31, 2.54, -0.36, 0.28, -0.13, -0.1, 3.36, 4.11, 1.74, 4.76, 8.79, 0.93, 7.87, 0.6, 0.96, 7.05, 0.0, 0.1, 0.16, 0.19, 0.01]} \ No newline at end of file diff --git a/annotations_filtered/tPy34tjLOyk_filtered.json b/annotations_filtered/tPy34tjLOyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09acb39ac5997f0535fa0b20f6cdf9fca437d9e7 --- /dev/null +++ b/annotations_filtered/tPy34tjLOyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.28], [6.0, 7.94], [14.0, 13.88], [16.0, 17.39], [29.0, 29.22], [37.0, 36.96], [41.0, 41.22], [43.0, 42.85], [45.0, 46.72], [47.0, 47.44], [48.0, 49.08], [50.0, 49.91], [50.0, 51.75], [57.0, 59.39], [62.0, 64.07], [64.0, 65.77], [67.0, 67.59], [69.0, 70.02], [75.0, 75.57], [79.0, 80.2], [85.0, 85.43], [97.0, 98.46], [111.0, 113.83], [115.0, 116.07], [117.0, 121.04], [123.0, 124.09], [124.0, 126.96], [129.0, 129.09], [130.0, 130.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.94, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0, 71.43, 0.0, 42.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.75], ["cough", 11.4], ["laughter", 7.62]], null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 23.42], ["speech", 23.11], ["music", 18.69]], null, null], "duration": [0.28, 1.94, -0.12, 1.39, 0.22, -0.04, 0.22, -0.15, 1.72, 0.44, 1.08, -0.09, 1.75, 2.39, 2.07, 1.77, 0.59, 1.02, 0.57, 1.2, 0.43, 1.46, 2.83, 1.07, 4.04, 1.09, 2.96, 0.09, 0.77]} \ No newline at end of file diff --git a/annotations_filtered/tQJTJdTM0Wk_filtered.json b/annotations_filtered/tQJTJdTM0Wk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61a3b2bf34e2c4517e982ea8f972e452ec7c9dd2 --- /dev/null +++ b/annotations_filtered/tQJTJdTM0Wk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.64], [11.0, 36.8], [37.0, 59.9], [62.0, 74.88], [77.0, 78.24], [79.0, 79.73], [81.0, 82.19], [84.0, 85.11], [88.0, 91.29], [93.0, 94.2], [99.0, 101.06], [102.0, 103.3], [105.0, 105.68], [110.0, 110.47], [114.0, 118.2], [119.0, 120.29], [123.0, 125.12], [126.0, 128.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.88, 33.28, 37.93, 94.22, 0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 97.83, 0.0, 0.0, 0.0, 96.04, 0.0, 98.01, 93.6], "audiomae_on_audioset": [[["music", 33.23], ["hum", 25.3], ["throbbing", 12.0]], [["music", 56.38], ["hum", 10.38], ["mains hum", 9.42]], [["music", 81.12], ["hum", 2.82], ["theremin", 2.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.64, 25.8, 22.9, 12.88, 1.24, 0.73, 1.19, 1.11, 3.29, 1.2, 2.06, 1.3, 0.68, 0.47, 4.2, 1.29, 2.12, 2.36]} \ No newline at end of file diff --git a/annotations_filtered/tQl5ypxi69U_filtered.json b/annotations_filtered/tQl5ypxi69U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e8df86c082b75ab8cb5cb11ac311761b8320edd --- /dev/null +++ b/annotations_filtered/tQl5ypxi69U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 34.33], [36.0, 35.7], [37.0, 44.42], [45.0, 52.96], [54.0, 62.85], [63.0, 77.79], [79.0, 79.64], [86.0, 91.32]], "keep_status": [true, false, false, false, true, true, false, false], "silence_prob": [34.1, 0.0, 33.98, 36.42, 34.3, 30.92, 0.0, 29.97], "audiomae_on_audioset": [[["mains hum", 33.52], ["hum", 21.97], ["speech", 8.0]], null, [["speech", 33.87], ["mains hum", 21.25], ["hum", 18.84]], [["mains hum", 45.01], ["hum", 36.37], ["music", 4.11]], [["speech", 29.78], ["music", 26.86], ["hum", 11.73]], [["music", 38.67], ["hum", 20.72], ["mains hum", 10.36]], null, [["speech", 42.68], ["aircraft", 17.66], ["vehicle", 11.57]]], "duration": [4.33, -0.3, 7.42, 7.96, 8.85, 14.79, 0.64, 5.32]} \ No newline at end of file diff --git a/annotations_filtered/tQlujXWP-5c_filtered.json b/annotations_filtered/tQlujXWP-5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbf14b4313554e4218f5dc7298cd3cc904c37949 --- /dev/null +++ b/annotations_filtered/tQlujXWP-5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.97], [9.0, 12.87], [14.0, 16.48], [17.0, 29.51], [30.0, 46.18], [48.0, 55.78], [57.0, 73.77], [77.0, 77.52], [78.0, 78.46], [78.0, 82.39], [83.0, 90.66], [92.0, 95.39], [96.0, 98.59], [99.0, 105.17], [106.0, 112.21], [114.0, 114.91], [116.0, 117.17], [118.0, 118.56]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, true, true, true, false, false, false], "silence_prob": [0.0, 39.0, 70.16, 39.3, 39.07, 31.88, 43.35, 0.0, 0.0, 35.31, 47.5, 50.51, 44.29, 41.72, 30.45, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["whale vocalization", 30.52], ["hum", 9.37], ["squish", 6.89]], null, [["speech", 85.71], ["hum", 3.2], ["inside, small room", 1.43]], [["speech", 65.11], ["whale vocalization", 6.25], ["liquid", 2.67]], [["speech", 48.1], ["whack, thwack", 13.15], ["sidetone", 5.69]], [["liquid", 37.03], ["water", 23.26], ["glass", 9.77]], null, null, [["whale vocalization", 33.78], ["animal", 25.02], ["speech", 11.33]], [["speech", 71.22], ["sidetone", 5.08], ["dial tone", 3.72]], null, [["speech", 16.96], ["fly, housefly", 7.79], ["insect", 7.57]], [["whale vocalization", 35.55], ["speech", 20.78], ["burping, eructation", 5.68]], [["hum", 27.88], ["mains hum", 8.82], ["throbbing", 5.15]], null, null, null], "duration": [1.97, 3.87, 2.48, 12.51, 16.18, 7.78, 16.77, 0.52, 0.46, 4.39, 7.66, 3.39, 2.59, 6.17, 6.21, 0.91, 1.17, 0.56]} \ No newline at end of file diff --git a/annotations_filtered/tRHVMi3LxZE_filtered.json b/annotations_filtered/tRHVMi3LxZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..221f2f575fb125fb2e5f5991b14ead541208e942 --- /dev/null +++ b/annotations_filtered/tRHVMi3LxZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 40.81], [45.0, 47.8], [50.0, 52.76], [54.0, 55.93], [57.0, 82.38], [87.0, 89.85], [91.0, 108.99]], "keep_status": [true, true, true, false, true, false, true], "silence_prob": [43.38, 44.99, 36.84, 0.0, 33.78, 32.36, 29.58], "audiomae_on_audioset": [[["steam whistle", 28.36], ["speech", 19.86], ["train", 5.97]], [["music", 26.94], ["speech", 20.16], ["sidetone", 14.57]], [["music", 25.51], ["effects unit", 14.34], ["echo", 10.59]], null, [["music", 23.72], ["explosion", 14.49], ["musical instrument", 9.74]], [["steam whistle", 67.78], ["wind instrument, woodwind instrument", 7.87], ["music", 5.04]], [["vehicle", 9.54], ["music", 9.3], ["hum", 8.7]]], "duration": [4.81, 2.8, 2.76, 1.93, 25.38, 2.85, 17.99]} \ No newline at end of file diff --git a/annotations_filtered/tRRQX1SXcMM_filtered.json b/annotations_filtered/tRRQX1SXcMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66548c72bbcc53b0d371d1b23e44fd12746c76db --- /dev/null +++ b/annotations_filtered/tRRQX1SXcMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 23.45], [26.0, 26.74], [30.0, 38.96], [40.0, 43.9], [46.0, 62.13], [65.0, 85.55], [87.0, 88.01], [91.0, 97.28], [99.0, 99.71], [100.0, 117.59]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [42.91, 0.0, 30.62, 31.82, 38.71, 39.6, 0.0, 35.22, 0.0, 37.97], "audiomae_on_audioset": [[["speech", 56.86], ["vehicle", 6.28], ["sidetone", 5.65]], null, [["speech", 60.26], ["explosion", 17.02], ["music", 2.64]], [["hum", 39.38], ["mains hum", 17.71], ["throbbing", 14.31]], [["hum", 27.65], ["music", 22.92], ["whale vocalization", 22.57]], [["music", 64.15], ["whale vocalization", 30.36], ["soundtrack music", 1.15]], null, [["music", 61.04], ["whale vocalization", 27.55], ["electronic music", 1.97]], null, [["whale vocalization", 56.6], ["music", 35.97], ["theremin", 1.16]]], "duration": [14.45, 0.74, 8.96, 3.9, 16.13, 20.55, 1.01, 6.28, 0.71, 17.59]} \ No newline at end of file diff --git a/annotations_filtered/tRwyOQw5zcw_filtered.json b/annotations_filtered/tRwyOQw5zcw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33e35d2c53b7ba876fada4749c29dc4e8bb100ce --- /dev/null +++ b/annotations_filtered/tRwyOQw5zcw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.12], [13.0, 13.39], [14.0, 17.29], [27.0, 27.33], [31.0, 31.48], [41.0, 41.22], [42.0, 42.45], [51.0, 52.24], [56.0, 57.7], [59.0, 59.98], [62.0, 63.1], [64.0, 64.67], [66.0, 66.46], [71.0, 71.02], [72.0, 72.86], [75.0, 75.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.12, 0.39, 3.29, 0.33, 0.48, 0.22, 0.45, 1.24, 1.7, 0.98, 1.1, 0.67, 0.46, 0.02, 0.86, 0.07]} \ No newline at end of file diff --git a/annotations_filtered/tRx8N7mJU9g_filtered.json b/annotations_filtered/tRx8N7mJU9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_filtered/tRx8N7mJU9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_filtered/tS36ZnWoR70_filtered.json b/annotations_filtered/tS36ZnWoR70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa08342a68ba4b17c4df89e2863607937c7d5c64 --- /dev/null +++ b/annotations_filtered/tS36ZnWoR70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.85], [6.0, 8.41], [11.0, 11.08], [12.0, 12.48], [14.0, 14.93], [17.0, 18.1], [20.0, 22.27], [24.0, 24.04], [26.0, 27.35], [30.0, 32.46], [35.0, 38.35], [41.0, 41.61], [45.0, 47.41], [49.0, 50.38], [52.0, 53.64], [55.0, 56.35], [59.0, 60.44], [64.0, 66.07], [68.0, 69.06], [70.0, 71.85], [74.0, 75.1], [76.0, 81.31], [84.0, 83.94], [86.0, 86.41], [88.0, 90.71], [93.0, 94.02], [98.0, 99.59], [102.0, 102.1], [104.0, 106.56], [108.0, 108.99], [112.0, 113.24], [117.0, 118.57], [120.0, 120.83], [122.0, 123.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.8, 91.47, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.96, 99.95, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 97.11, 0.0, 0.0, 0.0, 50.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.85, 2.41, 0.08, 0.48, 0.93, 1.1, 2.27, 0.04, 1.35, 2.46, 3.35, 0.61, 2.41, 1.38, 1.64, 1.35, 1.44, 2.07, 1.06, 1.85, 1.1, 5.31, -0.06, 0.41, 2.71, 1.02, 1.59, 0.1, 2.56, 0.99, 1.24, 1.57, 0.83, 1.47]} \ No newline at end of file diff --git a/annotations_filtered/tSXp2wB6kXQ_filtered.json b/annotations_filtered/tSXp2wB6kXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44007cb9cebc66918de0c44ef07efb6960eb0663 --- /dev/null +++ b/annotations_filtered/tSXp2wB6kXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.4], [11.0, 24.39], [25.0, 26.08], [30.0, 30.59], [33.0, 33.45], [36.0, 37.1], [44.0, 46.09], [48.0, 49.0], [50.0, 50.13], [51.0, 76.27], [80.0, 80.52], [83.0, 83.66], [87.0, 87.51], [89.0, 89.36], [98.0, 98.76], [108.0, 108.73], [113.0, 114.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 78.21, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 13.39, 1.08, 0.59, 0.45, 1.1, 2.09, 1.0, 0.13, 25.27, 0.52, 0.66, 0.51, 0.36, 0.76, 0.73, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/tSpOMNC3WtQ_filtered.json b/annotations_filtered/tSpOMNC3WtQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d93ce705864196944eec27c068d736e9837b6c8c --- /dev/null +++ b/annotations_filtered/tSpOMNC3WtQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.38], [18.0, 18.13], [19.0, 26.38], [31.0, 32.44], [36.0, 36.37], [46.0, 46.58], [49.0, 60.89], [66.0, 73.6], [79.0, 79.57]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [99.99, 0.0, 46.83, 0.0, 0.0, 0.0, 37.81, 38.33, 0.0], "audiomae_on_audioset": [null, null, [["speech", 68.73], ["sidetone", 6.08], ["radio", 4.48]], null, null, null, [["music", 38.39], ["bleat", 12.93], ["sheep", 12.89]], [["music", 55.54], ["speech", 14.2], ["radio", 7.35]], null], "duration": [2.38, 0.13, 7.38, 1.44, 0.37, 0.58, 11.89, 7.6, 0.57]} \ No newline at end of file diff --git a/annotations_filtered/tTFOv5oFe3E_filtered.json b/annotations_filtered/tTFOv5oFe3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..124c5734a52bb163240f2ce7f6ce48b38803f089 --- /dev/null +++ b/annotations_filtered/tTFOv5oFe3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 25.71], [27.0, 27.51], [29.0, 29.76], [31.0, 32.49], [34.0, 34.94], [37.0, 38.31], [39.0, 40.2], [41.0, 55.07], [56.0, 59.44], [60.0, 78.6], [79.0, 80.1], [81.0, 93.75], [95.0, 96.16], [99.0, 100.62], [102.0, 103.49], [104.0, 104.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 81.0, 99.36, 0.0, 99.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.71, 0.51, 0.76, 1.49, 0.94, 1.31, 1.2, 14.07, 3.44, 18.6, 1.1, 12.75, 1.16, 1.62, 1.49, 0.41]} \ No newline at end of file diff --git a/annotations_filtered/tTVFP-9AdMk_filtered.json b/annotations_filtered/tTVFP-9AdMk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a4f0281662521cd2e2562f00b12dc8537799cfa --- /dev/null +++ b/annotations_filtered/tTVFP-9AdMk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.65], [17.0, 18.27], [24.0, 23.99], [30.0, 30.65], [33.0, 34.13], [35.0, 35.65], [43.0, 42.79], [45.0, 45.76], [50.0, 50.45], [55.0, 57.55], [66.0, 67.68], [69.0, 69.87], [71.0, 71.42], [73.0, 73.21], [74.0, 74.11], [77.0, 76.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 73.26], ["livestock, farm animals, working animals", 2.68], ["baby laughter", 2.27]], null, null, null, null, null, null], "duration": [0.65, 1.27, -0.01, 0.65, 1.13, 0.65, -0.21, 0.76, 0.45, 2.55, 1.68, 0.87, 0.42, 0.21, 0.11, -0.41]} \ No newline at end of file diff --git a/annotations_filtered/tTbqVFrvn0E_filtered.json b/annotations_filtered/tTbqVFrvn0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa824974c7815cebf1af00656c5e81c2c181199c --- /dev/null +++ b/annotations_filtered/tTbqVFrvn0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [3.0, 4.21], [5.0, 6.32], [9.0, 11.31], [12.0, 13.27], [13.0, 13.86], [15.0, 18.01], [18.0, 19.63], [21.0, 22.17], [23.0, 23.95], [25.0, 25.83], [26.0, 27.41], [30.0, 34.77], [36.0, 37.42], [38.0, 39.02], [41.0, 41.28], [47.0, 47.98], [56.0, 56.79], [59.0, 59.1], [69.0, 69.5], [71.0, 71.44], [74.0, 74.34], [91.0, 91.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 1.21, 1.32, 2.31, 1.27, 0.86, 3.01, 1.63, 1.17, 0.95, 0.83, 1.41, 4.77, 1.42, 1.02, 0.28, 0.98, 0.79, 0.1, 0.5, 0.44, 0.34, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/tTrgUKsKetY_filtered.json b/annotations_filtered/tTrgUKsKetY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..793a0a8c2735b3ae677e5e7a624d28a5fcd67fd3 --- /dev/null +++ b/annotations_filtered/tTrgUKsKetY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 16.98], [20.0, 23.31], [24.0, 24.33], [26.0, 26.67], [28.0, 29.19], [30.0, 30.97], [32.0, 32.49], [34.0, 35.19], [43.0, 43.09], [54.0, 54.31], [60.0, 60.45], [71.0, 80.03], [84.0, 92.26], [95.0, 100.5], [104.0, 137.27], [140.0, 142.28], [145.0, 145.45], [146.0, 146.84], [148.0, 148.68], [150.0, 150.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.09, 32.27, 30.53, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.45], ["buzz", 8.23], ["vehicle", 3.58]], [["white noise", 19.09], ["hum", 14.7], ["mains hum", 10.01]], [["livestock, farm animals, working animals", 56.7], ["cattle, bovinae", 24.23], ["moo", 14.43]], null, null, null, null, null, null], "duration": [-0.02, 3.31, 0.33, 0.67, 1.19, 0.97, 0.49, 1.19, 0.09, 0.31, 0.45, 9.03, 8.26, 5.5, 33.27, 2.28, 0.45, 0.84, 0.68, 0.58]} \ No newline at end of file diff --git a/annotations_filtered/tUaOBgXp_Pg_filtered.json b/annotations_filtered/tUaOBgXp_Pg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba412bb311ed0330833543916cce2c7b9c4584aa --- /dev/null +++ b/annotations_filtered/tUaOBgXp_Pg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.83], [13.0, 57.15], [58.0, 59.37], [60.0, 62.26], [64.0, 67.39], [69.0, 70.53], [77.0, 80.87], [85.0, 84.75], [90.0, 90.76], [94.0, 98.0]], "keep_status": [false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.88, 40.38, 0.0, 41.52, 0.0, 0.0, 29.48], "audiomae_on_audioset": [null, null, null, [["music", 12.43], ["noise", 9.59], ["white noise", 9.16]], [["speech", 33.77], ["music", 30.08], ["sidetone", 9.06]], null, [["music", 52.31], ["fart", 4.22], ["fly, housefly", 2.56]], null, null, [["music", 61.59], ["speech", 6.98], ["throbbing", 5.49]]], "duration": [1.83, 44.15, 1.37, 2.26, 3.39, 1.53, 3.87, -0.25, 0.76, 4.0]} \ No newline at end of file diff --git a/annotations_filtered/tUiVEKK8rWM_filtered.json b/annotations_filtered/tUiVEKK8rWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc9ff6193ce9907ff74749b77c6938913215c09a --- /dev/null +++ b/annotations_filtered/tUiVEKK8rWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [3.0, 4.04], [4.0, 4.29], [4.0, 4.43], [7.0, 7.94], [16.0, 16.21], [20.0, 20.48], [23.0, 23.67], [30.0, 30.89], [38.0, 38.62], [42.0, 42.69], [44.0, 44.32], [45.0, 46.52], [49.0, 50.21], [52.0, 53.28], [55.0, 55.46], [67.0, 67.61], [69.0, 69.53], [76.0, 76.08], [78.0, 78.46], [79.0, 82.26], [83.0, 84.7], [87.0, 87.39], [88.0, 89.28], [92.0, 92.25], [103.0, 111.69], [113.0, 118.88], [120.0, 121.88], [124.0, 124.39], [127.0, 128.02], [129.0, 134.57], [138.0, 141.17], [142.0, 143.24], [144.0, 144.64], [148.0, 148.0], [153.0, 153.64], [155.0, 155.22], [157.0, 157.2], [158.0, 159.07], [160.0, 161.08], [166.0, 166.99], [170.0, 171.02], [177.0, 178.31], [182.0, 183.03], [184.0, 183.93], [187.0, 187.79], [193.0, 194.09], [198.0, 198.91], [202.0, 202.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 59.96, 88.28, 0.0, 0.0, 0.0, 96.42, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 1.04, 0.29, 0.43, 0.94, 0.21, 0.48, 0.67, 0.89, 0.62, 0.69, 0.32, 1.52, 1.21, 1.28, 0.46, 0.61, 0.53, 0.08, 0.46, 3.26, 1.7, 0.39, 1.28, 0.25, 8.69, 5.88, 1.88, 0.39, 1.02, 5.57, 3.17, 1.24, 0.64, 0.0, 0.64, 0.22, 0.2, 1.07, 1.08, 0.99, 1.02, 1.31, 1.03, -0.07, 0.79, 1.09, 0.91, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/tUkE9qaVgmo_filtered.json b/annotations_filtered/tUkE9qaVgmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0606b7cc05f24e9bcb2ba64cf1a0ca6515d9c34e --- /dev/null +++ b/annotations_filtered/tUkE9qaVgmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [6.0, 6.96], [15.0, 17.81], [22.0, 24.24], [25.0, 25.03], [26.0, 26.96], [29.0, 29.39], [34.0, 34.77], [37.0, 38.5], [43.0, 44.73], [46.0, 46.8], [55.0, 55.46], [63.0, 63.98], [65.0, 65.5], [68.0, 68.96], [70.0, 70.56], [71.0, 71.19], [73.0, 72.55], [73.0, 76.0], [81.0, 81.57], [82.0, 82.68], [84.0, 87.35], [88.0, 88.62], [93.0, 95.03], [96.0, 98.69], [106.0, 112.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 98.1, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.41, 0.0, 0.0, 43.79, 0.0, 48.87, 40.68, 30.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 13.79], ["noise", 12.05], ["frog", 11.91]], null, null, [["cattle, bovinae", 38.23], ["moo", 20.64], ["caw", 11.59]], null, [["fart", 19.9], ["telephone", 10.53], ["speech", 10.06]], [["frog", 50.75], ["croak", 35.18], ["speech", 5.4]], [["speech", 26.2], ["baby cry, infant cry", 25.51], ["whimper", 16.84]]], "duration": [0.43, 0.96, 2.81, 2.24, 0.03, 0.96, 0.39, 0.77, 1.5, 1.73, 0.8, 0.46, 0.98, 0.5, 0.96, 0.56, 0.19, -0.45, 3.0, 0.57, 0.68, 3.35, 0.62, 2.03, 2.69, 6.95]} \ No newline at end of file diff --git a/annotations_filtered/tUuzV9kwSBE_filtered.json b/annotations_filtered/tUuzV9kwSBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..913a111ead7198f8630316d95484499910d1d5cb --- /dev/null +++ b/annotations_filtered/tUuzV9kwSBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.14], [10.0, 12.83], [30.0, 32.43], [32.0, 32.46], [49.0, 55.16], [57.0, 56.96], [60.0, 59.93], [60.0, 60.89], [63.0, 63.81], [64.0, 67.71], [68.0, 67.76], [69.0, 70.68], [82.0, 83.08], [89.0, 90.1], [93.0, 94.53], [105.0, 112.13], [112.0, 112.56], [115.0, 117.36]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.16, 37.17, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 34.04, 0.0, 0.0, 0.0, 0.0, 0.0, 32.94, 0.0, 31.82], "audiomae_on_audioset": [null, [["music", 36.7], ["boing", 13.43], ["quack", 11.42]], [["music", 41.52], ["didgeridoo", 19.84], ["speech", 8.7]], null, [["music", 28.18], ["speech", 27.99], ["whack, thwack", 11.14]], null, null, null, null, [["music", 45.22], ["speech", 24.58], ["boing", 4.94]], null, null, null, null, null, [["speech", 66.35], ["music", 4.42], ["hubbub, speech noise, speech babble", 3.72]], null, [["speech", 55.06], ["crowd", 10.29], ["outside, urban or manmade", 8.13]]], "duration": [0.14, 2.83, 2.43, 0.46, 6.16, -0.04, -0.07, 0.89, 0.81, 3.71, -0.24, 1.68, 1.08, 1.1, 1.53, 7.13, 0.56, 2.36]} \ No newline at end of file diff --git a/annotations_filtered/tV7wQ19UBqg_filtered.json b/annotations_filtered/tV7wQ19UBqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86bcb91979c82523269e6902acffa19ddf2968e3 --- /dev/null +++ b/annotations_filtered/tV7wQ19UBqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 17.9], [40.0, 75.79], [76.0, 77.94], [81.0, 82.09], [87.0, 95.61], [97.0, 100.11], [101.0, 102.29], [103.0, 105.92], [108.0, 122.15], [124.0, 125.24], [125.0, 131.9], [133.0, 136.97], [139.0, 139.99], [143.0, 144.71], [146.0, 149.79], [151.0, 151.16], [153.0, 155.11], [160.0, 161.33], [162.0, 162.11], [163.0, 164.52], [168.0, 171.9], [176.0, 178.98], [180.0, 180.3], [184.0, 184.91], [185.0, 189.73], [191.0, 197.99], [199.0, 203.17], [208.0, 211.86], [212.0, 216.67], [219.0, 221.0], [224.0, 225.41], [229.0, 231.33], [232.0, 233.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.86, 0.0, 0.0, 0.0, 100.0, 98.36, 0.0, 99.9, 99.71, 0.0, 91.47, 99.9, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 98.99, 100.0, 0.0, 0.0, 92.31, 99.85, 99.98, 97.11, 99.87, 100.0, 0.0, 97.92, 0.0], "audiomae_on_audioset": [[["speech", 68.57], ["breaking", 10.87], ["whack, thwack", 4.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.9, 35.79, 1.94, 1.09, 8.61, 3.11, 1.29, 2.92, 14.15, 1.24, 6.9, 3.97, 0.99, 1.71, 3.79, 0.16, 2.11, 1.33, 0.11, 1.52, 3.9, 2.98, 0.3, 0.91, 4.73, 6.99, 4.17, 3.86, 4.67, 2.0, 1.41, 2.33, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/tVBVeXfbo6k_filtered.json b/annotations_filtered/tVBVeXfbo6k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60827a13f618dcba4ccc8d798620d1f14b646e78 --- /dev/null +++ b/annotations_filtered/tVBVeXfbo6k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 28.49], [31.0, 33.45], [35.0, 35.43], [37.0, 46.87], [50.0, 53.05], [66.0, 81.63], [82.0, 84.5], [86.0, 89.7], [92.0, 92.38], [106.0, 107.38], [110.0, 111.69], [112.0, 116.06]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [49.64, 87.92, 0.0, 33.55, 34.59, 36.7, 38.95, 99.78, 0.0, 0.0, 0.0, 61.87], "audiomae_on_audioset": [[["music", 62.4], ["theremin", 8.23], ["synthesizer", 3.69]], null, null, [["music", 69.96], ["fart", 4.52], ["groan", 4.44]], [["music", 46.84], ["didgeridoo", 18.07], ["throbbing", 7.02]], [["groan", 47.58], ["music", 39.06], ["speech", 3.09]], [["whack, thwack", 23.31], ["clang", 13.18], ["arrow", 10.87]], null, null, null, null, null], "duration": [20.49, 2.45, 0.43, 9.87, 3.05, 15.63, 2.5, 3.7, 0.38, 1.38, 1.69, 4.06]} \ No newline at end of file diff --git a/annotations_filtered/tVRPz6-Tkww_filtered.json b/annotations_filtered/tVRPz6-Tkww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4873116444eb799f9a5617786dfb99f678042a39 --- /dev/null +++ b/annotations_filtered/tVRPz6-Tkww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.34], [11.0, 19.14], [21.0, 23.13], [24.0, 32.61], [33.0, 73.06], [74.0, 73.75], [74.0, 78.51], [79.0, 81.5], [83.0, 85.04], [90.0, 90.66], [93.0, 96.01], [98.0, 99.99], [105.0, 109.11], [111.0, 117.0], [118.0, 120.68], [123.0, 130.54]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.27, 50.66, 98.86, 44.9, 0.0, 0.0, 67.0, 84.8, 33.55, 0.0, 98.86, 0.0, 98.36, 82.97, 95.37, 45.95], "audiomae_on_audioset": [null, null, null, [["insect", 10.79], ["hum", 9.66], ["music", 9.47]], null, null, null, null, [["animal", 42.69], ["whale vocalization", 37.47], ["roaring cats (lions, tigers)", 5.43]], null, null, null, null, null, null, [["speech", 81.4], ["whale vocalization", 4.62], ["sidetone", 1.98]]], "duration": [5.34, 8.14, 2.13, 8.61, 40.06, -0.25, 4.51, 2.5, 2.04, 0.66, 3.01, 1.99, 4.11, 6.0, 2.68, 7.54]} \ No newline at end of file diff --git a/annotations_filtered/tVfrMp_MWw4_filtered.json b/annotations_filtered/tVfrMp_MWw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a83ccb517e752e814461e47e379df82a491dbc76 --- /dev/null +++ b/annotations_filtered/tVfrMp_MWw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [4.0, 4.29], [6.0, 7.32], [10.0, 14.03], [16.0, 18.91], [21.0, 21.42], [24.0, 24.93], [27.0, 29.57], [30.0, 33.32], [34.0, 34.79], [36.0, 37.45], [40.0, 41.66], [43.0, 43.46], [46.0, 48.63], [50.0, 53.15], [55.0, 55.0], [57.0, 56.89], [58.0, 59.64], [62.0, 63.46], [69.0, 69.06], [71.0, 71.56], [73.0, 73.87], [76.0, 81.97], [84.0, 86.59], [88.0, 88.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.56, 97.73, 0.0, 0.0, 90.6, 88.83, 0.0, 0.0, 0.0, 0.0, 67.51, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 82.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 0.29, 1.32, 4.03, 2.91, 0.42, 0.93, 2.57, 3.32, 0.79, 1.45, 1.66, 0.46, 2.63, 3.15, 0.0, -0.11, 1.64, 1.46, 0.06, 0.56, 0.87, 5.97, 2.59, 0.91]} \ No newline at end of file diff --git a/annotations_filtered/tVl78xgPyow_filtered.json b/annotations_filtered/tVl78xgPyow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7be66b8fbc91ae85a1ef1f513cf2977fb8a8082 --- /dev/null +++ b/annotations_filtered/tVl78xgPyow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.47], [4.0, 5.49], [9.0, 10.35], [13.0, 33.59]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 59.86], "audiomae_on_audioset": [null, null, null, null], "duration": [1.47, 1.49, 1.35, 20.59]} \ No newline at end of file diff --git a/annotations_filtered/tVubEM2oUj4_filtered.json b/annotations_filtered/tVubEM2oUj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bc38317c99f1e509ced6320496543d27da65ee2 --- /dev/null +++ b/annotations_filtered/tVubEM2oUj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.49], [9.0, 9.85], [17.0, 17.54], [29.0, 31.5], [33.0, 34.77], [37.0, 36.78], [37.0, 37.84], [38.0, 40.2], [45.0, 46.04], [53.0, 55.34], [56.0, 59.48], [61.0, 65.7], [67.0, 75.54], [76.0, 76.65], [78.0, 78.26], [79.0, 79.81], [82.0, 82.54], [85.0, 85.48], [88.0, 90.24], [91.0, 91.54], [96.0, 96.74], [98.0, 99.45], [101.0, 114.42], [116.0, 130.25], [132.0, 139.13], [141.0, 141.44], [143.0, 146.52], [150.0, 150.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 99.87, 80.46, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 99.76, 99.84, 99.76, 0.0, 99.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.49, 0.85, 0.54, 2.5, 1.77, -0.22, 0.84, 2.2, 1.04, 2.34, 3.48, 4.7, 8.54, 0.65, 0.26, 0.81, 0.54, 0.48, 2.24, 0.54, 0.74, 1.45, 13.42, 14.25, 7.13, 0.44, 3.52, 0.16]} \ No newline at end of file diff --git a/annotations_filtered/tVxYCeRXzGo_filtered.json b/annotations_filtered/tVxYCeRXzGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9945591bb87955c00964853aa6d26d523e5fc096 --- /dev/null +++ b/annotations_filtered/tVxYCeRXzGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.83], [6.0, 7.03], [8.0, 9.61], [10.0, 11.79], [13.0, 14.98], [23.0, 25.78], [27.0, 28.56], [35.0, 36.98], [53.0, 54.97], [56.0, 56.81], [57.0, 58.7], [65.0, 65.67], [80.0, 80.65], [85.0, 86.0], [96.0, 97.68], [101.0, 101.88], [106.0, 106.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 1.03, 1.61, 1.79, 1.98, 2.78, 1.56, 1.98, 1.97, 0.81, 1.7, 0.67, 0.65, 1.0, 1.68, 0.88, 0.88]} \ No newline at end of file diff --git a/annotations_filtered/tWEBbYoDaU8_filtered.json b/annotations_filtered/tWEBbYoDaU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d94c0690747ffa7a3268139bd4ce633a8dad2ff --- /dev/null +++ b/annotations_filtered/tWEBbYoDaU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [5.0, 6.07], [7.0, 7.77], [10.0, 10.18], [11.0, 11.72], [16.0, 16.87], [20.0, 19.79], [21.0, 22.27], [30.0, 33.59], [37.0, 43.09], [44.0, 46.7], [49.0, 53.59], [56.0, 56.73], [61.0, 62.45], [69.0, 70.06], [77.0, 86.98], [88.0, 88.43], [89.0, 124.87], [127.0, 127.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 62.07, 44.99, 53.72, 0.0, 0.0, 0.0, 30.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 25.78], ["thunk", 15.15], ["hum", 14.59]], null, null, null, null, [["music", 40.62], ["speech", 34.58], ["didgeridoo", 2.38]], null, null, null], "duration": [0.72, 1.07, 0.77, 0.18, 0.72, 0.87, -0.21, 1.27, 3.59, 6.09, 2.7, 4.59, 0.73, 1.45, 1.06, 9.98, 0.43, 35.87, 0.99]} \ No newline at end of file diff --git a/annotations_filtered/tWuBw5082gI_filtered.json b/annotations_filtered/tWuBw5082gI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09584483663c57042b8c1a34b375ef623bfb29d4 --- /dev/null +++ b/annotations_filtered/tWuBw5082gI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 50.79], [51.0, 92.97], [94.0, 171.27]], "keep_status": [true, false, false], "silence_prob": [29.91, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 33.77], ["music", 14.96], ["mains hum", 11.55]], null, null], "duration": [10.79, 41.97, 77.27]} \ No newline at end of file diff --git a/annotations_filtered/tX3qqCP99Tw_filtered.json b/annotations_filtered/tX3qqCP99Tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96b0bd6c5d59acb1b0b8a510fc144a2fe1077fe5 --- /dev/null +++ b/annotations_filtered/tX3qqCP99Tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 72.67], [74.0, 84.52], [85.0, 86.54], [87.0, 112.43], [114.0, 120.39], [121.0, 123.06], [125.0, 124.77], [127.0, 129.15], [131.0, 132.19], [133.0, 134.52], [135.0, 137.29], [143.0, 145.35], [148.0, 149.17], [150.0, 150.92], [159.0, 159.38], [164.0, 166.36], [168.0, 171.17], [172.0, 172.81], [175.0, 180.44], [181.0, 180.69], [181.0, 195.98], [197.0, 199.71]], "keep_status": [true, true, false, true, true, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, true, true], "silence_prob": [34.23, 35.49, 0.0, 34.1, 37.99, 97.43, 0.0, 67.13, 0.0, 0.0, 56.03, 58.72, 0.0, 0.0, 0.0, 47.94, 39.38, 0.0, 37.95, 0.0, 35.98, 47.94], "audiomae_on_audioset": [[["mains hum", 17.47], ["buzz", 17.0], ["hum", 16.51]], [["speech", 30.99], ["music", 25.39], ["buzz", 7.79]], null, [["fly, housefly", 24.98], ["livestock, farm animals, working animals", 18.03], ["insect", 13.53]], [["music", 33.89], ["throbbing", 15.96], ["whack, thwack", 9.17]], null, null, null, null, null, null, null, null, null, null, [["hum", 25.12], ["mains hum", 13.13], ["sine wave", 10.53]], [["gong", 33.62], ["music", 25.68], ["gasp", 10.68]], null, [["gong", 21.95], ["speech", 19.47], ["machine gun", 6.93]], null, [["music", 22.19], ["noise", 9.12], ["electric shaver, electric razor", 5.84]], [["music", 37.09], ["hum", 7.64], ["speech", 7.47]]], "duration": [29.67, 10.52, 1.54, 25.43, 6.39, 2.06, -0.23, 2.15, 1.19, 1.52, 2.29, 2.35, 1.17, 0.92, 0.38, 2.36, 3.17, 0.81, 5.44, -0.31, 14.98, 2.71]} \ No newline at end of file diff --git a/annotations_filtered/tX74H9IuYdM_filtered.json b/annotations_filtered/tX74H9IuYdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccaf40a5e574848754ecedd46496b3ae9941a8e9 --- /dev/null +++ b/annotations_filtered/tX74H9IuYdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.32], [9.0, 22.44], [23.0, 33.08], [34.0, 34.82], [36.0, 41.37], [43.0, 43.09], [48.0, 48.98], [51.0, 52.73], [55.0, 55.83], [60.0, 60.49], [64.0, 64.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.82, 68.15, 96.04, 0.0, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.32, 13.44, 10.08, 0.82, 5.37, 0.09, 0.98, 1.73, 0.83, 0.49, 0.96]} \ No newline at end of file diff --git a/annotations_filtered/tXF23iSwW3I_filtered.json b/annotations_filtered/tXF23iSwW3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..383bb02a1f53557dfe18b9f11bf41914543cc25d --- /dev/null +++ b/annotations_filtered/tXF23iSwW3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 31.19], [36.0, 36.59]], "keep_status": [false, false], "silence_prob": [33.95, 0.0], "audiomae_on_audioset": [[["music", 44.19], ["hum", 24.1], ["throbbing", 12.37]], null], "duration": [23.19, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/tXNMNMLQzwg_filtered.json b/annotations_filtered/tXNMNMLQzwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee4db71196b4f23eec1bd4292add410ee09116fa --- /dev/null +++ b/annotations_filtered/tXNMNMLQzwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 24.92], [34.0, 34.2], [36.0, 36.85], [38.0, 38.31], [47.0, 47.04], [57.0, 57.2], [63.0, 65.28], [67.0, 66.83], [68.0, 67.81], [80.0, 80.47], [85.0, 85.73], [86.0, 86.61], [93.0, 95.35], [127.0, 126.96], [140.0, 139.68], [140.0, 139.97], [144.0, 144.32], [147.0, 146.79], [150.0, 149.76], [156.0, 156.64], [157.0, 159.76], [165.0, 168.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.08, 0.2, 0.85, 0.31, 0.04, 0.2, 2.28, -0.17, -0.19, 0.47, 0.73, 0.61, 2.35, -0.04, -0.32, -0.03, 0.32, -0.21, -0.24, 0.64, 2.76, 3.51]} \ No newline at end of file diff --git a/annotations_filtered/tXhTaL04ByA_filtered.json b/annotations_filtered/tXhTaL04ByA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6350de73e52b9a0adf867c7cfe9181f91f51859 --- /dev/null +++ b/annotations_filtered/tXhTaL04ByA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.18], [8.0, 8.78], [9.0, 9.64], [11.0, 13.12], [13.0, 16.51], [17.0, 17.37], [19.0, 20.43], [21.0, 21.47], [25.0, 25.41], [32.0, 37.64], [39.0, 40.58], [42.0, 50.8], [52.0, 52.51], [53.0, 62.07], [63.0, 75.44], [76.0, 80.55], [81.0, 81.21], [84.0, 84.32], [86.0, 93.06], [93.0, 93.88], [99.0, 99.22], [100.0, 100.48], [101.0, 101.39], [103.0, 103.91], [109.0, 109.78], [111.0, 111.23], [112.0, 112.67], [114.0, 115.57]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 50.66, 43.35, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0, 35.2, 0.0, 46.75, 31.05, 33.2, 0.0, 0.0, 34.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 66.6], ["telephone", 10.35], ["sidetone", 9.51]], null, null, null, null, [["music", 31.02], ["theremin", 20.11], ["hum", 10.04]], null, [["music", 50.23], ["theremin", 24.25], ["musical instrument", 6.87]], null, [["theremin", 45.3], ["hum", 19.09], ["music", 13.7]], [["theremin", 57.13], ["music", 29.48], ["musical instrument", 3.07]], [["music", 28.92], ["foghorn", 7.98], ["speech", 7.23]], null, null, [["theremin", 23.36], ["music", 17.12], ["synthesizer", 10.42]], null, null, null, null, null, null, null, null, null], "duration": [1.18, 0.78, 0.64, 2.12, 3.51, 0.37, 1.43, 0.47, 0.41, 5.64, 1.58, 8.8, 0.51, 9.07, 12.44, 4.55, 0.21, 0.32, 7.06, 0.88, 0.22, 0.48, 0.39, 0.91, 0.78, 0.23, 0.67, 1.57]} \ No newline at end of file diff --git a/annotations_filtered/tXp79rAS5JQ_filtered.json b/annotations_filtered/tXp79rAS5JQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9de762be58f0f6e12582cd6d8b06d75ccc5f89be --- /dev/null +++ b/annotations_filtered/tXp79rAS5JQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.44], [7.0, 17.56], [19.0, 30.21], [31.0, 34.53], [36.0, 63.36], [67.0, 67.0], [72.0, 75.19], [76.0, 87.64], [94.0, 97.43], [120.0, 124.65], [127.0, 127.57], [131.0, 131.33], [136.0, 139.13], [142.0, 141.78], [146.0, 146.69], [153.0, 153.06]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [36.89, 40.64, 46.61, 50.26, 31.7, 0.0, 64.75, 38.37, 39.19, 49.59, 0.0, 0.0, 48.65, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["theremin", 39.41], ["music", 33.9], ["synthesizer", 8.55]], [["rumble", 15.7], ["music", 13.28], ["hum", 11.81]], [["whale vocalization", 81.06], ["speech", 6.78], ["singing bowl", 2.44]], null, [["hum", 34.12], ["music", 32.72], ["throbbing", 9.14]], null, null, [["music", 43.05], ["singing bowl", 11.19], ["ambient music", 10.92]], [["speech", 60.8], ["music", 13.72], ["hum", 1.95]], [["whale vocalization", 94.62], ["music", 1.85], ["hum", 0.58]], null, null, [["whale vocalization", 40.6], ["music", 31.09], ["theremin", 5.77]], null, null, null], "duration": [5.44, 10.56, 11.21, 3.53, 27.36, 0.0, 3.19, 11.64, 3.43, 4.65, 0.57, 0.33, 3.13, -0.22, 0.69, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/tXrxBy-CDPc_filtered.json b/annotations_filtered/tXrxBy-CDPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e222f7cba26b3f6dcc0adf161925dc05bc1cb62d --- /dev/null +++ b/annotations_filtered/tXrxBy-CDPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.92], [10.0, 11.65], [12.0, 13.56], [16.0, 18.64], [20.0, 20.58], [21.0, 23.09], [25.0, 28.58], [30.0, 35.7], [37.0, 37.17], [39.0, 39.19], [41.0, 44.1], [45.0, 46.21], [48.0, 50.25], [51.0, 51.71], [52.0, 51.8], [52.0, 52.15], [53.0, 53.49], [54.0, 56.57], [57.0, 57.38], [58.0, 58.72], [59.0, 59.86], [63.0, 63.8], [66.0, 66.99], [74.0, 77.43], [82.0, 83.49], [85.0, 85.72], [87.0, 88.62], [91.0, 91.07], [92.0, 92.7], [94.0, 94.76], [96.0, 97.04], [99.0, 101.61], [103.0, 104.46], [114.0, 115.06], [116.0, 118.3], [120.0, 122.88], [125.0, 125.34], [126.0, 128.09], [131.0, 131.08], [131.0, 132.21], [134.0, 134.23], [138.0, 138.96], [139.0, 140.49], [141.0, 141.44], [142.0, 142.65], [145.0, 146.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 77.36, 0.0, 82.43, 99.84, 64.86, 0.0, 0.0, 69.61, 0.0, 63.31, 0.0, 0.0, 0.0, 0.0, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 82.07, 80.82, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 1.65, 1.56, 2.64, 0.58, 2.09, 3.58, 5.7, 0.17, 0.19, 3.1, 1.21, 2.25, 0.71, -0.2, 0.15, 0.49, 2.57, 0.38, 0.72, 0.86, 0.8, 0.99, 3.43, 1.49, 0.72, 1.62, 0.07, 0.7, 0.76, 1.04, 2.61, 1.46, 1.06, 2.3, 2.88, 0.34, 2.09, 0.08, 1.21, 0.23, 0.96, 1.49, 0.44, 0.65, 1.65]} \ No newline at end of file diff --git a/annotations_filtered/tY5el7dZ9H0_filtered.json b/annotations_filtered/tY5el7dZ9H0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e22040669cd01f24fb537c48a12b740f59ff094d --- /dev/null +++ b/annotations_filtered/tY5el7dZ9H0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.02], [22.0, 22.94], [23.0, 24.14], [25.0, 26.65], [30.0, 31.45], [34.0, 34.97], [36.0, 36.85], [38.0, 39.02], [41.0, 42.2], [44.0, 45.49], [46.0, 46.57], [47.0, 47.73], [49.0, 50.3], [51.0, 51.63], [53.0, 54.26], [56.0, 60.54], [62.0, 62.21], [63.0, 63.73], [69.0, 69.33], [70.0, 70.95], [72.0, 73.03], [74.0, 75.34], [77.0, 76.87], [78.0, 77.73], [81.0, 81.51], [83.0, 83.93], [85.0, 86.14], [90.0, 90.51], [93.0, 93.56], [95.0, 96.45], [98.0, 99.3], [104.0, 106.81], [108.0, 117.86], [120.0, 120.8], [122.0, 126.32], [127.0, 128.26], [130.0, 130.79], [132.0, 132.65], [134.0, 135.24], [137.0, 173.79], [175.0, 176.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 77.87, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.02, 0.94, 1.14, 1.65, 1.45, 0.97, 0.85, 1.02, 1.2, 1.49, 0.57, 0.73, 1.3, 0.63, 1.26, 4.54, 0.21, 0.73, 0.33, 0.95, 1.03, 1.34, -0.13, -0.27, 0.51, 0.93, 1.14, 0.51, 0.56, 1.45, 1.3, 2.81, 9.86, 0.8, 4.32, 1.26, 0.79, 0.65, 1.24, 36.79, 1.72]} \ No newline at end of file diff --git a/annotations_filtered/tYGiUUnoZhk_filtered.json b/annotations_filtered/tYGiUUnoZhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b317e95fc523ee858ada594430b42cee5c5ab6b0 --- /dev/null +++ b/annotations_filtered/tYGiUUnoZhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [2.0, 2.57], [3.0, 4.31], [5.0, 5.21], [8.0, 8.34], [11.0, 11.18], [13.0, 13.44], [14.0, 14.66], [17.0, 16.83], [19.0, 20.98], [27.0, 27.63], [29.0, 30.01], [30.0, 31.45], [34.0, 34.65], [42.0, 42.26], [44.0, 46.09], [47.0, 50.63], [51.0, 52.07], [52.0, 56.02], [60.0, 61.8], [62.0, 65.25], [68.0, 70.38], [76.0, 77.84], [79.0, 80.82], [84.0, 85.19], [90.0, 90.88], [91.0, 91.91], [93.0, 94.59], [97.0, 106.49], [109.0, 124.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 57.01, 0.0, 46.36, 0.0, 34.09, 45.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.63, 47.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.14], ["music", 17.61], ["hum", 13.11]], null, [["music", 51.28], ["speech", 29.29], ["didgeridoo", 3.66]], [["music", 58.34], ["synthesizer", 8.79], ["didgeridoo", 8.66]], null, null, null, null, null, null, [["hum", 21.36], ["mains hum", 16.42], ["buzz", 13.03]], [["throbbing", 14.55], ["fly, housefly", 7.98], ["speech", 5.49]]], "duration": [0.38, 0.57, 1.31, 0.21, 0.34, 0.18, 0.44, 0.66, -0.17, 1.98, 0.63, 1.01, 1.45, 0.65, 0.26, 2.09, 3.63, 1.07, 4.02, 1.8, 3.25, 2.38, 1.84, 1.82, 1.19, 0.88, 0.91, 1.59, 9.49, 15.34]} \ No newline at end of file diff --git a/annotations_filtered/tYPUzX8KTXw_filtered.json b/annotations_filtered/tYPUzX8KTXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32e9201e7882c5e430ef6e3d086e56f4b0124ed8 --- /dev/null +++ b/annotations_filtered/tYPUzX8KTXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.82], [3.0, 4.28], [8.0, 37.18], [44.0, 43.56], [44.0, 44.31], [45.0, 46.04], [51.0, 50.9], [52.0, 52.84], [54.0, 54.13], [54.0, 57.67], [65.0, 65.43], [66.0, 65.75], [67.0, 67.88], [71.0, 71.64], [73.0, 73.4], [76.0, 77.26], [79.0, 79.79], [82.0, 81.92], [86.0, 87.0], [92.0, 91.83], [93.0, 92.69], [95.0, 95.77], [96.0, 96.53], [106.0, 105.97], [108.0, 108.58], [111.0, 111.84], [113.0, 113.41], [114.0, 114.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 67.35], ["synthesizer", 6.64], ["theremin", 3.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 1.28, 29.18, -0.44, 0.31, 1.04, -0.1, 0.84, 0.13, 3.67, 0.43, -0.25, 0.88, 0.64, 0.4, 1.26, 0.79, -0.08, 1.0, -0.17, -0.31, 0.77, 0.53, -0.03, 0.58, 0.84, 0.41, 0.44]} \ No newline at end of file diff --git a/annotations_filtered/tYRzkKtCRuY_filtered.json b/annotations_filtered/tYRzkKtCRuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98d5b70cb27e3efe8f796442528716a0164a129f --- /dev/null +++ b/annotations_filtered/tYRzkKtCRuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.15], [10.0, 10.08], [11.0, 13.37], [15.0, 15.9], [18.0, 19.18], [20.0, 22.03], [25.0, 28.36], [31.0, 32.86], [34.0, 35.55], [36.0, 39.78], [40.0, 41.55], [43.0, 43.65], [47.0, 48.96]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [68.8, 0.0, 71.57, 0.0, 0.0, 37.49, 81.71, 0.0, 0.0, 40.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 32.39], ["music", 29.25], ["musical instrument", 3.08]], null, null, null, [["music", 41.02], ["speech", 16.1], ["mains hum", 7.58]], null, null, null], "duration": [4.15, 0.08, 2.37, 0.9, 1.18, 2.03, 3.36, 1.86, 1.55, 3.78, 1.55, 0.65, 1.96]} \ No newline at end of file diff --git a/annotations_filtered/tYf5ENc39dQ_filtered.json b/annotations_filtered/tYf5ENc39dQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b48d0219357da8c185327b5e2310b9bed3d0f3a --- /dev/null +++ b/annotations_filtered/tYf5ENc39dQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.3], [17.0, 24.11], [26.0, 30.94], [32.0, 34.84], [36.0, 50.36], [55.0, 63.09], [68.0, 91.22], [93.0, 93.01], [94.0, 103.69], [106.0, 109.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.05, 98.66, 72.31, 94.66, 55.39, 42.6, 63.42, 0.0, 56.55, 62.89], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.69], ["cello", 10.75], ["bowed string instrument", 5.54]], null, null, null, null], "duration": [3.3, 7.11, 4.94, 2.84, 14.36, 8.09, 23.22, 0.01, 9.69, 3.46]} \ No newline at end of file diff --git a/annotations_filtered/tYmvgGjSiN8_filtered.json b/annotations_filtered/tYmvgGjSiN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..998bb0a9bb3d0405f7db5a3951d08f8eb36f2c12 --- /dev/null +++ b/annotations_filtered/tYmvgGjSiN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.84], [42.0, 45.18], [61.0, 62.38], [64.0, 64.23], [69.0, 71.32], [89.0, 93.77], [116.0, 121.64]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 35.99, 0.0, 0.0, 60.14, 36.17, 30.9], "audiomae_on_audioset": [null, [["music", 66.37], ["carnatic music", 12.4], ["mantra", 4.66]], null, null, null, [["music", 27.0], ["humming", 21.25], ["electronic tuner", 8.24]], [["music", 67.45], ["guitar", 6.9], ["musical instrument", 4.88]]], "duration": [0.84, 3.18, 1.38, 0.23, 2.32, 4.77, 5.64]} \ No newline at end of file diff --git a/annotations_filtered/tYs7uguB_JQ_filtered.json b/annotations_filtered/tYs7uguB_JQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef26e039d4e3db916cb8071eac674e3fad5a1702 --- /dev/null +++ b/annotations_filtered/tYs7uguB_JQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.05], [3.0, 3.08], [4.0, 36.24], [39.0, 120.33], [121.0, 122.18], [125.0, 137.61], [139.0, 160.46], [160.0, 160.52], [161.0, 160.59], [161.0, 163.8], [165.0, 165.97]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 32.56, 0.0, 0.0, 49.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 36.75], ["throbbing", 17.77], ["speech", 13.98]], [["livestock, farm animals, working animals", 25.67], ["cattle, bovinae", 22.56], ["moo", 14.7]], null, null, [["music", 11.5], ["mosquito", 11.49], ["frog", 11.11]], null], "duration": [0.05, 0.08, 32.24, 81.33, 1.18, 12.61, 21.46, 0.52, -0.41, 2.8, 0.97]} \ No newline at end of file diff --git a/annotations_filtered/tZ97edZTrHQ_filtered.json b/annotations_filtered/tZ97edZTrHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2184c4f1680863032605b7d88d7947ce58bcf5d6 --- /dev/null +++ b/annotations_filtered/tZ97edZTrHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.13], [23.0, 25.98], [28.0, 29.24], [32.0, 39.58], [40.0, 41.34], [46.0, 50.18], [57.0, 57.59]], "keep_status": [false, true, false, false, false, true, false], "silence_prob": [0.0, 32.94, 0.0, 35.62, 0.0, 34.89, 0.0], "audiomae_on_audioset": [null, [["music", 31.21], ["speech", 13.91], ["didgeridoo", 12.73]], null, [["music", 66.15], ["musical instrument", 11.43], ["synthesizer", 4.67]], null, [["music", 29.74], ["sidetone", 13.59], ["speech", 13.49]], null], "duration": [1.13, 2.98, 1.24, 7.58, 1.34, 4.18, 0.59]} \ No newline at end of file diff --git a/annotations_filtered/t_9GTwEOdkY_filtered.json b/annotations_filtered/t_9GTwEOdkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f824d6da33bab22cdc9c7ac4416e92d70c23fd7f --- /dev/null +++ b/annotations_filtered/t_9GTwEOdkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.0], [27.0, 31.92], [37.0, 37.86], [44.0, 52.68], [54.0, 55.7], [57.0, 110.47], [111.0, 112.67], [114.0, 114.51], [118.0, 132.88], [141.0, 141.86], [143.0, 173.58]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.37, 0.0, 53.65, 0.0, 0.0, 0.0, 0.0, 41.32, 0.0, 0.0], "audiomae_on_audioset": [null, [["singing bowl", 41.27], ["gong", 18.72], ["music", 8.97]], null, null, null, null, null, null, [["hum", 39.41], ["mains hum", 27.16], ["music", 12.84]], null, null], "duration": [1.0, 4.92, 0.86, 8.68, 1.7, 53.47, 1.67, 0.51, 14.88, 0.86, 30.58]} \ No newline at end of file diff --git a/annotations_filtered/t_BSGcc9XkY_filtered.json b/annotations_filtered/t_BSGcc9XkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44bfe43aec6b922b125c613e789e5b2feb68865f --- /dev/null +++ b/annotations_filtered/t_BSGcc9XkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.23], [9.0, 10.35], [12.0, 12.75], [13.0, 13.54], [14.0, 26.96], [35.0, 42.47], [44.0, 49.52], [52.0, 53.4], [55.0, 63.22], [64.0, 66.02], [67.0, 91.3], [92.0, 92.52], [93.0, 94.63], [95.0, 97.39], [98.0, 99.23], [100.0, 107.52], [109.0, 109.19], [112.0, 119.91], [122.0, 123.58], [125.0, 125.22], [126.0, 126.27], [127.0, 127.45], [129.0, 130.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 52.1, 54.9, 61.77, 0.0, 67.13, 59.24, 52.98, 0.0, 0.0, 92.8, 0.0, 45.82, 0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.97], ["electric shaver, electric razor", 13.99], ["radio", 7.2]], null, null, null, null, null, null, null], "duration": [1.23, 1.35, 0.75, 0.54, 12.96, 7.47, 5.52, 1.4, 8.22, 2.02, 24.3, 0.52, 1.63, 2.39, 1.23, 7.52, 0.19, 7.91, 1.58, 0.22, 0.27, 0.45, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/t_FRWUPcR7Y_filtered.json b/annotations_filtered/t_FRWUPcR7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc91e2d29b7313b6e7a2700a60713d85f0d8acad --- /dev/null +++ b/annotations_filtered/t_FRWUPcR7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.12], [13.0, 18.76], [22.0, 22.18], [27.0, 28.19], [36.0, 36.69], [38.0, 38.08], [39.0, 39.55], [41.0, 41.03]], "keep_status": [true, true, false, false, false, false, false, false], "silence_prob": [39.78, 41.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 30.56], ["bouncing", 9.11], ["music", 4.43]], [["noise", 18.0], ["hum", 6.67], ["thunk", 6.63]], null, null, null, null, null, null], "duration": [2.12, 5.76, 0.18, 1.19, 0.69, 0.08, 0.55, 0.03]} \ No newline at end of file diff --git a/annotations_filtered/t_JOKNfSn1w_filtered.json b/annotations_filtered/t_JOKNfSn1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fd8cc60c2821295a3c912ac6f7642b51bf11c40 --- /dev/null +++ b/annotations_filtered/t_JOKNfSn1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 52.32], [53.0, 53.18], [54.0, 54.95], [56.0, 58.94], [60.0, 69.03], [70.0, 71.34], [74.0, 78.38], [79.0, 114.3], [116.0, 135.62], [136.0, 140.16], [141.0, 140.95], [141.0, 169.25], [170.0, 172.91], [173.0, 181.84], [182.0, 186.46]], "keep_status": [false, false, false, true, false, false, true, false, true, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 42.96, 31.82, 0.0, 28.77, 0.0, 29.49, 37.03, 0.0, 29.7, 28.75, 29.38, 30.02], "audiomae_on_audioset": [null, null, null, [["hum", 14.07], ["fly, housefly", 11.28], ["moo", 9.39]], [["mains hum", 38.35], ["hum", 28.03], ["fly, housefly", 9.47]], null, [["music", 20.81], ["sound effect", 7.95], ["whoosh, swoosh, swish", 6.27]], null, [["music", 17.71], ["livestock, farm animals, working animals", 10.01], ["throbbing", 7.8]], [["music", 63.28], ["squish", 8.44], ["crackle", 3.46]], null, [["music", 60.42], ["speech", 7.78], ["electronic music", 7.72]], [["rumble", 25.23], ["speech", 11.95], ["music", 6.26]], [["animal", 39.0], ["music", 12.86], ["speech", 6.81]], [["music", 51.09], ["throbbing", 2.45], ["musical instrument", 2.35]]], "duration": [49.32, 0.18, 0.95, 2.94, 9.03, 1.34, 4.38, 35.3, 19.62, 4.16, -0.05, 28.25, 2.91, 8.84, 4.46]} \ No newline at end of file diff --git a/annotations_filtered/t_NZNgm66xI_filtered.json b/annotations_filtered/t_NZNgm66xI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71407d5d5448e38ebe31b283142a7827516493b8 --- /dev/null +++ b/annotations_filtered/t_NZNgm66xI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 22.71], [27.0, 27.85], [32.0, 33.4], [35.0, 35.88], [40.0, 42.85], [43.0, 45.3], [48.0, 48.81], [54.0, 55.56], [57.0, 58.78], [61.0, 62.6], [65.0, 66.78], [69.0, 70.36], [73.0, 74.68], [76.0, 78.75], [80.0, 82.07], [84.0, 85.83], [87.0, 99.62], [108.0, 108.53], [110.0, 115.26], [120.0, 131.31], [131.0, 131.45]], "keep_status": [true, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, true, false, true, true, false], "silence_prob": [41.74, 0.0, 0.0, 0.0, 44.78, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.87, 52.86, 0.0, 33.88, 0.0, 33.39, 29.73, 0.0], "audiomae_on_audioset": [[["animal", 15.84], ["frog", 12.1], ["speech", 8.77]], null, null, null, [["whimper", 19.62], ["speech", 13.1], ["sine wave", 8.5]], [["cattle, bovinae", 14.94], ["moo", 13.47], ["animal", 12.0]], null, null, null, null, null, null, null, [["music", 26.39], ["speech", 19.1], ["hum", 6.97]], null, null, [["music", 39.47], ["brass instrument", 9.28], ["speech", 8.71]], null, [["foghorn", 41.59], ["speech", 13.48], ["music", 9.96]], [["theremin", 36.86], ["music", 23.02], ["echo", 5.89]], null], "duration": [12.71, 0.85, 1.4, 0.88, 2.85, 2.3, 0.81, 1.56, 1.78, 1.6, 1.78, 1.36, 1.68, 2.75, 2.07, 1.83, 12.62, 0.53, 5.26, 11.31, 0.45]} \ No newline at end of file diff --git a/annotations_filtered/t_wR8zbM5VI_filtered.json b/annotations_filtered/t_wR8zbM5VI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9055c27a95e19268bc9149046c60d069895f7718 --- /dev/null +++ b/annotations_filtered/t_wR8zbM5VI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.95], [18.0, 20.26], [27.0, 37.34], [38.0, 64.37], [70.0, 71.93], [74.0, 81.77], [91.0, 93.18], [98.0, 105.75], [109.0, 118.99], [121.0, 123.84], [127.0, 132.36], [135.0, 136.07]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 39.27, 41.56, 87.55, 0.0, 59.77, 40.55, 66.51, 94.07, 79.07, 44.66, 0.0], "audiomae_on_audioset": [null, [["music", 39.49], ["chant", 5.94], ["speech", 4.82]], [["sheep", 22.27], ["speech", 21.11], ["music", 17.84]], null, null, null, [["speech", 79.53], ["grunt", 3.07], ["boing", 2.17]], null, null, null, [["music", 57.53], ["speech", 4.21], ["percussion", 2.47]], null], "duration": [1.95, 2.26, 10.34, 26.37, 1.93, 7.77, 2.18, 7.75, 9.99, 2.84, 5.36, 1.07]} \ No newline at end of file diff --git a/annotations_filtered/taL06OVt4kQ_filtered.json b/annotations_filtered/taL06OVt4kQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b818dee21c70fc49eb88fb7dba630262bc40a57 --- /dev/null +++ b/annotations_filtered/taL06OVt4kQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 15.13], [16.0, 16.88], [18.0, 38.1], [38.0, 39.14], [40.0, 41.17], [42.0, 64.4], [66.0, 67.02], [69.0, 84.91], [85.0, 94.26], [94.0, 138.77], [139.0, 143.95], [146.0, 150.85], [152.0, 159.8], [161.0, 160.83]], "keep_status": [true, false, true, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [40.28, 0.0, 29.89, 0.0, 0.0, 31.16, 0.0, 46.43, 47.7, 0.0, 78.72, 60.6, 37.88, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 25.6], ["animal", 12.83], ["cattle, bovinae", 12.23]], null, [["music", 25.34], ["hum", 20.81], ["mains hum", 14.99]], null, null, [["explosion", 16.39], ["cattle, bovinae", 12.38], ["burst, pop", 9.78]], null, [["music", 35.67], ["speech", 8.48], ["cough", 8.21]], [["mains hum", 45.38], ["hum", 41.19], ["music", 3.23]], null, null, null, [["music", 47.62], ["mantra", 25.98], ["chant", 13.55]], null], "duration": [13.13, 0.88, 20.1, 1.14, 1.17, 22.4, 1.02, 15.91, 9.26, 44.77, 4.95, 4.85, 7.8, -0.17]} \ No newline at end of file diff --git a/annotations_filtered/taOda6ZwWyw_filtered.json b/annotations_filtered/taOda6ZwWyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57e228c333302d889d30f22517105d1afc2e0a7c --- /dev/null +++ b/annotations_filtered/taOda6ZwWyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [22.0, 24.66], [26.0, 26.37], [27.0, 31.9], [57.0, 57.94], [82.0, 84.52], [89.0, 90.93], [93.0, 109.27], [109.0, 109.46], [109.0, 113.32], [114.0, 118.08], [119.0, 118.98]], "keep_status": [false, false, false, true, false, true, false, true, false, true, true, false], "silence_prob": [0.0, 46.02, 0.0, 31.46, 0.0, 29.92, 0.0, 29.35, 0.0, 29.48, 35.1, 0.0], "audiomae_on_audioset": [null, [["music", 61.17], ["musical instrument", 10.79], ["speech", 7.12]], null, [["music", 30.25], ["speech", 24.51], ["musical instrument", 7.26]], null, [["music", 35.64], ["speech", 10.25], ["throbbing", 7.03]], null, [["music", 41.32], ["animal", 11.02], ["speech", 6.91]], null, [["moo", 27.94], ["music", 21.2], ["livestock, farm animals, working animals", 20.67]], [["music", 24.01], ["didgeridoo", 21.86], ["foghorn", 5.46]], null], "duration": [1.13, 2.66, 0.37, 4.9, 0.94, 2.52, 1.93, 16.27, 0.46, 4.32, 4.08, -0.02]} \ No newline at end of file diff --git a/annotations_filtered/tab4Nxd8GlY_filtered.json b/annotations_filtered/tab4Nxd8GlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b9b42f83f77c724b0c3a90040a23115e0b17acc --- /dev/null +++ b/annotations_filtered/tab4Nxd8GlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[73.0, 83.59]], "keep_status": [false], "silence_prob": [50.81], "audiomae_on_audioset": [null], "duration": [10.59]} \ No newline at end of file diff --git a/annotations_filtered/taf0MZ5VgDc_filtered.json b/annotations_filtered/taf0MZ5VgDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d0fa991726e7d567a79b83f335b99a5edf0cc1c --- /dev/null +++ b/annotations_filtered/taf0MZ5VgDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [4.0, 3.75], [4.0, 6.42], [15.0, 14.59], [15.0, 14.62], [22.0, 24.85], [29.0, 44.71], [47.0, 52.74], [55.0, 65.72], [67.0, 67.46], [71.0, 79.78], [83.0, 83.86], [94.0, 95.08], [96.0, 97.19], [102.0, 101.98], [108.0, 113.91]], "keep_status": [false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 43.03, 0.0, 0.0, 60.05, 30.53, 49.68, 32.05, 0.0, 37.86, 0.0, 0.0, 0.0, 0.0, 30.59], "audiomae_on_audioset": [null, null, [["music", 38.66], ["throbbing", 14.01], ["animal", 10.53]], null, null, null, [["music", 70.05], ["throbbing", 5.23], ["whack, thwack", 2.79]], [["hum", 27.87], ["music", 23.8], ["throbbing", 11.17]], [["music", 25.51], ["throbbing", 18.38], ["hum", 9.46]], null, [["speech", 41.88], ["music", 34.31], ["boing", 5.28]], null, null, null, null, [["electric shaver, electric razor", 10.26], ["whack, thwack", 9.4], ["speech", 6.87]]], "duration": [0.48, -0.25, 2.42, -0.41, -0.38, 2.85, 15.71, 5.74, 10.72, 0.46, 8.78, 0.86, 1.08, 1.19, -0.02, 5.91]} \ No newline at end of file diff --git a/annotations_filtered/tagDBoX24S0_filtered.json b/annotations_filtered/tagDBoX24S0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..903e9a3ab1efdca5c5ecef6584c4d449efc07d01 --- /dev/null +++ b/annotations_filtered/tagDBoX24S0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.58], [6.0, 28.41], [29.0, 32.19], [34.0, 54.13], [55.0, 56.91], [58.0, 71.95], [73.0, 73.33], [74.0, 82.05], [84.0, 90.71], [91.0, 94.0], [94.0, 96.03], [97.0, 97.24], [99.0, 100.41], [101.0, 107.08], [108.0, 109.75], [114.0, 115.82], [117.0, 120.72], [122.0, 125.47], [127.0, 127.48], [129.0, 135.99], [144.0, 151.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.98, 100.0, 99.76, 0.0, 100.0, 0.0, 99.88, 100.0, 100.0, 92.64, 0.0, 0.0, 99.8, 0.0, 0.0, 96.66, 95.09, 0.0, 99.91, 84.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 22.41, 3.19, 20.13, 1.91, 13.95, 0.33, 8.05, 6.71, 3.0, 2.03, 0.24, 1.41, 6.08, 1.75, 1.82, 3.72, 3.47, 0.48, 6.99, 7.11]} \ No newline at end of file diff --git a/annotations_filtered/tb9kVTItw3I_filtered.json b/annotations_filtered/tb9kVTItw3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e156a5971c2feb27d3fc238a66aa3e7899dd87b --- /dev/null +++ b/annotations_filtered/tb9kVTItw3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 34.35], [38.0, 47.48], [48.0, 48.79], [53.0, 53.28], [54.0, 54.92], [61.0, 62.34], [72.0, 75.27], [76.0, 77.06], [78.0, 94.9], [99.0, 116.48], [116.0, 116.51], [118.0, 132.88], [134.0, 138.15], [144.0, 149.61]], "keep_status": [true, false, false, false, false, false, true, false, true, true, false, false, true, true], "silence_prob": [29.69, 32.2, 0.0, 0.0, 0.0, 0.0, 32.4, 0.0, 30.21, 31.72, 0.0, 30.56, 31.48, 31.54], "audiomae_on_audioset": [[["whale vocalization", 22.14], ["fart", 8.4], ["fly, housefly", 7.31]], [["music", 64.52], ["didgeridoo", 3.02], ["whale vocalization", 2.71]], null, null, null, null, [["livestock, farm animals, working animals", 24.03], ["cattle, bovinae", 19.9], ["moo", 13.53]], null, [["livestock, farm animals, working animals", 27.56], ["speech", 21.23], ["animal", 12.02]], [["speech", 43.39], ["buzz", 6.9], ["hum", 3.12]], null, [["music", 77.24], ["boing", 2.6], ["didgeridoo", 2.51]], [["music", 20.91], ["cattle, bovinae", 8.43], ["groan", 8.14]], [["roaring cats (lions, tigers)", 23.24], ["wild animals", 20.71], ["music", 16.6]]], "duration": [8.35, 9.48, 0.79, 0.28, 0.92, 1.34, 3.27, 1.06, 16.9, 17.48, 0.51, 14.88, 4.15, 5.61]} \ No newline at end of file diff --git a/annotations_filtered/tbdHhLOzT-Y_filtered.json b/annotations_filtered/tbdHhLOzT-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..707ba6e09e496a27ba46f024f7bbbf509d64bbbb --- /dev/null +++ b/annotations_filtered/tbdHhLOzT-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 18.74], [20.0, 21.54], [37.0, 49.81], [52.0, 60.66], [62.0, 82.51]], "keep_status": [true, false, false, true, true], "silence_prob": [35.54, 0.0, 31.21, 31.06, 32.11], "audiomae_on_audioset": [[["moo", 15.08], ["cattle, bovinae", 12.02], ["insect", 11.51]], null, [["music", 56.75], ["buzz", 21.69], ["animal", 2.22]], [["speech", 24.02], ["animal", 14.31], ["mosquito", 12.94]], [["music", 22.23], ["speech", 21.47], ["explosion", 8.66]]], "duration": [11.74, 1.54, 12.81, 8.66, 20.51]} \ No newline at end of file diff --git a/annotations_filtered/tc4zPfUtP8A_filtered.json b/annotations_filtered/tc4zPfUtP8A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6d26a0a1c64b8b2b0bff6fb9bda3bf2add47b48 --- /dev/null +++ b/annotations_filtered/tc4zPfUtP8A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [4.0, 5.37], [7.0, 7.69], [9.0, 11.33], [12.0, 12.72], [16.0, 18.06], [19.0, 19.65], [25.0, 26.16], [28.0, 28.56], [39.0, 39.58], [50.0, 50.25], [64.0, 64.2], [67.0, 69.79], [70.0, 71.98], [73.0, 75.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.54, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 88.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 1.37, 0.69, 2.33, 0.72, 2.06, 0.65, 1.16, 0.56, 0.58, 0.25, 0.2, 2.79, 1.98, 2.73]} \ No newline at end of file diff --git a/annotations_filtered/tcCo38aP8qc_filtered.json b/annotations_filtered/tcCo38aP8qc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23255cd74686b5dec2654667d8a601eb7ce08d94 --- /dev/null +++ b/annotations_filtered/tcCo38aP8qc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.05], [4.0, 4.33], [7.0, 7.48], [8.0, 9.42], [13.0, 13.96], [15.0, 15.99], [17.0, 16.88], [19.0, 20.14], [21.0, 21.74], [23.0, 23.84], [26.0, 27.24], [28.0, 29.02], [35.0, 36.56], [40.0, 43.55], [47.0, 51.07], [60.0, 60.27], [63.0, 64.17], [66.0, 66.88], [70.0, 70.5], [72.0, 72.01], [85.0, 86.1], [88.0, 88.96], [91.0, 92.42], [94.0, 95.18], [102.0, 102.27], [108.0, 108.33], [109.0, 109.11], [112.0, 112.02], [117.0, 118.23], [120.0, 119.96], [122.0, 123.7], [125.0, 126.17], [127.0, 128.07], [131.0, 131.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 73.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.33, 0.48, 1.42, 0.96, 0.99, -0.12, 1.14, 0.74, 0.84, 1.24, 1.02, 1.56, 3.55, 4.07, 0.27, 1.17, 0.88, 0.5, 0.01, 1.1, 0.96, 1.42, 1.18, 0.27, 0.33, 0.11, 0.02, 1.23, -0.04, 1.7, 1.17, 1.07, 0.36]} \ No newline at end of file diff --git a/annotations_filtered/tcIaT5D4Iwc_filtered.json b/annotations_filtered/tcIaT5D4Iwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..889d5a894adfea88544adc46f8ecec764f4b82ff --- /dev/null +++ b/annotations_filtered/tcIaT5D4Iwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.99], [15.0, 16.5], [17.0, 17.61], [19.0, 20.53], [23.0, 23.8], [29.0, 28.97], [37.0, 42.48], [49.0, 51.46], [60.0, 60.99], [71.0, 71.71], [76.0, 76.52], [81.0, 81.18], [82.0, 83.2], [84.0, 85.06], [87.0, 88.62], [92.0, 92.33], [94.0, 94.02], [96.0, 97.92], [99.0, 100.65], [101.0, 107.62], [108.0, 110.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.65, 69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.67, 52.22], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 74.0], ["horse", 4.99], ["clip-clop", 3.2]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 87.58], ["sidetone", 5.75], ["beatboxing", 0.89]], null], "duration": [0.99, 1.5, 0.61, 1.53, 0.8, -0.03, 5.48, 2.46, 0.99, 0.71, 0.52, 0.18, 1.2, 1.06, 1.62, 0.33, 0.02, 1.92, 1.65, 6.62, 2.0]} \ No newline at end of file diff --git a/annotations_filtered/tcR7LgBVTNE_filtered.json b/annotations_filtered/tcR7LgBVTNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b82af30968ec45e6f12b1f98befd75a26499d22 --- /dev/null +++ b/annotations_filtered/tcR7LgBVTNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [8.0, 7.89], [8.0, 11.79], [13.0, 13.63], [15.0, 34.5], [37.0, 37.84], [38.0, 39.53], [41.0, 42.84], [45.0, 45.96], [46.0, 46.89], [48.0, 76.33], [94.0, 94.37], [99.0, 99.49], [105.0, 106.14], [108.0, 109.95], [111.0, 115.38], [116.0, 117.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 40.21, 0.0, 34.12, 0.0, 0.0, 0.0, 0.0, 0.0, 39.93, 0.0, 0.0, 0.0, 0.0, 37.35, 0.0], "audiomae_on_audioset": [null, null, [["speech", 71.52], ["sidetone", 6.57], ["stomach rumble", 5.85]], null, [["speech", 60.71], ["cat", 7.79], ["animal", 7.61]], null, null, null, null, null, [["sine wave", 36.28], ["dial tone", 12.36], ["sidetone", 11.6]], null, null, null, null, [["speech", 44.8], ["explosion", 18.33], ["burst, pop", 6.54]], null], "duration": [0.78, -0.11, 3.79, 0.63, 19.5, 0.84, 1.53, 1.84, 0.96, 0.89, 28.33, 0.37, 0.49, 1.14, 1.95, 4.38, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/td3p2XKHP2M_filtered.json b/annotations_filtered/td3p2XKHP2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dc1828e1d7caeb6dffb7d63a9ac4913b7bfd35d --- /dev/null +++ b/annotations_filtered/td3p2XKHP2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [9.0, 8.88], [11.0, 12.66], [14.0, 14.57], [16.0, 17.05], [18.0, 17.96], [19.0, 20.85], [27.0, 27.14], [31.0, 31.21], [33.0, 33.91], [35.0, 35.5], [38.0, 37.94], [41.0, 41.13], [43.0, 43.61], [45.0, 45.76], [63.0, 62.9], [69.0, 69.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, -0.12, 1.66, 0.57, 1.05, -0.04, 1.85, 0.14, 0.21, 0.91, 0.5, -0.06, 0.13, 0.61, 0.76, -0.1, 0.92]} \ No newline at end of file diff --git a/annotations_filtered/tdADTzvJtSY_filtered.json b/annotations_filtered/tdADTzvJtSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..872be4a9694b114280101b48733916e45cd833bc --- /dev/null +++ b/annotations_filtered/tdADTzvJtSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.17], [10.0, 12.6], [14.0, 15.4], [18.0, 18.96], [22.0, 23.45], [25.0, 26.57], [27.0, 28.75], [32.0, 33.18], [36.0, 38.47], [40.0, 41.18], [42.0, 43.17], [45.0, 47.28], [48.0, 49.57], [51.0, 51.39], [53.0, 61.7], [63.0, 64.13], [66.0, 67.24], [69.0, 69.9], [73.0, 75.14], [77.0, 77.85], [79.0, 80.1], [82.0, 82.9], [89.0, 90.31], [92.0, 94.02], [95.0, 96.18], [97.0, 98.31], [100.0, 103.23], [105.0, 106.1], [110.0, 112.19], [113.0, 113.17], [114.0, 114.4], [115.0, 120.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.4, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 100.0, 0.0, 73.67, 0.0, 0.0, 75.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.17, 2.6, 1.4, 0.96, 1.45, 1.57, 1.75, 1.18, 2.47, 1.18, 1.17, 2.28, 1.57, 0.39, 8.7, 1.13, 1.24, 0.9, 2.14, 0.85, 1.1, 0.9, 1.31, 2.02, 1.18, 1.31, 3.23, 1.1, 2.19, 0.17, 0.4, 5.48]} \ No newline at end of file diff --git a/annotations_filtered/tdCot34--pc_filtered.json b/annotations_filtered/tdCot34--pc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4cc9a31826f1c709f54d286c89e3f907963c284 --- /dev/null +++ b/annotations_filtered/tdCot34--pc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [3.0, 5.73], [9.0, 11.26], [13.0, 15.03], [16.0, 17.17], [20.0, 21.03], [26.0, 28.05], [29.0, 30.0], [30.0, 32.07], [33.0, 37.0], [40.0, 41.52], [45.0, 44.9], [47.0, 47.75], [49.0, 50.99], [52.0, 53.97], [57.0, 59.26], [60.0, 61.26], [62.0, 62.92], [65.0, 68.96], [69.0, 70.55], [72.0, 72.99], [76.0, 76.33], [79.0, 79.68], [81.0, 81.57], [83.0, 84.54], [86.0, 87.18], [89.0, 90.59], [96.0, 98.15], [100.0, 100.63], [102.0, 102.47], [104.0, 105.95], [109.0, 132.07], [133.0, 135.67], [137.0, 138.59], [141.0, 157.82], [160.0, 161.08], [166.0, 168.12], [169.0, 170.36], [172.0, 172.81]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.78, 69.34, 66.39, 0.0, 0.0, 68.41, 0.0, 42.51, 66.76, 0.0, 0.0, 0.0, 0.0, 0.0, 51.12, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 66.51, 74.44, 0.0, 65.44, 0.0, 74.92, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 42.82], ["sidetone", 22.67], ["hum", 4.52]], null, null, null, null, null, null, [["hum", 25.16], ["sidetone", 19.02], ["mains hum", 9.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 2.73, 2.26, 2.03, 1.17, 1.03, 2.05, 1.0, 2.07, 4.0, 1.52, -0.1, 0.75, 1.99, 1.97, 2.26, 1.26, 0.92, 3.96, 1.55, 0.99, 0.33, 0.68, 0.57, 1.54, 1.18, 1.59, 2.15, 0.63, 0.47, 1.95, 23.07, 2.67, 1.59, 16.82, 1.08, 2.12, 1.36, 0.81]} \ No newline at end of file diff --git a/annotations_filtered/tdMF1i45oks_filtered.json b/annotations_filtered/tdMF1i45oks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1875ef36596643f25a8fa17057524635869da5e0 --- /dev/null +++ b/annotations_filtered/tdMF1i45oks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.96], [8.0, 9.37], [10.0, 16.26], [17.0, 17.51], [18.0, 18.71], [19.0, 20.6], [23.0, 23.35], [27.0, 28.12], [29.0, 29.74], [35.0, 38.23], [40.0, 40.59], [48.0, 60.51], [62.0, 70.8], [74.0, 74.75], [76.0, 76.1], [76.0, 79.69], [81.0, 108.95], [110.0, 111.11], [112.0, 112.99], [120.0, 120.83], [123.0, 124.8], [125.0, 129.05], [130.0, 131.52], [133.0, 133.62], [136.0, 137.02], [137.0, 139.19], [140.0, 143.55], [145.0, 146.82], [147.0, 149.2], [154.0, 156.57], [159.0, 167.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [44.29, 0.0, 55.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 32.84, 34.42, 0.0, 0.0, 38.59, 33.72, 0.0, 0.0, 0.0, 0.0, 40.36, 0.0, 0.0, 0.0, 79.94, 83.88, 0.0, 55.6, 55.67, 57.97], "audiomae_on_audioset": [[["music", 35.56], ["hum", 20.24], ["whale vocalization", 14.62]], null, null, null, null, null, null, null, null, null, null, [["speech", 46.32], ["music", 11.93], ["sidetone", 3.65]], [["speech", 40.94], ["music", 22.6], ["explosion", 9.03]], null, null, [["whale vocalization", 89.49], ["music", 3.69], ["hum", 1.85]], [["music", 40.35], ["whale vocalization", 18.78], ["hum", 7.88]], null, null, null, null, [["speech", 32.41], ["music", 19.05], ["theremin", 12.7]], null, null, null, null, null, null, null, null, null], "duration": [5.96, 1.37, 6.26, 0.51, 0.71, 1.6, 0.35, 1.12, 0.74, 3.23, 0.59, 12.51, 8.8, 0.75, 0.1, 3.69, 27.95, 1.11, 0.99, 0.83, 1.8, 4.05, 1.52, 0.62, 1.02, 2.19, 3.55, 1.82, 2.2, 2.57, 8.8]} \ No newline at end of file diff --git a/annotations_filtered/tdMQZ0g9ykE_filtered.json b/annotations_filtered/tdMQZ0g9ykE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60c5c9770955f23d68e0ad960de6ebc2b66c7a82 --- /dev/null +++ b/annotations_filtered/tdMQZ0g9ykE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 27.89], [28.0, 27.92], [28.0, 78.43], [81.0, 103.65]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.95], "audiomae_on_audioset": [null, null, null, [["music", 52.92], ["theremin", 18.71], ["didgeridoo", 8.25]]], "duration": [-0.11, -0.08, 50.43, 22.65]} \ No newline at end of file diff --git a/annotations_filtered/tdXshjACQx8_filtered.json b/annotations_filtered/tdXshjACQx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1161fd278ad7ed4cf519ea06562673a5ef263a7c --- /dev/null +++ b/annotations_filtered/tdXshjACQx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.66], [19.0, 18.94], [19.0, 19.26], [20.0, 31.58], [32.0, 32.44], [35.0, 34.79], [36.0, 35.95], [36.0, 37.23], [39.0, 39.21], [39.0, 41.05], [42.0, 42.62], [44.0, 46.8], [48.0, 49.18], [50.0, 51.34], [53.0, 61.38], [62.0, 62.13], [63.0, 63.19], [64.0, 66.56], [67.0, 67.36], [69.0, 70.14], [72.0, 78.56], [79.0, 79.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [56.03, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 99.99, 0.0, 0.0, 32.24, 0.0, 0.0, 35.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sonar", 17.07], ["synthesizer", 13.33], ["musical instrument", 9.25]], null, null, [["sidetone", 48.56], ["busy signal", 11.59], ["music", 8.02]], null], "duration": [13.66, -0.06, 0.26, 11.58, 0.44, -0.21, -0.05, 1.23, 0.21, 2.05, 0.62, 2.8, 1.18, 1.34, 8.38, 0.13, 0.19, 2.56, 0.36, 1.14, 6.56, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/tdcUxHh3tAc_filtered.json b/annotations_filtered/tdcUxHh3tAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b316bfeed8db67e01554b647e6b1800106203c94 --- /dev/null +++ b/annotations_filtered/tdcUxHh3tAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.96], [18.0, 19.52], [23.0, 23.16], [26.0, 27.77], [42.0, 43.11], [45.0, 45.74], [51.0, 51.71], [59.0, 59.54], [66.0, 68.4], [75.0, 76.37], [83.0, 84.74], [92.0, 92.87], [108.0, 109.32], [119.0, 119.75], [121.0, 121.49], [124.0, 125.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["trombone", 33.3], ["music", 26.96], ["brass instrument", 17.18]], null, null, null, null, null, null, null], "duration": [0.96, 1.52, 0.16, 1.77, 1.11, 0.74, 0.71, 0.54, 2.4, 1.37, 1.74, 0.87, 1.32, 0.75, 0.49, 1.29]} \ No newline at end of file diff --git a/annotations_filtered/tdvj1iOOUE0_filtered.json b/annotations_filtered/tdvj1iOOUE0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92b0d631d21eeb6f3c924e473e8bb1d20c213546 --- /dev/null +++ b/annotations_filtered/tdvj1iOOUE0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.3], [19.0, 19.35], [20.0, 21.68], [35.0, 36.78], [38.0, 39.53], [40.0, 41.3], [62.0, 63.14], [65.0, 67.34], [68.0, 70.31], [73.0, 74.83], [79.0, 79.96], [85.0, 85.09], [91.0, 91.99], [94.0, 94.44], [97.0, 97.11], [98.0, 99.6], [104.0, 104.84], [105.0, 113.24], [124.0, 128.36], [130.0, 130.38], [131.0, 132.43], [149.0, 149.96], [153.0, 155.6]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.49, 39.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.9, 30.96, 0.0, 0.0, 0.0, 35.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["tick-tock", 29.14], ["speech", 27.42], ["tick", 17.78]], [["music", 46.16], ["speech", 6.62], ["groan", 6.54]], null, null, null, null, null, null, null, null, [["speech", 46.1], ["music", 26.5], ["boing", 8.67]], [["groan", 26.58], ["whack, thwack", 21.04], ["sound effect", 3.89]], null, null, null, [["throbbing", 24.75], ["music", 19.99], ["speech", 7.48]]], "duration": [0.3, 0.35, 1.68, 1.78, 1.53, 1.3, 1.14, 2.34, 2.31, 1.83, 0.96, 0.09, 0.99, 0.44, 0.11, 1.6, 0.84, 8.24, 4.36, 0.38, 1.43, 0.96, 2.6]} \ No newline at end of file diff --git a/annotations_filtered/tdzX5AKWiDw_filtered.json b/annotations_filtered/tdzX5AKWiDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d715addd71c6291eccfbaaeae4791555c9a41a5 --- /dev/null +++ b/annotations_filtered/tdzX5AKWiDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.38], [14.0, 14.52], [15.0, 16.66], [18.0, 18.71], [25.0, 25.88], [26.0, 26.86], [29.0, 30.05], [31.0, 33.24], [35.0, 35.6], [39.0, 40.29], [48.0, 48.17], [53.0, 54.65], [56.0, 57.16], [60.0, 61.84], [64.0, 65.35], [72.0, 72.15], [73.0, 74.01], [77.0, 78.76], [83.0, 83.61], [103.0, 104.85], [107.0, 107.77], [110.0, 111.2], [115.0, 116.58], [121.0, 122.77], [124.0, 125.32], [126.0, 127.25], [128.0, 130.59], [134.0, 135.26], [150.0, 150.62], [152.0, 152.51], [154.0, 155.14], [157.0, 164.51], [165.0, 166.06], [167.0, 168.71], [170.0, 171.49], [180.0, 180.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 0.52, 1.66, 0.71, 0.88, 0.86, 1.05, 2.24, 0.6, 1.29, 0.17, 1.65, 1.16, 1.84, 1.35, 0.15, 1.01, 1.76, 0.61, 1.85, 0.77, 1.2, 1.58, 1.77, 1.32, 1.25, 2.59, 1.26, 0.62, 0.51, 1.14, 7.51, 1.06, 1.71, 1.49, 0.5]} \ No newline at end of file diff --git a/annotations_filtered/te-hhtqatQk_filtered.json b/annotations_filtered/te-hhtqatQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d410cf21f328e19edcf75bcc2cd64a6beb24a20d --- /dev/null +++ b/annotations_filtered/te-hhtqatQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.82], [9.0, 13.17], [14.0, 19.57], [22.0, 36.02], [39.0, 47.44], [50.0, 55.07], [55.0, 91.88], [97.0, 104.03], [107.0, 119.2], [120.0, 120.06], [123.0, 125.02]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [84.43, 76.7, 42.19, 33.22, 33.83, 48.95, 0.0, 53.84, 79.24, 0.0, 99.88], "audiomae_on_audioset": [null, null, [["music", 49.28], ["speech", 13.03], ["sidetone", 9.33]], [["music", 40.3], ["speech", 22.42], ["cacophony", 10.73]], [["music", 48.7], ["electronic music", 6.7], ["speech", 6.47]], [["music", 25.43], ["speech", 22.63], ["sidetone", 5.7]], null, null, null, null, null], "duration": [2.82, 4.17, 5.57, 14.02, 8.44, 5.07, 36.88, 7.03, 12.2, 0.06, 2.02]} \ No newline at end of file diff --git a/annotations_filtered/te2WMrdJ3yQ_filtered.json b/annotations_filtered/te2WMrdJ3yQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25ce5b90e764f125f949d3773b585129980844b0 --- /dev/null +++ b/annotations_filtered/te2WMrdJ3yQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 26.76], [27.0, 26.91], [27.0, 27.58], [29.0, 31.7], [33.0, 33.66], [34.0, 34.97], [36.0, 38.85], [41.0, 42.55], [53.0, 53.89], [60.0, 60.05], [61.0, 63.0], [66.0, 66.58], [68.0, 69.38], [71.0, 71.58], [74.0, 79.37], [82.0, 82.63], [83.0, 82.86], [88.0, 89.87], [97.0, 98.19], [102.0, 102.93], [104.0, 105.27], [107.0, 107.81], [108.0, 111.3], [116.0, 116.36], [121.0, 122.55], [127.0, 131.67], [141.0, 145.93], [146.0, 148.49], [151.0, 155.31], [158.0, 158.75], [159.0, 158.97], [159.0, 178.14], [180.0, 180.18]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 49.87, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 46.61, 0.0, 0.0, 0.0, 54.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.52, 0.0, 0.0, 70.16, 29.69, 34.94, 31.94, 0.0, 0.0, 30.62, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 22.0], ["rumble", 10.77], ["hum", 8.18]], null, null, [["fly, housefly", 40.82], ["mosquito", 21.64], ["insect", 19.11]], null, null, null, [["speech", 31.33], ["hum", 15.45], ["music", 13.26]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.63], ["hum", 15.08], ["throbbing", 10.96]], null, null, null, [["speech", 20.58], ["livestock, farm animals, working animals", 14.47], ["explosion", 9.46]], [["music", 28.27], ["groan", 13.71], ["cattle, bovinae", 6.02]], [["speech", 47.06], ["animal", 4.5], ["boing", 3.71]], null, null, [["music", 50.4], ["speech", 19.99], ["hum", 4.03]], null], "duration": [-0.24, -0.09, 0.58, 2.7, 0.66, 0.97, 2.85, 1.55, 0.89, 0.05, 2.0, 0.58, 1.38, 0.58, 5.37, 0.63, -0.14, 1.87, 1.19, 0.93, 1.27, 0.81, 3.3, 0.36, 1.55, 4.67, 4.93, 2.49, 4.31, 0.75, -0.03, 19.14, 0.18]} \ No newline at end of file diff --git a/annotations_filtered/te366vMoW0E_filtered.json b/annotations_filtered/te366vMoW0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be8d0f095c917e1cf8e489a594f41a73a0808d3b --- /dev/null +++ b/annotations_filtered/te366vMoW0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.14], [12.0, 12.99], [18.0, 19.9], [21.0, 22.5], [27.0, 27.67], [29.0, 30.15], [32.0, 32.98], [34.0, 34.67], [45.0, 45.82], [63.0, 63.81], [72.0, 71.81], [74.0, 79.44], [83.0, 83.83], [87.0, 91.81], [93.0, 94.39], [96.0, 97.48], [100.0, 99.96], [101.0, 101.9], [105.0, 105.85], [109.0, 110.88], [121.0, 121.37], [122.0, 123.3], [125.0, 126.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.14, 0.99, 1.9, 1.5, 0.67, 1.15, 0.98, 0.67, 0.82, 0.81, -0.19, 5.44, 0.83, 4.81, 1.39, 1.48, -0.04, 0.9, 0.85, 1.88, 0.37, 1.3, 1.79]} \ No newline at end of file diff --git a/annotations_filtered/teZ52l28tys_filtered.json b/annotations_filtered/teZ52l28tys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e55676790a584bed36aab085c3ab372ff08b7c80 --- /dev/null +++ b/annotations_filtered/teZ52l28tys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.86], [34.0, 44.41], [46.0, 78.09], [78.0, 80.32], [82.0, 88.32], [90.0, 103.27], [104.0, 106.37], [108.0, 113.8], [121.0, 122.66], [124.0, 123.99], [125.0, 127.03], [128.0, 130.74]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 52.33, 0.0, 84.25, 42.51, 35.59, 43.33, 42.98, 0.0, 0.0, 46.61, 45.49], "audiomae_on_audioset": [null, null, null, null, [["music", 58.63], ["musical instrument", 9.58], ["synthesizer", 6.11]], [["music", 62.32], ["synthesizer", 5.98], ["musical instrument", 4.27]], [["sonar", 15.66], ["synthesizer", 11.42], ["music", 9.38]], [["sine wave", 14.81], ["stomach rumble", 12.28], ["sheep", 6.35]], null, null, [["chirp tone", 38.96], ["sine wave", 32.0], ["singing bowl", 5.62]], [["music", 43.69], ["musical instrument", 7.81], ["effects unit", 7.78]]], "duration": [1.86, 10.41, 32.09, 2.32, 6.32, 13.27, 2.37, 5.8, 1.66, -0.01, 2.03, 2.74]} \ No newline at end of file diff --git a/annotations_filtered/tekVuL2mT7A_filtered.json b/annotations_filtered/tekVuL2mT7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2acf003e321781b8116225365b66bbf75d0b1fa --- /dev/null +++ b/annotations_filtered/tekVuL2mT7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.23], [14.0, 14.17], [15.0, 14.64], [15.0, 14.69], [15.0, 14.94], [16.0, 41.5], [44.0, 46.87], [51.0, 51.38], [52.0, 52.22], [59.0, 63.37], [64.0, 65.5], [67.0, 81.19], [81.0, 82.22], [82.0, 83.62], [119.0, 119.26], [127.0, 128.98], [134.0, 134.08], [134.0, 136.39], [139.0, 142.64], [153.0, 153.22], [154.0, 156.1], [157.0, 158.94], [162.0, 164.86], [166.0, 166.82], [168.0, 172.81], [179.0, 193.56], [197.0, 199.35], [220.0, 222.32], [223.0, 223.4], [230.0, 234.27], [235.0, 236.38]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, true, false], "silence_prob": [95.37, 0.0, 0.0, 0.0, 0.0, 37.66, 35.99, 0.0, 0.0, 31.45, 0.0, 33.96, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 63.96, 0.0, 37.55, 0.0, 29.1, 0.0, 29.02, 30.27, 40.47, 41.36, 0.0, 42.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 28.53], ["speech", 15.44], ["hum", 11.65]], [["speech", 44.31], ["music", 15.86], ["foghorn", 10.17]], null, null, [["speech", 43.49], ["music", 19.45], ["fart", 13.2]], null, [["fly, housefly", 22.9], ["music", 22.78], ["insect", 15.53]], null, null, null, null, null, null, null, null, [["speech", 56.15], ["moo", 10.12], ["cattle, bovinae", 8.72]], null, [["speech", 19.28], ["music", 19.18], ["cattle, bovinae", 8.39]], null, [["music", 56.34], ["throbbing", 10.7], ["hum", 7.38]], [["boing", 41.08], ["music", 28.09], ["whack, thwack", 8.56]], [["whale vocalization", 18.91], ["fly, housefly", 14.77], ["insect", 12.32]], [["animal", 16.35], ["speech", 13.54], ["canidae, dogs, wolves", 11.11]], null, [["livestock, farm animals, working animals", 18.15], ["cattle, bovinae", 17.2], ["moo", 16.86]], null], "duration": [4.23, 0.17, -0.36, -0.31, -0.06, 25.5, 2.87, 0.38, 0.22, 4.37, 1.5, 14.19, 1.22, 1.62, 0.26, 1.98, 0.08, 2.39, 3.64, 0.22, 2.1, 1.94, 2.86, 0.82, 4.81, 14.56, 2.35, 2.32, 0.4, 4.27, 1.38]} \ No newline at end of file diff --git a/annotations_filtered/teoyewW1bUY_filtered.json b/annotations_filtered/teoyewW1bUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42f3bddf8005e7c4ff40637b262d53b31998f41d --- /dev/null +++ b/annotations_filtered/teoyewW1bUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.9], [10.0, 11.13], [14.0, 16.56], [20.0, 20.76], [22.0, 22.79], [27.0, 28.36], [33.0, 33.99], [36.0, 36.76], [40.0, 40.47], [43.0, 43.5], [45.0, 46.21], [52.0, 53.32], [55.0, 57.77], [59.0, 60.39], [62.0, 64.37], [66.0, 67.0], [68.0, 68.27], [70.0, 70.09], [74.0, 75.3], [77.0, 76.92], [81.0, 81.26], [85.0, 86.81], [92.0, 94.07], [97.0, 99.5], [100.0, 103.54], [107.0, 108.67], [120.0, 121.59], [123.0, 124.17], [125.0, 126.44], [130.0, 131.28], [135.0, 136.39], [138.0, 138.28], [141.0, 141.59], [142.0, 143.78], [146.0, 146.62], [148.0, 150.38], [152.0, 152.34], [155.0, 155.38], [158.0, 158.45], [164.0, 164.86], [167.0, 168.79], [170.0, 171.46], [173.0, 176.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 99.82, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.54], ["singing bowl", 20.17], ["gong", 19.83]], null, null, null, null, null, null, [["music", 41.61], ["ambient music", 31.19], ["electronic music", 6.26]]], "duration": [0.9, 1.13, 2.56, 0.76, 0.79, 1.36, 0.99, 0.76, 0.47, 0.5, 1.21, 1.32, 2.77, 1.39, 2.37, 1.0, 0.27, 0.09, 1.3, -0.08, 0.26, 1.81, 2.07, 2.5, 3.54, 1.67, 1.59, 1.17, 1.44, 1.28, 1.39, 0.28, 0.59, 1.78, 0.62, 2.38, 0.34, 0.38, 0.45, 0.86, 1.79, 1.46, 3.22]} \ No newline at end of file diff --git a/annotations_filtered/tesqTwX7cpc_filtered.json b/annotations_filtered/tesqTwX7cpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47b0b8133c368c74ca6e70e869c9e242a2bbf75f --- /dev/null +++ b/annotations_filtered/tesqTwX7cpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.87], [9.0, 9.83], [11.0, 16.92], [19.0, 27.77], [35.0, 35.5], [38.0, 45.18], [47.0, 48.91], [52.0, 52.69], [55.0, 69.47], [70.0, 70.44], [70.0, 75.83], [77.0, 91.76], [93.0, 116.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 67.51, 82.61, 0.0, 64.07, 0.0, 0.0, 65.44, 0.0, 83.52, 35.98, 30.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 38.0], ["mains hum", 23.26], ["music", 11.98]], [["music", 30.53], ["theremin", 24.62], ["brass instrument", 7.5]]], "duration": [1.87, 0.83, 5.92, 8.77, 0.5, 7.18, 1.91, 0.69, 14.47, 0.44, 5.83, 14.76, 23.01]} \ No newline at end of file diff --git a/annotations_filtered/tetwGGL997s_filtered.json b/annotations_filtered/tetwGGL997s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29613fda661b484fb322e1736251276d71e42001 --- /dev/null +++ b/annotations_filtered/tetwGGL997s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.08], [4.0, 5.24], [6.0, 8.02], [10.0, 11.85], [18.0, 19.38], [22.0, 25.98], [28.0, 29.57], [32.0, 33.89], [37.0, 37.98], [39.0, 39.07], [39.0, 41.07], [42.0, 43.11], [45.0, 47.34], [49.0, 50.38], [54.0, 54.11], [55.0, 55.19], [56.0, 56.83], [58.0, 58.5], [60.0, 60.89], [62.0, 62.07], [64.0, 64.1], [66.0, 66.31], [68.0, 70.29], [73.0, 74.12], [78.0, 81.19], [82.0, 83.81], [85.0, 85.95], [86.0, 87.1], [88.0, 90.9], [92.0, 94.24], [95.0, 96.15], [97.0, 98.54], [102.0, 104.72], [106.0, 106.05], [107.0, 107.22], [110.0, 114.0], [115.0, 121.07], [123.0, 126.89], [130.0, 130.13], [133.0, 133.64], [135.0, 135.46], [137.0, 137.84], [140.0, 140.8], [143.0, 143.18], [145.0, 146.2], [149.0, 150.6], [151.0, 156.12], [159.0, 160.19], [161.0, 161.96], [164.0, 166.38], [168.0, 170.26], [172.0, 173.35]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.31, 0.0, 44.6, 0.0, 0.0, 52.62, 0.0, 0.0, 0.0, 0.0, 40.54, 0.0, 50.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.6, 0.0, 54.04, 0.0, 0.0, 0.0, 58.13, 34.04, 0.0, 0.0, 50.16, 0.0, 0.0, 59.07, 37.3, 47.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.71, 0.0, 0.0, 55.89, 71.72, 0.0], "audiomae_on_audioset": [[["radio", 32.03], ["sidetone", 26.5], ["speech", 13.98]], null, [["whale vocalization", 24.09], ["hum", 14.17], ["mains hum", 6.79]], null, null, null, null, null, null, null, [["sidetone", 33.92], ["fly, housefly", 9.65], ["hum", 9.29]], null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 18.19], ["speech", 15.66], ["radio", 8.04]], null, null, null, null, null, null, [["whale vocalization", 37.1], ["hum", 14.89], ["music", 8.46]], null, null, null, null, null, null, [["sidetone", 73.77], ["radio", 10.89], ["speech", 7.55]], [["hum", 7.27], ["noise", 4.08], ["thunderstorm", 4.03]], null, null, null, null, null, null, null, null, [["hum", 38.51], ["mains hum", 27.45], ["speech", 11.36]], null, null, null, null, null], "duration": [2.08, 1.24, 2.02, 1.85, 1.38, 3.98, 1.57, 1.89, 0.98, 0.07, 2.07, 1.11, 2.34, 1.38, 0.11, 0.19, 0.83, 0.5, 0.89, 0.07, 0.1, 0.31, 2.29, 1.12, 3.19, 1.81, 0.95, 1.1, 2.9, 2.24, 1.15, 1.54, 2.72, 0.05, 0.22, 4.0, 6.07, 3.89, 0.13, 0.64, 0.46, 0.84, 0.8, 0.18, 1.2, 1.6, 5.12, 1.19, 0.96, 2.38, 2.26, 1.35]} \ No newline at end of file diff --git a/annotations_filtered/tfGpUcIEIf0_filtered.json b/annotations_filtered/tfGpUcIEIf0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81d52a00a233f82c82f30b9e46f98caf974b7798 --- /dev/null +++ b/annotations_filtered/tfGpUcIEIf0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [7.0, 8.73], [17.0, 18.12], [33.0, 32.68], [34.0, 40.14], [47.0, 46.75], [62.0, 65.35]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.09, 0.0, 29.56], "audiomae_on_audioset": [null, null, null, null, [["music", 39.64], ["speech", 14.23], ["theremin", 7.2]], null, [["speech", 31.02], ["music", 26.38], ["helicopter", 12.85]]], "duration": [1.56, 1.73, 1.12, -0.32, 6.14, -0.25, 3.35]} \ No newline at end of file diff --git a/annotations_filtered/tfL5f6cZlk8_filtered.json b/annotations_filtered/tfL5f6cZlk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4123b6f356d033250375b52b5759e3c301452616 --- /dev/null +++ b/annotations_filtered/tfL5f6cZlk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.54], [6.0, 7.13], [9.0, 9.53], [10.0, 10.67], [11.0, 11.6], [12.0, 13.59], [14.0, 14.88], [20.0, 19.92], [20.0, 20.87], [22.0, 23.84], [26.0, 27.36], [29.0, 32.51], [34.0, 35.34], [39.0, 39.02], [40.0, 41.93], [42.0, 44.0], [45.0, 46.01], [47.0, 47.83], [52.0, 55.11], [57.0, 64.76], [72.0, 72.47], [78.0, 80.7], [88.0, 88.42], [91.0, 91.08], [98.0, 99.44], [101.0, 101.33], [102.0, 105.07], [105.0, 105.51], [111.0, 112.18], [115.0, 115.65], [120.0, 119.99], [123.0, 123.5], [124.0, 124.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.29, 0.0, 0.0, 0.0, 33.48, 0.0, 0.0, 71.29, 31.44, 0.0, 40.06, 0.0, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.9], ["music", 26.7], ["cello", 8.12]], null, null, null, [["speech", 46.97], ["sidetone", 18.91], ["music", 6.25]], null, null, null, [["hum", 38.03], ["music", 14.62], ["throbbing", 13.49]], null, [["speech", 47.67], ["music", 12.06], ["hum", 8.16]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.54, 1.13, 0.53, 0.67, 0.6, 1.59, 0.88, -0.08, 0.87, 1.84, 1.36, 3.51, 1.34, 0.02, 1.93, 2.0, 1.01, 0.83, 3.11, 7.76, 0.47, 2.7, 0.42, 0.08, 1.44, 0.33, 3.07, 0.51, 1.18, 0.65, -0.01, 0.5, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/tf_RRItKJm0_filtered.json b/annotations_filtered/tf_RRItKJm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..badd399cb41239e2c0d582af5567f18eb5aafbef --- /dev/null +++ b/annotations_filtered/tf_RRItKJm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.17], [20.0, 22.69], [25.0, 48.14], [51.0, 69.52], [74.0, 77.82], [79.0, 79.37], [80.0, 90.53], [98.0, 99.05], [106.0, 106.44], [107.0, 111.59], [122.0, 137.69], [143.0, 146.53]], "keep_status": [true, false, false, false, true, false, true, false, false, true, false, true], "silence_prob": [40.47, 42.53, 32.48, 46.79, 40.84, 0.0, 33.72, 0.0, 0.0, 38.52, 32.48, 32.09], "audiomae_on_audioset": [[["rumble", 28.95], ["hum", 24.54], ["music", 13.81]], [["hum", 31.55], ["music", 22.66], ["throbbing", 18.05]], [["hum", 45.16], ["mains hum", 30.35], ["music", 11.27]], [["music", 77.34], ["ambient music", 3.75], ["theremin", 2.97]], [["music", 48.37], ["electronic music", 12.31], ["hum", 5.73]], null, [["speech", 28.57], ["music", 9.03], ["hum", 8.26]], null, null, [["music", 55.32], ["electronic music", 10.0], ["hum", 3.27]], [["hum", 51.08], ["throbbing", 19.2], ["mains hum", 17.87]], [["music", 36.43], ["speech", 28.48], ["electronic music", 3.97]]], "duration": [4.17, 2.69, 23.14, 18.52, 3.82, 0.37, 10.53, 1.05, 0.44, 4.59, 15.69, 3.53]} \ No newline at end of file diff --git a/annotations_filtered/tff_EEQt79s_filtered.json b/annotations_filtered/tff_EEQt79s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..022df198d46d2199f47e3601fc18c184b84a2a2c --- /dev/null +++ b/annotations_filtered/tff_EEQt79s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.5], [8.0, 50.45], [51.0, 79.29], [85.0, 85.43], [86.0, 116.67], [120.0, 132.54]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 32.33, 0.0, 0.0, 30.71], "audiomae_on_audioset": [null, null, [["throbbing", 56.55], ["hum", 22.91], ["music", 7.81]], null, null, [["music", 41.58], ["crowd", 7.95], ["mosquito", 3.69]]], "duration": [0.5, 42.45, 28.29, 0.43, 30.67, 12.54]} \ No newline at end of file diff --git a/annotations_filtered/tfvoOEa1OOI_filtered.json b/annotations_filtered/tfvoOEa1OOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5db78a1d1fee58772785f1e7833fa2c73e29642e --- /dev/null +++ b/annotations_filtered/tfvoOEa1OOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 25.93], [26.0, 27.09], [29.0, 29.29], [30.0, 31.95], [33.0, 34.75], [36.0, 36.9], [45.0, 48.12], [51.0, 65.45], [67.0, 67.37], [68.0, 69.11], [73.0, 74.17], [74.0, 74.92], [75.0, 76.47], [80.0, 81.14], [86.0, 87.35], [88.0, 88.48], [91.0, 90.98], [91.0, 92.64], [95.0, 95.4], [95.0, 96.43], [100.0, 99.96], [100.0, 100.8], [104.0, 105.78], [106.0, 106.27], [107.0, 108.35], [112.0, 113.31], [117.0, 119.03], [122.0, 129.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 64.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 90.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [14.93, 1.09, 0.29, 1.95, 1.75, 0.9, 3.12, 14.45, 0.37, 1.11, 1.17, 0.92, 1.47, 1.14, 1.35, 0.48, -0.02, 1.64, 0.4, 1.43, -0.04, 0.8, 1.78, 0.27, 1.35, 1.31, 2.03, 7.24]} \ No newline at end of file diff --git a/annotations_filtered/tfvptl5VS08_filtered.json b/annotations_filtered/tfvptl5VS08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18950a3341cb843e2bcc635e7d3a276e304ef2b2 --- /dev/null +++ b/annotations_filtered/tfvptl5VS08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.71], [34.0, 46.16], [48.0, 65.65], [67.0, 67.41], [69.0, 70.21], [72.0, 85.01], [87.0, 92.03], [94.0, 94.86], [97.0, 99.23]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 57.72, 66.03, 0.0, 0.0, 45.43, 60.7, 0.0, 75.72], "audiomae_on_audioset": [null, null, null, null, null, [["music", 22.69], ["didgeridoo", 22.34], ["cattle, bovinae", 4.76]], null, null, null], "duration": [0.71, 12.16, 17.65, 0.41, 1.21, 13.01, 5.03, 0.86, 2.23]} \ No newline at end of file diff --git a/annotations_filtered/tg2X2RZsGy4_filtered.json b/annotations_filtered/tg2X2RZsGy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7cecb8bf1bc9ec50e6f3060445f32d7a33bbd8e --- /dev/null +++ b/annotations_filtered/tg2X2RZsGy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.02], [8.0, 9.0], [50.0, 50.14], [81.0, 81.75], [82.0, 82.63], [107.0, 108.24], [109.0, 109.29], [112.0, 112.6], [113.0, 114.56]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [2.02, 1.0, 0.14, 0.75, 0.63, 1.24, 0.29, 0.6, 1.56]} \ No newline at end of file diff --git a/annotations_filtered/tg4jLJ6OiDY_filtered.json b/annotations_filtered/tg4jLJ6OiDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f416cded8c3172a8b6f336aab3c548a33f81ea0a --- /dev/null +++ b/annotations_filtered/tg4jLJ6OiDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [5.0, 6.13], [7.0, 8.65], [10.0, 10.89], [12.0, 19.16], [22.0, 23.18], [24.0, 24.19], [25.0, 25.52], [26.0, 29.24], [39.0, 39.45], [43.0, 45.39], [48.0, 47.85], [50.0, 49.96], [53.0, 54.04], [62.0, 64.67], [66.0, 66.93], [74.0, 73.94], [80.0, 80.33], [82.0, 85.41], [86.0, 86.83], [88.0, 88.45], [89.0, 97.24], [100.0, 103.11], [111.0, 112.45], [123.0, 123.82], [128.0, 129.19]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 45.43, 0.0, 45.82, 0.0, 0.0, 0.0, 46.02, 0.0, 0.0, 0.0, 60.51, 0.0, 0.0, 76.37, 57.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["dog", 20.92], ["bow-wow", 14.8], ["animal", 12.26]], null, [["music", 49.41], ["speech", 22.31], ["musical instrument", 5.72]], null, null, null, [["music", 72.44], ["synthesizer", 4.64], ["sidetone", 4.29]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 1.13, 1.65, 0.89, 7.16, 1.18, 0.19, 0.52, 3.24, 0.45, 2.39, -0.15, -0.04, 1.04, 2.67, 0.93, -0.06, 0.33, 3.41, 0.83, 0.45, 8.24, 3.11, 1.45, 0.82, 1.19]} \ No newline at end of file diff --git a/annotations_filtered/tgHcYxKjwVE_filtered.json b/annotations_filtered/tgHcYxKjwVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d96b3048d9fc723d821c92202f193a7b0d13b622 --- /dev/null +++ b/annotations_filtered/tgHcYxKjwVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.09], [16.0, 16.29], [17.0, 18.59], [20.0, 20.8], [22.0, 25.25], [27.0, 28.44], [29.0, 30.0], [31.0, 32.12], [32.0, 33.15], [34.0, 36.76], [37.0, 38.67], [39.0, 39.75], [41.0, 44.88], [46.0, 46.77], [49.0, 49.25], [50.0, 50.75], [52.0, 53.55], [55.0, 58.89], [65.0, 65.5], [68.0, 68.22], [69.0, 69.89], [73.0, 74.16], [79.0, 88.25], [89.0, 91.0], [91.0, 91.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.81, 0.0, 0.0, 0.0, 0.0, 34.29, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 41.98, 0.0, 0.0, 0.0, 0.0, 88.83, 40.64, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 61.78], ["speech", 14.85], ["whale vocalization", 6.03]], null, null, null, null, [["speech", 57.1], ["sidetone", 20.68], ["dial tone", 5.01]], null, null, [["sidetone", 42.4], ["speech", 25.28], ["chirp tone", 8.31]], null, null, null, null, [["speech", 49.39], ["dial tone", 6.19], ["telephone", 5.09]], null, null, null, null, null, [["livestock, farm animals, working animals", 30.47], ["cattle, bovinae", 14.26], ["fly, housefly", 8.26]], null], "duration": [1.09, 0.29, 1.59, 0.8, 3.25, 1.44, 1.0, 1.12, 1.15, 2.76, 1.67, 0.75, 3.88, 0.77, 0.25, 0.75, 1.55, 3.89, 0.5, 0.22, 0.89, 1.16, 9.25, 2.0, 0.54]} \ No newline at end of file diff --git a/annotations_filtered/thSPQDFYyiE_filtered.json b/annotations_filtered/thSPQDFYyiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aec77f2f11cd40116a91311d1804b3dcf5de8276 --- /dev/null +++ b/annotations_filtered/thSPQDFYyiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.66], [3.0, 3.62], [5.0, 6.35], [8.0, 11.43], [13.0, 13.95], [15.0, 16.02], [19.0, 19.21], [20.0, 20.12], [22.0, 22.03], [23.0, 24.26], [24.0, 27.41], [28.0, 28.88], [30.0, 31.36], [33.0, 35.56], [36.0, 36.1], [38.0, 39.02], [41.0, 43.92], [45.0, 45.96], [48.0, 60.12], [60.0, 61.1], [62.0, 62.73], [66.0, 66.5], [69.0, 70.66], [72.0, 72.05], [73.0, 74.14], [76.0, 76.65], [79.0, 79.37], [83.0, 84.65], [85.0, 87.17], [87.0, 88.11], [88.0, 88.69], [90.0, 90.0], [90.0, 92.48], [94.0, 94.27], [96.0, 97.07], [97.0, 98.41], [99.0, 100.77], [104.0, 105.49], [107.0, 108.57], [109.0, 109.92], [113.0, 117.34], [118.0, 121.8], [123.0, 123.42], [125.0, 125.56], [126.0, 127.38], [128.0, 128.61], [129.0, 129.32], [130.0, 130.4], [131.0, 132.04], [133.0, 135.03], [136.0, 138.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.44, 0.0, 0.0, 100.0, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 69.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 0.62, 1.35, 3.43, 0.95, 1.02, 0.21, 0.12, 0.03, 1.26, 3.41, 0.88, 1.36, 2.56, 0.1, 1.02, 2.92, 0.96, 12.12, 1.1, 0.73, 0.5, 1.66, 0.05, 1.14, 0.65, 0.37, 1.65, 2.17, 1.11, 0.69, 0.0, 2.48, 0.27, 1.07, 1.41, 1.77, 1.49, 1.57, 0.92, 4.34, 3.8, 0.42, 0.56, 1.38, 0.61, 0.32, 0.4, 1.04, 2.03, 2.79]} \ No newline at end of file diff --git a/annotations_filtered/thhYv6-lz9A_filtered.json b/annotations_filtered/thhYv6-lz9A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..901d087cf5aa4357ea684eb4e38775e2be727696 --- /dev/null +++ b/annotations_filtered/thhYv6-lz9A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.95], [10.0, 11.28], [14.0, 16.06], [17.0, 17.56], [19.0, 21.86], [24.0, 26.54], [29.0, 30.79], [34.0, 35.6], [37.0, 38.35], [40.0, 42.4], [46.0, 47.44]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.74, 0.0, 36.94, 55.18, 0.0, 0.0, 0.0, 58.98, 0.0], "audiomae_on_audioset": [null, null, [["music", 25.51], ["hum", 17.79], ["mains hum", 10.52]], null, [["whale vocalization", 37.37], ["music", 11.99], ["hum", 6.46]], null, null, null, null, null, null], "duration": [0.95, 1.28, 2.06, 0.56, 2.86, 2.54, 1.79, 1.6, 1.35, 2.4, 1.44]} \ No newline at end of file diff --git a/annotations_filtered/ti2qUYIgpjM_filtered.json b/annotations_filtered/ti2qUYIgpjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cd7c5ecc9715c9074602654bc1c013671c9308b --- /dev/null +++ b/annotations_filtered/ti2qUYIgpjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.99], [12.0, 14.66], [16.0, 41.45], [44.0, 52.95], [56.0, 57.69], [64.0, 63.69], [64.0, 65.55], [67.0, 68.3], [69.0, 69.13], [79.0, 78.73], [82.0, 82.8], [84.0, 85.14], [86.0, 87.61], [90.0, 91.05], [93.0, 93.93], [95.0, 96.31], [99.0, 99.52], [105.0, 106.1], [114.0, 117.66], [128.0, 128.11]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.81, 55.53, 49.0, 36.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0], "audiomae_on_audioset": [[["speech", 20.97], ["music", 18.39], ["whale vocalization", 9.65]], null, [["mains hum", 26.1], ["music", 22.02], ["speech", 18.5]], [["speech", 58.59], ["music", 16.42], ["didgeridoo", 2.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.99, 2.66, 25.45, 8.95, 1.69, -0.31, 1.55, 1.3, 0.13, -0.27, 0.8, 1.14, 1.61, 1.05, 0.93, 1.31, 0.52, 1.1, 3.66, 0.11]} \ No newline at end of file diff --git a/annotations_filtered/ti39GhRZkrw_filtered.json b/annotations_filtered/ti39GhRZkrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6219e447cbc518f24705c867bd9f8845df41696 --- /dev/null +++ b/annotations_filtered/ti39GhRZkrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.06], [9.0, 9.32], [11.0, 13.68], [15.0, 16.41], [22.0, 25.56], [28.0, 31.08], [31.0, 33.61], [38.0, 38.48], [40.0, 40.59], [43.0, 44.04], [46.0, 48.63], [51.0, 51.63], [53.0, 53.62], [56.0, 56.24], [58.0, 59.24], [63.0, 63.24], [68.0, 68.4], [71.0, 71.41], [72.0, 74.49], [76.0, 76.05], [79.0, 79.84], [83.0, 84.42], [88.0, 88.67], [94.0, 95.59], [123.0, 123.06], [124.0, 124.68], [131.0, 130.89], [136.0, 136.36], [142.0, 143.77], [148.0, 150.01], [155.0, 156.22], [161.0, 161.96], [164.0, 163.68]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 42.58, 0.0, 41.87, 45.36, 30.24, 0.0, 0.0, 0.0, 48.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.61], ["hum", 16.0], ["mains hum", 8.31]], null, [["speech", 43.97], ["music", 20.85], ["sonar", 5.39]], [["whip", 30.18], ["sidetone", 10.0], ["crack", 6.5]], [["mains hum", 42.44], ["hum", 22.49], ["music", 7.17]], null, null, null, [["didgeridoo", 32.06], ["music", 29.29], ["whale vocalization", 4.86]], null, null, null, null, null, null, null, [["electric shaver, electric razor", 62.98], ["speech", 25.25], ["mains hum", 3.02]], null, null, null, null, null, null, null, null, null, null, [["music", 27.1], ["hum", 22.76], ["mains hum", 12.03]], null, null, null], "duration": [1.06, 0.32, 2.68, 1.41, 3.56, 3.08, 2.61, 0.48, 0.59, 1.04, 2.63, 0.63, 0.62, 0.24, 1.24, 0.24, 0.4, 0.41, 2.49, 0.05, 0.84, 1.42, 0.67, 1.59, 0.06, 0.68, -0.11, 0.36, 1.77, 2.01, 1.22, 0.96, -0.32]} \ No newline at end of file diff --git a/annotations_filtered/ti3HSBmEoVU_filtered.json b/annotations_filtered/ti3HSBmEoVU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c21c6084506c698bfd607483ccd26a5be4b46171 --- /dev/null +++ b/annotations_filtered/ti3HSBmEoVU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.74], [8.0, 9.05], [12.0, 15.53], [16.0, 20.39], [21.0, 22.54], [26.0, 26.99], [33.0, 33.54], [35.0, 35.68], [36.0, 36.54], [37.0, 37.76], [38.0, 38.69], [39.0, 45.55], [48.0, 48.42], [49.0, 51.53], [52.0, 53.7], [55.0, 67.14], [68.0, 84.33], [85.0, 86.88], [88.0, 117.24], [121.0, 131.5], [135.0, 141.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.36, 0.0, 84.07, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 59.15, 0.0, 70.3, 93.45, 0.0, 31.61, 31.94, 32.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.43], ["musical instrument", 2.65], ["wind instrument, woodwind instrument", 1.99]], [["music", 82.91], ["musical instrument", 1.84], ["guitar", 1.29]], [["music", 65.04], ["didgeridoo", 7.91], ["mosquito", 1.93]]], "duration": [3.74, 1.05, 3.53, 4.39, 1.54, 0.99, 0.54, 0.68, 0.54, 0.76, 0.69, 6.55, 0.42, 2.53, 1.7, 12.14, 16.33, 1.88, 29.24, 10.5, 6.62]} \ No newline at end of file diff --git a/annotations_filtered/ti42vZVtgvY_filtered.json b/annotations_filtered/ti42vZVtgvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4407c9ee63682b518852837b0486b71a82c362d6 --- /dev/null +++ b/annotations_filtered/ti42vZVtgvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.07], [13.0, 13.07], [17.0, 16.78], [29.0, 29.57], [32.0, 34.72], [38.0, 39.39], [41.0, 41.32], [56.0, 55.98], [57.0, 57.59], [58.0, 58.89], [62.0, 62.53], [63.0, 64.96], [69.0, 70.17], [71.0, 72.72], [76.0, 82.66], [94.0, 94.24], [97.0, 97.51], [106.0, 108.63], [110.0, 111.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.62, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 40.69], ["music", 25.06], ["musical instrument", 5.74]], null, null, null, null, null, null, null, null, null, [["speech", 75.6], ["music", 5.38], ["synthesizer", 2.05]], null, null, null, null], "duration": [0.07, 0.07, -0.22, 0.57, 2.72, 1.39, 0.32, -0.02, 0.59, 0.89, 0.53, 1.96, 1.17, 1.72, 6.66, 0.24, 0.51, 2.63, 1.45]} \ No newline at end of file diff --git a/annotations_filtered/ti9jg0JOK2I_filtered.json b/annotations_filtered/ti9jg0JOK2I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32918c2e0a131babd4b9a01b2f9adb73bc9aa424 --- /dev/null +++ b/annotations_filtered/ti9jg0JOK2I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.61], [19.0, 25.1], [29.0, 28.92], [29.0, 52.19], [53.0, 55.65], [57.0, 57.43], [59.0, 95.37], [98.0, 98.91], [104.0, 106.76], [109.0, 109.02], [111.0, 113.91], [115.0, 115.89], [120.0, 121.2], [132.0, 135.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 29.5, 0.0, 27.89, 28.22, 0.0, 0.0, 0.0, 27.99, 0.0, 32.0, 0.0, 0.0, 28.04], "audiomae_on_audioset": [null, [["throbbing", 38.41], ["music", 18.65], ["hum", 14.85]], null, [["speech", 44.2], ["music", 20.7], ["buzz", 7.89]], [["music", 83.05], ["cacophony", 2.39], ["speech", 1.63]], null, null, null, [["breaking", 87.23], ["music", 4.55], ["smash, crash", 2.13]], null, [["music", 27.37], ["speech", 20.77], ["throbbing", 13.91]], null, null, [["music", 58.67], ["boing", 4.66], ["didgeridoo", 3.39]]], "duration": [0.61, 6.1, -0.08, 23.19, 2.65, 0.43, 36.37, 0.91, 2.76, 0.02, 2.91, 0.89, 1.2, 3.46]} \ No newline at end of file diff --git a/annotations_filtered/tiYXgCsoqaA_filtered.json b/annotations_filtered/tiYXgCsoqaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5cbeecd878ee4a2d926d20631b94dbb4de4a911 --- /dev/null +++ b/annotations_filtered/tiYXgCsoqaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.94], [11.0, 12.28], [14.0, 14.37], [25.0, 29.03], [34.0, 34.8], [47.0, 52.88], [61.0, 62.04], [64.0, 64.3], [65.0, 69.57], [72.0, 72.33], [74.0, 78.78], [80.0, 80.54], [86.0, 86.32], [87.0, 87.91], [91.0, 91.74], [98.0, 98.85], [102.0, 108.89], [109.0, 110.71], [112.0, 112.77], [115.0, 115.92], [118.0, 118.99], [119.0, 119.79], [120.0, 123.97]], "keep_status": [true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.22, 0.0, 0.0, 41.03, 0.0, 30.41, 0.0, 0.0, 95.37, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 74.6], "audiomae_on_audioset": [[["speech", 27.54], ["livestock, farm animals, working animals", 17.88], ["moo", 6.6]], null, null, [["speech", 19.17], ["fart", 11.07], ["mosquito", 6.64]], null, [["music", 42.13], ["musical instrument", 12.75], ["didgeridoo", 10.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.94, 1.28, 0.37, 4.03, 0.8, 5.88, 1.04, 0.3, 4.57, 0.33, 4.78, 0.54, 0.32, 0.91, 0.74, 0.85, 6.89, 1.71, 0.77, 0.92, 0.99, 0.79, 3.97]} \ No newline at end of file diff --git a/annotations_filtered/tifUOGFTOBM_filtered.json b/annotations_filtered/tifUOGFTOBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f466698b57d176c540a3496c691daf56c252bb74 --- /dev/null +++ b/annotations_filtered/tifUOGFTOBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.91], [11.0, 16.38], [32.0, 32.54], [33.0, 37.59], [39.0, 39.39], [45.0, 45.6]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 58.05, 0.0, 55.39, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.91, 5.38, 0.54, 4.59, 0.39, 0.6]} \ No newline at end of file diff --git a/annotations_filtered/tippFPLwGgI_filtered.json b/annotations_filtered/tippFPLwGgI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e065be34cb65b9925f8cc302a74c619293dc0b2 --- /dev/null +++ b/annotations_filtered/tippFPLwGgI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.82], [44.0, 44.27], [47.0, 47.44], [52.0, 53.89], [59.0, 58.95], [66.0, 66.23]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.82, 0.27, 0.44, 1.89, -0.05, 0.23]} \ No newline at end of file diff --git a/annotations_filtered/tj3Trywp_zk_filtered.json b/annotations_filtered/tj3Trywp_zk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07c3accb0fadb408fd9a2d96ba8a5fdbbd11aafc --- /dev/null +++ b/annotations_filtered/tj3Trywp_zk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.05], [14.0, 14.28], [18.0, 18.99], [21.0, 21.39], [27.0, 27.23], [28.0, 30.25], [31.0, 32.31], [39.0, 39.77], [43.0, 43.82], [51.0, 54.16], [63.0, 65.72], [67.0, 68.72], [70.0, 70.44], [72.0, 81.33], [84.0, 86.48], [89.0, 92.89], [96.0, 97.98], [100.0, 101.39], [104.0, 106.08], [109.0, 118.15], [122.0, 122.99], [127.0, 127.25], [130.0, 130.96], [132.0, 133.2], [136.0, 135.77], [138.0, 140.83], [148.0, 148.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 45.69, 93.13, 0.0, 0.0, 34.96, 80.64, 50.71, 0.0, 0.0, 46.86, 47.54, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 41.31], ["whale vocalization", 21.05], ["speech", 16.85]], null, null, null, [["music", 50.86], ["hum", 18.7], ["mains hum", 8.6]], null, null, null, null, [["music", 40.07], ["ambient music", 7.03], ["synthesizer", 6.55]], [["gong", 52.67], ["music", 13.48], ["singing bowl", 12.3]], null, null, null, null, null, null, null], "duration": [1.05, 0.28, 0.99, 0.39, 0.23, 2.25, 1.31, 0.77, 0.82, 3.16, 2.72, 1.72, 0.44, 9.33, 2.48, 3.89, 1.98, 1.39, 2.08, 9.15, 0.99, 0.25, 0.96, 1.2, -0.23, 2.83, 0.1]} \ No newline at end of file diff --git a/annotations_filtered/tjRYZON0o9w_filtered.json b/annotations_filtered/tjRYZON0o9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d35fa09692d78fe4254769afe84314364a3518c6 --- /dev/null +++ b/annotations_filtered/tjRYZON0o9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.33], [20.0, 20.07], [25.0, 24.75], [27.0, 29.19], [30.0, 34.15], [38.0, 41.12], [43.0, 45.23], [47.0, 49.03], [51.0, 55.51], [57.0, 61.92], [64.0, 72.54], [73.0, 74.07], [76.0, 100.99], [102.0, 101.83], [103.0, 106.25], [108.0, 118.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [53.84, 0.0, 0.0, 50.26, 56.03, 57.89, 55.39, 54.9, 72.46, 88.28, 78.21, 0.0, 49.87, 0.0, 64.86, 34.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.01], ["sidetone", 29.38], ["rumble", 9.28]], null, null, [["music", 26.9], ["cacophony", 15.21], ["buzz", 8.13]]], "duration": [4.33, 0.07, -0.25, 2.19, 4.15, 3.12, 2.23, 2.03, 4.51, 4.92, 8.54, 1.07, 24.99, -0.17, 3.25, 10.25]} \ No newline at end of file diff --git a/annotations_filtered/tjsQP94DIfM_filtered.json b/annotations_filtered/tjsQP94DIfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8be3ffc28c63ba34abdc4de18aab33bfe37fb37d --- /dev/null +++ b/annotations_filtered/tjsQP94DIfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.3], [5.0, 5.48], [8.0, 14.08], [15.0, 16.8], [17.0, 17.73], [21.0, 21.96], [23.0, 23.26], [25.0, 27.43], [33.0, 33.44], [36.0, 37.4], [38.0, 38.58], [40.0, 41.12], [42.0, 43.24], [44.0, 45.42], [52.0, 52.24], [52.0, 53.82], [57.0, 57.4], [58.0, 59.0], [60.0, 60.52], [61.0, 61.1], [67.0, 66.58], [67.0, 68.25], [83.0, 89.9], [92.0, 94.09], [95.0, 96.52], [98.0, 98.81], [102.0, 103.64], [104.0, 105.9], [106.0, 107.18], [108.0, 108.41], [109.0, 110.08], [112.0, 113.53], [114.0, 114.88], [116.0, 117.07], [120.0, 120.82], [125.0, 125.95], [130.0, 134.45], [136.0, 137.46], [138.0, 145.18], [146.0, 148.51]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 44.6, 0.0, 0.0, 0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.2, 85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 49.64, 31.44], "audiomae_on_audioset": [null, null, [["speech", 47.97], ["electric shaver, electric razor", 7.92], ["telephone", 6.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["electric shaver, electric razor", 30.83], ["hum", 16.18], ["speech", 15.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 17.62], ["mains hum", 10.04], ["thunk", 7.29]], [["cattle, bovinae", 15.72], ["moo", 13.82], ["animal", 11.4]]], "duration": [0.3, 0.48, 6.08, 1.8, 0.73, 0.96, 0.26, 2.43, 0.44, 1.4, 0.58, 1.12, 1.24, 1.42, 0.24, 1.82, 0.4, 1.0, 0.52, 0.1, -0.42, 1.25, 6.9, 2.09, 1.52, 0.81, 1.64, 1.9, 1.18, 0.41, 1.08, 1.53, 0.88, 1.07, 0.82, 0.95, 4.45, 1.46, 7.18, 2.51]} \ No newline at end of file diff --git a/annotations_filtered/tk2vET4aFW8_filtered.json b/annotations_filtered/tk2vET4aFW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cd2ae964f777ae74914e185f90c5ec4ad6dabe9 --- /dev/null +++ b/annotations_filtered/tk2vET4aFW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 49.27], [50.0, 50.97], [53.0, 53.92], [55.0, 58.33], [59.0, 59.86], [61.0, 62.51], [66.0, 67.91], [70.0, 70.58], [74.0, 74.78], [77.0, 78.34], [83.0, 83.44], [85.0, 89.6], [90.0, 91.91]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.12, 0.0, 0.0, 39.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0], "audiomae_on_audioset": [[["music", 42.78], ["guitar", 11.37], ["speech", 10.56]], null, null, [["music", 66.03], ["musical instrument", 7.12], ["guitar", 6.6]], null, null, null, null, null, null, null, null, null], "duration": [13.27, 0.97, 0.92, 3.33, 0.86, 1.51, 1.91, 0.58, 0.78, 1.34, 0.44, 4.6, 1.91]} \ No newline at end of file diff --git a/annotations_filtered/tkDK_YLfTO0_filtered.json b/annotations_filtered/tkDK_YLfTO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6ab601c0f86bc4ea1868b358ca86a2f3437c1f1 --- /dev/null +++ b/annotations_filtered/tkDK_YLfTO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.74], [22.0, 26.96], [30.0, 32.85], [37.0, 46.68], [48.0, 48.47], [56.0, 56.98], [68.0, 68.98], [70.0, 70.93], [71.0, 72.08], [73.0, 73.06], [75.0, 75.88], [79.0, 79.51], [81.0, 81.35], [83.0, 83.49], [92.0, 94.69], [101.0, 101.85], [102.0, 102.88], [104.0, 104.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.54, 52.86, 78.38, 74.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.15, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.73], ["noise", 8.22], ["radio", 4.84]], null, null, null], "duration": [2.74, 4.96, 2.85, 9.68, 0.47, 0.98, 0.98, 0.93, 1.08, 0.06, 0.88, 0.51, 0.35, 0.49, 2.69, 0.85, 0.88, 0.06]} \ No newline at end of file diff --git a/annotations_filtered/tkN8fCU-rzU_filtered.json b/annotations_filtered/tkN8fCU-rzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ffce97daadb195210f2832b316e820005518b45 --- /dev/null +++ b/annotations_filtered/tkN8fCU-rzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [5.0, 6.29], [10.0, 11.62], [13.0, 14.37], [17.0, 17.52], [23.0, 24.21], [28.0, 31.35], [32.0, 34.16], [37.0, 38.33], [38.0, 43.34], [47.0, 55.59], [56.0, 56.67], [58.0, 58.94], [61.0, 60.86], [62.0, 63.56], [65.0, 68.52], [73.0, 73.77], [77.0, 76.84], [79.0, 81.06], [85.0, 84.94], [92.0, 98.07], [99.0, 99.13], [100.0, 100.43], [103.0, 103.5], [106.0, 109.7], [110.0, 111.3]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.89, 37.41, 0.0, 45.82, 35.7, 0.0, 0.0, 0.0, 0.0, 69.2, 0.0, 0.0, 66.76, 0.0, 40.14, 0.0, 0.0, 0.0, 57.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 39.87], ["buzzer", 17.25], ["fire alarm", 5.13]], [["buzzer", 37.57], ["fire alarm", 11.07], ["speech", 10.25]], null, [["speech", 31.79], ["hum", 30.84], ["mains hum", 11.04]], [["speech", 73.65], ["knock", 7.23], ["music", 4.8]], null, null, null, null, null, null, null, null, null, [["speech", 38.43], ["sidetone", 14.29], ["sine wave", 8.54]], null, null, null, null, null], "duration": [1.11, 1.29, 1.62, 1.37, 0.52, 1.21, 3.35, 2.16, 1.33, 5.34, 8.59, 0.67, 0.94, -0.14, 1.56, 3.52, 0.77, -0.16, 2.06, -0.06, 6.07, 0.13, 0.43, 0.5, 3.7, 1.3]} \ No newline at end of file diff --git a/annotations_filtered/tkRvLFdrbTU_filtered.json b/annotations_filtered/tkRvLFdrbTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de87c2b78c7bf857f96f47a0d678f1095b0954e9 --- /dev/null +++ b/annotations_filtered/tkRvLFdrbTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 38.21], [46.0, 47.38], [57.0, 57.97], [60.0, 60.86], [62.0, 63.96], [68.0, 68.3], [69.0, 72.82]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [30.85, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96], "audiomae_on_audioset": [[["music", 44.38], ["speech", 14.69], ["sidetone", 13.82]], null, null, null, null, null, null], "duration": [5.21, 1.38, 0.97, 0.86, 1.96, 0.3, 3.82]} \ No newline at end of file diff --git a/annotations_filtered/tkWWtYRbnq8_filtered.json b/annotations_filtered/tkWWtYRbnq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..308c5a18d34e7b4033df4f7faae59347026ab95e --- /dev/null +++ b/annotations_filtered/tkWWtYRbnq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.85], [17.0, 22.03], [23.0, 28.46], [31.0, 31.31], [44.0, 43.92], [48.0, 49.91], [53.0, 54.5], [56.0, 56.66], [59.0, 59.05], [61.0, 62.95], [64.0, 68.08], [70.0, 83.96], [88.0, 101.92], [106.0, 114.15], [124.0, 142.97], [145.0, 147.99], [148.0, 148.31], [152.0, 155.28]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 42.6, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.43, 43.13, 37.46, 42.02, 33.93, 88.1, 0.0, 63.74], "audiomae_on_audioset": [null, [["speech", 37.67], ["whale vocalization", 14.11], ["music", 13.21]], null, null, null, null, null, null, null, null, [["music", 33.6], ["harp", 18.78], ["speech", 6.88]], [["music", 50.93], ["quack", 21.67], ["duck", 3.75]], [["music", 61.77], ["synthesizer", 6.27], ["speech", 5.27]], [["music", 30.33], ["mains hum", 16.93], ["hum", 13.83]], [["music", 33.07], ["cattle, bovinae", 26.1], ["moo", 19.25]], null, null, null], "duration": [1.85, 5.03, 5.46, 0.31, -0.08, 1.91, 1.5, 0.66, 0.05, 1.95, 4.08, 13.96, 13.92, 8.15, 18.97, 2.99, 0.31, 3.28]} \ No newline at end of file diff --git a/annotations_filtered/tkj3klWMn5E_filtered.json b/annotations_filtered/tkj3klWMn5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..961a2e06d4668943dc4082ce9335c7b427c1379f --- /dev/null +++ b/annotations_filtered/tkj3klWMn5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[89.0, 89.8], [90.0, 92.47], [107.0, 108.45], [117.0, 117.83], [118.0, 118.49], [119.0, 119.92], [121.0, 121.42]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.8, 2.47, 1.45, 0.83, 0.49, 0.92, 0.42]} \ No newline at end of file diff --git a/annotations_filtered/tktoOXBmflI_filtered.json b/annotations_filtered/tktoOXBmflI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba2cdf43ecc73f8c4190c0625bd81d9421eb0824 --- /dev/null +++ b/annotations_filtered/tktoOXBmflI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.83], [14.0, 23.06], [24.0, 24.66], [25.0, 27.28], [28.0, 31.41], [32.0, 37.66], [38.0, 52.35], [54.0, 59.73], [61.0, 62.23], [63.0, 63.96], [66.0, 70.61], [73.0, 73.72], [76.0, 76.49], [77.0, 78.31], [82.0, 85.65], [87.0, 96.3], [97.0, 109.17], [110.0, 110.15], [110.0, 111.45], [115.0, 123.67], [128.0, 128.85], [133.0, 135.21], [137.0, 138.01]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [96.89, 70.44, 0.0, 51.66, 49.18, 76.37, 81.17, 99.21, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 59.96, 33.82, 53.97, 0.0, 0.0, 79.24, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["boing", 42.32], ["noise", 12.8], ["speech", 8.53]], null, null, null, null, null, [["speech", 60.55], ["echo", 3.77], ["boing", 3.08]], null, null, null, null, [["music", 42.48], ["synthesizer", 8.48], ["musical instrument", 4.6]], null, null, null, null, null, null, null], "duration": [5.83, 9.06, 0.66, 2.28, 3.41, 5.66, 14.35, 5.73, 1.23, 0.96, 4.61, 0.72, 0.49, 1.31, 3.65, 9.3, 12.17, 0.15, 1.45, 8.67, 0.85, 2.21, 1.01]} \ No newline at end of file diff --git a/annotations_filtered/tlE5yK4l34o_filtered.json b/annotations_filtered/tlE5yK4l34o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61bc709243be633de44aa75df96bb8ec0e26dcb3 --- /dev/null +++ b/annotations_filtered/tlE5yK4l34o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.25], [19.0, 21.44], [23.0, 30.75], [33.0, 40.27], [41.0, 41.22], [41.0, 41.27], [41.0, 41.32], [41.0, 43.53], [44.0, 45.3], [46.0, 46.68], [48.0, 51.95]], "keep_status": [false, false, true, true, false, false, false, true, false, false, true], "silence_prob": [34.5, 71.0, 31.35, 35.54, 0.0, 0.0, 0.0, 38.25, 0.0, 0.0, 41.14], "audiomae_on_audioset": [[["crowd", 46.75], ["cheering", 22.63], ["music", 4.6]], null, [["vehicle", 24.63], ["livestock, farm animals, working animals", 12.78], ["sound effect", 6.85]], [["grunt", 30.09], ["whale vocalization", 10.01], ["animal", 6.84]], null, null, null, [["insect", 24.86], ["fly, housefly", 22.16], ["mosquito", 10.19]], null, null, [["burping, eructation", 20.47], ["grunt", 16.87], ["groan", 16.72]]], "duration": [10.25, 2.44, 7.75, 7.27, 0.22, 0.27, 0.32, 2.53, 1.3, 0.68, 3.95]} \ No newline at end of file diff --git a/annotations_filtered/tlI--ATerwo_filtered.json b/annotations_filtered/tlI--ATerwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd8a6c5b7ff8289e24f9c8197b9819aa82f72d70 --- /dev/null +++ b/annotations_filtered/tlI--ATerwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [12.0, 13.27], [14.0, 14.89], [16.0, 16.01], [17.0, 17.17], [22.0, 22.52], [26.0, 26.25], [27.0, 27.7], [29.0, 29.2], [38.0, 38.74], [39.0, 42.03], [43.0, 43.34], [48.0, 47.78], [49.0, 53.97], [56.0, 57.21], [58.0, 58.35], [59.0, 59.81], [61.0, 61.3], [68.0, 68.84], [70.0, 71.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 1.27, 0.89, 0.01, 0.17, 0.52, 0.25, 0.7, 0.2, 0.74, 3.03, 0.34, -0.22, 4.97, 1.21, 0.35, 0.81, 0.3, 0.84, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/tlJM0tgXu5Q_filtered.json b/annotations_filtered/tlJM0tgXu5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5516980b7f4325da16b6306e719896f7e68fec59 --- /dev/null +++ b/annotations_filtered/tlJM0tgXu5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [3.0, 112.41]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.76, 109.41]} \ No newline at end of file diff --git a/annotations_filtered/tlLSqeVA_no_filtered.json b/annotations_filtered/tlLSqeVA_no_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7318273d8cd0a91287e9724359dc28ca9479a076 --- /dev/null +++ b/annotations_filtered/tlLSqeVA_no_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.26], [21.0, 21.2], [22.0, 22.82], [34.0, 34.26], [35.0, 45.33], [47.0, 51.33], [53.0, 54.57], [57.0, 57.54], [60.0, 66.77], [69.0, 89.73], [90.0, 90.49], [106.0, 106.47], [107.0, 108.46], [112.0, 112.95], [120.0, 120.51], [123.0, 124.16], [128.0, 128.22], [131.0, 135.95]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.27, 100.0, 0.0, 0.0, 32.27, 31.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89], "audiomae_on_audioset": [null, null, null, null, [["crow", 29.48], ["animal", 20.93], ["caw", 14.87]], null, null, null, [["speech", 62.73], ["quack", 6.48], ["duck", 4.72]], [["cattle, bovinae", 40.42], ["livestock, farm animals, working animals", 25.43], ["moo", 14.12]], null, null, null, null, null, null, null, null], "duration": [1.26, 0.2, 0.82, 0.26, 10.33, 4.33, 1.57, 0.54, 6.77, 20.73, 0.49, 0.47, 1.46, 0.95, 0.51, 1.16, 0.22, 4.95]} \ No newline at end of file diff --git a/annotations_filtered/tlNLhuxeDJQ_filtered.json b/annotations_filtered/tlNLhuxeDJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9034d7956f59451e2d11529e8dd1bb2cf77d373 --- /dev/null +++ b/annotations_filtered/tlNLhuxeDJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.95], [21.0, 21.2], [40.0, 40.04], [55.0, 55.41], [62.0, 62.11], [66.0, 66.9], [70.0, 95.32], [96.0, 96.2], [100.0, 101.04], [102.0, 111.27], [115.0, 118.66]], "keep_status": [false, false, false, false, false, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.72, 0.0, 0.0, 30.24, 45.85], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 57.84], ["ambient music", 4.39], ["electronic music", 3.63]], null, null, [["music", 33.63], ["gong", 13.65], ["didgeridoo", 10.57]], [["music", 43.11], ["theremin", 7.68], ["singing bowl", 5.87]]], "duration": [-0.05, 0.2, 0.04, 0.41, 0.11, 0.9, 25.32, 0.2, 1.04, 9.27, 3.66]} \ No newline at end of file diff --git a/annotations_filtered/tlSZa51g_rc_filtered.json b/annotations_filtered/tlSZa51g_rc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86613507cab4c44b9c29e379075e6508d7c3250e --- /dev/null +++ b/annotations_filtered/tlSZa51g_rc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.8], [2.0, 3.81], [14.0, 17.71], [19.0, 21.84], [26.0, 26.47], [30.0, 30.57], [32.0, 34.57], [45.0, 44.88], [47.0, 47.41], [49.0, 50.09], [53.0, 53.03], [55.0, 55.29], [60.0, 60.3], [70.0, 75.61], [77.0, 79.34], [82.0, 81.97], [84.0, 84.57], [87.0, 88.13], [89.0, 90.91], [93.0, 93.72], [96.0, 96.99], [102.0, 119.33]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.49, 44.09, 0.0, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.18], "audiomae_on_audioset": [null, null, [["music", 32.88], ["speech", 23.39], ["musical instrument", 6.88]], [["music", 69.89], ["musical instrument", 3.96], ["guitar", 2.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 1.81, 3.71, 2.84, 0.47, 0.57, 2.57, -0.12, 0.41, 1.09, 0.03, 0.29, 0.3, 5.61, 2.34, -0.03, 0.57, 1.13, 1.91, 0.72, 0.99, 17.33]} \ No newline at end of file diff --git a/annotations_filtered/tlSscKeO9Cc_filtered.json b/annotations_filtered/tlSscKeO9Cc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb9130c7f3d95367cbe625953ca1c4dbfd30a16f --- /dev/null +++ b/annotations_filtered/tlSscKeO9Cc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.91], [26.0, 27.18], [28.0, 28.63], [29.0, 31.45], [33.0, 33.35], [35.0, 54.09], [56.0, 63.75], [68.0, 76.47], [78.0, 78.43], [80.0, 85.41], [86.0, 92.91], [97.0, 112.04], [114.0, 119.52], [124.0, 131.31], [138.0, 147.77]], "keep_status": [true, false, false, true, false, false, false, true, false, true, false, true, true, true, true], "silence_prob": [29.72, 0.0, 0.0, 31.8, 0.0, 28.73, 28.53, 28.55, 0.0, 29.22, 28.25, 28.37, 30.89, 29.14, 28.65], "audiomae_on_audioset": [[["speech", 36.22], ["aircraft", 11.23], ["vehicle", 9.18]], null, null, [["speech", 17.78], ["music", 17.2], ["mains hum", 4.87]], null, [["music", 72.79], ["synthesizer", 5.33], ["electronic music", 3.88]], [["music", 45.16], ["speech", 13.43], ["hum", 13.0]], [["vehicle", 23.56], ["music", 13.87], ["speech", 11.24]], null, [["vehicle", 29.97], ["speech", 10.6], ["car", 10.36]], [["motorcycle", 62.21], ["vehicle", 8.74], ["speech", 6.45]], [["vehicle", 38.21], ["car", 13.13], ["speech", 11.31]], [["music", 49.09], ["synthesizer", 13.11], ["speech", 5.93]], [["music", 32.66], ["throbbing", 18.22], ["hum", 13.03]], [["music", 32.53], ["speech", 24.53], ["outside, rural or natural", 5.82]]], "duration": [6.91, 1.18, 0.63, 2.45, 0.35, 19.09, 7.75, 8.47, 0.43, 5.41, 6.91, 15.04, 5.52, 7.31, 9.77]} \ No newline at end of file diff --git a/annotations_filtered/tm6qzug9AS8_filtered.json b/annotations_filtered/tm6qzug9AS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9822a619e73d52b0533d4634833bbb20db85b833 --- /dev/null +++ b/annotations_filtered/tm6qzug9AS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [9.0, 9.91], [13.0, 13.81], [19.0, 19.99], [26.0, 27.19], [33.0, 33.61], [41.0, 41.74], [47.0, 47.33], [51.0, 53.45], [56.0, 56.37], [61.0, 62.95], [84.0, 86.66], [131.0, 134.03], [139.0, 140.0], [144.0, 145.47], [151.0, 152.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.99, 0.0, 0.0, 38.0, 56.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 54.4], ["speech", 5.83], ["trombone", 3.49]], null, null, null, null], "duration": [0.38, 0.91, 0.81, 0.99, 1.19, 0.61, 0.74, 0.33, 2.45, 0.37, 1.95, 2.66, 3.03, 1.0, 1.47, 1.46]} \ No newline at end of file diff --git a/annotations_filtered/tmUleIek9Fc_filtered.json b/annotations_filtered/tmUleIek9Fc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f66384053978ff86a3b8d3a4dafb499f3736e969 --- /dev/null +++ b/annotations_filtered/tmUleIek9Fc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.84], [17.0, 17.47], [18.0, 39.41], [41.0, 41.86], [42.0, 46.21], [48.0, 49.71], [51.0, 51.61], [55.0, 61.72], [64.0, 74.38], [77.0, 77.19], [81.0, 81.65], [85.0, 86.27], [87.0, 88.67], [91.0, 93.5], [94.0, 98.05], [98.0, 99.66], [100.0, 102.66], [104.0, 106.64], [107.0, 107.54], [108.0, 110.15], [111.0, 112.9], [114.0, 115.25], [116.0, 119.35], [120.0, 123.97], [127.0, 129.76], [130.0, 133.81], [135.0, 137.66], [138.0, 140.54], [141.0, 146.77], [147.0, 149.67]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 42.0, 0.0, 53.22, 0.0, 0.0, 63.1, 70.44, 0.0, 0.0, 0.0, 0.0, 99.26, 82.79, 0.0, 98.86, 100.0, 0.0, 93.91, 0.0, 0.0, 96.17, 77.53, 99.85, 61.97, 98.8, 48.14, 91.13, 80.46], "audiomae_on_audioset": [null, null, [["music", 18.13], ["animal", 13.93], ["hum", 9.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.05], ["music", 22.09], ["hum", 17.41]], null, null], "duration": [0.84, 0.47, 21.41, 0.86, 4.21, 1.71, 0.61, 6.72, 10.38, 0.19, 0.65, 1.27, 1.67, 2.5, 4.05, 1.66, 2.66, 2.64, 0.54, 2.15, 1.9, 1.25, 3.35, 3.97, 2.76, 3.81, 2.66, 2.54, 5.77, 2.67]} \ No newline at end of file diff --git a/annotations_filtered/tmZiGfLVs8w_filtered.json b/annotations_filtered/tmZiGfLVs8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4df59c2bccb51e4b97ebebdd9e558e925da86b93 --- /dev/null +++ b/annotations_filtered/tmZiGfLVs8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.46], [19.0, 19.6], [21.0, 21.64], [23.0, 29.51], [31.0, 31.58], [32.0, 32.71], [34.0, 35.46], [36.0, 40.59], [42.0, 42.25], [43.0, 43.33], [46.0, 50.45], [54.0, 55.32], [57.0, 57.42], [60.0, 60.62], [61.0, 60.66], [66.0, 65.82], [68.0, 69.16], [71.0, 72.1], [73.0, 73.26], [75.0, 93.38], [95.0, 95.15], [98.0, 98.79], [104.0, 104.63], [106.0, 107.11], [108.0, 109.59], [111.0, 111.2], [112.0, 112.73], [113.0, 117.26]], "keep_status": [true, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.25, 0.0, 0.0, 39.67, 0.0, 0.0, 0.0, 42.33, 0.0, 0.0, 48.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.98], "audiomae_on_audioset": [[["music", 38.36], ["ambient music", 16.72], ["whale vocalization", 7.43]], null, null, [["hum", 36.0], ["music", 29.88], ["mains hum", 17.67]], null, null, null, [["speech", 34.92], ["music", 23.64], ["whale vocalization", 8.61]], null, null, [["music", 41.83], ["whale vocalization", 13.54], ["electronic music", 9.39]], null, null, null, null, null, null, null, null, [["music", 53.05], ["scary music", 13.39], ["single-lens reflex camera", 5.24]], null, null, null, null, null, null, null, [["music", 75.07], ["theremin", 3.41], ["synthesizer", 2.67]]], "duration": [4.46, 0.6, 0.64, 6.51, 0.58, 0.71, 1.46, 4.59, 0.25, 0.33, 4.45, 1.32, 0.42, 0.62, -0.34, -0.18, 1.16, 1.1, 0.26, 18.38, 0.15, 0.79, 0.63, 1.11, 1.59, 0.2, 0.73, 4.26]} \ No newline at end of file diff --git a/annotations_filtered/tm_W36kWahM_filtered.json b/annotations_filtered/tm_W36kWahM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84f938de9916d744c6b94c1287ddaf08b855370b --- /dev/null +++ b/annotations_filtered/tm_W36kWahM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.6], [16.0, 15.65], [17.0, 17.39], [19.0, 19.57], [33.0, 33.79], [34.0, 38.47], [40.0, 40.81], [41.0, 42.01], [43.0, 44.39], [47.0, 48.66], [51.0, 52.25], [54.0, 54.5], [58.0, 58.51], [60.0, 59.8], [63.0, 67.19], [68.0, 69.65], [76.0, 76.87], [77.0, 80.06], [81.0, 82.39], [87.0, 100.7], [102.0, 102.56], [104.0, 107.2], [109.0, 116.04], [118.0, 120.93], [122.0, 137.17], [138.0, 150.23], [152.0, 154.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [37.2, 0.0, 0.0, 0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 48.31, 0.0, 99.99, 0.0, 49.36, 97.11, 82.25, 99.16, 66.27, 99.96], "audiomae_on_audioset": [[["speech", 54.1], ["sidetone", 12.59], ["hum", 8.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.73], ["music", 9.99], ["chirp tone", 9.32]], null, null, null, [["speech", 61.64], ["singing bowl", 13.46], ["music", 4.59]], null, null, null, null, null], "duration": [3.6, -0.35, 0.39, 0.57, 0.79, 4.47, 0.81, 1.01, 1.39, 1.66, 1.25, 0.5, 0.51, -0.2, 4.19, 1.65, 0.87, 3.06, 1.39, 13.7, 0.56, 3.2, 7.04, 2.93, 15.17, 12.23, 2.92]} \ No newline at end of file diff --git a/annotations_filtered/tmwSUyoEItk_filtered.json b/annotations_filtered/tmwSUyoEItk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e970ff2198afb7d014300e97d07f3215e87ede32 --- /dev/null +++ b/annotations_filtered/tmwSUyoEItk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.62], [22.0, 33.67], [34.0, 38.25], [38.0, 51.11], [53.0, 53.59], [61.0, 61.92], [72.0, 72.27]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 45.08, 50.51, 34.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 75.88], ["ambient music", 3.15], ["synthesizer", 2.91]], null, [["speech", 51.3], ["music", 15.27], ["outside, rural or natural", 5.21]], null, null, null], "duration": [0.62, 11.67, 4.25, 13.11, 0.59, 0.92, 0.27]} \ No newline at end of file diff --git a/annotations_filtered/tnhW2iYL25k_filtered.json b/annotations_filtered/tnhW2iYL25k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab1a53ee5e64a01de7f9650f7941bde2264d7be7 --- /dev/null +++ b/annotations_filtered/tnhW2iYL25k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [5.0, 10.39], [15.0, 15.6], [16.0, 35.48], [42.0, 48.14]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 42.26, 0.0, 35.52, 32.42], "audiomae_on_audioset": [null, [["hum", 42.14], ["mains hum", 33.5], ["music", 6.56]], null, [["speech", 52.08], ["music", 11.05], ["rumble", 10.2]], [["throbbing", 25.36], ["hum", 23.66], ["music", 19.66]]], "duration": [0.94, 5.39, 0.6, 19.48, 6.14]} \ No newline at end of file diff --git a/annotations_filtered/toAOUXtlXXc_filtered.json b/annotations_filtered/toAOUXtlXXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f3038a9dde4291ec752028d872fd3aa8fda94c3 --- /dev/null +++ b/annotations_filtered/toAOUXtlXXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[118.0, 118.29], [120.0, 131.52]], "keep_status": [false, false], "silence_prob": [0.0, 63.31], "audiomae_on_audioset": [null, null], "duration": [0.29, 11.52]} \ No newline at end of file diff --git a/annotations_filtered/toctHJpW6no_filtered.json b/annotations_filtered/toctHJpW6no_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd931ef681047bfb4e6ab5425d620ca3120d3448 --- /dev/null +++ b/annotations_filtered/toctHJpW6no_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.83], [8.0, 12.92], [15.0, 17.34], [26.0, 26.69], [31.0, 32.37], [34.0, 35.24], [36.0, 37.02], [38.0, 38.97], [41.0, 44.95], [46.0, 46.18], [51.0, 53.16], [61.0, 62.28], [63.0, 63.9], [65.0, 67.58], [68.0, 70.29], [75.0, 75.81], [77.0, 77.58], [78.0, 79.73], [81.0, 82.46], [83.0, 84.54], [87.0, 88.67], [90.0, 91.69], [99.0, 100.08], [101.0, 107.81], [109.0, 110.13], [111.0, 118.2], [119.0, 120.21], [123.0, 125.46], [126.0, 128.09], [129.0, 137.91], [145.0, 163.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.19, 79.24, 55.31, 0.0, 0.0, 0.0, 0.0, 0.0, 50.46, 0.0, 45.46, 0.0, 0.0, 88.46, 69.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 93.76, 0.0, 95.64, 99.16, 84.25, 55.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["sidetone", 33.33], ["whale vocalization", 7.48], ["music", 7.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.83, 4.92, 2.34, 0.69, 1.37, 1.24, 1.02, 0.97, 3.95, 0.18, 2.16, 1.28, 0.9, 2.58, 2.29, 0.81, 0.58, 1.73, 1.46, 1.54, 1.67, 1.69, 1.08, 6.81, 1.13, 7.2, 1.21, 2.46, 2.09, 8.91, 18.17]} \ No newline at end of file diff --git a/annotations_filtered/toq0HYc9mmg_filtered.json b/annotations_filtered/toq0HYc9mmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8feba2a76fb5d581d6e32cfb322f73069b785d4b --- /dev/null +++ b/annotations_filtered/toq0HYc9mmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.88], [7.0, 8.31], [10.0, 22.55], [23.0, 24.17], [26.0, 26.11], [26.0, 26.65], [27.0, 27.06], [32.0, 32.9], [40.0, 42.08], [46.0, 47.04]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.36, 0.0, 0.0, 0.0, 0.0, 0.0, 36.63, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.11], ["cattle, bovinae", 4.85], ["speech", 4.55]], null, null, null, null, null, [["music", 75.32], ["musical instrument", 3.91], ["guitar", 3.09]], null], "duration": [1.88, 1.31, 12.55, 1.17, 0.11, 0.65, 0.06, 0.9, 2.08, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/tp1eVLXEXm8_filtered.json b/annotations_filtered/tp1eVLXEXm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eac2edfc5c1619693e0d9339cee79b7016c6d5f --- /dev/null +++ b/annotations_filtered/tp1eVLXEXm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.61], [14.0, 20.92], [21.0, 26.89], [34.0, 52.52], [56.0, 59.37], [62.0, 62.99], [71.0, 72.62], [81.0, 95.05], [111.0, 116.9], [119.0, 122.77], [124.0, 128.46], [131.0, 131.89], [133.0, 135.04], [136.0, 138.47], [139.0, 138.54], [140.0, 147.16]], "keep_status": [false, true, true, false, false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 37.01, 36.61, 33.24, 36.69, 0.0, 0.0, 32.41, 31.82, 36.99, 57.72, 0.0, 35.48, 34.14, 0.0, 31.65], "audiomae_on_audioset": [null, [["music", 25.68], ["boing", 21.45], ["speech", 18.34]], [["music", 42.67], ["speech", 15.3], ["animal", 4.12]], [["music", 61.94], ["theremin", 16.68], ["speech", 4.14]], [["music", 48.54], ["guitar", 19.03], ["musical instrument", 8.47]], null, null, [["music", 60.04], ["boing", 7.09], ["speech", 5.96]], [["boing", 28.46], ["music", 19.82], ["speech", 13.86]], [["boing", 23.73], ["music", 12.46], ["speech", 11.2]], null, null, [["whale vocalization", 48.77], ["music", 17.06], ["speech", 7.27]], [["fly, housefly", 49.71], ["mosquito", 23.65], ["insect", 18.67]], null, [["music", 38.48], ["speech", 5.21], ["hum", 4.44]]], "duration": [0.61, 6.92, 5.89, 18.52, 3.37, 0.99, 1.62, 14.05, 5.9, 3.77, 4.46, 0.89, 2.04, 2.47, -0.46, 7.16]} \ No newline at end of file diff --git a/annotations_filtered/tp7ss_bTP4Y_filtered.json b/annotations_filtered/tp7ss_bTP4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6087384a71d54aa84870c0c423913ce23c70d16 --- /dev/null +++ b/annotations_filtered/tp7ss_bTP4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [40.0, 42.8], [48.0, 74.28], [75.0, 81.21], [82.0, 83.52], [84.0, 84.75], [90.0, 91.3], [96.0, 97.43], [100.0, 101.98], [104.0, 104.95], [108.0, 108.62], [113.0, 115.37]], "keep_status": [false, true, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.11, 35.08, 44.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.27], "audiomae_on_audioset": [null, [["speech", 41.56], ["hum", 10.63], ["throbbing", 8.71]], [["music", 31.92], ["throbbing", 17.56], ["hum", 14.03]], [["thunk", 12.97], ["music", 10.79], ["noise", 9.43]], null, null, null, null, null, null, null, null], "duration": [0.51, 2.8, 26.28, 6.21, 1.52, 0.75, 1.3, 1.43, 1.98, 0.95, 0.62, 2.37]} \ No newline at end of file diff --git a/annotations_filtered/tpfOhYRYv80_filtered.json b/annotations_filtered/tpfOhYRYv80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d264c2a5db61778e5af4c2ffebc5be1e6fc5db82 --- /dev/null +++ b/annotations_filtered/tpfOhYRYv80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.78], [22.0, 22.13], [23.0, 24.14], [25.0, 25.35], [27.0, 27.8], [29.0, 29.24], [33.0, 33.98], [36.0, 36.68], [37.0, 37.91], [40.0, 41.42], [43.0, 44.96], [45.0, 46.7], [49.0, 50.13], [53.0, 53.23], [62.0, 62.06], [64.0, 64.45], [65.0, 85.23], [88.0, 93.29], [99.0, 99.52], [100.0, 100.87], [104.0, 106.05], [108.0, 108.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.92, 49.45, 0.0, 0.0, 88.1, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.11], ["music", 7.89], ["mains hum", 7.67]], [["speech", 22.04], ["fart", 11.23], ["hum", 5.78]], null, null, null, null], "duration": [0.78, 0.13, 1.14, 0.35, 0.8, 0.24, 0.98, 0.68, 0.91, 1.42, 1.96, 1.7, 1.13, 0.23, 0.06, 0.45, 20.23, 5.29, 0.52, 0.87, 2.05, 0.67]} \ No newline at end of file diff --git a/annotations_filtered/tpkTStVMv_Q_filtered.json b/annotations_filtered/tpkTStVMv_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bed78f3109a48fe794ec80c07bacd76f2a9f72ed --- /dev/null +++ b/annotations_filtered/tpkTStVMv_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.42], [10.0, 16.12], [17.0, 18.76], [23.0, 24.12], [33.0, 37.57], [40.0, 45.5], [48.0, 50.19], [52.0, 53.62], [55.0, 57.92], [60.0, 61.77], [66.0, 66.28], [66.0, 66.39], [67.0, 68.12], [70.0, 70.55], [75.0, 78.07], [80.0, 82.32], [83.0, 84.03], [90.0, 90.71], [93.0, 93.75], [95.0, 96.72], [97.0, 99.59], [100.0, 101.9], [105.0, 106.76], [108.0, 109.48], [111.0, 111.89], [113.0, 115.53], [116.0, 123.01], [124.0, 124.73], [126.0, 127.6], [128.0, 141.62], [145.0, 149.42], [150.0, 167.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 0.0, 0.0, 99.78, 99.96, 99.98, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 100.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 99.99, 99.94, 0.0, 0.0, 98.01, 98.73, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 6.12, 1.76, 1.12, 4.57, 5.5, 2.19, 1.62, 2.92, 1.77, 0.28, 0.39, 1.12, 0.55, 3.07, 2.32, 1.03, 0.71, 0.75, 1.72, 2.59, 1.9, 1.76, 1.48, 0.89, 2.53, 7.01, 0.73, 1.6, 13.62, 4.42, 17.22]} \ No newline at end of file diff --git a/annotations_filtered/tpsGUGc8Ri8_filtered.json b/annotations_filtered/tpsGUGc8Ri8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..152d5825cbf25b68de588ff88db5727a2933258b --- /dev/null +++ b/annotations_filtered/tpsGUGc8Ri8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.87], [17.0, 31.23], [35.0, 35.21], [39.0, 39.39], [40.0, 41.79], [45.0, 45.32], [45.0, 48.0], [58.0, 59.58], [60.0, 63.37], [64.0, 63.78], [64.0, 76.79], [79.0, 87.52], [88.0, 93.16], [94.0, 99.01], [101.0, 109.09], [109.0, 109.71], [112.0, 150.26], [159.0, 174.8]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [34.88, 31.3, 0.0, 0.0, 0.0, 0.0, 31.12, 0.0, 31.96, 0.0, 30.99, 29.54, 30.36, 29.52, 29.01, 0.0, 0.0, 29.58], "audiomae_on_audioset": [[["sidetone", 36.57], ["speech", 21.45], ["music", 11.88]], [["music", 71.03], ["throbbing", 6.27], ["hum", 5.55]], null, null, null, null, [["music", 51.38], ["speech", 7.04], ["electronic music", 5.05]], null, [["music", 26.7], ["speech", 14.37], ["sidetone", 10.66]], null, [["hum", 33.89], ["throbbing", 24.99], ["mains hum", 24.67]], [["music", 64.25], ["throbbing", 16.23], ["hum", 6.04]], [["music", 73.36], ["speech", 3.59], ["electronic music", 2.44]], [["music", 31.1], ["speech", 21.35], ["breaking", 19.06]], [["music", 70.67], ["speech", 14.8], ["throbbing", 4.18]], null, null, [["music", 61.83], ["hum", 12.24], ["throbbing", 10.77]]], "duration": [4.87, 14.23, 0.21, 0.39, 1.79, 0.32, 3.0, 1.58, 3.37, -0.22, 12.79, 8.52, 5.16, 5.01, 8.09, 0.71, 38.26, 15.8]} \ No newline at end of file diff --git a/annotations_filtered/tpyZHmGRPuE_filtered.json b/annotations_filtered/tpyZHmGRPuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fb85562f362f4a290e56210a887633ff1e00e78 --- /dev/null +++ b/annotations_filtered/tpyZHmGRPuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 40.59], [42.0, 52.42], [53.0, 53.91], [55.0, 56.56], [58.0, 70.29], [71.0, 116.83]], "keep_status": [true, true, false, false, false, false], "silence_prob": [36.14, 38.21, 0.0, 0.0, 51.39, 0.0], "audiomae_on_audioset": [[["whale vocalization", 40.96], ["hum", 11.82], ["fart", 7.23]], [["hum", 23.41], ["throbbing", 13.86], ["speech", 13.13]], null, null, null, null], "duration": [2.59, 10.42, 0.91, 1.56, 12.29, 45.83]} \ No newline at end of file diff --git a/annotations_filtered/tqfFZYur4sM_filtered.json b/annotations_filtered/tqfFZYur4sM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6da2afea43ac31501b73786a4c0b616d0701a4aa --- /dev/null +++ b/annotations_filtered/tqfFZYur4sM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.12], [9.0, 9.83], [13.0, 25.44], [27.0, 39.66], [43.0, 43.75]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 31.02, 37.23, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 43.17], ["hum", 18.28], ["music", 16.6]], [["music", 41.51], ["throbbing", 8.15], ["electronic music", 7.24]], null], "duration": [0.12, 0.83, 12.44, 12.66, 0.75]} \ No newline at end of file diff --git a/annotations_filtered/tqmbgqyc1bc_filtered.json b/annotations_filtered/tqmbgqyc1bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3522141ce643831fd9eb20414d764e26f6018920 --- /dev/null +++ b/annotations_filtered/tqmbgqyc1bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.73], [14.0, 14.35], [15.0, 22.69], [28.0, 29.44], [33.0, 34.59], [46.0, 87.88], [95.0, 108.9], [112.0, 127.28], [133.0, 139.08], [142.0, 145.4], [147.0, 147.56], [149.0, 150.48], [151.0, 153.39], [154.0, 154.95], [156.0, 158.58], [159.0, 161.03], [162.0, 164.0], [166.0, 176.94]], "keep_status": [false, false, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [50.31, 0.0, 39.8, 0.0, 0.0, 0.0, 29.26, 29.73, 75.88, 41.91, 0.0, 0.0, 59.42, 0.0, 56.33, 57.4, 67.76, 52.1], "audiomae_on_audioset": [null, null, [["music", 32.57], ["speech", 21.39], ["throbbing", 9.28]], null, null, null, [["music", 72.57], ["throbbing", 3.51], ["electronic music", 2.23]], [["music", 46.88], ["mains hum", 7.11], ["speech", 4.65]], null, [["speech", 28.11], ["music", 16.35], ["fly, housefly", 8.77]], null, null, null, null, null, null, null, null], "duration": [5.73, 0.35, 7.69, 1.44, 1.59, 41.88, 13.9, 15.28, 6.08, 3.4, 0.56, 1.48, 2.39, 0.95, 2.58, 2.03, 2.0, 10.94]} \ No newline at end of file diff --git a/annotations_filtered/tqqSIT1D0vU_filtered.json b/annotations_filtered/tqqSIT1D0vU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66209ea5fe1c4b9ed8b437004bb014cab6d670e2 --- /dev/null +++ b/annotations_filtered/tqqSIT1D0vU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.62], [1.0, 0.75], [1.0, 0.78], [1.0, 26.32], [30.0, 47.75], [50.0, 52.95], [58.0, 127.01], [130.0, 135.6], [139.0, 140.04]], "keep_status": [false, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.53, 30.2, 47.35, 0.0, 40.22, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 65.8], ["throbbing", 8.66], ["hum", 6.14]], [["music", 25.09], ["smash, crash", 12.5], ["throbbing", 7.82]], [["mains hum", 13.51], ["hum", 9.53], ["engine", 6.65]], null, [["music", 24.4], ["rumble", 13.21], ["hum", 9.95]], null], "duration": [0.62, -0.25, -0.22, 25.32, 17.75, 2.95, 69.01, 5.6, 1.04]} \ No newline at end of file diff --git a/annotations_filtered/tqtqEZqGg5A_filtered.json b/annotations_filtered/tqtqEZqGg5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9e7cea8ba32d6bb1b90010d0f5898702dede047 --- /dev/null +++ b/annotations_filtered/tqtqEZqGg5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [3.0, 3.06], [4.0, 15.55], [17.0, 17.24], [21.0, 24.73], [30.0, 32.16], [35.0, 38.01], [38.0, 49.92], [51.0, 52.93], [55.0, 87.4], [88.0, 92.97], [96.0, 98.79], [99.0, 100.35], [105.0, 116.06]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.17, 0.0, 38.56, 46.29, 43.51, 42.91, 0.0, 0.0, 91.64, 98.19, 0.0, 48.23], "audiomae_on_audioset": [null, null, [["hum", 50.72], ["throbbing", 25.11], ["music", 9.34]], null, [["whack, thwack", 26.97], ["smash, crash", 22.07], ["music", 12.96]], [["music", 58.95], ["didgeridoo", 15.88], ["musical instrument", 7.05]], [["speech", 21.75], ["fly, housefly", 15.27], ["whale vocalization", 7.98]], [["throbbing", 41.1], ["speech", 19.45], ["music", 16.22]], null, null, null, null, null, [["speech", 18.26], ["sidetone", 18.12], ["fly, housefly", 17.98]]], "duration": [0.33, 0.06, 11.55, 0.24, 3.73, 2.16, 3.01, 11.92, 1.93, 32.4, 4.97, 2.79, 1.35, 11.06]} \ No newline at end of file diff --git a/annotations_filtered/tr2hYRUEkHk_filtered.json b/annotations_filtered/tr2hYRUEkHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d56a3310a5d74e16e5e68abc351abc5101edb161 --- /dev/null +++ b/annotations_filtered/tr2hYRUEkHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.87], [2.0, 3.82], [5.0, 5.39], [6.0, 8.6], [9.0, 9.15], [12.0, 12.83], [13.0, 13.2], [14.0, 13.85], [15.0, 20.55], [22.0, 23.03], [27.0, 27.41], [28.0, 29.44], [30.0, 30.64], [31.0, 45.6], [47.0, 49.82], [52.0, 57.13], [58.0, 59.46], [60.0, 65.52], [68.0, 70.53], [75.0, 78.27], [80.0, 81.31], [85.0, 85.4], [87.0, 87.45], [90.0, 102.68], [104.0, 109.22], [111.0, 115.77], [117.0, 121.81], [122.0, 123.85], [126.0, 131.95], [133.0, 133.64], [135.0, 135.62], [136.0, 141.15], [142.0, 149.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 99.78, 99.52, 99.99, 0.0, 99.87, 99.91, 100.0, 0.0, 0.0, 0.0, 99.52, 99.99, 100.0, 99.99, 0.0, 99.91, 0.0, 0.0, 99.31, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.13, 1.82, 0.39, 2.6, 0.15, 0.83, 0.2, -0.15, 5.55, 1.03, 0.41, 1.44, 0.64, 14.6, 2.82, 5.13, 1.46, 5.52, 2.53, 3.27, 1.31, 0.4, 0.45, 12.68, 5.22, 4.77, 4.81, 1.85, 5.95, 0.64, 0.62, 5.15, 7.55]} \ No newline at end of file diff --git a/annotations_filtered/tr3ORGLT_W8_filtered.json b/annotations_filtered/tr3ORGLT_W8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a1315c5bcedfca7ffe57d819961127dbf824a85 --- /dev/null +++ b/annotations_filtered/tr3ORGLT_W8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.67], [14.0, 18.3], [23.0, 24.12], [26.0, 26.06], [27.0, 27.63], [29.0, 29.2], [30.0, 30.72], [36.0, 37.79], [43.0, 44.46], [52.0, 52.27], [54.0, 53.92], [55.0, 55.56], [57.0, 57.06], [60.0, 60.4], [61.0, 76.77], [79.0, 78.98], [79.0, 83.79], [90.0, 90.32], [95.0, 96.23], [98.0, 98.09], [102.0, 102.86], [107.0, 113.17], [113.0, 125.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.63, 0.0, 32.98, 0.0, 0.0, 0.0, 0.0, 33.51, 32.03], "audiomae_on_audioset": [null, [["music", 71.76], ["musical instrument", 3.93], ["didgeridoo", 1.67]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 86.77], ["musical instrument", 1.85], ["effects unit", 1.43]], null, [["music", 73.37], ["musical instrument", 3.72], ["didgeridoo", 2.12]], null, null, null, null, [["music", 62.2], ["didgeridoo", 14.38], ["musical instrument", 4.28]], [["music", 77.71], ["didgeridoo", 2.82], ["boing", 1.98]]], "duration": [0.67, 4.3, 1.12, 0.06, 0.63, 0.2, 0.72, 1.79, 1.46, 0.27, -0.08, 0.56, 0.06, 0.4, 15.77, -0.02, 4.79, 0.32, 1.23, 0.09, 0.86, 6.17, 12.49]} \ No newline at end of file diff --git a/annotations_filtered/tr4beSTsJ1E_filtered.json b/annotations_filtered/tr4beSTsJ1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25956faa05f066bc1ded40e8c9c7f1d4232e5539 --- /dev/null +++ b/annotations_filtered/tr4beSTsJ1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 74.76], [75.0, 79.07], [79.0, 79.17], [79.0, 98.51], [99.0, 100.09], [103.0, 109.34], [112.0, 120.45], [121.0, 123.28], [124.0, 163.58]], "keep_status": [true, true, false, true, false, true, false, false, false], "silence_prob": [30.78, 35.06, 0.0, 30.65, 0.0, 40.26, 63.53, 56.93, 0.0], "audiomae_on_audioset": [[["music", 19.85], ["beatboxing", 8.85], ["whack, thwack", 7.26]], [["speech", 14.4], ["music", 9.36], ["whale vocalization", 9.08]], null, [["speech", 22.23], ["music", 17.29], ["whack, thwack", 11.26]], null, [["music", 19.41], ["speech", 13.5], ["frog", 10.91]], null, null, null], "duration": [23.76, 4.07, 0.17, 19.51, 1.09, 6.34, 8.45, 2.28, 39.58]} \ No newline at end of file diff --git a/annotations_filtered/trGyimjcGRI_filtered.json b/annotations_filtered/trGyimjcGRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f74a8b886fc9f8ae83ff09454a92cce49e7fa57a --- /dev/null +++ b/annotations_filtered/trGyimjcGRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.9], [9.0, 10.59], [13.0, 13.41], [20.0, 21.0], [23.0, 23.33], [24.0, 26.01], [32.0, 32.12], [36.0, 36.19], [37.0, 37.93], [40.0, 40.2], [41.0, 42.04], [43.0, 43.97], [45.0, 45.96], [60.0, 61.15], [62.0, 64.37], [65.0, 72.86], [81.0, 82.17], [84.0, 86.43], [91.0, 93.66], [94.0, 94.96], [105.0, 105.73], [107.0, 108.6], [109.0, 110.84], [114.0, 115.74], [121.0, 120.75], [121.0, 122.59], [123.0, 124.29], [125.0, 126.74], [128.0, 129.79], [140.0, 140.27], [143.0, 151.31], [151.0, 151.68], [157.0, 158.14], [159.0, 162.45], [164.0, 166.01], [170.0, 171.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 42.06, 0.0, 63.64, 89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.29, 0.0, 0.0, 65.67, 76.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.24], ["throbbing", 31.76], ["mains hum", 10.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 80.53], ["sidetone", 4.2], ["hum", 1.39]], null, null, null, null, null], "duration": [1.9, 1.59, 0.41, 1.0, 0.33, 2.01, 0.12, 0.19, 0.93, 0.2, 1.04, 0.97, 0.96, 1.15, 2.37, 7.86, 1.17, 2.43, 2.66, 0.96, 0.73, 1.6, 1.84, 1.74, -0.25, 1.59, 1.29, 1.74, 1.79, 0.27, 8.31, 0.68, 1.14, 3.45, 2.01, 1.53]} \ No newline at end of file diff --git a/annotations_filtered/trLRP0-zvtU_filtered.json b/annotations_filtered/trLRP0-zvtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1975f100d07fd397671d41e811b5207268b34604 --- /dev/null +++ b/annotations_filtered/trLRP0-zvtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.37], [28.0, 29.73], [40.0, 46.67], [49.0, 53.32], [55.0, 57.18], [59.0, 60.08], [61.0, 61.77], [66.0, 69.01]], "keep_status": [false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 34.9, 75.07, 98.51, 0.0, 0.0, 31.65], "audiomae_on_audioset": [null, null, [["hum", 24.74], ["speech", 23.36], ["throbbing", 10.08]], null, null, null, null, [["music", 19.3], ["noise", 12.64], ["synthesizer", 7.18]]], "duration": [1.37, 1.73, 6.67, 4.32, 2.18, 1.08, 0.77, 3.01]} \ No newline at end of file diff --git a/annotations_filtered/trPOKL7Nguo_filtered.json b/annotations_filtered/trPOKL7Nguo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83abab88d168b306bf70b17f1f794cc67132d7cf --- /dev/null +++ b/annotations_filtered/trPOKL7Nguo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 77.6], [81.0, 96.35], [97.0, 121.88]], "keep_status": [false, true, true], "silence_prob": [0.0, 30.52, 31.75], "audiomae_on_audioset": [null, [["music", 23.47], ["speech", 10.18], ["electric shaver, electric razor", 6.81]], [["music", 23.82], ["whip", 10.8], ["speech", 6.79]]], "duration": [72.6, 15.35, 24.88]} \ No newline at end of file diff --git a/annotations_filtered/trgDVhZHIrc_filtered.json b/annotations_filtered/trgDVhZHIrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..386816f0439b6183f514a0d900f240d9a7546823 --- /dev/null +++ b/annotations_filtered/trgDVhZHIrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.88], [13.0, 16.9], [20.0, 21.74], [25.0, 25.76], [27.0, 28.38], [31.0, 34.48], [37.0, 38.16], [41.0, 41.2], [44.0, 44.79], [49.0, 50.7], [53.0, 54.28], [57.0, 66.02], [70.0, 72.12], [75.0, 99.59], [103.0, 108.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [98.01, 95.51, 0.0, 0.0, 0.0, 55.11, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87, 35.68, 40.11, 96.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.27], ["chirp tone", 15.13], ["sine wave", 5.66]], [["speech", 31.78], ["sidetone", 12.67], ["hum", 8.81]], null], "duration": [3.88, 3.9, 1.74, 0.76, 1.38, 3.48, 1.16, 0.2, 0.79, 1.7, 1.28, 9.02, 2.12, 24.59, 5.23]} \ No newline at end of file diff --git a/annotations_filtered/tru0WMH7yic_filtered.json b/annotations_filtered/tru0WMH7yic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16a4e7a27159863fd94f9786cd4b1c45ca03d5bd --- /dev/null +++ b/annotations_filtered/tru0WMH7yic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.44], [13.0, 14.69], [20.0, 20.55], [23.0, 24.98], [26.0, 26.59], [27.0, 31.53], [32.0, 31.62], [33.0, 51.58], [56.0, 116.85], [118.0, 119.47], [122.0, 132.02], [133.0, 133.32], [134.0, 139.04], [139.0, 142.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.8, 0.0, 38.05, 0.0, 0.0, 45.05, 0.0, 96.42, 32.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 46.7], ["mains hum", 25.57], ["music", 6.37]], null, null, [["smash, crash", 27.1], ["breaking", 23.68], ["speech", 6.39]], null, null, [["clang", 19.88], ["speech", 10.74], ["ding", 8.12]]], "duration": [0.44, 1.69, 0.55, 1.98, 0.59, 4.53, -0.38, 18.58, 60.85, 1.47, 10.02, 0.32, 5.04, 3.4]} \ No newline at end of file diff --git a/annotations_filtered/trxN4ftuxKQ_filtered.json b/annotations_filtered/trxN4ftuxKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..494daad03d5f47c6650d1142904dbd083295ed23 --- /dev/null +++ b/annotations_filtered/trxN4ftuxKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.79], [16.0, 17.69], [24.0, 25.29], [27.0, 27.48], [29.0, 30.38], [54.0, 57.64], [92.0, 95.54], [99.0, 100.2], [102.0, 103.98], [105.0, 107.5], [110.0, 132.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 81.0, 0.0, 0.0, 99.65, 97.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 1.69, 1.29, 0.48, 1.38, 3.64, 3.54, 1.2, 1.98, 2.5, 22.61]} \ No newline at end of file diff --git a/annotations_filtered/ts4gt7f_rek_filtered.json b/annotations_filtered/ts4gt7f_rek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a56047e3293d6ec303a6e939852b548e0d2ab5e4 --- /dev/null +++ b/annotations_filtered/ts4gt7f_rek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [9.0, 9.34], [10.0, 12.46], [17.0, 17.47], [18.0, 18.52], [22.0, 24.66], [40.0, 40.74], [46.0, 50.18], [54.0, 55.49], [59.0, 59.44], [63.0, 67.56], [73.0, 73.85], [81.0, 85.35], [91.0, 91.88], [93.0, 95.66], [100.0, 102.66], [104.0, 104.09], [104.0, 106.34], [110.0, 110.62], [112.0, 112.29], [113.0, 113.64], [116.0, 124.31], [125.0, 125.46], [127.0, 128.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 74.44, 0.0, 0.0, 92.97, 0.0, 98.01, 0.0, 0.0, 52.39, 0.0, 71.57, 0.0, 81.53, 82.07, 0.0, 75.55, 0.0, 0.0, 0.0, 57.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.34, 2.46, 0.47, 0.52, 2.66, 0.74, 4.18, 1.49, 0.44, 4.56, 0.85, 4.35, 0.88, 2.66, 2.66, 0.09, 2.34, 0.62, 0.29, 0.64, 8.31, 0.46, 1.09]} \ No newline at end of file diff --git a/annotations_filtered/tsIYleoAQpY_filtered.json b/annotations_filtered/tsIYleoAQpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dd003385573d59147b779a5476bec3395f15772 --- /dev/null +++ b/annotations_filtered/tsIYleoAQpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 31.72], [35.0, 55.65], [57.0, 82.49], [83.0, 90.63], [93.0, 112.95], [113.0, 113.97], [115.0, 115.26]], "keep_status": [true, true, true, true, false, false, false], "silence_prob": [30.5, 28.99, 30.3, 30.87, 32.63, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 52.16], ["hum", 8.3], ["buzz", 7.06]], [["hum", 22.4], ["mains hum", 12.64], ["throbbing", 10.4]], [["explosion", 46.09], ["speech", 6.86], ["burst, pop", 6.53]], [["clang", 32.59], ["ding", 26.8], ["speech", 7.39]], [["music", 49.65], ["synthesizer", 20.99], ["electronic music", 4.21]], null, null], "duration": [12.72, 20.65, 25.49, 7.63, 19.95, 0.97, 0.26]} \ No newline at end of file diff --git a/annotations_filtered/tskpXGAJMhw_filtered.json b/annotations_filtered/tskpXGAJMhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e71b4f04ccd22fc31b75b2805b05ff8ba43013d1 --- /dev/null +++ b/annotations_filtered/tskpXGAJMhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [6.0, 6.15], [10.0, 10.67], [12.0, 12.07], [16.0, 16.11], [17.0, 17.56], [22.0, 22.54], [29.0, 29.34], [32.0, 33.71], [35.0, 35.46], [37.0, 36.86], [50.0, 51.29], [52.0, 52.56], [66.0, 66.16], [68.0, 68.4], [71.0, 71.29], [77.0, 77.21], [79.0, 79.0], [83.0, 83.44], [87.0, 91.35], [92.0, 95.15], [100.0, 102.05], [110.0, 111.16], [116.0, 116.26], [117.0, 118.64], [122.0, 121.88], [131.0, 131.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 72.01, 35.98, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 20.79], ["speech", 9.29], ["caterwaul", 4.7]], null, null, null, null, null], "duration": [0.25, 0.15, 0.67, 0.07, 0.11, 0.56, 0.54, 0.34, 1.71, 0.46, -0.14, 1.29, 0.56, 0.16, 0.4, 0.29, 0.21, 0.0, 0.44, 4.35, 3.15, 2.05, 1.16, 0.26, 1.64, -0.12, 0.43]} \ No newline at end of file diff --git a/annotations_filtered/tskuP_9J2RY_filtered.json b/annotations_filtered/tskuP_9J2RY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a87ac352480013bf21a74fb4734a626802965801 --- /dev/null +++ b/annotations_filtered/tskuP_9J2RY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.03], [12.0, 12.97], [14.0, 15.89], [18.0, 20.07], [22.0, 23.38], [24.0, 25.96], [27.0, 31.92], [35.0, 36.34], [37.0, 42.65], [43.0, 44.74], [47.0, 48.27], [60.0, 60.37], [62.0, 63.17], [72.0, 71.79], [78.0, 86.0], [88.0, 89.82], [103.0, 105.92], [107.0, 107.91], [110.0, 110.44], [115.0, 116.29], [122.0, 134.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.21, 0.0, 0.0, 48.95, 0.0, 0.0, 73.82, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 67.51, 0.0, 0.0, 0.0, 62.47], "audiomae_on_audioset": [null, null, null, [["speech", 64.06], ["hum", 5.04], ["music", 4.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.03, 0.97, 1.89, 2.07, 1.38, 1.96, 4.92, 1.34, 5.65, 1.74, 1.27, 0.37, 1.17, -0.21, 8.0, 1.82, 2.92, 0.91, 0.44, 1.29, 12.03]} \ No newline at end of file diff --git a/annotations_filtered/ttEZ7b4Cf9w_filtered.json b/annotations_filtered/ttEZ7b4Cf9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c182c3d7f3ebfd39ab4129a052b6b7d53df81c6 --- /dev/null +++ b/annotations_filtered/ttEZ7b4Cf9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.15], [39.0, 43.5], [44.0, 45.47], [46.0, 50.63], [52.0, 55.71], [57.0, 58.06], [58.0, 58.92], [60.0, 61.91], [64.0, 114.74], [118.0, 160.91], [168.0, 168.62]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.98, 0.0, 46.97, 51.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.72], ["hum", 24.75], ["gong", 11.56]], null, [["speech", 53.22], ["music", 25.2], ["hum", 1.91]], null, null, null, null, null, null, null], "duration": [0.15, 4.5, 1.47, 4.63, 3.71, 1.06, 0.92, 1.91, 50.74, 42.91, 0.62]} \ No newline at end of file diff --git a/annotations_filtered/ttIN2nLcy6s_filtered.json b/annotations_filtered/ttIN2nLcy6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e76537c833db183974dd13801ea6a1f21ceea264 --- /dev/null +++ b/annotations_filtered/ttIN2nLcy6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [2.0, 2.89], [6.0, 7.42], [8.0, 17.29], [31.0, 38.7], [40.0, 41.25], [43.0, 50.13], [51.0, 53.08], [56.0, 58.77], [59.0, 59.0], [59.0, 60.22], [62.0, 71.78], [73.0, 89.24], [90.0, 91.3], [92.0, 95.05], [104.0, 104.28], [105.0, 105.63], [106.0, 106.57], [115.0, 116.23], [117.0, 118.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 94.66, 94.52, 0.0, 97.73, 98.27, 99.59, 0.0, 0.0, 39.98, 30.53, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 53.32], ["throbbing", 29.01], ["mains hum", 7.95]], [["music", 50.39], ["whip", 5.99], ["crowd", 5.27]], null, null, null, null, null, null, null], "duration": [0.0, 0.89, 1.42, 9.29, 7.7, 1.25, 7.13, 2.08, 2.77, 0.0, 1.22, 9.78, 16.24, 1.3, 3.05, 0.28, 0.63, 0.57, 1.23, 1.25]} \ No newline at end of file diff --git a/annotations_filtered/ttOuvmYYeps_filtered.json b/annotations_filtered/ttOuvmYYeps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09428c86e6ad795942c7429b013a039b83ac5a1a --- /dev/null +++ b/annotations_filtered/ttOuvmYYeps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.24], [9.0, 9.32], [11.0, 11.72], [15.0, 15.2], [47.0, 48.39], [61.0, 61.43], [72.0, 71.76], [74.0, 74.71], [75.0, 76.71], [80.0, 79.96], [84.0, 84.97], [86.0, 86.22], [92.0, 92.47], [94.0, 94.1], [95.0, 94.8], [105.0, 105.73], [113.0, 114.13], [120.0, 123.16], [123.0, 123.5], [124.0, 123.55], [124.0, 123.79], [129.0, 129.14], [146.0, 147.58], [156.0, 156.95], [158.0, 158.46], [171.0, 172.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 72.21], ["speech", 4.87], ["sampler", 2.56]], null, null, null, null, null, null, null, null], "duration": [1.24, 0.32, 0.72, 0.2, 1.39, 0.43, -0.24, 0.71, 1.71, -0.04, 0.97, 0.22, 0.47, 0.1, -0.2, 0.73, 1.13, 3.16, 0.5, -0.45, -0.21, 0.14, 1.58, 0.95, 0.46, 1.02]} \ No newline at end of file diff --git a/annotations_filtered/ttTyXqwsP0o_filtered.json b/annotations_filtered/ttTyXqwsP0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..294721e6a85234f34825e488fa7b0457a3e0b1a4 --- /dev/null +++ b/annotations_filtered/ttTyXqwsP0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.04], [9.0, 9.37], [12.0, 11.87], [15.0, 15.5], [17.0, 17.31], [19.0, 23.04], [26.0, 29.94], [31.0, 32.12], [34.0, 34.67], [43.0, 50.58], [52.0, 52.22], [54.0, 54.45], [59.0, 59.64], [62.0, 62.8], [66.0, 66.38], [67.0, 68.49], [70.0, 73.55], [74.0, 75.05], [76.0, 76.5], [78.0, 81.75], [84.0, 85.38], [88.0, 93.8], [95.0, 96.48], [99.0, 100.84], [103.0, 104.19], [106.0, 106.88], [111.0, 112.14]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.13, 30.33, 0.0, 0.0, 31.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.29, 0.0, 0.0, 34.36, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["cattle, bovinae", 19.17], ["speech", 16.77], ["moo", 11.83]], [["hum", 11.04], ["music", 5.95], ["cacophony", 4.42]], null, null, [["noise", 21.7], ["buzz", 12.21], ["vehicle", 10.39]], null, null, null, null, null, null, [["noise", 17.78], ["music", 12.35], ["white noise", 6.55]], null, null, [["speech", 41.07], ["horse", 5.66], ["radio", 5.49]], null, [["vehicle", 17.54], ["fly, housefly", 14.49], ["buzz", 8.98]], null, null, null, null, null], "duration": [1.04, 0.37, -0.13, 0.5, 0.31, 4.04, 3.94, 1.12, 0.67, 7.58, 0.22, 0.45, 0.64, 0.8, 0.38, 1.49, 3.55, 1.05, 0.5, 3.75, 1.38, 5.8, 1.48, 1.84, 1.19, 0.88, 1.14]} \ No newline at end of file diff --git a/annotations_filtered/ttU5gs0lj38_filtered.json b/annotations_filtered/ttU5gs0lj38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69f17400717c4e8ad253908747896d681ef5fce4 --- /dev/null +++ b/annotations_filtered/ttU5gs0lj38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.63], [15.0, 15.28], [15.0, 30.6], [32.0, 32.41], [35.0, 35.77], [39.0, 41.3], [41.0, 45.62], [49.0, 59.36], [60.0, 77.87], [78.0, 84.6], [86.0, 86.91], [88.0, 88.89], [89.0, 114.91], [115.0, 115.65], [116.0, 117.07], [118.0, 123.77], [125.0, 140.63], [146.0, 146.2]], "keep_status": [false, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.1, 0.0, 0.0, 31.63, 29.59, 32.78, 30.87, 32.05, 0.0, 0.0, 34.21, 0.0, 0.0, 37.84, 30.64, 0.0], "audiomae_on_audioset": [null, null, [["speech", 53.18], ["music", 25.34], ["buzz", 4.29]], null, null, [["music", 19.45], ["hum", 17.87], ["throbbing", 10.02]], [["music", 46.88], ["theremin", 6.23], ["speech", 5.31]], [["music", 18.0], ["buzz", 10.75], ["mains hum", 9.13]], [["music", 28.78], ["speech", 7.96], ["animal", 7.38]], [["speech", 59.1], ["hum", 5.73], ["vehicle", 5.31]], null, null, [["music", 36.85], ["speech", 24.45], ["hum", 10.29]], null, null, [["electric shaver, electric razor", 78.1], ["hum", 5.7], ["mains hum", 4.17]], [["speech", 68.11], ["music", 8.37], ["sidetone", 5.93]], null], "duration": [0.63, 0.28, 15.6, 0.41, 0.77, 2.3, 4.62, 10.36, 17.87, 6.6, 0.91, 0.89, 25.91, 0.65, 1.07, 5.77, 15.63, 0.2]} \ No newline at end of file diff --git a/annotations_filtered/ttiEgVcV-Xo_filtered.json b/annotations_filtered/ttiEgVcV-Xo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..264a3edfc8dbf9842097d5962688eb2d56d5de54 --- /dev/null +++ b/annotations_filtered/ttiEgVcV-Xo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 35.8], [37.0, 39.16], [44.0, 44.86], [52.0, 54.45], [57.0, 63.07], [64.0, 64.54], [66.0, 65.99], [67.0, 74.09], [77.0, 77.23], [78.0, 80.4], [81.0, 83.54], [84.0, 90.58], [92.0, 101.66], [102.0, 110.81], [111.0, 113.83], [115.0, 121.93], [124.0, 124.9], [127.0, 130.2], [130.0, 133.39], [135.0, 136.56], [138.0, 139.18], [141.0, 153.59], [155.0, 158.03], [158.0, 160.74], [161.0, 164.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 48.06, 0.0, 96.17, 99.87, 0.0, 0.0, 36.26, 0.0, 98.73, 90.95, 91.13, 99.21, 85.54, 66.76, 68.67, 0.0, 64.18, 44.72, 0.0, 0.0, 92.97, 99.48, 94.22, 62.58], "audiomae_on_audioset": [null, [["hum", 66.13], ["mains hum", 30.83], ["speech", 0.62]], null, null, null, null, null, [["thunk", 63.3], ["speech", 31.27], ["thump, thud", 2.78]], null, null, null, null, null, null, null, null, null, null, [["speech", 49.38], ["music", 24.22], ["singing bowl", 4.11]], null, null, null, null, null, null], "duration": [30.8, 2.16, 0.86, 2.45, 6.07, 0.54, -0.01, 7.09, 0.23, 2.4, 2.54, 6.58, 9.66, 8.81, 2.83, 6.93, 0.9, 3.2, 3.39, 1.56, 1.18, 12.59, 3.03, 2.74, 3.13]} \ No newline at end of file diff --git a/annotations_filtered/tu-cxDG2mW8_filtered.json b/annotations_filtered/tu-cxDG2mW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ff65ed011dd6d0662b62551bc4f60ba438f9be2 --- /dev/null +++ b/annotations_filtered/tu-cxDG2mW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.24], [16.0, 67.14], [68.0, 70.26], [71.0, 74.24]], "keep_status": [true, false, false, false], "silence_prob": [38.82, 0.0, 99.62, 99.96], "audiomae_on_audioset": [[["music", 45.32], ["foghorn", 11.64], ["vehicle", 4.15]], null, null, null], "duration": [4.24, 51.14, 2.26, 3.24]} \ No newline at end of file diff --git a/annotations_filtered/tu0NflL0_9c_filtered.json b/annotations_filtered/tu0NflL0_9c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3947f07ebb47826d8ee411384b78f4460084e95c --- /dev/null +++ b/annotations_filtered/tu0NflL0_9c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.7], [8.0, 9.46], [13.0, 13.19], [15.0, 17.39], [22.0, 22.49], [24.0, 24.53], [33.0, 33.79], [39.0, 39.33], [42.0, 43.38], [46.0, 46.36], [48.0, 50.31], [58.0, 61.69], [66.0, 67.56], [69.0, 68.86], [72.0, 72.69], [74.0, 75.54], [80.0, 82.98], [88.0, 90.17], [93.0, 96.82], [98.0, 101.22], [109.0, 113.02], [118.0, 118.47], [120.0, 120.18], [120.0, 120.72], [124.0, 125.15], [126.0, 127.52], [129.0, 129.46], [131.0, 130.76], [132.0, 133.46], [134.0, 136.44], [138.0, 140.93], [145.0, 145.32], [148.0, 155.26], [156.0, 156.64], [157.0, 158.08], [159.0, 158.95], [160.0, 160.79], [163.0, 164.3], [166.0, 165.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 99.91, 0.0, 0.0, 0.0, 0.0, 98.8, 68.02, 54.23, 99.76, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 99.4, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.3, 1.46, 0.19, 2.39, 0.49, 0.53, 0.79, 0.33, 1.38, 0.36, 2.31, 3.69, 1.56, -0.14, 0.69, 1.54, 2.98, 2.17, 3.82, 3.22, 4.02, 0.47, 0.18, 0.72, 1.15, 1.52, 0.46, -0.24, 1.46, 2.44, 2.93, 0.32, 7.26, 0.64, 1.08, -0.05, 0.79, 1.3, -0.3]} \ No newline at end of file diff --git a/annotations_filtered/tu6FDI4JBDY_filtered.json b/annotations_filtered/tu6FDI4JBDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a379b64ddf3e72e3ac0d70b4338cf21a97ed85de --- /dev/null +++ b/annotations_filtered/tu6FDI4JBDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.61], [23.0, 25.51], [27.0, 26.82], [27.0, 35.01], [42.0, 43.7], [44.0, 43.73], [46.0, 56.57], [61.0, 66.46], [68.0, 73.18], [73.0, 74.19], [86.0, 87.34], [89.0, 90.05], [94.0, 94.47], [99.0, 102.68]], "keep_status": [false, true, false, true, false, false, false, true, true, false, false, false, false, true], "silence_prob": [0.0, 30.16, 0.0, 28.97, 0.0, 0.0, 29.29, 29.76, 29.66, 0.0, 0.0, 0.0, 0.0, 31.3], "audiomae_on_audioset": [null, [["throbbing", 24.17], ["hum", 11.64], ["rumble", 11.03]], null, [["music", 27.34], ["hum", 17.71], ["breaking", 9.67]], null, null, [["speech", 39.87], ["music", 32.61], ["smash, crash", 5.89]], [["rumble", 20.91], ["music", 14.44], ["foghorn", 13.14]], [["music", 25.93], ["whack, thwack", 23.6], ["fly, housefly", 7.02]], null, null, null, null, [["speech", 39.53], ["music", 9.43], ["vehicle", 9.11]]], "duration": [0.61, 2.51, -0.18, 8.01, 1.7, -0.27, 10.57, 5.46, 5.18, 1.19, 1.34, 1.05, 0.47, 3.68]} \ No newline at end of file diff --git a/annotations_filtered/tuXSqMrfVW8_filtered.json b/annotations_filtered/tuXSqMrfVW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4da216c2b930b0e887a90ffe8f5e6d5c8021cfb3 --- /dev/null +++ b/annotations_filtered/tuXSqMrfVW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[101.0, 110.42], [111.0, 117.22]], "keep_status": [true, false], "silence_prob": [42.84, 40.73], "audiomae_on_audioset": [[["music", 44.81], ["speech", 6.76], ["buzz", 4.76]], [["music", 54.02], ["grunt", 17.96], ["speech", 3.36]]], "duration": [9.42, 6.22]} \ No newline at end of file diff --git a/annotations_filtered/tuusFUTcCO8_filtered.json b/annotations_filtered/tuusFUTcCO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b2c811b4d713bd0d49d5b181cf174cad154853f --- /dev/null +++ b/annotations_filtered/tuusFUTcCO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.18], [12.0, 13.09], [14.0, 15.63], [20.0, 24.22], [44.0, 45.3], [46.0, 47.46], [48.0, 49.47], [58.0, 74.43], [74.0, 74.95], [76.0, 83.83], [89.0, 89.85], [101.0, 101.12], [102.0, 106.79], [126.0, 126.79]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [33.38, 0.0, 0.0, 33.34, 0.0, 0.0, 0.0, 31.32, 0.0, 30.83, 0.0, 0.0, 33.77, 0.0], "audiomae_on_audioset": [[["speech", 33.62], ["music", 12.41], ["hum", 10.79]], null, null, [["speech", 49.05], ["throbbing", 16.25], ["hum", 6.09]], null, null, null, [["speech", 39.3], ["hum", 20.13], ["mains hum", 15.88]], null, [["sidetone", 30.03], ["speech", 26.05], ["music", 10.67]], null, null, [["didgeridoo", 55.97], ["music", 29.07], ["speech", 5.9]], null], "duration": [2.18, 1.09, 1.63, 4.22, 1.3, 1.46, 1.47, 16.43, 0.95, 7.83, 0.85, 0.12, 4.79, 0.79]} \ No newline at end of file diff --git a/annotations_filtered/tv25UVPcgxY_filtered.json b/annotations_filtered/tv25UVPcgxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..323be25a2e95a9a36e118e0a47f49f82ca99e333 --- /dev/null +++ b/annotations_filtered/tv25UVPcgxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.61], [10.0, 11.16], [12.0, 12.97], [14.0, 15.4], [17.0, 17.24], [19.0, 23.65], [27.0, 26.82], [28.0, 32.1], [33.0, 34.26], [35.0, 36.41], [37.0, 37.96], [41.0, 41.59], [47.0, 48.2], [50.0, 50.79], [52.0, 52.84], [55.0, 55.05], [56.0, 58.38], [59.0, 60.32], [61.0, 61.45], [63.0, 72.15], [73.0, 91.57], [103.0, 111.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 99.92, 100.0, 91.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 1.16, 0.97, 1.4, 0.24, 4.65, -0.18, 4.1, 1.26, 1.41, 0.96, 0.59, 1.2, 0.79, 0.84, 0.05, 2.38, 1.32, 0.45, 9.15, 18.57, 8.32]} \ No newline at end of file diff --git a/annotations_filtered/tvCjr63AgtM_filtered.json b/annotations_filtered/tvCjr63AgtM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e57b212fe15c734792fb206be09ce8acd842e1fb --- /dev/null +++ b/annotations_filtered/tvCjr63AgtM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.81], [7.0, 8.65], [18.0, 18.79], [24.0, 23.84], [36.0, 35.87], [43.0, 43.43], [45.0, 46.23], [48.0, 48.49], [55.0, 55.44], [56.0, 59.48], [61.0, 62.41], [64.0, 70.44], [72.0, 74.73], [78.0, 78.39], [82.0, 82.83], [83.0, 84.45], [85.0, 88.48], [91.0, 92.89], [95.0, 95.2], [96.0, 100.23], [101.0, 102.93], [104.0, 104.89], [107.0, 107.6], [108.0, 108.23], [109.0, 109.41], [121.0, 121.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 99.95, 84.98, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.81, 1.65, 0.79, -0.16, -0.13, 0.43, 1.23, 0.49, 0.44, 3.48, 1.41, 6.44, 2.73, 0.39, 0.83, 1.45, 3.48, 1.89, 0.2, 4.23, 1.93, 0.89, 0.6, 0.23, 0.41, 0.85]} \ No newline at end of file diff --git a/annotations_filtered/tvGHSvfnlsQ_filtered.json b/annotations_filtered/tvGHSvfnlsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93af513ac86996e6302f6c1a8eef02e9b966555c --- /dev/null +++ b/annotations_filtered/tvGHSvfnlsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.77], [11.0, 18.1], [20.0, 21.57], [23.0, 23.68], [27.0, 27.41], [29.0, 30.55], [34.0, 34.84], [36.0, 38.11], [42.0, 45.37], [46.0, 47.14], [48.0, 51.51], [53.0, 62.68], [64.0, 113.24], [115.0, 115.65], [123.0, 126.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 50.66, 0.0, 0.0, 96.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 7.1, 1.57, 0.68, 0.41, 1.55, 0.84, 2.11, 3.37, 1.14, 3.51, 9.68, 49.24, 0.65, 3.0]} \ No newline at end of file diff --git a/annotations_filtered/tvIE50OJfxM_filtered.json b/annotations_filtered/tvIE50OJfxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02d70f87a4f5c258969fe4cc6ebba788e4b48d5b --- /dev/null +++ b/annotations_filtered/tvIE50OJfxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.98], [14.0, 14.15], [15.0, 24.93], [26.0, 29.12], [30.0, 33.0], [48.0, 48.22], [52.0, 78.17], [78.0, 85.21], [87.0, 92.4], [93.0, 104.92], [106.0, 109.0], [110.0, 111.37], [112.0, 113.76], [115.0, 116.9], [118.0, 118.22], [123.0, 123.58], [127.0, 128.9]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.93, 36.76, 51.07, 0.0, 53.59, 80.82, 93.91, 92.48, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 31.4], ["hum", 18.6], ["ambient music", 10.16]], [["music", 35.4], ["sidetone", 16.83], ["throbbing", 5.65]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.98, 0.15, 9.93, 3.12, 3.0, 0.22, 26.17, 7.21, 5.4, 11.92, 3.0, 1.37, 1.76, 1.9, 0.22, 0.58, 1.9]} \ No newline at end of file diff --git a/annotations_filtered/tvKzyYy6qvY_filtered.json b/annotations_filtered/tvKzyYy6qvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d56b08a1e805f7aec1580a836db679422b19ab8 --- /dev/null +++ b/annotations_filtered/tvKzyYy6qvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.43], [13.0, 13.83], [15.0, 18.99], [23.0, 23.38], [25.0, 25.64], [28.0, 33.37], [40.0, 40.59], [53.0, 54.35], [56.0, 56.29], [59.0, 60.98], [62.0, 62.9], [65.0, 65.37], [70.0, 72.06], [72.0, 72.12], [73.0, 73.55], [75.0, 78.24], [80.0, 80.99], [82.0, 82.36], [82.0, 82.66], [85.0, 86.24], [88.0, 90.17], [94.0, 94.1], [96.0, 96.92], [99.0, 100.23], [103.0, 104.13], [106.0, 107.1]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.78, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.81, 0.0, 0.0, 31.22, 0.0, 0.0, 0.0, 0.0, 36.28, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 28.86], ["speech", 9.79], ["cello", 9.12]], null, null, null, null, null, null, null, null, null, [["music", 43.96], ["theremin", 7.69], ["foghorn", 5.67]], null, null, [["music", 29.26], ["speech", 18.95], ["theremin", 9.56]], null, null, null, null, [["music", 63.27], ["ambient music", 2.33], ["musical instrument", 2.2]], null, null, null, null, null], "duration": [1.43, 0.83, 3.99, 0.38, 0.64, 5.37, 0.59, 1.35, 0.29, 1.98, 0.9, 0.37, 2.06, 0.12, 0.55, 3.24, 0.99, 0.36, 0.66, 1.24, 2.17, 0.1, 0.92, 1.23, 1.13, 1.1]} \ No newline at end of file diff --git a/annotations_filtered/tv_xMisf9oc_filtered.json b/annotations_filtered/tv_xMisf9oc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0aaaa07762ab0f162420fe465420af8d2222ce7 --- /dev/null +++ b/annotations_filtered/tv_xMisf9oc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 61.62], [67.0, 66.85], [70.0, 71.12], [73.0, 73.68], [77.0, 77.5], [78.0, 79.79], [88.0, 87.99], [90.0, 90.58], [93.0, 92.87], [95.0, 95.5], [100.0, 101.55], [104.0, 104.9], [109.0, 108.94], [111.0, 113.31], [114.0, 116.68], [118.0, 119.62], [123.0, 128.22], [135.0, 135.24], [138.0, 138.67], [143.0, 143.8], [146.0, 148.95], [150.0, 151.68], [153.0, 156.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.73, 59.15, 0.0, 40.92, 0.0, 0.0, 0.0, 35.55, 0.0, 93.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.18], ["speech", 29.84], ["electronic music", 5.21]], null, null, [["speech", 21.32], ["music", 17.41], ["hum", 7.87]], null, null, null, [["music", 65.04], ["electronic music", 3.51], ["gong", 3.21]], null, null], "duration": [55.62, -0.15, 1.12, 0.68, 0.5, 1.79, -0.01, 0.58, -0.13, 0.5, 1.55, 0.9, -0.06, 2.31, 2.68, 1.62, 5.22, 0.24, 0.67, 0.8, 2.95, 1.68, 3.19]} \ No newline at end of file diff --git a/annotations_filtered/tvj61hwINaE_filtered.json b/annotations_filtered/tvj61hwINaE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b7c102509aeba42514bcdbd252e28c786658c5e --- /dev/null +++ b/annotations_filtered/tvj61hwINaE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 45.0], [47.0, 62.6], [63.0, 64.18], [65.0, 124.65], [125.0, 126.49], [127.0, 129.14], [135.0, 135.18], [139.0, 138.97], [140.0, 141.25], [142.0, 149.72], [151.0, 151.63], [154.0, 159.04]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 29.46, 0.0, 0.0, 0.0, 34.15, 0.0, 0.0, 0.0, 35.88, 0.0, 36.46], "audiomae_on_audioset": [null, [["music", 61.19], ["speech", 8.13], ["grunt", 3.61]], null, null, null, [["music", 22.33], ["hum", 14.42], ["mains hum", 8.75]], null, null, null, [["music", 28.26], ["hum", 27.21], ["throbbing", 17.98]], null, [["music", 35.1], ["brass instrument", 4.72], ["hum", 2.77]]], "duration": [34.0, 15.6, 1.18, 59.65, 1.49, 2.14, 0.18, -0.03, 1.25, 7.72, 0.63, 5.04]} \ No newline at end of file diff --git a/annotations_filtered/tvxjJd08MMc_filtered.json b/annotations_filtered/tvxjJd08MMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ffe76d041c9ca51c77699eee4462373853a8751 --- /dev/null +++ b/annotations_filtered/tvxjJd08MMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 43.28], [47.0, 63.69], [65.0, 65.35], [67.0, 86.36], [87.0, 96.21], [97.0, 105.19], [107.0, 106.95], [107.0, 118.13], [122.0, 122.57], [126.0, 127.13]], "keep_status": [true, false, false, false, false, true, false, true, false, false], "silence_prob": [34.41, 33.06, 0.0, 33.87, 36.2, 43.15, 0.0, 47.23, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.18], ["brass instrument", 8.31], ["wind instrument, woodwind instrument", 4.7]], [["music", 67.02], ["brass instrument", 2.92], ["hum", 2.7]], null, [["music", 48.12], ["theremin", 18.99], ["clarinet", 6.29]], [["music", 63.23], ["theremin", 6.45], ["wind instrument, woodwind instrument", 5.8]], [["music", 53.33], ["fart", 5.64], ["didgeridoo", 4.29]], null, [["speech", 35.53], ["wail, moan", 8.95], ["beatboxing", 7.89]], null, null], "duration": [15.28, 16.69, 0.35, 19.36, 9.21, 8.19, -0.05, 11.13, 0.57, 1.13]} \ No newline at end of file diff --git a/annotations_filtered/tvy0nfXbStY_filtered.json b/annotations_filtered/tvy0nfXbStY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..086465562549405248b7d03b14b97bfe60fb095f --- /dev/null +++ b/annotations_filtered/tvy0nfXbStY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.03], [7.0, 7.67], [9.0, 9.64], [14.0, 13.91], [16.0, 15.97], [16.0, 16.71], [72.0, 72.32], [73.0, 73.31], [74.0, 74.61], [76.0, 76.77], [78.0, 79.07], [84.0, 85.4], [86.0, 86.53], [89.0, 89.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.03, 0.67, 0.64, -0.09, -0.03, 0.71, 0.32, 0.31, 0.61, 0.77, 1.07, 1.4, 0.53, 0.29]} \ No newline at end of file diff --git a/annotations_filtered/tw84SFLxC_o_filtered.json b/annotations_filtered/tw84SFLxC_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbba6e5c04fc67b1557cd18be855c02d30644fa5 --- /dev/null +++ b/annotations_filtered/tw84SFLxC_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 21.69], [23.0, 28.49]], "keep_status": [false, false], "silence_prob": [93.6, 90.25], "audiomae_on_audioset": [null, null], "duration": [8.69, 5.49]} \ No newline at end of file diff --git a/annotations_filtered/twkjN0xQsWw_filtered.json b/annotations_filtered/twkjN0xQsWw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65e3e672ed9b248f86191d27bf803792db15124e --- /dev/null +++ b/annotations_filtered/twkjN0xQsWw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.99], [18.0, 20.9], [24.0, 26.25], [28.0, 44.19], [47.0, 49.44], [50.0, 56.4], [57.0, 64.57], [66.0, 72.67], [75.0, 77.75], [79.0, 79.44], [82.0, 84.47], [86.0, 88.59], [91.0, 94.29], [99.0, 100.57], [101.0, 112.38], [113.0, 117.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 95.37, 99.97, 100.0, 98.59, 99.84, 98.86, 99.87, 0.0, 99.59, 99.98, 99.44, 0.0, 97.11, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 2.9, 2.25, 16.19, 2.44, 6.4, 7.57, 6.67, 2.75, 0.44, 2.47, 2.59, 3.29, 1.57, 11.38, 4.76]} \ No newline at end of file diff --git a/annotations_filtered/txHNcE_d7ro_filtered.json b/annotations_filtered/txHNcE_d7ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a36de67c450a6e8b0fe2e24aa1a2e2eb78ee863 --- /dev/null +++ b/annotations_filtered/txHNcE_d7ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 47.85], [49.0, 100.45], [102.0, 103.23]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [44.85, 51.45, 1.23]} \ No newline at end of file diff --git a/annotations_filtered/txQcaXvbRB8_filtered.json b/annotations_filtered/txQcaXvbRB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..327bbe699912fdc25f2a65951f865a5e4cda9f7e --- /dev/null +++ b/annotations_filtered/txQcaXvbRB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.97], [13.0, 13.73], [14.0, 13.88], [20.0, 21.17], [22.0, 25.86], [29.0, 28.93], [33.0, 32.8], [38.0, 37.81], [40.0, 46.94], [48.0, 74.58], [77.0, 78.38], [79.0, 79.12], [82.0, 82.39], [91.0, 91.67], [101.0, 101.33], [102.0, 102.81], [108.0, 110.08], [110.0, 111.0], [111.0, 111.89], [116.0, 116.14]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.6, 0.0, 0.0, 0.0, 31.05, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 35.26], ["music", 32.79], ["animal", 3.72]], null, null, null, [["music", 30.42], ["speech", 25.08], ["sidetone", 13.82]], [["music", 57.1], ["vehicle", 8.8], ["speech", 3.89]], null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.73, -0.12, 1.17, 3.86, -0.07, -0.2, -0.19, 6.94, 26.58, 1.38, 0.12, 0.39, 0.67, 0.33, 0.81, 2.08, 1.0, 0.89, 0.14]} \ No newline at end of file diff --git a/annotations_filtered/ty68MEZQPS0_filtered.json b/annotations_filtered/ty68MEZQPS0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..605eae00a31148e60a6a0dfa6804be3c4684f2d4 --- /dev/null +++ b/annotations_filtered/ty68MEZQPS0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.01], [4.0, 4.72], [5.0, 8.07], [9.0, 9.81], [11.0, 12.73], [19.0, 19.41], [22.0, 22.94], [38.0, 39.28], [40.0, 40.95], [43.0, 43.01], [49.0, 50.16], [51.0, 51.8], [52.0, 52.62], [57.0, 57.01], [60.0, 60.98], [79.0, 79.08], [83.0, 85.56], [86.0, 87.1], [88.0, 89.16], [92.0, 92.01], [94.0, 94.53], [99.0, 100.43], [102.0, 102.49], [106.0, 107.16], [108.0, 107.91], [109.0, 109.46], [117.0, 117.12], [121.0, 121.2], [142.0, 143.21], [148.0, 148.42], [158.0, 162.28], [163.0, 163.49], [165.0, 165.33], [166.0, 166.6], [169.0, 175.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [44.34, 0.0, 31.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.58, 0.0, 0.0, 0.0, 35.4], "audiomae_on_audioset": [[["hum", 30.25], ["throbbing", 29.98], ["sidetone", 10.29]], null, [["throbbing", 31.91], ["heart sounds, heartbeat", 23.83], ["hum", 22.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 27.06], ["insect", 17.19], ["bee, wasp, etc.", 16.46]], null, null, null, [["speech", 22.63], ["boat, water vehicle", 7.26], ["vehicle", 6.65]]], "duration": [2.01, 0.72, 3.07, 0.81, 1.73, 0.41, 0.94, 1.28, 0.95, 0.01, 1.16, 0.8, 0.62, 0.01, 0.98, 0.08, 2.56, 1.1, 1.16, 0.01, 0.53, 1.43, 0.49, 1.16, -0.09, 0.46, 0.12, 0.2, 1.21, 0.42, 4.28, 0.49, 0.33, 0.6, 6.14]} \ No newline at end of file diff --git a/annotations_filtered/ty_jbbvZDkQ_filtered.json b/annotations_filtered/ty_jbbvZDkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e7e8298faf685c3a28cefeb682b1e6e3e4f17ed --- /dev/null +++ b/annotations_filtered/ty_jbbvZDkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.93], [12.0, 12.28], [13.0, 14.0], [16.0, 17.9], [18.0, 24.63], [27.0, 28.73], [30.0, 30.75], [35.0, 36.17], [38.0, 37.99], [41.0, 48.19], [49.0, 50.52], [53.0, 56.29], [57.0, 71.44], [77.0, 77.23], [78.0, 87.59], [90.0, 90.58], [98.0, 98.52], [101.0, 102.1], [105.0, 108.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 52.56, 0.0, 0.0, 0.0, 0.0, 42.98, 0.0, 40.62, 82.61, 0.0, 54.9, 0.0, 0.0, 0.0, 40.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 61.43], ["radio", 11.88], ["music", 5.17]], null, [["wood", 20.61], ["hum", 13.01], ["mains hum", 11.7]], null, null, null, null, null, null, [["music", 53.51], ["didgeridoo", 4.67], ["synthesizer", 4.28]]], "duration": [-0.07, 0.28, 1.0, 1.9, 6.63, 1.73, 0.75, 1.17, -0.01, 7.19, 1.52, 3.29, 14.44, 0.23, 9.59, 0.58, 0.52, 1.1, 3.89]} \ No newline at end of file diff --git a/annotations_filtered/tyazEYlueAw_filtered.json b/annotations_filtered/tyazEYlueAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..880ec694d84a842069ad0bd122bf84024eb69b5b --- /dev/null +++ b/annotations_filtered/tyazEYlueAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.08], [7.0, 6.98], [8.0, 15.62], [16.0, 17.79], [19.0, 19.58], [20.0, 21.25], [23.0, 24.58], [25.0, 53.06], [54.0, 54.67], [56.0, 57.01], [62.0, 63.29], [70.0, 75.19], [77.0, 95.5], [97.0, 96.9], [100.0, 107.59], [109.0, 109.97], [113.0, 114.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0, 0.0, 0.0, 47.05, 51.88, 0.0, 63.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["stomach rumble", 16.58], ["rowboat, canoe, kayak", 9.38], ["boat, water vehicle", 7.8]], null, null, null, null, null], "duration": [1.08, -0.02, 7.62, 1.79, 0.58, 1.25, 1.58, 28.06, 0.67, 1.01, 1.29, 5.19, 18.5, -0.1, 7.59, 0.97, 1.34]} \ No newline at end of file diff --git a/annotations_filtered/tyyPSnHcthg_filtered.json b/annotations_filtered/tyyPSnHcthg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c7e2a0f5fb9041d7d43e36811275e2a459d22aa --- /dev/null +++ b/annotations_filtered/tyyPSnHcthg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.08], [14.0, 17.56], [18.0, 20.16], [21.0, 22.69], [26.0, 33.67], [36.0, 46.47], [47.0, 48.37], [51.0, 52.89], [57.0, 58.92], [61.0, 63.46], [64.0, 69.8], [72.0, 74.41], [80.0, 96.36], [97.0, 97.73], [99.0, 98.91], [105.0, 104.55], [109.0, 108.84], [110.0, 111.67], [113.0, 113.8], [115.0, 118.74], [120.0, 119.7], [123.0, 125.73], [127.0, 127.01], [133.0, 136.12], [138.0, 137.96], [139.0, 139.33], [139.0, 139.87], [150.0, 151.92], [154.0, 158.52], [159.0, 163.46], [166.0, 167.21], [168.0, 172.94], [176.0, 176.62], [178.0, 178.71], [180.0, 181.52]], "keep_status": [false, true, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.86, 30.53, 32.56, 0.0, 30.76, 30.61, 0.0, 0.0, 0.0, 33.04, 28.95, 30.84, 29.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 0.0, 39.86, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 41.6, 80.64, 0.0, 36.2, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.88], ["throbbing", 23.36], ["hum", 10.39]], [["music", 28.46], ["speech", 17.13], ["hum", 7.95]], [["music", 29.74], ["hum", 24.08], ["mains hum", 18.19]], null, [["music", 49.46], ["hum", 7.15], ["throbbing", 6.91]], [["music", 59.58], ["vehicle", 6.94], ["hum", 4.16]], null, null, null, [["music", 80.03], ["throbbing", 4.33], ["musical instrument", 2.46]], [["music", 35.94], ["vehicle", 14.92], ["speech", 9.55]], [["music", 73.69], ["guitar", 6.26], ["musical instrument", 4.55]], [["vehicle", 31.0], ["car", 20.07], ["music", 12.5]], null, null, null, null, null, null, null, null, [["speech", 58.85], ["music", 13.32], ["buzzer", 5.31]], null, null, null, null, null, null, [["cattle, bovinae", 46.39], ["livestock, farm animals, working animals", 27.82], ["moo", 24.07]], null, null, [["fly, housefly", 50.42], ["insect", 15.56], ["mosquito", 9.5]], null, null, null], "duration": [4.08, 3.56, 2.16, 1.69, 7.67, 10.47, 1.37, 1.89, 1.92, 2.46, 5.8, 2.41, 16.36, 0.73, -0.09, -0.45, -0.16, 1.67, 0.8, 3.74, -0.3, 2.73, 0.01, 3.12, -0.04, 0.33, 0.87, 1.92, 4.52, 4.46, 1.21, 4.94, 0.62, 0.71, 1.52]} \ No newline at end of file diff --git a/annotations_filtered/tz-XJMspLOA_filtered.json b/annotations_filtered/tz-XJMspLOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e2eca302e6bad5143ae5cef30503628b6e3dcbf --- /dev/null +++ b/annotations_filtered/tz-XJMspLOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.34], [10.0, 30.2], [31.0, 33.84], [36.0, 53.05], [54.0, 56.62], [58.0, 64.76], [66.0, 75.34], [76.0, 88.7], [92.0, 93.75], [95.0, 96.06], [97.0, 97.36], [98.0, 98.96], [100.0, 101.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 59.42, 80.11, 87.0, 70.02, 89.36, 95.64, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 20.2, 2.84, 17.05, 2.62, 6.76, 9.34, 12.7, 1.75, 1.06, 0.36, 0.96, 1.33]} \ No newline at end of file diff --git a/annotations_filtered/tz6dNnahwCI_filtered.json b/annotations_filtered/tz6dNnahwCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43bbfc3a96677cce57c2e4f2e80437d57f18817e --- /dev/null +++ b/annotations_filtered/tz6dNnahwCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.82], [16.0, 16.9], [28.0, 33.2], [35.0, 55.02], [56.0, 72.79], [75.0, 83.52], [86.0, 86.26], [89.0, 92.23], [93.0, 94.54], [96.0, 96.16], [99.0, 98.91], [101.0, 102.0], [103.0, 103.42]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.8, 30.99, 31.54, 36.85, 0.0, 31.18, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 56.86], ["speech", 28.98], ["sidetone", 0.94]], [["music", 66.64], ["speech", 14.61], ["skateboard", 2.28]], [["speech", 39.72], ["music", 37.28], ["synthesizer", 2.0]], [["speech", 39.9], ["music", 35.08], ["guitar", 1.71]], null, [["vehicle", 28.54], ["car", 19.61], ["race car, auto racing", 11.05]], null, null, null, null, null], "duration": [0.82, 0.9, 5.2, 20.02, 16.79, 8.52, 0.26, 3.23, 1.54, 0.16, -0.09, 1.0, 0.42]} \ No newline at end of file